{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.9567084078711986, "global_step": 8022, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 7.936507936507937e-08, "loss": 1.2868, "step": 1 }, { "epoch": 0.0, "learning_rate": 1.5873015873015874e-07, "loss": 1.365, "step": 2 }, { "epoch": 0.0, "learning_rate": 2.3809523809523811e-07, "loss": 1.3393, "step": 3 }, { "epoch": 0.0, "learning_rate": 3.174603174603175e-07, "loss": 1.3114, "step": 4 }, { "epoch": 0.0, "learning_rate": 3.9682539682539683e-07, "loss": 1.3627, "step": 5 }, { "epoch": 0.0, "learning_rate": 4.7619047619047623e-07, "loss": 1.3527, "step": 6 }, { "epoch": 0.0, "learning_rate": 5.555555555555555e-07, "loss": 1.2243, "step": 7 }, { "epoch": 0.0, "learning_rate": 6.34920634920635e-07, "loss": 1.3605, "step": 8 }, { "epoch": 0.0, "learning_rate": 7.142857142857143e-07, "loss": 1.3415, "step": 9 }, { "epoch": 0.0, "learning_rate": 7.936507936507937e-07, "loss": 1.3203, "step": 10 }, { "epoch": 0.0, "learning_rate": 8.73015873015873e-07, "loss": 1.3125, "step": 11 }, { "epoch": 0.0, "learning_rate": 9.523809523809525e-07, "loss": 1.2333, "step": 12 }, { "epoch": 0.0, "learning_rate": 1.0317460317460317e-06, "loss": 1.3248, "step": 13 }, { "epoch": 0.0, "learning_rate": 1.111111111111111e-06, "loss": 1.2656, "step": 14 }, { "epoch": 0.0, "learning_rate": 1.1904761904761906e-06, "loss": 1.2556, "step": 15 }, { "epoch": 0.0, "learning_rate": 1.26984126984127e-06, "loss": 1.2377, "step": 16 }, { "epoch": 0.0, "learning_rate": 1.3492063492063493e-06, "loss": 1.2355, "step": 17 }, { "epoch": 0.0, "learning_rate": 1.4285714285714286e-06, "loss": 1.154, "step": 18 }, { "epoch": 0.0, "learning_rate": 1.507936507936508e-06, "loss": 1.2076, "step": 19 }, { "epoch": 0.0, "learning_rate": 1.5873015873015873e-06, "loss": 1.1004, "step": 20 }, { "epoch": 0.0, "learning_rate": 1.6666666666666667e-06, "loss": 1.1574, "step": 21 }, { "epoch": 0.0, "learning_rate": 1.746031746031746e-06, "loss": 1.0882, "step": 22 }, { "epoch": 0.0, "learning_rate": 1.8253968253968254e-06, "loss": 1.1384, "step": 23 }, { "epoch": 0.0, "learning_rate": 1.904761904761905e-06, "loss": 1.1618, "step": 24 }, { "epoch": 0.0, "learning_rate": 1.984126984126984e-06, "loss": 1.0815, "step": 25 }, { "epoch": 0.0, "learning_rate": 2.0634920634920634e-06, "loss": 1.096, "step": 26 }, { "epoch": 0.0, "learning_rate": 2.1428571428571427e-06, "loss": 1.1518, "step": 27 }, { "epoch": 0.0, "learning_rate": 2.222222222222222e-06, "loss": 1.1473, "step": 28 }, { "epoch": 0.0, "learning_rate": 2.301587301587302e-06, "loss": 1.1161, "step": 29 }, { "epoch": 0.0, "learning_rate": 2.380952380952381e-06, "loss": 1.1412, "step": 30 }, { "epoch": 0.0, "learning_rate": 2.4603174603174605e-06, "loss": 1.0357, "step": 31 }, { "epoch": 0.0, "learning_rate": 2.53968253968254e-06, "loss": 1.077, "step": 32 }, { "epoch": 0.0, "learning_rate": 2.6190476190476192e-06, "loss": 1.0776, "step": 33 }, { "epoch": 0.0, "learning_rate": 2.6984126984126986e-06, "loss": 1.0619, "step": 34 }, { "epoch": 0.0, "learning_rate": 2.7777777777777783e-06, "loss": 1.0279, "step": 35 }, { "epoch": 0.0, "learning_rate": 2.8571428571428573e-06, "loss": 1.0558, "step": 36 }, { "epoch": 0.0, "learning_rate": 2.936507936507937e-06, "loss": 1.0614, "step": 37 }, { "epoch": 0.0, "learning_rate": 3.015873015873016e-06, "loss": 1.0586, "step": 38 }, { "epoch": 0.0, "learning_rate": 3.0952380952380957e-06, "loss": 1.0324, "step": 39 }, { "epoch": 0.0, "learning_rate": 3.1746031746031746e-06, "loss": 1.0441, "step": 40 }, { "epoch": 0.0, "learning_rate": 3.2539682539682544e-06, "loss": 0.9286, "step": 41 }, { "epoch": 0.01, "learning_rate": 3.3333333333333333e-06, "loss": 0.9531, "step": 42 }, { "epoch": 0.01, "learning_rate": 3.412698412698413e-06, "loss": 0.9671, "step": 43 }, { "epoch": 0.01, "learning_rate": 3.492063492063492e-06, "loss": 1.0017, "step": 44 }, { "epoch": 0.01, "learning_rate": 3.5714285714285718e-06, "loss": 1.0179, "step": 45 }, { "epoch": 0.01, "learning_rate": 3.6507936507936507e-06, "loss": 1.0446, "step": 46 }, { "epoch": 0.01, "learning_rate": 3.7301587301587305e-06, "loss": 0.9609, "step": 47 }, { "epoch": 0.01, "learning_rate": 3.80952380952381e-06, "loss": 1.0045, "step": 48 }, { "epoch": 0.01, "learning_rate": 3.88888888888889e-06, "loss": 1.0017, "step": 49 }, { "epoch": 0.01, "learning_rate": 3.968253968253968e-06, "loss": 0.986, "step": 50 }, { "epoch": 0.01, "learning_rate": 4.047619047619048e-06, "loss": 1.0033, "step": 51 }, { "epoch": 0.01, "learning_rate": 4.126984126984127e-06, "loss": 0.9381, "step": 52 }, { "epoch": 0.01, "learning_rate": 4.206349206349207e-06, "loss": 0.9157, "step": 53 }, { "epoch": 0.01, "learning_rate": 4.2857142857142855e-06, "loss": 0.9922, "step": 54 }, { "epoch": 0.01, "learning_rate": 4.365079365079366e-06, "loss": 0.9157, "step": 55 }, { "epoch": 0.01, "learning_rate": 4.444444444444444e-06, "loss": 0.981, "step": 56 }, { "epoch": 0.01, "learning_rate": 4.523809523809524e-06, "loss": 0.9392, "step": 57 }, { "epoch": 0.01, "learning_rate": 4.603174603174604e-06, "loss": 0.9559, "step": 58 }, { "epoch": 0.01, "learning_rate": 4.682539682539683e-06, "loss": 0.9671, "step": 59 }, { "epoch": 0.01, "learning_rate": 4.761904761904762e-06, "loss": 0.9381, "step": 60 }, { "epoch": 0.01, "learning_rate": 4.841269841269842e-06, "loss": 0.9704, "step": 61 }, { "epoch": 0.01, "learning_rate": 4.920634920634921e-06, "loss": 0.933, "step": 62 }, { "epoch": 0.01, "learning_rate": 5e-06, "loss": 0.947, "step": 63 }, { "epoch": 0.01, "learning_rate": 5.07936507936508e-06, "loss": 0.9286, "step": 64 }, { "epoch": 0.01, "learning_rate": 5.15873015873016e-06, "loss": 0.9007, "step": 65 }, { "epoch": 0.01, "learning_rate": 5.2380952380952384e-06, "loss": 0.9548, "step": 66 }, { "epoch": 0.01, "learning_rate": 5.317460317460318e-06, "loss": 1.0039, "step": 67 }, { "epoch": 0.01, "learning_rate": 5.396825396825397e-06, "loss": 0.9347, "step": 68 }, { "epoch": 0.01, "learning_rate": 5.476190476190477e-06, "loss": 0.9743, "step": 69 }, { "epoch": 0.01, "learning_rate": 5.555555555555557e-06, "loss": 0.923, "step": 70 }, { "epoch": 0.01, "learning_rate": 5.634920634920635e-06, "loss": 0.918, "step": 71 }, { "epoch": 0.01, "learning_rate": 5.7142857142857145e-06, "loss": 0.9598, "step": 72 }, { "epoch": 0.01, "learning_rate": 5.793650793650795e-06, "loss": 0.9308, "step": 73 }, { "epoch": 0.01, "learning_rate": 5.873015873015874e-06, "loss": 0.8884, "step": 74 }, { "epoch": 0.01, "learning_rate": 5.9523809523809525e-06, "loss": 0.9933, "step": 75 }, { "epoch": 0.01, "learning_rate": 6.031746031746032e-06, "loss": 0.9224, "step": 76 }, { "epoch": 0.01, "learning_rate": 6.111111111111112e-06, "loss": 0.9079, "step": 77 }, { "epoch": 0.01, "learning_rate": 6.1904761904761914e-06, "loss": 0.8795, "step": 78 }, { "epoch": 0.01, "learning_rate": 6.26984126984127e-06, "loss": 0.9369, "step": 79 }, { "epoch": 0.01, "learning_rate": 6.349206349206349e-06, "loss": 0.8951, "step": 80 }, { "epoch": 0.01, "learning_rate": 6.4285714285714295e-06, "loss": 0.9581, "step": 81 }, { "epoch": 0.01, "learning_rate": 6.507936507936509e-06, "loss": 0.8549, "step": 82 }, { "epoch": 0.01, "learning_rate": 6.587301587301588e-06, "loss": 0.9598, "step": 83 }, { "epoch": 0.01, "learning_rate": 6.666666666666667e-06, "loss": 0.9542, "step": 84 }, { "epoch": 0.01, "learning_rate": 6.746031746031747e-06, "loss": 0.986, "step": 85 }, { "epoch": 0.01, "learning_rate": 6.825396825396826e-06, "loss": 0.9263, "step": 86 }, { "epoch": 0.01, "learning_rate": 6.9047619047619055e-06, "loss": 0.8549, "step": 87 }, { "epoch": 0.01, "learning_rate": 6.984126984126984e-06, "loss": 0.9436, "step": 88 }, { "epoch": 0.01, "learning_rate": 7.063492063492064e-06, "loss": 0.9369, "step": 89 }, { "epoch": 0.01, "learning_rate": 7.1428571428571436e-06, "loss": 0.9715, "step": 90 }, { "epoch": 0.01, "learning_rate": 7.222222222222223e-06, "loss": 0.9141, "step": 91 }, { "epoch": 0.01, "learning_rate": 7.301587301587301e-06, "loss": 0.8929, "step": 92 }, { "epoch": 0.01, "learning_rate": 7.380952380952382e-06, "loss": 0.9325, "step": 93 }, { "epoch": 0.01, "learning_rate": 7.460317460317461e-06, "loss": 0.9051, "step": 94 }, { "epoch": 0.01, "learning_rate": 7.53968253968254e-06, "loss": 0.894, "step": 95 }, { "epoch": 0.01, "learning_rate": 7.61904761904762e-06, "loss": 0.9023, "step": 96 }, { "epoch": 0.01, "learning_rate": 7.698412698412699e-06, "loss": 0.9738, "step": 97 }, { "epoch": 0.01, "learning_rate": 7.77777777777778e-06, "loss": 0.9163, "step": 98 }, { "epoch": 0.01, "learning_rate": 7.857142857142858e-06, "loss": 0.981, "step": 99 }, { "epoch": 0.01, "learning_rate": 7.936507936507936e-06, "loss": 0.9453, "step": 100 }, { "epoch": 0.01, "learning_rate": 8.015873015873016e-06, "loss": 0.8884, "step": 101 }, { "epoch": 0.01, "learning_rate": 8.095238095238097e-06, "loss": 0.8689, "step": 102 }, { "epoch": 0.01, "learning_rate": 8.174603174603175e-06, "loss": 0.8092, "step": 103 }, { "epoch": 0.01, "learning_rate": 8.253968253968254e-06, "loss": 0.8605, "step": 104 }, { "epoch": 0.01, "learning_rate": 8.333333333333334e-06, "loss": 0.8555, "step": 105 }, { "epoch": 0.01, "learning_rate": 8.412698412698414e-06, "loss": 0.8828, "step": 106 }, { "epoch": 0.01, "learning_rate": 8.492063492063492e-06, "loss": 0.8488, "step": 107 }, { "epoch": 0.01, "learning_rate": 8.571428571428571e-06, "loss": 0.889, "step": 108 }, { "epoch": 0.01, "learning_rate": 8.650793650793651e-06, "loss": 0.918, "step": 109 }, { "epoch": 0.01, "learning_rate": 8.730158730158731e-06, "loss": 0.8945, "step": 110 }, { "epoch": 0.01, "learning_rate": 8.80952380952381e-06, "loss": 0.9118, "step": 111 }, { "epoch": 0.01, "learning_rate": 8.888888888888888e-06, "loss": 0.9068, "step": 112 }, { "epoch": 0.01, "learning_rate": 8.968253968253968e-06, "loss": 0.9286, "step": 113 }, { "epoch": 0.01, "learning_rate": 9.047619047619049e-06, "loss": 0.9208, "step": 114 }, { "epoch": 0.01, "learning_rate": 9.126984126984127e-06, "loss": 0.9637, "step": 115 }, { "epoch": 0.01, "learning_rate": 9.206349206349207e-06, "loss": 0.9079, "step": 116 }, { "epoch": 0.01, "learning_rate": 9.285714285714288e-06, "loss": 0.8739, "step": 117 }, { "epoch": 0.01, "learning_rate": 9.365079365079366e-06, "loss": 0.9241, "step": 118 }, { "epoch": 0.01, "learning_rate": 9.444444444444445e-06, "loss": 0.9269, "step": 119 }, { "epoch": 0.01, "learning_rate": 9.523809523809525e-06, "loss": 0.8929, "step": 120 }, { "epoch": 0.01, "learning_rate": 9.603174603174605e-06, "loss": 0.9609, "step": 121 }, { "epoch": 0.01, "learning_rate": 9.682539682539683e-06, "loss": 0.8644, "step": 122 }, { "epoch": 0.01, "learning_rate": 9.761904761904762e-06, "loss": 0.9063, "step": 123 }, { "epoch": 0.01, "learning_rate": 9.841269841269842e-06, "loss": 0.9118, "step": 124 }, { "epoch": 0.01, "learning_rate": 9.920634920634922e-06, "loss": 0.933, "step": 125 }, { "epoch": 0.02, "learning_rate": 1e-05, "loss": 0.8577, "step": 126 }, { "epoch": 0.02, "learning_rate": 1.007936507936508e-05, "loss": 0.9085, "step": 127 }, { "epoch": 0.02, "learning_rate": 1.015873015873016e-05, "loss": 0.9375, "step": 128 }, { "epoch": 0.02, "learning_rate": 1.0238095238095238e-05, "loss": 0.8756, "step": 129 }, { "epoch": 0.02, "learning_rate": 1.031746031746032e-05, "loss": 0.9157, "step": 130 }, { "epoch": 0.02, "learning_rate": 1.0396825396825398e-05, "loss": 0.9012, "step": 131 }, { "epoch": 0.02, "learning_rate": 1.0476190476190477e-05, "loss": 0.88, "step": 132 }, { "epoch": 0.02, "learning_rate": 1.0555555555555557e-05, "loss": 0.9174, "step": 133 }, { "epoch": 0.02, "learning_rate": 1.0634920634920636e-05, "loss": 0.9515, "step": 134 }, { "epoch": 0.02, "learning_rate": 1.0714285714285714e-05, "loss": 0.9085, "step": 135 }, { "epoch": 0.02, "learning_rate": 1.0793650793650794e-05, "loss": 0.9113, "step": 136 }, { "epoch": 0.02, "learning_rate": 1.0873015873015873e-05, "loss": 0.8884, "step": 137 }, { "epoch": 0.02, "learning_rate": 1.0952380952380955e-05, "loss": 0.8951, "step": 138 }, { "epoch": 0.02, "learning_rate": 1.1031746031746033e-05, "loss": 0.8817, "step": 139 }, { "epoch": 0.02, "learning_rate": 1.1111111111111113e-05, "loss": 0.8599, "step": 140 }, { "epoch": 0.02, "learning_rate": 1.1190476190476192e-05, "loss": 0.9414, "step": 141 }, { "epoch": 0.02, "learning_rate": 1.126984126984127e-05, "loss": 0.8711, "step": 142 }, { "epoch": 0.02, "learning_rate": 1.134920634920635e-05, "loss": 0.8588, "step": 143 }, { "epoch": 0.02, "learning_rate": 1.1428571428571429e-05, "loss": 0.8544, "step": 144 }, { "epoch": 0.02, "learning_rate": 1.1507936507936508e-05, "loss": 0.9286, "step": 145 }, { "epoch": 0.02, "learning_rate": 1.158730158730159e-05, "loss": 0.923, "step": 146 }, { "epoch": 0.02, "learning_rate": 1.1666666666666668e-05, "loss": 0.8968, "step": 147 }, { "epoch": 0.02, "learning_rate": 1.1746031746031748e-05, "loss": 0.9531, "step": 148 }, { "epoch": 0.02, "learning_rate": 1.1825396825396827e-05, "loss": 0.9375, "step": 149 }, { "epoch": 0.02, "learning_rate": 1.1904761904761905e-05, "loss": 0.9247, "step": 150 }, { "epoch": 0.02, "learning_rate": 1.1984126984126985e-05, "loss": 0.8744, "step": 151 }, { "epoch": 0.02, "learning_rate": 1.2063492063492064e-05, "loss": 0.9258, "step": 152 }, { "epoch": 0.02, "learning_rate": 1.2142857142857142e-05, "loss": 0.8527, "step": 153 }, { "epoch": 0.02, "learning_rate": 1.2222222222222224e-05, "loss": 0.947, "step": 154 }, { "epoch": 0.02, "learning_rate": 1.2301587301587303e-05, "loss": 0.9565, "step": 155 }, { "epoch": 0.02, "learning_rate": 1.2380952380952383e-05, "loss": 0.9403, "step": 156 }, { "epoch": 0.02, "learning_rate": 1.2460317460317461e-05, "loss": 0.87, "step": 157 }, { "epoch": 0.02, "learning_rate": 1.253968253968254e-05, "loss": 0.9001, "step": 158 }, { "epoch": 0.02, "learning_rate": 1.261904761904762e-05, "loss": 0.8432, "step": 159 }, { "epoch": 0.02, "learning_rate": 1.2698412698412699e-05, "loss": 0.9392, "step": 160 }, { "epoch": 0.02, "learning_rate": 1.2777777777777777e-05, "loss": 0.8655, "step": 161 }, { "epoch": 0.02, "learning_rate": 1.2857142857142859e-05, "loss": 0.8588, "step": 162 }, { "epoch": 0.02, "learning_rate": 1.2936507936507937e-05, "loss": 0.9369, "step": 163 }, { "epoch": 0.02, "learning_rate": 1.3015873015873018e-05, "loss": 0.9213, "step": 164 }, { "epoch": 0.02, "learning_rate": 1.3095238095238096e-05, "loss": 0.9542, "step": 165 }, { "epoch": 0.02, "learning_rate": 1.3174603174603176e-05, "loss": 0.9012, "step": 166 }, { "epoch": 0.02, "learning_rate": 1.3253968253968255e-05, "loss": 0.8845, "step": 167 }, { "epoch": 0.02, "learning_rate": 1.3333333333333333e-05, "loss": 0.8717, "step": 168 }, { "epoch": 0.02, "learning_rate": 1.3412698412698413e-05, "loss": 0.8923, "step": 169 }, { "epoch": 0.02, "learning_rate": 1.3492063492063494e-05, "loss": 0.846, "step": 170 }, { "epoch": 0.02, "learning_rate": 1.3571428571428574e-05, "loss": 0.875, "step": 171 }, { "epoch": 0.02, "learning_rate": 1.3650793650793652e-05, "loss": 0.9247, "step": 172 }, { "epoch": 0.02, "learning_rate": 1.3730158730158731e-05, "loss": 0.9135, "step": 173 }, { "epoch": 0.02, "learning_rate": 1.3809523809523811e-05, "loss": 0.8778, "step": 174 }, { "epoch": 0.02, "learning_rate": 1.388888888888889e-05, "loss": 0.9057, "step": 175 }, { "epoch": 0.02, "learning_rate": 1.3968253968253968e-05, "loss": 0.9604, "step": 176 }, { "epoch": 0.02, "learning_rate": 1.4047619047619048e-05, "loss": 0.8694, "step": 177 }, { "epoch": 0.02, "learning_rate": 1.4126984126984128e-05, "loss": 0.9587, "step": 178 }, { "epoch": 0.02, "learning_rate": 1.4206349206349209e-05, "loss": 0.9565, "step": 179 }, { "epoch": 0.02, "learning_rate": 1.4285714285714287e-05, "loss": 0.9029, "step": 180 }, { "epoch": 0.02, "learning_rate": 1.4365079365079366e-05, "loss": 0.8979, "step": 181 }, { "epoch": 0.02, "learning_rate": 1.4444444444444446e-05, "loss": 0.9364, "step": 182 }, { "epoch": 0.02, "learning_rate": 1.4523809523809524e-05, "loss": 0.889, "step": 183 }, { "epoch": 0.02, "learning_rate": 1.4603174603174603e-05, "loss": 0.8789, "step": 184 }, { "epoch": 0.02, "learning_rate": 1.4682539682539683e-05, "loss": 0.8789, "step": 185 }, { "epoch": 0.02, "learning_rate": 1.4761904761904763e-05, "loss": 0.9029, "step": 186 }, { "epoch": 0.02, "learning_rate": 1.4841269841269843e-05, "loss": 0.9001, "step": 187 }, { "epoch": 0.02, "learning_rate": 1.4920634920634922e-05, "loss": 0.9498, "step": 188 }, { "epoch": 0.02, "learning_rate": 1.5000000000000002e-05, "loss": 0.9208, "step": 189 }, { "epoch": 0.02, "learning_rate": 1.507936507936508e-05, "loss": 0.9096, "step": 190 }, { "epoch": 0.02, "learning_rate": 1.5158730158730159e-05, "loss": 0.8956, "step": 191 }, { "epoch": 0.02, "learning_rate": 1.523809523809524e-05, "loss": 0.9074, "step": 192 }, { "epoch": 0.02, "learning_rate": 1.531746031746032e-05, "loss": 0.8767, "step": 193 }, { "epoch": 0.02, "learning_rate": 1.5396825396825398e-05, "loss": 0.9074, "step": 194 }, { "epoch": 0.02, "learning_rate": 1.5476190476190476e-05, "loss": 0.9169, "step": 195 }, { "epoch": 0.02, "learning_rate": 1.555555555555556e-05, "loss": 0.8276, "step": 196 }, { "epoch": 0.02, "learning_rate": 1.5634920634920637e-05, "loss": 0.8945, "step": 197 }, { "epoch": 0.02, "learning_rate": 1.5714285714285715e-05, "loss": 0.8789, "step": 198 }, { "epoch": 0.02, "learning_rate": 1.5793650793650794e-05, "loss": 0.9325, "step": 199 }, { "epoch": 0.02, "learning_rate": 1.5873015873015872e-05, "loss": 0.846, "step": 200 }, { "epoch": 0.02, "learning_rate": 1.5952380952380954e-05, "loss": 0.8655, "step": 201 }, { "epoch": 0.02, "learning_rate": 1.6031746031746033e-05, "loss": 0.8683, "step": 202 }, { "epoch": 0.02, "learning_rate": 1.6111111111111115e-05, "loss": 0.8962, "step": 203 }, { "epoch": 0.02, "learning_rate": 1.6190476190476193e-05, "loss": 0.8633, "step": 204 }, { "epoch": 0.02, "learning_rate": 1.626984126984127e-05, "loss": 0.8382, "step": 205 }, { "epoch": 0.02, "learning_rate": 1.634920634920635e-05, "loss": 0.9152, "step": 206 }, { "epoch": 0.02, "learning_rate": 1.642857142857143e-05, "loss": 0.8583, "step": 207 }, { "epoch": 0.02, "learning_rate": 1.6507936507936507e-05, "loss": 0.8544, "step": 208 }, { "epoch": 0.02, "learning_rate": 1.658730158730159e-05, "loss": 0.928, "step": 209 }, { "epoch": 0.03, "learning_rate": 1.6666666666666667e-05, "loss": 0.904, "step": 210 }, { "epoch": 0.03, "learning_rate": 1.674603174603175e-05, "loss": 0.923, "step": 211 }, { "epoch": 0.03, "learning_rate": 1.6825396825396828e-05, "loss": 0.8783, "step": 212 }, { "epoch": 0.03, "learning_rate": 1.6904761904761906e-05, "loss": 0.9196, "step": 213 }, { "epoch": 0.03, "learning_rate": 1.6984126984126985e-05, "loss": 0.9141, "step": 214 }, { "epoch": 0.03, "learning_rate": 1.7063492063492063e-05, "loss": 0.875, "step": 215 }, { "epoch": 0.03, "learning_rate": 1.7142857142857142e-05, "loss": 0.9224, "step": 216 }, { "epoch": 0.03, "learning_rate": 1.7222222222222224e-05, "loss": 0.8839, "step": 217 }, { "epoch": 0.03, "learning_rate": 1.7301587301587302e-05, "loss": 0.8756, "step": 218 }, { "epoch": 0.03, "learning_rate": 1.7380952380952384e-05, "loss": 0.9269, "step": 219 }, { "epoch": 0.03, "learning_rate": 1.7460317460317463e-05, "loss": 0.8594, "step": 220 }, { "epoch": 0.03, "learning_rate": 1.753968253968254e-05, "loss": 0.8862, "step": 221 }, { "epoch": 0.03, "learning_rate": 1.761904761904762e-05, "loss": 0.8627, "step": 222 }, { "epoch": 0.03, "learning_rate": 1.7698412698412698e-05, "loss": 0.8984, "step": 223 }, { "epoch": 0.03, "learning_rate": 1.7777777777777777e-05, "loss": 0.8599, "step": 224 }, { "epoch": 0.03, "learning_rate": 1.785714285714286e-05, "loss": 0.9012, "step": 225 }, { "epoch": 0.03, "learning_rate": 1.7936507936507937e-05, "loss": 0.9576, "step": 226 }, { "epoch": 0.03, "learning_rate": 1.801587301587302e-05, "loss": 0.8739, "step": 227 }, { "epoch": 0.03, "learning_rate": 1.8095238095238097e-05, "loss": 0.9074, "step": 228 }, { "epoch": 0.03, "learning_rate": 1.8174603174603176e-05, "loss": 0.9157, "step": 229 }, { "epoch": 0.03, "learning_rate": 1.8253968253968254e-05, "loss": 0.9012, "step": 230 }, { "epoch": 0.03, "learning_rate": 1.8333333333333333e-05, "loss": 0.9001, "step": 231 }, { "epoch": 0.03, "learning_rate": 1.8412698412698415e-05, "loss": 0.8376, "step": 232 }, { "epoch": 0.03, "learning_rate": 1.8492063492063493e-05, "loss": 0.9113, "step": 233 }, { "epoch": 0.03, "learning_rate": 1.8571428571428575e-05, "loss": 0.8398, "step": 234 }, { "epoch": 0.03, "learning_rate": 1.8650793650793654e-05, "loss": 0.9085, "step": 235 }, { "epoch": 0.03, "learning_rate": 1.8730158730158732e-05, "loss": 0.8973, "step": 236 }, { "epoch": 0.03, "learning_rate": 1.880952380952381e-05, "loss": 0.909, "step": 237 }, { "epoch": 0.03, "learning_rate": 1.888888888888889e-05, "loss": 0.923, "step": 238 }, { "epoch": 0.03, "learning_rate": 1.8968253968253968e-05, "loss": 0.8694, "step": 239 }, { "epoch": 0.03, "learning_rate": 1.904761904761905e-05, "loss": 0.9102, "step": 240 }, { "epoch": 0.03, "learning_rate": 1.9126984126984128e-05, "loss": 0.9481, "step": 241 }, { "epoch": 0.03, "learning_rate": 1.920634920634921e-05, "loss": 0.8544, "step": 242 }, { "epoch": 0.03, "learning_rate": 1.928571428571429e-05, "loss": 0.8979, "step": 243 }, { "epoch": 0.03, "learning_rate": 1.9365079365079367e-05, "loss": 0.8795, "step": 244 }, { "epoch": 0.03, "learning_rate": 1.9444444444444445e-05, "loss": 0.9023, "step": 245 }, { "epoch": 0.03, "learning_rate": 1.9523809523809524e-05, "loss": 0.9336, "step": 246 }, { "epoch": 0.03, "learning_rate": 1.9603174603174602e-05, "loss": 0.9191, "step": 247 }, { "epoch": 0.03, "learning_rate": 1.9682539682539684e-05, "loss": 0.9325, "step": 248 }, { "epoch": 0.03, "learning_rate": 1.9761904761904763e-05, "loss": 0.8772, "step": 249 }, { "epoch": 0.03, "learning_rate": 1.9841269841269845e-05, "loss": 0.9414, "step": 250 }, { "epoch": 0.03, "learning_rate": 1.9920634920634923e-05, "loss": 0.923, "step": 251 }, { "epoch": 0.03, "learning_rate": 2e-05, "loss": 0.8477, "step": 252 }, { "epoch": 0.03, "learning_rate": 1.9999999253949546e-05, "loss": 0.8956, "step": 253 }, { "epoch": 0.03, "learning_rate": 1.9999997015798293e-05, "loss": 0.8739, "step": 254 }, { "epoch": 0.03, "learning_rate": 1.9999993285546573e-05, "loss": 0.8655, "step": 255 }, { "epoch": 0.03, "learning_rate": 1.9999988063194945e-05, "loss": 1.0, "step": 256 }, { "epoch": 0.03, "learning_rate": 1.9999981348744186e-05, "loss": 0.9459, "step": 257 }, { "epoch": 0.03, "learning_rate": 1.99999731421953e-05, "loss": 0.8661, "step": 258 }, { "epoch": 0.03, "learning_rate": 1.999996344354951e-05, "loss": 0.8532, "step": 259 }, { "epoch": 0.03, "learning_rate": 1.999995225280827e-05, "loss": 0.9682, "step": 260 }, { "epoch": 0.03, "learning_rate": 1.9999939569973235e-05, "loss": 0.9308, "step": 261 }, { "epoch": 0.03, "learning_rate": 1.9999925395046314e-05, "loss": 0.8761, "step": 262 }, { "epoch": 0.03, "learning_rate": 1.999990972802961e-05, "loss": 0.9347, "step": 263 }, { "epoch": 0.03, "learning_rate": 1.9999892568925467e-05, "loss": 0.9074, "step": 264 }, { "epoch": 0.03, "learning_rate": 1.999987391773644e-05, "loss": 0.9531, "step": 265 }, { "epoch": 0.03, "learning_rate": 1.999985377446532e-05, "loss": 0.8783, "step": 266 }, { "epoch": 0.03, "learning_rate": 1.9999832139115104e-05, "loss": 0.8884, "step": 267 }, { "epoch": 0.03, "learning_rate": 1.9999809011689027e-05, "loss": 0.9074, "step": 268 }, { "epoch": 0.03, "learning_rate": 1.9999784392190533e-05, "loss": 0.9286, "step": 269 }, { "epoch": 0.03, "learning_rate": 1.9999758280623303e-05, "loss": 0.9291, "step": 270 }, { "epoch": 0.03, "learning_rate": 1.999973067699123e-05, "loss": 0.9157, "step": 271 }, { "epoch": 0.03, "learning_rate": 1.999970158129843e-05, "loss": 0.8984, "step": 272 }, { "epoch": 0.03, "learning_rate": 1.9999670993549246e-05, "loss": 0.851, "step": 273 }, { "epoch": 0.03, "learning_rate": 1.9999638913748242e-05, "loss": 0.8828, "step": 274 }, { "epoch": 0.03, "learning_rate": 1.9999605341900205e-05, "loss": 0.8856, "step": 275 }, { "epoch": 0.03, "learning_rate": 1.9999570278010147e-05, "loss": 0.9213, "step": 276 }, { "epoch": 0.03, "learning_rate": 1.9999533722083296e-05, "loss": 0.928, "step": 277 }, { "epoch": 0.03, "learning_rate": 1.999949567412511e-05, "loss": 0.8142, "step": 278 }, { "epoch": 0.03, "learning_rate": 1.999945613414126e-05, "loss": 0.9235, "step": 279 }, { "epoch": 0.03, "learning_rate": 1.9999415102137653e-05, "loss": 0.9063, "step": 280 }, { "epoch": 0.03, "learning_rate": 1.9999372578120407e-05, "loss": 0.8666, "step": 281 }, { "epoch": 0.03, "learning_rate": 1.9999328562095868e-05, "loss": 0.9715, "step": 282 }, { "epoch": 0.03, "learning_rate": 1.9999283054070603e-05, "loss": 0.8811, "step": 283 }, { "epoch": 0.03, "learning_rate": 1.9999236054051407e-05, "loss": 0.8945, "step": 284 }, { "epoch": 0.03, "learning_rate": 1.9999187562045284e-05, "loss": 0.8711, "step": 285 }, { "epoch": 0.03, "learning_rate": 1.999913757805948e-05, "loss": 0.8845, "step": 286 }, { "epoch": 0.03, "learning_rate": 1.999908610210144e-05, "loss": 0.8767, "step": 287 }, { "epoch": 0.03, "learning_rate": 1.9999033134178858e-05, "loss": 0.9358, "step": 288 }, { "epoch": 0.03, "learning_rate": 1.999897867429963e-05, "loss": 0.9141, "step": 289 }, { "epoch": 0.03, "learning_rate": 1.9998922722471883e-05, "loss": 0.8404, "step": 290 }, { "epoch": 0.03, "learning_rate": 1.9998865278703967e-05, "loss": 0.9051, "step": 291 }, { "epoch": 0.03, "learning_rate": 1.9998806343004453e-05, "loss": 0.8722, "step": 292 }, { "epoch": 0.03, "learning_rate": 1.999874591538213e-05, "loss": 0.9743, "step": 293 }, { "epoch": 0.04, "learning_rate": 1.9998683995846023e-05, "loss": 0.9688, "step": 294 }, { "epoch": 0.04, "learning_rate": 1.9998620584405367e-05, "loss": 0.856, "step": 295 }, { "epoch": 0.04, "learning_rate": 1.999855568106962e-05, "loss": 0.8326, "step": 296 }, { "epoch": 0.04, "learning_rate": 1.999848928584847e-05, "loss": 0.8811, "step": 297 }, { "epoch": 0.04, "learning_rate": 1.9998421398751824e-05, "loss": 0.9118, "step": 298 }, { "epoch": 0.04, "learning_rate": 1.9998352019789814e-05, "loss": 0.8772, "step": 299 }, { "epoch": 0.04, "learning_rate": 1.9998281148972786e-05, "loss": 0.9079, "step": 300 }, { "epoch": 0.04, "learning_rate": 1.9998208786311316e-05, "loss": 0.9548, "step": 301 }, { "epoch": 0.04, "learning_rate": 1.9998134931816202e-05, "loss": 0.9364, "step": 302 }, { "epoch": 0.04, "learning_rate": 1.9998059585498466e-05, "loss": 0.9012, "step": 303 }, { "epoch": 0.04, "learning_rate": 1.9997982747369348e-05, "loss": 0.8884, "step": 304 }, { "epoch": 0.04, "learning_rate": 1.9997904417440318e-05, "loss": 0.9007, "step": 305 }, { "epoch": 0.04, "learning_rate": 1.9997824595723055e-05, "loss": 0.827, "step": 306 }, { "epoch": 0.04, "learning_rate": 1.9997743282229475e-05, "loss": 0.8705, "step": 307 }, { "epoch": 0.04, "learning_rate": 1.999766047697171e-05, "loss": 0.8689, "step": 308 }, { "epoch": 0.04, "learning_rate": 1.9997576179962115e-05, "loss": 0.909, "step": 309 }, { "epoch": 0.04, "learning_rate": 1.999749039121327e-05, "loss": 0.8739, "step": 310 }, { "epoch": 0.04, "learning_rate": 1.9997403110737968e-05, "loss": 0.8895, "step": 311 }, { "epoch": 0.04, "learning_rate": 1.9997314338549244e-05, "loss": 0.9213, "step": 312 }, { "epoch": 0.04, "learning_rate": 1.9997224074660335e-05, "loss": 0.861, "step": 313 }, { "epoch": 0.04, "learning_rate": 1.9997132319084707e-05, "loss": 0.8733, "step": 314 }, { "epoch": 0.04, "learning_rate": 1.999703907183606e-05, "loss": 0.9247, "step": 315 }, { "epoch": 0.04, "learning_rate": 1.99969443329283e-05, "loss": 0.9063, "step": 316 }, { "epoch": 0.04, "learning_rate": 1.999684810237557e-05, "loss": 0.8968, "step": 317 }, { "epoch": 0.04, "learning_rate": 1.999675038019222e-05, "loss": 0.9191, "step": 318 }, { "epoch": 0.04, "learning_rate": 1.999665116639284e-05, "loss": 0.9314, "step": 319 }, { "epoch": 0.04, "learning_rate": 1.9996550460992224e-05, "loss": 0.8811, "step": 320 }, { "epoch": 0.04, "learning_rate": 1.999644826400541e-05, "loss": 0.8644, "step": 321 }, { "epoch": 0.04, "learning_rate": 1.9996344575447636e-05, "loss": 0.8689, "step": 322 }, { "epoch": 0.04, "learning_rate": 1.9996239395334376e-05, "loss": 0.9035, "step": 323 }, { "epoch": 0.04, "learning_rate": 1.999613272368133e-05, "loss": 0.8878, "step": 324 }, { "epoch": 0.04, "learning_rate": 1.9996024560504407e-05, "loss": 0.9085, "step": 325 }, { "epoch": 0.04, "learning_rate": 1.9995914905819752e-05, "loss": 0.8666, "step": 326 }, { "epoch": 0.04, "learning_rate": 1.9995803759643722e-05, "loss": 0.8984, "step": 327 }, { "epoch": 0.04, "learning_rate": 1.99956911219929e-05, "loss": 0.9559, "step": 328 }, { "epoch": 0.04, "learning_rate": 1.99955769928841e-05, "loss": 0.9174, "step": 329 }, { "epoch": 0.04, "learning_rate": 1.9995461372334347e-05, "loss": 0.9302, "step": 330 }, { "epoch": 0.04, "learning_rate": 1.999534426036089e-05, "loss": 0.9146, "step": 331 }, { "epoch": 0.04, "learning_rate": 1.9995225656981207e-05, "loss": 0.8867, "step": 332 }, { "epoch": 0.04, "learning_rate": 1.9995105562212994e-05, "loss": 0.8761, "step": 333 }, { "epoch": 0.04, "learning_rate": 1.999498397607417e-05, "loss": 0.9224, "step": 334 }, { "epoch": 0.04, "learning_rate": 1.9994860898582872e-05, "loss": 0.9029, "step": 335 }, { "epoch": 0.04, "learning_rate": 1.9994736329757477e-05, "loss": 0.8767, "step": 336 }, { "epoch": 0.04, "learning_rate": 1.9994610269616558e-05, "loss": 0.9269, "step": 337 }, { "epoch": 0.04, "learning_rate": 1.9994482718178935e-05, "loss": 0.8594, "step": 338 }, { "epoch": 0.04, "learning_rate": 1.9994353675463633e-05, "loss": 0.8627, "step": 339 }, { "epoch": 0.04, "learning_rate": 1.999422314148991e-05, "loss": 0.904, "step": 340 }, { "epoch": 0.04, "learning_rate": 1.9994091116277245e-05, "loss": 0.9007, "step": 341 }, { "epoch": 0.04, "learning_rate": 1.999395759984533e-05, "loss": 0.8482, "step": 342 }, { "epoch": 0.04, "learning_rate": 1.999382259221409e-05, "loss": 0.8973, "step": 343 }, { "epoch": 0.04, "learning_rate": 1.9993686093403678e-05, "loss": 0.8538, "step": 344 }, { "epoch": 0.04, "learning_rate": 1.9993548103434448e-05, "loss": 0.9169, "step": 345 }, { "epoch": 0.04, "learning_rate": 1.9993408622327e-05, "loss": 0.8594, "step": 346 }, { "epoch": 0.04, "learning_rate": 1.999326765010214e-05, "loss": 0.8449, "step": 347 }, { "epoch": 0.04, "learning_rate": 1.99931251867809e-05, "loss": 0.9118, "step": 348 }, { "epoch": 0.04, "learning_rate": 1.9992981232384547e-05, "loss": 0.9609, "step": 349 }, { "epoch": 0.04, "learning_rate": 1.9992835786934552e-05, "loss": 0.8622, "step": 350 }, { "epoch": 0.04, "learning_rate": 1.999268885045262e-05, "loss": 0.9118, "step": 351 }, { "epoch": 0.04, "learning_rate": 1.9992540422960672e-05, "loss": 0.8672, "step": 352 }, { "epoch": 0.04, "learning_rate": 1.999239050448086e-05, "loss": 0.8415, "step": 353 }, { "epoch": 0.04, "learning_rate": 1.999223909503555e-05, "loss": 0.9202, "step": 354 }, { "epoch": 0.04, "learning_rate": 1.9992086194647337e-05, "loss": 0.8789, "step": 355 }, { "epoch": 0.04, "learning_rate": 1.999193180333903e-05, "loss": 0.8906, "step": 356 }, { "epoch": 0.04, "learning_rate": 1.9991775921133672e-05, "loss": 0.9314, "step": 357 }, { "epoch": 0.04, "learning_rate": 1.9991618548054518e-05, "loss": 0.9286, "step": 358 }, { "epoch": 0.04, "learning_rate": 1.999145968412505e-05, "loss": 0.9057, "step": 359 }, { "epoch": 0.04, "learning_rate": 1.9991299329368972e-05, "loss": 0.9163, "step": 360 }, { "epoch": 0.04, "learning_rate": 1.9991137483810214e-05, "loss": 0.8845, "step": 361 }, { "epoch": 0.04, "learning_rate": 1.999097414747292e-05, "loss": 0.9035, "step": 362 }, { "epoch": 0.04, "learning_rate": 1.9990809320381464e-05, "loss": 0.9408, "step": 363 }, { "epoch": 0.04, "learning_rate": 1.999064300256044e-05, "loss": 0.87, "step": 364 }, { "epoch": 0.04, "learning_rate": 1.999047519403466e-05, "loss": 0.8398, "step": 365 }, { "epoch": 0.04, "learning_rate": 1.9990305894829174e-05, "loss": 0.933, "step": 366 }, { "epoch": 0.04, "learning_rate": 1.999013510496923e-05, "loss": 0.8895, "step": 367 }, { "epoch": 0.04, "learning_rate": 1.9989962824480322e-05, "loss": 0.8962, "step": 368 }, { "epoch": 0.04, "learning_rate": 1.9989789053388147e-05, "loss": 0.9258, "step": 369 }, { "epoch": 0.04, "learning_rate": 1.998961379171864e-05, "loss": 0.904, "step": 370 }, { "epoch": 0.04, "learning_rate": 1.9989437039497953e-05, "loss": 0.8633, "step": 371 }, { "epoch": 0.04, "learning_rate": 1.9989258796752452e-05, "loss": 0.933, "step": 372 }, { "epoch": 0.04, "learning_rate": 1.9989079063508735e-05, "loss": 0.8867, "step": 373 }, { "epoch": 0.04, "learning_rate": 1.998889783979362e-05, "loss": 0.9224, "step": 374 }, { "epoch": 0.04, "learning_rate": 1.9988715125634154e-05, "loss": 0.8912, "step": 375 }, { "epoch": 0.04, "learning_rate": 1.998853092105759e-05, "loss": 0.8655, "step": 376 }, { "epoch": 0.04, "learning_rate": 1.9988345226091423e-05, "loss": 0.8549, "step": 377 }, { "epoch": 0.05, "learning_rate": 1.9988158040763353e-05, "loss": 0.8365, "step": 378 }, { "epoch": 0.05, "learning_rate": 1.998796936510131e-05, "loss": 0.856, "step": 379 }, { "epoch": 0.05, "learning_rate": 1.9987779199133452e-05, "loss": 0.8945, "step": 380 }, { "epoch": 0.05, "learning_rate": 1.998758754288815e-05, "loss": 0.8856, "step": 381 }, { "epoch": 0.05, "learning_rate": 1.9987394396394e-05, "loss": 0.9314, "step": 382 }, { "epoch": 0.05, "learning_rate": 1.998719975967982e-05, "loss": 0.8359, "step": 383 }, { "epoch": 0.05, "learning_rate": 1.998700363277466e-05, "loss": 0.8343, "step": 384 }, { "epoch": 0.05, "learning_rate": 1.9986806015707775e-05, "loss": 0.8717, "step": 385 }, { "epoch": 0.05, "learning_rate": 1.9986606908508656e-05, "loss": 0.928, "step": 386 }, { "epoch": 0.05, "learning_rate": 1.9986406311207012e-05, "loss": 0.9068, "step": 387 }, { "epoch": 0.05, "learning_rate": 1.9986204223832772e-05, "loss": 0.8136, "step": 388 }, { "epoch": 0.05, "learning_rate": 1.9986000646416092e-05, "loss": 0.9464, "step": 389 }, { "epoch": 0.05, "learning_rate": 1.9985795578987342e-05, "loss": 0.8426, "step": 390 }, { "epoch": 0.05, "learning_rate": 1.9985589021577128e-05, "loss": 0.957, "step": 391 }, { "epoch": 0.05, "learning_rate": 1.9985380974216268e-05, "loss": 0.8856, "step": 392 }, { "epoch": 0.05, "learning_rate": 1.99851714369358e-05, "loss": 0.8538, "step": 393 }, { "epoch": 0.05, "learning_rate": 1.9984960409766994e-05, "loss": 0.9018, "step": 394 }, { "epoch": 0.05, "learning_rate": 1.9984747892741336e-05, "loss": 0.8521, "step": 395 }, { "epoch": 0.05, "learning_rate": 1.9984533885890538e-05, "loss": 0.8722, "step": 396 }, { "epoch": 0.05, "learning_rate": 1.9984318389246527e-05, "loss": 0.8884, "step": 397 }, { "epoch": 0.05, "learning_rate": 1.998410140284146e-05, "loss": 0.8438, "step": 398 }, { "epoch": 0.05, "learning_rate": 1.9983882926707717e-05, "loss": 0.8521, "step": 399 }, { "epoch": 0.05, "learning_rate": 1.998366296087789e-05, "loss": 0.8895, "step": 400 }, { "epoch": 0.05, "learning_rate": 1.9983441505384808e-05, "loss": 0.904, "step": 401 }, { "epoch": 0.05, "learning_rate": 1.9983218560261504e-05, "loss": 0.8627, "step": 402 }, { "epoch": 0.05, "learning_rate": 1.9982994125541252e-05, "loss": 0.8945, "step": 403 }, { "epoch": 0.05, "learning_rate": 1.998276820125754e-05, "loss": 0.8873, "step": 404 }, { "epoch": 0.05, "learning_rate": 1.9982540787444074e-05, "loss": 0.8337, "step": 405 }, { "epoch": 0.05, "learning_rate": 1.998231188413479e-05, "loss": 0.9247, "step": 406 }, { "epoch": 0.05, "learning_rate": 1.9982081491363837e-05, "loss": 0.8906, "step": 407 }, { "epoch": 0.05, "learning_rate": 1.9981849609165597e-05, "loss": 0.899, "step": 408 }, { "epoch": 0.05, "learning_rate": 1.998161623757467e-05, "loss": 0.9068, "step": 409 }, { "epoch": 0.05, "learning_rate": 1.998138137662587e-05, "loss": 0.899, "step": 410 }, { "epoch": 0.05, "learning_rate": 1.9981145026354252e-05, "loss": 0.8365, "step": 411 }, { "epoch": 0.05, "learning_rate": 1.9980907186795074e-05, "loss": 0.8906, "step": 412 }, { "epoch": 0.05, "learning_rate": 1.9980667857983826e-05, "loss": 0.9113, "step": 413 }, { "epoch": 0.05, "learning_rate": 1.9980427039956218e-05, "loss": 0.9403, "step": 414 }, { "epoch": 0.05, "learning_rate": 1.9980184732748184e-05, "loss": 0.9018, "step": 415 }, { "epoch": 0.05, "learning_rate": 1.9979940936395873e-05, "loss": 0.8655, "step": 416 }, { "epoch": 0.05, "learning_rate": 1.997969565093567e-05, "loss": 0.8438, "step": 417 }, { "epoch": 0.05, "learning_rate": 1.997944887640417e-05, "loss": 0.889, "step": 418 }, { "epoch": 0.05, "learning_rate": 1.9979200612838193e-05, "loss": 0.9135, "step": 419 }, { "epoch": 0.05, "learning_rate": 1.9978950860274782e-05, "loss": 0.9129, "step": 420 }, { "epoch": 0.05, "learning_rate": 1.9978699618751208e-05, "loss": 0.8806, "step": 421 }, { "epoch": 0.05, "learning_rate": 1.9978446888304954e-05, "loss": 0.8627, "step": 422 }, { "epoch": 0.05, "learning_rate": 1.9978192668973733e-05, "loss": 0.8929, "step": 423 }, { "epoch": 0.05, "learning_rate": 1.997793696079547e-05, "loss": 0.8527, "step": 424 }, { "epoch": 0.05, "learning_rate": 1.9977679763808334e-05, "loss": 0.8984, "step": 425 }, { "epoch": 0.05, "learning_rate": 1.997742107805068e-05, "loss": 0.9079, "step": 426 }, { "epoch": 0.05, "learning_rate": 1.997716090356113e-05, "loss": 0.87, "step": 427 }, { "epoch": 0.05, "learning_rate": 1.997689924037849e-05, "loss": 0.8906, "step": 428 }, { "epoch": 0.05, "learning_rate": 1.9976636088541804e-05, "loss": 0.8175, "step": 429 }, { "epoch": 0.05, "learning_rate": 1.9976371448090334e-05, "loss": 0.8521, "step": 430 }, { "epoch": 0.05, "learning_rate": 1.997610531906358e-05, "loss": 0.8616, "step": 431 }, { "epoch": 0.05, "learning_rate": 1.997583770150124e-05, "loss": 0.894, "step": 432 }, { "epoch": 0.05, "learning_rate": 1.9975568595443245e-05, "loss": 0.9799, "step": 433 }, { "epoch": 0.05, "learning_rate": 1.9975298000929757e-05, "loss": 0.8705, "step": 434 }, { "epoch": 0.05, "learning_rate": 1.997502591800114e-05, "loss": 0.8371, "step": 435 }, { "epoch": 0.05, "learning_rate": 1.9974752346698005e-05, "loss": 0.9012, "step": 436 }, { "epoch": 0.05, "learning_rate": 1.9974477287061157e-05, "loss": 0.8956, "step": 437 }, { "epoch": 0.05, "learning_rate": 1.9974200739131652e-05, "loss": 0.7813, "step": 438 }, { "epoch": 0.05, "learning_rate": 1.997392270295074e-05, "loss": 0.933, "step": 439 }, { "epoch": 0.05, "learning_rate": 1.9973643178559914e-05, "loss": 0.832, "step": 440 }, { "epoch": 0.05, "learning_rate": 1.9973362166000887e-05, "loss": 0.8717, "step": 441 }, { "epoch": 0.05, "learning_rate": 1.9973079665315577e-05, "loss": 0.8521, "step": 442 }, { "epoch": 0.05, "learning_rate": 1.9972795676546146e-05, "loss": 0.8878, "step": 443 }, { "epoch": 0.05, "learning_rate": 1.9972510199734963e-05, "loss": 0.8532, "step": 444 }, { "epoch": 0.05, "learning_rate": 1.9972223234924623e-05, "loss": 0.9129, "step": 445 }, { "epoch": 0.05, "learning_rate": 1.997193478215795e-05, "loss": 0.8756, "step": 446 }, { "epoch": 0.05, "learning_rate": 1.9971644841477977e-05, "loss": 0.8839, "step": 447 }, { "epoch": 0.05, "learning_rate": 1.997135341292797e-05, "loss": 0.9118, "step": 448 }, { "epoch": 0.05, "learning_rate": 1.997106049655141e-05, "loss": 0.942, "step": 449 }, { "epoch": 0.05, "learning_rate": 1.9970766092392008e-05, "loss": 0.9872, "step": 450 }, { "epoch": 0.05, "learning_rate": 1.9970470200493694e-05, "loss": 0.8599, "step": 451 }, { "epoch": 0.05, "learning_rate": 1.9970172820900606e-05, "loss": 0.8594, "step": 452 }, { "epoch": 0.05, "learning_rate": 1.9969873953657125e-05, "loss": 0.8343, "step": 453 }, { "epoch": 0.05, "learning_rate": 1.9969573598807847e-05, "loss": 0.9314, "step": 454 }, { "epoch": 0.05, "learning_rate": 1.9969271756397582e-05, "loss": 0.9688, "step": 455 }, { "epoch": 0.05, "learning_rate": 1.9968968426471372e-05, "loss": 0.8862, "step": 456 }, { "epoch": 0.05, "learning_rate": 1.9968663609074473e-05, "loss": 0.8449, "step": 457 }, { "epoch": 0.05, "learning_rate": 1.9968357304252374e-05, "loss": 0.8655, "step": 458 }, { "epoch": 0.05, "learning_rate": 1.996804951205077e-05, "loss": 0.8482, "step": 459 }, { "epoch": 0.05, "learning_rate": 1.996774023251559e-05, "loss": 0.9051, "step": 460 }, { "epoch": 0.05, "learning_rate": 1.9967429465692986e-05, "loss": 0.9023, "step": 461 }, { "epoch": 0.06, "learning_rate": 1.9967117211629322e-05, "loss": 0.8968, "step": 462 }, { "epoch": 0.06, "learning_rate": 1.9966803470371187e-05, "loss": 0.8666, "step": 463 }, { "epoch": 0.06, "learning_rate": 1.9966488241965403e-05, "loss": 0.8767, "step": 464 }, { "epoch": 0.06, "learning_rate": 1.9966171526459003e-05, "loss": 0.8365, "step": 465 }, { "epoch": 0.06, "learning_rate": 1.996585332389924e-05, "loss": 0.9046, "step": 466 }, { "epoch": 0.06, "learning_rate": 1.9965533634333597e-05, "loss": 0.9085, "step": 467 }, { "epoch": 0.06, "learning_rate": 1.9965212457809767e-05, "loss": 0.8834, "step": 468 }, { "epoch": 0.06, "learning_rate": 1.9964889794375683e-05, "loss": 0.8627, "step": 469 }, { "epoch": 0.06, "learning_rate": 1.996456564407949e-05, "loss": 0.8566, "step": 470 }, { "epoch": 0.06, "learning_rate": 1.9964240006969543e-05, "loss": 0.8465, "step": 471 }, { "epoch": 0.06, "learning_rate": 1.996391288309444e-05, "loss": 0.8867, "step": 472 }, { "epoch": 0.06, "learning_rate": 1.9963584272502987e-05, "loss": 0.8655, "step": 473 }, { "epoch": 0.06, "learning_rate": 1.996325417524422e-05, "loss": 0.8878, "step": 474 }, { "epoch": 0.06, "learning_rate": 1.9962922591367387e-05, "loss": 0.8594, "step": 475 }, { "epoch": 0.06, "learning_rate": 1.996258952092197e-05, "loss": 0.8292, "step": 476 }, { "epoch": 0.06, "learning_rate": 1.9962254963957658e-05, "loss": 0.8756, "step": 477 }, { "epoch": 0.06, "learning_rate": 1.9961918920524384e-05, "loss": 0.9007, "step": 478 }, { "epoch": 0.06, "learning_rate": 1.9961581390672277e-05, "loss": 0.8627, "step": 479 }, { "epoch": 0.06, "learning_rate": 1.9961242374451703e-05, "loss": 0.8432, "step": 480 }, { "epoch": 0.06, "learning_rate": 1.9960901871913246e-05, "loss": 0.9358, "step": 481 }, { "epoch": 0.06, "learning_rate": 1.996055988310772e-05, "loss": 0.8711, "step": 482 }, { "epoch": 0.06, "learning_rate": 1.996021640808614e-05, "loss": 0.8404, "step": 483 }, { "epoch": 0.06, "learning_rate": 1.9959871446899766e-05, "loss": 0.9163, "step": 484 }, { "epoch": 0.06, "learning_rate": 1.9959524999600064e-05, "loss": 0.8493, "step": 485 }, { "epoch": 0.06, "learning_rate": 1.9959177066238733e-05, "loss": 0.9487, "step": 486 }, { "epoch": 0.06, "learning_rate": 1.995882764686768e-05, "loss": 0.9068, "step": 487 }, { "epoch": 0.06, "learning_rate": 1.9958476741539056e-05, "loss": 0.8895, "step": 488 }, { "epoch": 0.06, "learning_rate": 1.9958124350305207e-05, "loss": 0.9375, "step": 489 }, { "epoch": 0.06, "learning_rate": 1.9957770473218715e-05, "loss": 0.8119, "step": 490 }, { "epoch": 0.06, "learning_rate": 1.9957415110332385e-05, "loss": 0.8772, "step": 491 }, { "epoch": 0.06, "learning_rate": 1.995705826169924e-05, "loss": 0.9102, "step": 492 }, { "epoch": 0.06, "learning_rate": 1.995669992737252e-05, "loss": 0.8934, "step": 493 }, { "epoch": 0.06, "learning_rate": 1.9956340107405702e-05, "loss": 0.8901, "step": 494 }, { "epoch": 0.06, "learning_rate": 1.995597880185247e-05, "loss": 0.918, "step": 495 }, { "epoch": 0.06, "learning_rate": 1.9955616010766737e-05, "loss": 0.8772, "step": 496 }, { "epoch": 0.06, "learning_rate": 1.995525173420263e-05, "loss": 0.8717, "step": 497 }, { "epoch": 0.06, "learning_rate": 1.9954885972214503e-05, "loss": 0.8739, "step": 498 }, { "epoch": 0.06, "learning_rate": 1.9954518724856938e-05, "loss": 0.9358, "step": 499 }, { "epoch": 0.06, "learning_rate": 1.9954149992184725e-05, "loss": 0.8728, "step": 500 }, { "epoch": 0.06, "learning_rate": 1.9953779774252886e-05, "loss": 0.9012, "step": 501 }, { "epoch": 0.06, "learning_rate": 1.995340807111666e-05, "loss": 0.7667, "step": 502 }, { "epoch": 0.06, "learning_rate": 1.995303488283151e-05, "loss": 0.8722, "step": 503 }, { "epoch": 0.06, "learning_rate": 1.9952660209453118e-05, "loss": 0.8823, "step": 504 }, { "epoch": 0.06, "learning_rate": 1.9952284051037393e-05, "loss": 0.9174, "step": 505 }, { "epoch": 0.06, "learning_rate": 1.9951906407640455e-05, "loss": 0.9146, "step": 506 }, { "epoch": 0.06, "learning_rate": 1.9951527279318656e-05, "loss": 0.8237, "step": 507 }, { "epoch": 0.06, "learning_rate": 1.995114666612857e-05, "loss": 0.9196, "step": 508 }, { "epoch": 0.06, "learning_rate": 1.995076456812698e-05, "loss": 0.8571, "step": 509 }, { "epoch": 0.06, "learning_rate": 1.9950380985370903e-05, "loss": 0.9191, "step": 510 }, { "epoch": 0.06, "learning_rate": 1.9949995917917574e-05, "loss": 0.8119, "step": 511 }, { "epoch": 0.06, "learning_rate": 1.9949609365824444e-05, "loss": 0.8449, "step": 512 }, { "epoch": 0.06, "learning_rate": 1.99492213291492e-05, "loss": 0.9397, "step": 513 }, { "epoch": 0.06, "learning_rate": 1.9948831807949735e-05, "loss": 0.8622, "step": 514 }, { "epoch": 0.06, "learning_rate": 1.994844080228417e-05, "loss": 0.8398, "step": 515 }, { "epoch": 0.06, "learning_rate": 1.9948048312210843e-05, "loss": 0.9012, "step": 516 }, { "epoch": 0.06, "learning_rate": 1.9947654337788326e-05, "loss": 0.9085, "step": 517 }, { "epoch": 0.06, "learning_rate": 1.9947258879075397e-05, "loss": 0.9157, "step": 518 }, { "epoch": 0.06, "learning_rate": 1.994686193613107e-05, "loss": 0.8482, "step": 519 }, { "epoch": 0.06, "learning_rate": 1.994646350901456e-05, "loss": 0.8789, "step": 520 }, { "epoch": 0.06, "learning_rate": 1.994606359778533e-05, "loss": 0.8828, "step": 521 }, { "epoch": 0.06, "learning_rate": 1.9945662202503044e-05, "loss": 0.8315, "step": 522 }, { "epoch": 0.06, "learning_rate": 1.994525932322759e-05, "loss": 0.9269, "step": 523 }, { "epoch": 0.06, "learning_rate": 1.9944854960019092e-05, "loss": 0.8516, "step": 524 }, { "epoch": 0.06, "learning_rate": 1.9944449112937877e-05, "loss": 0.8549, "step": 525 }, { "epoch": 0.06, "learning_rate": 1.9944041782044507e-05, "loss": 0.9035, "step": 526 }, { "epoch": 0.06, "learning_rate": 1.994363296739976e-05, "loss": 0.87, "step": 527 }, { "epoch": 0.06, "learning_rate": 1.994322266906463e-05, "loss": 0.9637, "step": 528 }, { "epoch": 0.06, "learning_rate": 1.9942810887100335e-05, "loss": 0.8945, "step": 529 }, { "epoch": 0.06, "learning_rate": 1.9942397621568327e-05, "loss": 0.8594, "step": 530 }, { "epoch": 0.06, "learning_rate": 1.9941982872530266e-05, "loss": 0.8839, "step": 531 }, { "epoch": 0.06, "learning_rate": 1.9941566640048032e-05, "loss": 0.9146, "step": 532 }, { "epoch": 0.06, "learning_rate": 1.9941148924183736e-05, "loss": 0.8934, "step": 533 }, { "epoch": 0.06, "learning_rate": 1.9940729724999704e-05, "loss": 0.9107, "step": 534 }, { "epoch": 0.06, "learning_rate": 1.9940309042558487e-05, "loss": 0.8588, "step": 535 }, { "epoch": 0.06, "learning_rate": 1.993988687692285e-05, "loss": 0.8806, "step": 536 }, { "epoch": 0.06, "learning_rate": 1.9939463228155785e-05, "loss": 0.8387, "step": 537 }, { "epoch": 0.06, "learning_rate": 1.9939038096320508e-05, "loss": 0.8996, "step": 538 }, { "epoch": 0.06, "learning_rate": 1.9938611481480455e-05, "loss": 0.87, "step": 539 }, { "epoch": 0.06, "learning_rate": 1.9938183383699276e-05, "loss": 0.8862, "step": 540 }, { "epoch": 0.06, "learning_rate": 1.9937753803040847e-05, "loss": 0.9258, "step": 541 }, { "epoch": 0.06, "learning_rate": 1.993732273956927e-05, "loss": 0.8477, "step": 542 }, { "epoch": 0.06, "learning_rate": 1.993689019334886e-05, "loss": 0.9141, "step": 543 }, { "epoch": 0.06, "learning_rate": 1.9936456164444163e-05, "loss": 0.8767, "step": 544 }, { "epoch": 0.06, "learning_rate": 1.993602065291994e-05, "loss": 0.8499, "step": 545 }, { "epoch": 0.07, "learning_rate": 1.9935583658841162e-05, "loss": 0.8008, "step": 546 }, { "epoch": 0.07, "learning_rate": 1.993514518227305e-05, "loss": 0.9012, "step": 547 }, { "epoch": 0.07, "learning_rate": 1.9934705223281013e-05, "loss": 0.8834, "step": 548 }, { "epoch": 0.07, "learning_rate": 1.9934263781930712e-05, "loss": 0.8867, "step": 549 }, { "epoch": 0.07, "learning_rate": 1.9933820858288003e-05, "loss": 0.9319, "step": 550 }, { "epoch": 0.07, "learning_rate": 1.993337645241898e-05, "loss": 0.8733, "step": 551 }, { "epoch": 0.07, "learning_rate": 1.9932930564389954e-05, "loss": 0.8655, "step": 552 }, { "epoch": 0.07, "learning_rate": 1.993248319426745e-05, "loss": 0.899, "step": 553 }, { "epoch": 0.07, "learning_rate": 1.9932034342118228e-05, "loss": 0.8845, "step": 554 }, { "epoch": 0.07, "learning_rate": 1.9931584008009256e-05, "loss": 0.8806, "step": 555 }, { "epoch": 0.07, "learning_rate": 1.9931132192007733e-05, "loss": 0.8465, "step": 556 }, { "epoch": 0.07, "learning_rate": 1.993067889418107e-05, "loss": 0.8795, "step": 557 }, { "epoch": 0.07, "learning_rate": 1.9930224114596903e-05, "loss": 0.885, "step": 558 }, { "epoch": 0.07, "learning_rate": 1.9929767853323092e-05, "loss": 0.904, "step": 559 }, { "epoch": 0.07, "learning_rate": 1.9929310110427716e-05, "loss": 0.8901, "step": 560 }, { "epoch": 0.07, "learning_rate": 1.9928850885979073e-05, "loss": 0.8828, "step": 561 }, { "epoch": 0.07, "learning_rate": 1.9928390180045686e-05, "loss": 0.8767, "step": 562 }, { "epoch": 0.07, "learning_rate": 1.99279279926963e-05, "loss": 0.8728, "step": 563 }, { "epoch": 0.07, "learning_rate": 1.992746432399987e-05, "loss": 0.8817, "step": 564 }, { "epoch": 0.07, "learning_rate": 1.9926999174025587e-05, "loss": 0.8834, "step": 565 }, { "epoch": 0.07, "learning_rate": 1.992653254284285e-05, "loss": 0.8426, "step": 566 }, { "epoch": 0.07, "learning_rate": 1.9926064430521287e-05, "loss": 0.9029, "step": 567 }, { "epoch": 0.07, "learning_rate": 1.9925594837130754e-05, "loss": 0.8929, "step": 568 }, { "epoch": 0.07, "learning_rate": 1.9925123762741307e-05, "loss": 0.8482, "step": 569 }, { "epoch": 0.07, "learning_rate": 1.992465120742324e-05, "loss": 0.9208, "step": 570 }, { "epoch": 0.07, "learning_rate": 1.9924177171247062e-05, "loss": 0.8728, "step": 571 }, { "epoch": 0.07, "learning_rate": 1.9923701654283505e-05, "loss": 0.8873, "step": 572 }, { "epoch": 0.07, "learning_rate": 1.992322465660352e-05, "loss": 0.9325, "step": 573 }, { "epoch": 0.07, "learning_rate": 1.992274617827828e-05, "loss": 0.8482, "step": 574 }, { "epoch": 0.07, "learning_rate": 1.9922266219379183e-05, "loss": 0.9035, "step": 575 }, { "epoch": 0.07, "learning_rate": 1.9921784779977837e-05, "loss": 0.8705, "step": 576 }, { "epoch": 0.07, "learning_rate": 1.9921301860146082e-05, "loss": 0.8477, "step": 577 }, { "epoch": 0.07, "learning_rate": 1.9920817459955974e-05, "loss": 0.8828, "step": 578 }, { "epoch": 0.07, "learning_rate": 1.9920331579479787e-05, "loss": 0.8845, "step": 579 }, { "epoch": 0.07, "learning_rate": 1.9919844218790022e-05, "loss": 0.9152, "step": 580 }, { "epoch": 0.07, "learning_rate": 1.9919355377959397e-05, "loss": 0.8382, "step": 581 }, { "epoch": 0.07, "learning_rate": 1.9918865057060857e-05, "loss": 0.8767, "step": 582 }, { "epoch": 0.07, "learning_rate": 1.9918373256167553e-05, "loss": 0.8644, "step": 583 }, { "epoch": 0.07, "learning_rate": 1.991787997535288e-05, "loss": 0.9023, "step": 584 }, { "epoch": 0.07, "learning_rate": 1.9917385214690427e-05, "loss": 0.8834, "step": 585 }, { "epoch": 0.07, "learning_rate": 1.9916888974254023e-05, "loss": 0.9308, "step": 586 }, { "epoch": 0.07, "learning_rate": 1.9916391254117714e-05, "loss": 0.8834, "step": 587 }, { "epoch": 0.07, "learning_rate": 1.9915892054355763e-05, "loss": 0.9314, "step": 588 }, { "epoch": 0.07, "learning_rate": 1.9915391375042653e-05, "loss": 0.8778, "step": 589 }, { "epoch": 0.07, "learning_rate": 1.9914889216253096e-05, "loss": 0.8694, "step": 590 }, { "epoch": 0.07, "learning_rate": 1.9914385578062015e-05, "loss": 0.8304, "step": 591 }, { "epoch": 0.07, "learning_rate": 1.991388046054456e-05, "loss": 0.8326, "step": 592 }, { "epoch": 0.07, "learning_rate": 1.99133738637761e-05, "loss": 0.8739, "step": 593 }, { "epoch": 0.07, "learning_rate": 1.991286578783222e-05, "loss": 0.8415, "step": 594 }, { "epoch": 0.07, "learning_rate": 1.9912356232788736e-05, "loss": 0.8912, "step": 595 }, { "epoch": 0.07, "learning_rate": 1.991184519872168e-05, "loss": 0.88, "step": 596 }, { "epoch": 0.07, "learning_rate": 1.991133268570729e-05, "loss": 0.8778, "step": 597 }, { "epoch": 0.07, "learning_rate": 1.9910818693822053e-05, "loss": 0.8588, "step": 598 }, { "epoch": 0.07, "learning_rate": 1.9910303223142654e-05, "loss": 0.8499, "step": 599 }, { "epoch": 0.07, "learning_rate": 1.990978627374601e-05, "loss": 0.8566, "step": 600 }, { "epoch": 0.07, "learning_rate": 1.9909267845709254e-05, "loss": 0.9431, "step": 601 }, { "epoch": 0.07, "learning_rate": 1.990874793910974e-05, "loss": 0.8516, "step": 602 }, { "epoch": 0.07, "learning_rate": 1.9908226554025045e-05, "loss": 0.8862, "step": 603 }, { "epoch": 0.07, "learning_rate": 1.9907703690532965e-05, "loss": 0.8521, "step": 604 }, { "epoch": 0.07, "learning_rate": 1.990717934871151e-05, "loss": 0.8744, "step": 605 }, { "epoch": 0.07, "learning_rate": 1.9906653528638926e-05, "loss": 0.8694, "step": 606 }, { "epoch": 0.07, "learning_rate": 1.9906126230393667e-05, "loss": 0.8532, "step": 607 }, { "epoch": 0.07, "learning_rate": 1.990559745405441e-05, "loss": 0.8354, "step": 608 }, { "epoch": 0.07, "learning_rate": 1.9905067199700055e-05, "loss": 0.8443, "step": 609 }, { "epoch": 0.07, "learning_rate": 1.9904535467409722e-05, "loss": 0.8047, "step": 610 }, { "epoch": 0.07, "learning_rate": 1.9904002257262747e-05, "loss": 0.9213, "step": 611 }, { "epoch": 0.07, "learning_rate": 1.9903467569338698e-05, "loss": 0.8828, "step": 612 }, { "epoch": 0.07, "learning_rate": 1.9902931403717353e-05, "loss": 0.923, "step": 613 }, { "epoch": 0.07, "learning_rate": 1.9902393760478708e-05, "loss": 0.832, "step": 614 }, { "epoch": 0.07, "learning_rate": 1.9901854639702986e-05, "loss": 0.8398, "step": 615 }, { "epoch": 0.07, "learning_rate": 1.9901314041470635e-05, "loss": 0.846, "step": 616 }, { "epoch": 0.07, "learning_rate": 1.9900771965862313e-05, "loss": 0.9196, "step": 617 }, { "epoch": 0.07, "learning_rate": 1.9900228412958905e-05, "loss": 0.9023, "step": 618 }, { "epoch": 0.07, "learning_rate": 1.9899683382841513e-05, "loss": 0.8761, "step": 619 }, { "epoch": 0.07, "learning_rate": 1.9899136875591462e-05, "loss": 0.9436, "step": 620 }, { "epoch": 0.07, "learning_rate": 1.98985888912903e-05, "loss": 0.8951, "step": 621 }, { "epoch": 0.07, "learning_rate": 1.9898039430019788e-05, "loss": 0.8387, "step": 622 }, { "epoch": 0.07, "learning_rate": 1.9897488491861906e-05, "loss": 0.8415, "step": 623 }, { "epoch": 0.07, "learning_rate": 1.989693607689887e-05, "loss": 0.8917, "step": 624 }, { "epoch": 0.07, "learning_rate": 1.9896382185213097e-05, "loss": 0.8594, "step": 625 }, { "epoch": 0.07, "learning_rate": 1.989582681688724e-05, "loss": 0.9364, "step": 626 }, { "epoch": 0.07, "learning_rate": 1.9895269972004162e-05, "loss": 0.8761, "step": 627 }, { "epoch": 0.07, "learning_rate": 1.989471165064695e-05, "loss": 0.8438, "step": 628 }, { "epoch": 0.08, "learning_rate": 1.989415185289891e-05, "loss": 0.8895, "step": 629 }, { "epoch": 0.08, "learning_rate": 1.9893590578843574e-05, "loss": 0.8382, "step": 630 }, { "epoch": 0.08, "learning_rate": 1.9893027828564686e-05, "loss": 0.8471, "step": 631 }, { "epoch": 0.08, "learning_rate": 1.9892463602146214e-05, "loss": 0.8337, "step": 632 }, { "epoch": 0.08, "learning_rate": 1.989189789967235e-05, "loss": 0.8136, "step": 633 }, { "epoch": 0.08, "learning_rate": 1.9891330721227497e-05, "loss": 0.8683, "step": 634 }, { "epoch": 0.08, "learning_rate": 1.9890762066896286e-05, "loss": 0.8622, "step": 635 }, { "epoch": 0.08, "learning_rate": 1.989019193676357e-05, "loss": 0.8114, "step": 636 }, { "epoch": 0.08, "learning_rate": 1.988962033091441e-05, "loss": 0.8733, "step": 637 }, { "epoch": 0.08, "learning_rate": 1.98890472494341e-05, "loss": 0.9001, "step": 638 }, { "epoch": 0.08, "learning_rate": 1.9888472692408155e-05, "loss": 0.9403, "step": 639 }, { "epoch": 0.08, "learning_rate": 1.9887896659922294e-05, "loss": 0.9185, "step": 640 }, { "epoch": 0.08, "learning_rate": 1.9887319152062476e-05, "loss": 0.9342, "step": 641 }, { "epoch": 0.08, "learning_rate": 1.9886740168914863e-05, "loss": 0.8616, "step": 642 }, { "epoch": 0.08, "learning_rate": 1.988615971056585e-05, "loss": 0.9269, "step": 643 }, { "epoch": 0.08, "learning_rate": 1.988557777710205e-05, "loss": 0.8867, "step": 644 }, { "epoch": 0.08, "learning_rate": 1.9884994368610287e-05, "loss": 0.8471, "step": 645 }, { "epoch": 0.08, "learning_rate": 1.9884409485177613e-05, "loss": 0.9051, "step": 646 }, { "epoch": 0.08, "learning_rate": 1.9883823126891303e-05, "loss": 0.8806, "step": 647 }, { "epoch": 0.08, "learning_rate": 1.9883235293838842e-05, "loss": 0.8722, "step": 648 }, { "epoch": 0.08, "learning_rate": 1.9882645986107946e-05, "loss": 0.8599, "step": 649 }, { "epoch": 0.08, "learning_rate": 1.9882055203786536e-05, "loss": 0.9135, "step": 650 }, { "epoch": 0.08, "learning_rate": 1.9881462946962773e-05, "loss": 0.9096, "step": 651 }, { "epoch": 0.08, "learning_rate": 1.9880869215725024e-05, "loss": 0.8895, "step": 652 }, { "epoch": 0.08, "learning_rate": 1.988027401016188e-05, "loss": 0.9068, "step": 653 }, { "epoch": 0.08, "learning_rate": 1.9879677330362154e-05, "loss": 0.8415, "step": 654 }, { "epoch": 0.08, "learning_rate": 1.987907917641487e-05, "loss": 0.8744, "step": 655 }, { "epoch": 0.08, "learning_rate": 1.9878479548409285e-05, "loss": 0.8806, "step": 656 }, { "epoch": 0.08, "learning_rate": 1.9877878446434862e-05, "loss": 0.9057, "step": 657 }, { "epoch": 0.08, "learning_rate": 1.9877275870581302e-05, "loss": 0.8198, "step": 658 }, { "epoch": 0.08, "learning_rate": 1.9876671820938508e-05, "loss": 0.8438, "step": 659 }, { "epoch": 0.08, "learning_rate": 1.9876066297596615e-05, "loss": 0.8979, "step": 660 }, { "epoch": 0.08, "learning_rate": 1.987545930064597e-05, "loss": 0.8421, "step": 661 }, { "epoch": 0.08, "learning_rate": 1.9874850830177142e-05, "loss": 0.8834, "step": 662 }, { "epoch": 0.08, "learning_rate": 1.987424088628092e-05, "loss": 0.87, "step": 663 }, { "epoch": 0.08, "learning_rate": 1.987362946904832e-05, "loss": 0.8806, "step": 664 }, { "epoch": 0.08, "learning_rate": 1.9873016578570566e-05, "loss": 0.8711, "step": 665 }, { "epoch": 0.08, "learning_rate": 1.987240221493911e-05, "loss": 0.8828, "step": 666 }, { "epoch": 0.08, "learning_rate": 1.9871786378245622e-05, "loss": 0.8655, "step": 667 }, { "epoch": 0.08, "learning_rate": 1.9871169068581987e-05, "loss": 0.8633, "step": 668 }, { "epoch": 0.08, "learning_rate": 1.9870550286040318e-05, "loss": 0.8683, "step": 669 }, { "epoch": 0.08, "learning_rate": 1.986993003071294e-05, "loss": 0.8817, "step": 670 }, { "epoch": 0.08, "learning_rate": 1.9869308302692406e-05, "loss": 0.8499, "step": 671 }, { "epoch": 0.08, "learning_rate": 1.9868685102071482e-05, "loss": 0.88, "step": 672 }, { "epoch": 0.08, "learning_rate": 1.9868060428943154e-05, "loss": 0.8901, "step": 673 }, { "epoch": 0.08, "learning_rate": 1.9867434283400634e-05, "loss": 0.8783, "step": 674 }, { "epoch": 0.08, "learning_rate": 1.9866806665537338e-05, "loss": 0.856, "step": 675 }, { "epoch": 0.08, "learning_rate": 1.9866177575446927e-05, "loss": 0.8577, "step": 676 }, { "epoch": 0.08, "learning_rate": 1.9865547013223262e-05, "loss": 0.8398, "step": 677 }, { "epoch": 0.08, "learning_rate": 1.9864914978960428e-05, "loss": 0.8566, "step": 678 }, { "epoch": 0.08, "learning_rate": 1.986428147275273e-05, "loss": 0.9001, "step": 679 }, { "epoch": 0.08, "learning_rate": 1.98636464946947e-05, "loss": 0.8583, "step": 680 }, { "epoch": 0.08, "learning_rate": 1.9863010044881074e-05, "loss": 0.8438, "step": 681 }, { "epoch": 0.08, "learning_rate": 1.9862372123406824e-05, "loss": 0.87, "step": 682 }, { "epoch": 0.08, "learning_rate": 1.986173273036713e-05, "loss": 0.8577, "step": 683 }, { "epoch": 0.08, "learning_rate": 1.9861091865857395e-05, "loss": 0.8828, "step": 684 }, { "epoch": 0.08, "learning_rate": 1.986044952997325e-05, "loss": 0.9247, "step": 685 }, { "epoch": 0.08, "learning_rate": 1.9859805722810527e-05, "loss": 0.8761, "step": 686 }, { "epoch": 0.08, "learning_rate": 1.9859160444465298e-05, "loss": 0.889, "step": 687 }, { "epoch": 0.08, "learning_rate": 1.9858513695033842e-05, "loss": 0.7941, "step": 688 }, { "epoch": 0.08, "learning_rate": 1.9857865474612658e-05, "loss": 0.8521, "step": 689 }, { "epoch": 0.08, "learning_rate": 1.985721578329847e-05, "loss": 0.8343, "step": 690 }, { "epoch": 0.08, "learning_rate": 1.9856564621188218e-05, "loss": 0.8532, "step": 691 }, { "epoch": 0.08, "learning_rate": 1.985591198837906e-05, "loss": 0.8387, "step": 692 }, { "epoch": 0.08, "learning_rate": 1.9855257884968377e-05, "loss": 0.904, "step": 693 }, { "epoch": 0.08, "learning_rate": 1.9854602311053768e-05, "loss": 0.8828, "step": 694 }, { "epoch": 0.08, "learning_rate": 1.985394526673305e-05, "loss": 0.8549, "step": 695 }, { "epoch": 0.08, "learning_rate": 1.9853286752104264e-05, "loss": 0.8432, "step": 696 }, { "epoch": 0.08, "learning_rate": 1.985262676726566e-05, "loss": 0.9018, "step": 697 }, { "epoch": 0.08, "learning_rate": 1.9851965312315725e-05, "loss": 0.7924, "step": 698 }, { "epoch": 0.08, "learning_rate": 1.9851302387353144e-05, "loss": 0.8867, "step": 699 }, { "epoch": 0.08, "learning_rate": 1.9850637992476836e-05, "loss": 0.9001, "step": 700 }, { "epoch": 0.08, "learning_rate": 1.984997212778594e-05, "loss": 0.8878, "step": 701 }, { "epoch": 0.08, "learning_rate": 1.9849304793379804e-05, "loss": 0.8956, "step": 702 }, { "epoch": 0.08, "learning_rate": 1.9848635989358004e-05, "loss": 0.8789, "step": 703 }, { "epoch": 0.08, "learning_rate": 1.9847965715820332e-05, "loss": 0.8253, "step": 704 }, { "epoch": 0.08, "learning_rate": 1.9847293972866796e-05, "loss": 0.88, "step": 705 }, { "epoch": 0.08, "learning_rate": 1.984662076059763e-05, "loss": 0.8996, "step": 706 }, { "epoch": 0.08, "learning_rate": 1.984594607911329e-05, "loss": 0.8677, "step": 707 }, { "epoch": 0.08, "learning_rate": 1.9845269928514433e-05, "loss": 0.9157, "step": 708 }, { "epoch": 0.08, "learning_rate": 1.9844592308901953e-05, "loss": 0.8622, "step": 709 }, { "epoch": 0.08, "learning_rate": 1.984391322037696e-05, "loss": 0.8326, "step": 710 }, { "epoch": 0.08, "learning_rate": 1.984323266304078e-05, "loss": 0.8906, "step": 711 }, { "epoch": 0.08, "learning_rate": 1.984255063699496e-05, "loss": 0.8265, "step": 712 }, { "epoch": 0.09, "learning_rate": 1.9841867142341254e-05, "loss": 0.8689, "step": 713 }, { "epoch": 0.09, "learning_rate": 1.9841182179181665e-05, "loss": 0.8521, "step": 714 }, { "epoch": 0.09, "learning_rate": 1.9840495747618385e-05, "loss": 0.8181, "step": 715 }, { "epoch": 0.09, "learning_rate": 1.983980784775384e-05, "loss": 0.8767, "step": 716 }, { "epoch": 0.09, "learning_rate": 1.9839118479690666e-05, "loss": 0.8778, "step": 717 }, { "epoch": 0.09, "learning_rate": 1.9838427643531727e-05, "loss": 0.8588, "step": 718 }, { "epoch": 0.09, "learning_rate": 1.9837735339380105e-05, "loss": 0.8817, "step": 719 }, { "epoch": 0.09, "learning_rate": 1.98370415673391e-05, "loss": 0.8605, "step": 720 }, { "epoch": 0.09, "learning_rate": 1.9836346327512226e-05, "loss": 0.8577, "step": 721 }, { "epoch": 0.09, "learning_rate": 1.983564962000322e-05, "loss": 0.8828, "step": 722 }, { "epoch": 0.09, "learning_rate": 1.9834951444916038e-05, "loss": 0.8454, "step": 723 }, { "epoch": 0.09, "learning_rate": 1.9834251802354856e-05, "loss": 0.7969, "step": 724 }, { "epoch": 0.09, "learning_rate": 1.9833550692424067e-05, "loss": 0.8996, "step": 725 }, { "epoch": 0.09, "learning_rate": 1.9832848115228284e-05, "loss": 0.817, "step": 726 }, { "epoch": 0.09, "learning_rate": 1.9832144070872337e-05, "loss": 0.8259, "step": 727 }, { "epoch": 0.09, "learning_rate": 1.983143855946128e-05, "loss": 0.832, "step": 728 }, { "epoch": 0.09, "learning_rate": 1.9830731581100382e-05, "loss": 0.8895, "step": 729 }, { "epoch": 0.09, "learning_rate": 1.9830023135895128e-05, "loss": 0.8823, "step": 730 }, { "epoch": 0.09, "learning_rate": 1.9829313223951224e-05, "loss": 0.8577, "step": 731 }, { "epoch": 0.09, "learning_rate": 1.9828601845374604e-05, "loss": 0.861, "step": 732 }, { "epoch": 0.09, "learning_rate": 1.9827889000271403e-05, "loss": 0.8795, "step": 733 }, { "epoch": 0.09, "learning_rate": 1.9827174688747993e-05, "loss": 0.8365, "step": 734 }, { "epoch": 0.09, "learning_rate": 1.982645891091095e-05, "loss": 0.8599, "step": 735 }, { "epoch": 0.09, "learning_rate": 1.982574166686708e-05, "loss": 0.822, "step": 736 }, { "epoch": 0.09, "learning_rate": 1.98250229567234e-05, "loss": 0.8181, "step": 737 }, { "epoch": 0.09, "learning_rate": 1.982430278058715e-05, "loss": 0.8549, "step": 738 }, { "epoch": 0.09, "learning_rate": 1.9823581138565787e-05, "loss": 0.8767, "step": 739 }, { "epoch": 0.09, "learning_rate": 1.9822858030766993e-05, "loss": 0.947, "step": 740 }, { "epoch": 0.09, "learning_rate": 1.9822133457298653e-05, "loss": 0.8309, "step": 741 }, { "epoch": 0.09, "learning_rate": 1.9821407418268886e-05, "loss": 0.9118, "step": 742 }, { "epoch": 0.09, "learning_rate": 1.9820679913786022e-05, "loss": 0.8973, "step": 743 }, { "epoch": 0.09, "learning_rate": 1.981995094395862e-05, "loss": 0.8789, "step": 744 }, { "epoch": 0.09, "learning_rate": 1.981922050889544e-05, "loss": 0.8917, "step": 745 }, { "epoch": 0.09, "learning_rate": 1.9818488608705473e-05, "loss": 0.8499, "step": 746 }, { "epoch": 0.09, "learning_rate": 1.9817755243497926e-05, "loss": 0.8538, "step": 747 }, { "epoch": 0.09, "learning_rate": 1.9817020413382227e-05, "loss": 0.8756, "step": 748 }, { "epoch": 0.09, "learning_rate": 1.981628411846802e-05, "loss": 0.8655, "step": 749 }, { "epoch": 0.09, "learning_rate": 1.9815546358865162e-05, "loss": 0.9169, "step": 750 }, { "epoch": 0.09, "learning_rate": 1.981480713468374e-05, "loss": 0.8571, "step": 751 }, { "epoch": 0.09, "learning_rate": 1.981406644603405e-05, "loss": 0.8867, "step": 752 }, { "epoch": 0.09, "learning_rate": 1.9813324293026614e-05, "loss": 0.8209, "step": 753 }, { "epoch": 0.09, "learning_rate": 1.9812580675772165e-05, "loss": 0.8253, "step": 754 }, { "epoch": 0.09, "learning_rate": 1.9811835594381662e-05, "loss": 0.8426, "step": 755 }, { "epoch": 0.09, "learning_rate": 1.9811089048966277e-05, "loss": 0.8979, "step": 756 }, { "epoch": 0.09, "learning_rate": 1.98103410396374e-05, "loss": 0.8867, "step": 757 }, { "epoch": 0.09, "learning_rate": 1.9809591566506646e-05, "loss": 0.8806, "step": 758 }, { "epoch": 0.09, "learning_rate": 1.9808840629685837e-05, "loss": 0.875, "step": 759 }, { "epoch": 0.09, "learning_rate": 1.9808088229287026e-05, "loss": 0.8583, "step": 760 }, { "epoch": 0.09, "learning_rate": 1.9807334365422477e-05, "loss": 0.8588, "step": 761 }, { "epoch": 0.09, "learning_rate": 1.9806579038204676e-05, "loss": 0.8811, "step": 762 }, { "epoch": 0.09, "learning_rate": 1.980582224774632e-05, "loss": 0.7941, "step": 763 }, { "epoch": 0.09, "learning_rate": 1.9805063994160337e-05, "loss": 0.8488, "step": 764 }, { "epoch": 0.09, "learning_rate": 1.9804304277559866e-05, "loss": 0.8426, "step": 765 }, { "epoch": 0.09, "learning_rate": 1.9803543098058255e-05, "loss": 0.9196, "step": 766 }, { "epoch": 0.09, "learning_rate": 1.9802780455769088e-05, "loss": 0.8772, "step": 767 }, { "epoch": 0.09, "learning_rate": 1.9802016350806157e-05, "loss": 0.9699, "step": 768 }, { "epoch": 0.09, "learning_rate": 1.9801250783283472e-05, "loss": 0.9085, "step": 769 }, { "epoch": 0.09, "learning_rate": 1.980048375331527e-05, "loss": 0.7985, "step": 770 }, { "epoch": 0.09, "learning_rate": 1.9799715261015988e-05, "loss": 0.8566, "step": 771 }, { "epoch": 0.09, "learning_rate": 1.9798945306500303e-05, "loss": 0.8917, "step": 772 }, { "epoch": 0.09, "learning_rate": 1.9798173889883096e-05, "loss": 0.8315, "step": 773 }, { "epoch": 0.09, "learning_rate": 1.979740101127947e-05, "loss": 0.8493, "step": 774 }, { "epoch": 0.09, "learning_rate": 1.979662667080475e-05, "loss": 0.8839, "step": 775 }, { "epoch": 0.09, "learning_rate": 1.979585086857447e-05, "loss": 0.9079, "step": 776 }, { "epoch": 0.09, "learning_rate": 1.9795073604704393e-05, "loss": 0.9113, "step": 777 }, { "epoch": 0.09, "learning_rate": 1.9794294879310488e-05, "loss": 0.9141, "step": 778 }, { "epoch": 0.09, "learning_rate": 1.9793514692508955e-05, "loss": 0.8365, "step": 779 }, { "epoch": 0.09, "learning_rate": 1.97927330444162e-05, "loss": 0.8449, "step": 780 }, { "epoch": 0.09, "learning_rate": 1.9791949935148856e-05, "loss": 0.8577, "step": 781 }, { "epoch": 0.09, "learning_rate": 1.9791165364823774e-05, "loss": 0.9202, "step": 782 }, { "epoch": 0.09, "learning_rate": 1.9790379333558016e-05, "loss": 0.9018, "step": 783 }, { "epoch": 0.09, "learning_rate": 1.9789591841468862e-05, "loss": 0.8633, "step": 784 }, { "epoch": 0.09, "learning_rate": 1.978880288867382e-05, "loss": 0.8717, "step": 785 }, { "epoch": 0.09, "learning_rate": 1.978801247529061e-05, "loss": 0.8499, "step": 786 }, { "epoch": 0.09, "learning_rate": 1.9787220601437164e-05, "loss": 0.8398, "step": 787 }, { "epoch": 0.09, "learning_rate": 1.9786427267231642e-05, "loss": 0.8616, "step": 788 }, { "epoch": 0.09, "learning_rate": 1.978563247279242e-05, "loss": 0.8711, "step": 789 }, { "epoch": 0.09, "learning_rate": 1.9784836218238082e-05, "loss": 0.8259, "step": 790 }, { "epoch": 0.09, "learning_rate": 1.978403850368744e-05, "loss": 0.9085, "step": 791 }, { "epoch": 0.09, "learning_rate": 1.9783239329259525e-05, "loss": 0.8471, "step": 792 }, { "epoch": 0.09, "learning_rate": 1.978243869507358e-05, "loss": 0.8493, "step": 793 }, { "epoch": 0.09, "learning_rate": 1.978163660124906e-05, "loss": 0.841, "step": 794 }, { "epoch": 0.09, "learning_rate": 1.9780833047905655e-05, "loss": 0.8996, "step": 795 }, { "epoch": 0.09, "learning_rate": 1.9780028035163265e-05, "loss": 0.8571, "step": 796 }, { "epoch": 0.1, "learning_rate": 1.9779221563141997e-05, "loss": 0.8806, "step": 797 }, { "epoch": 0.1, "learning_rate": 1.977841363196219e-05, "loss": 0.9096, "step": 798 }, { "epoch": 0.1, "learning_rate": 1.9777604241744395e-05, "loss": 0.9018, "step": 799 }, { "epoch": 0.1, "learning_rate": 1.977679339260938e-05, "loss": 0.8488, "step": 800 }, { "epoch": 0.1, "learning_rate": 1.9775981084678134e-05, "loss": 0.8739, "step": 801 }, { "epoch": 0.1, "learning_rate": 1.977516731807186e-05, "loss": 0.8365, "step": 802 }, { "epoch": 0.1, "learning_rate": 1.977435209291198e-05, "loss": 0.7896, "step": 803 }, { "epoch": 0.1, "learning_rate": 1.9773535409320136e-05, "loss": 0.8594, "step": 804 }, { "epoch": 0.1, "learning_rate": 1.977271726741818e-05, "loss": 0.8823, "step": 805 }, { "epoch": 0.1, "learning_rate": 1.9771897667328194e-05, "loss": 0.7785, "step": 806 }, { "epoch": 0.1, "learning_rate": 1.9771076609172464e-05, "loss": 0.8761, "step": 807 }, { "epoch": 0.1, "learning_rate": 1.9770254093073505e-05, "loss": 0.8119, "step": 808 }, { "epoch": 0.1, "learning_rate": 1.9769430119154042e-05, "loss": 0.9063, "step": 809 }, { "epoch": 0.1, "learning_rate": 1.9768604687537026e-05, "loss": 0.8783, "step": 810 }, { "epoch": 0.1, "learning_rate": 1.976777779834561e-05, "loss": 0.8237, "step": 811 }, { "epoch": 0.1, "learning_rate": 1.976694945170318e-05, "loss": 0.856, "step": 812 }, { "epoch": 0.1, "learning_rate": 1.9766119647733334e-05, "loss": 0.8544, "step": 813 }, { "epoch": 0.1, "learning_rate": 1.976528838655989e-05, "loss": 0.8376, "step": 814 }, { "epoch": 0.1, "learning_rate": 1.976445566830687e-05, "loss": 0.8449, "step": 815 }, { "epoch": 0.1, "learning_rate": 1.9763621493098535e-05, "loss": 0.8588, "step": 816 }, { "epoch": 0.1, "learning_rate": 1.9762785861059348e-05, "loss": 0.8968, "step": 817 }, { "epoch": 0.1, "learning_rate": 1.976194877231399e-05, "loss": 0.8198, "step": 818 }, { "epoch": 0.1, "learning_rate": 1.976111022698737e-05, "loss": 0.8655, "step": 819 }, { "epoch": 0.1, "learning_rate": 1.9760270225204606e-05, "loss": 0.8599, "step": 820 }, { "epoch": 0.1, "learning_rate": 1.975942876709103e-05, "loss": 0.9007, "step": 821 }, { "epoch": 0.1, "learning_rate": 1.97585858527722e-05, "loss": 0.8549, "step": 822 }, { "epoch": 0.1, "learning_rate": 1.9757741482373887e-05, "loss": 0.8103, "step": 823 }, { "epoch": 0.1, "learning_rate": 1.9756895656022078e-05, "loss": 0.9174, "step": 824 }, { "epoch": 0.1, "learning_rate": 1.975604837384298e-05, "loss": 0.8616, "step": 825 }, { "epoch": 0.1, "learning_rate": 1.9755199635963014e-05, "loss": 0.8744, "step": 826 }, { "epoch": 0.1, "learning_rate": 1.9754349442508825e-05, "loss": 0.8616, "step": 827 }, { "epoch": 0.1, "learning_rate": 1.9753497793607267e-05, "loss": 0.8465, "step": 828 }, { "epoch": 0.1, "learning_rate": 1.9752644689385413e-05, "loss": 0.851, "step": 829 }, { "epoch": 0.1, "learning_rate": 1.9751790129970557e-05, "loss": 0.8421, "step": 830 }, { "epoch": 0.1, "learning_rate": 1.975093411549021e-05, "loss": 0.8733, "step": 831 }, { "epoch": 0.1, "learning_rate": 1.9750076646072097e-05, "loss": 0.8923, "step": 832 }, { "epoch": 0.1, "learning_rate": 1.9749217721844158e-05, "loss": 0.88, "step": 833 }, { "epoch": 0.1, "learning_rate": 1.9748357342934554e-05, "loss": 0.8404, "step": 834 }, { "epoch": 0.1, "learning_rate": 1.9747495509471663e-05, "loss": 0.8956, "step": 835 }, { "epoch": 0.1, "learning_rate": 1.9746632221584082e-05, "loss": 0.8348, "step": 836 }, { "epoch": 0.1, "learning_rate": 1.974576747940062e-05, "loss": 0.8047, "step": 837 }, { "epoch": 0.1, "learning_rate": 1.97449012830503e-05, "loss": 0.9174, "step": 838 }, { "epoch": 0.1, "learning_rate": 1.974403363266238e-05, "loss": 0.8315, "step": 839 }, { "epoch": 0.1, "learning_rate": 1.974316452836631e-05, "loss": 0.8862, "step": 840 }, { "epoch": 0.1, "learning_rate": 1.974229397029177e-05, "loss": 0.8298, "step": 841 }, { "epoch": 0.1, "learning_rate": 1.9741421958568665e-05, "loss": 0.875, "step": 842 }, { "epoch": 0.1, "learning_rate": 1.9740548493327103e-05, "loss": 0.8956, "step": 843 }, { "epoch": 0.1, "learning_rate": 1.973967357469741e-05, "loss": 0.8772, "step": 844 }, { "epoch": 0.1, "learning_rate": 1.9738797202810137e-05, "loss": 0.8834, "step": 845 }, { "epoch": 0.1, "learning_rate": 1.9737919377796046e-05, "loss": 0.8655, "step": 846 }, { "epoch": 0.1, "learning_rate": 1.973704009978612e-05, "loss": 0.8973, "step": 847 }, { "epoch": 0.1, "learning_rate": 1.9736159368911553e-05, "loss": 0.7868, "step": 848 }, { "epoch": 0.1, "learning_rate": 1.973527718530376e-05, "loss": 0.8828, "step": 849 }, { "epoch": 0.1, "learning_rate": 1.9734393549094376e-05, "loss": 0.8917, "step": 850 }, { "epoch": 0.1, "learning_rate": 1.973350846041524e-05, "loss": 0.8677, "step": 851 }, { "epoch": 0.1, "learning_rate": 1.973262191939842e-05, "loss": 0.8069, "step": 852 }, { "epoch": 0.1, "learning_rate": 1.9731733926176195e-05, "loss": 0.8638, "step": 853 }, { "epoch": 0.1, "learning_rate": 1.973084448088107e-05, "loss": 0.8438, "step": 854 }, { "epoch": 0.1, "learning_rate": 1.9729953583645752e-05, "loss": 0.8817, "step": 855 }, { "epoch": 0.1, "learning_rate": 1.9729061234603173e-05, "loss": 0.894, "step": 856 }, { "epoch": 0.1, "learning_rate": 1.972816743388648e-05, "loss": 0.8393, "step": 857 }, { "epoch": 0.1, "learning_rate": 1.972727218162904e-05, "loss": 0.7997, "step": 858 }, { "epoch": 0.1, "learning_rate": 1.9726375477964436e-05, "loss": 0.8566, "step": 859 }, { "epoch": 0.1, "learning_rate": 1.9725477323026457e-05, "loss": 0.8811, "step": 860 }, { "epoch": 0.1, "learning_rate": 1.972457771694912e-05, "loss": 0.8711, "step": 861 }, { "epoch": 0.1, "learning_rate": 1.972367665986666e-05, "loss": 0.8203, "step": 862 }, { "epoch": 0.1, "learning_rate": 1.972277415191352e-05, "loss": 0.798, "step": 863 }, { "epoch": 0.1, "learning_rate": 1.972187019322436e-05, "loss": 0.8454, "step": 864 }, { "epoch": 0.1, "learning_rate": 1.9720964783934066e-05, "loss": 0.8984, "step": 865 }, { "epoch": 0.1, "learning_rate": 1.972005792417773e-05, "loss": 0.8465, "step": 866 }, { "epoch": 0.1, "learning_rate": 1.9719149614090667e-05, "loss": 0.8343, "step": 867 }, { "epoch": 0.1, "learning_rate": 1.9718239853808405e-05, "loss": 0.8438, "step": 868 }, { "epoch": 0.1, "learning_rate": 1.971732864346669e-05, "loss": 0.8845, "step": 869 }, { "epoch": 0.1, "learning_rate": 1.9716415983201484e-05, "loss": 0.851, "step": 870 }, { "epoch": 0.1, "learning_rate": 1.9715501873148962e-05, "loss": 0.7963, "step": 871 }, { "epoch": 0.1, "learning_rate": 1.9714586313445522e-05, "loss": 0.856, "step": 872 }, { "epoch": 0.1, "learning_rate": 1.9713669304227773e-05, "loss": 0.8281, "step": 873 }, { "epoch": 0.1, "learning_rate": 1.9712750845632543e-05, "loss": 0.861, "step": 874 }, { "epoch": 0.1, "learning_rate": 1.9711830937796877e-05, "loss": 0.8739, "step": 875 }, { "epoch": 0.1, "learning_rate": 1.971090958085803e-05, "loss": 0.8605, "step": 876 }, { "epoch": 0.1, "learning_rate": 1.9709986774953484e-05, "loss": 0.8426, "step": 877 }, { "epoch": 0.1, "learning_rate": 1.9709062520220924e-05, "loss": 0.8789, "step": 878 }, { "epoch": 0.1, "learning_rate": 1.9708136816798262e-05, "loss": 0.8583, "step": 879 }, { "epoch": 0.1, "learning_rate": 1.970720966482362e-05, "loss": 0.9241, "step": 880 }, { "epoch": 0.11, "learning_rate": 1.970628106443534e-05, "loss": 0.8532, "step": 881 }, { "epoch": 0.11, "learning_rate": 1.9705351015771983e-05, "loss": 0.8337, "step": 882 }, { "epoch": 0.11, "learning_rate": 1.9704419518972312e-05, "loss": 0.9263, "step": 883 }, { "epoch": 0.11, "learning_rate": 1.9703486574175324e-05, "loss": 0.8644, "step": 884 }, { "epoch": 0.11, "learning_rate": 1.970255218152022e-05, "loss": 0.8689, "step": 885 }, { "epoch": 0.11, "learning_rate": 1.9701616341146424e-05, "loss": 0.8493, "step": 886 }, { "epoch": 0.11, "learning_rate": 1.9700679053193566e-05, "loss": 0.8666, "step": 887 }, { "epoch": 0.11, "learning_rate": 1.9699740317801507e-05, "loss": 0.9029, "step": 888 }, { "epoch": 0.11, "learning_rate": 1.969880013511031e-05, "loss": 0.8834, "step": 889 }, { "epoch": 0.11, "learning_rate": 1.969785850526026e-05, "loss": 0.8471, "step": 890 }, { "epoch": 0.11, "learning_rate": 1.9696915428391862e-05, "loss": 0.8616, "step": 891 }, { "epoch": 0.11, "learning_rate": 1.9695970904645828e-05, "loss": 0.9057, "step": 892 }, { "epoch": 0.11, "learning_rate": 1.9695024934163096e-05, "loss": 0.8823, "step": 893 }, { "epoch": 0.11, "learning_rate": 1.9694077517084807e-05, "loss": 0.8482, "step": 894 }, { "epoch": 0.11, "learning_rate": 1.9693128653552332e-05, "loss": 0.8281, "step": 895 }, { "epoch": 0.11, "learning_rate": 1.9692178343707248e-05, "loss": 0.9487, "step": 896 }, { "epoch": 0.11, "learning_rate": 1.9691226587691347e-05, "loss": 0.8365, "step": 897 }, { "epoch": 0.11, "learning_rate": 1.9690273385646647e-05, "loss": 0.841, "step": 898 }, { "epoch": 0.11, "learning_rate": 1.9689318737715374e-05, "loss": 0.8806, "step": 899 }, { "epoch": 0.11, "learning_rate": 1.9688362644039965e-05, "loss": 0.8705, "step": 900 }, { "epoch": 0.11, "learning_rate": 1.9687405104763092e-05, "loss": 0.8778, "step": 901 }, { "epoch": 0.11, "learning_rate": 1.9686446120027616e-05, "loss": 0.8142, "step": 902 }, { "epoch": 0.11, "learning_rate": 1.9685485689976632e-05, "loss": 0.8298, "step": 903 }, { "epoch": 0.11, "learning_rate": 1.968452381475345e-05, "loss": 0.8622, "step": 904 }, { "epoch": 0.11, "learning_rate": 1.9683560494501585e-05, "loss": 0.8488, "step": 905 }, { "epoch": 0.11, "learning_rate": 1.9682595729364777e-05, "loss": 0.8683, "step": 906 }, { "epoch": 0.11, "learning_rate": 1.9681629519486978e-05, "loss": 0.8493, "step": 907 }, { "epoch": 0.11, "learning_rate": 1.968066186501236e-05, "loss": 0.8789, "step": 908 }, { "epoch": 0.11, "learning_rate": 1.9679692766085297e-05, "loss": 0.9001, "step": 909 }, { "epoch": 0.11, "learning_rate": 1.9678722222850403e-05, "loss": 0.8661, "step": 910 }, { "epoch": 0.11, "learning_rate": 1.967775023545248e-05, "loss": 0.7545, "step": 911 }, { "epoch": 0.11, "learning_rate": 1.9676776804036564e-05, "loss": 0.9113, "step": 912 }, { "epoch": 0.11, "learning_rate": 1.96758019287479e-05, "loss": 0.8131, "step": 913 }, { "epoch": 0.11, "learning_rate": 1.9674825609731953e-05, "loss": 0.8862, "step": 914 }, { "epoch": 0.11, "learning_rate": 1.9673847847134388e-05, "loss": 0.8733, "step": 915 }, { "epoch": 0.11, "learning_rate": 1.9672868641101113e-05, "loss": 0.8465, "step": 916 }, { "epoch": 0.11, "learning_rate": 1.967188799177822e-05, "loss": 0.8789, "step": 917 }, { "epoch": 0.11, "learning_rate": 1.9670905899312046e-05, "loss": 0.8622, "step": 918 }, { "epoch": 0.11, "learning_rate": 1.9669922363849118e-05, "loss": 0.8566, "step": 919 }, { "epoch": 0.11, "learning_rate": 1.9668937385536196e-05, "loss": 0.9224, "step": 920 }, { "epoch": 0.11, "learning_rate": 1.9667950964520244e-05, "loss": 0.8884, "step": 921 }, { "epoch": 0.11, "learning_rate": 1.966696310094845e-05, "loss": 0.894, "step": 922 }, { "epoch": 0.11, "learning_rate": 1.966597379496821e-05, "loss": 0.9057, "step": 923 }, { "epoch": 0.11, "learning_rate": 1.966498304672714e-05, "loss": 0.9035, "step": 924 }, { "epoch": 0.11, "learning_rate": 1.966399085637307e-05, "loss": 0.9732, "step": 925 }, { "epoch": 0.11, "learning_rate": 1.9662997224054048e-05, "loss": 0.8616, "step": 926 }, { "epoch": 0.11, "learning_rate": 1.9662002149918328e-05, "loss": 0.8471, "step": 927 }, { "epoch": 0.11, "learning_rate": 1.9661005634114384e-05, "loss": 0.9001, "step": 928 }, { "epoch": 0.11, "learning_rate": 1.9660007676790913e-05, "loss": 0.8175, "step": 929 }, { "epoch": 0.11, "learning_rate": 1.9659008278096815e-05, "loss": 0.8828, "step": 930 }, { "epoch": 0.11, "learning_rate": 1.9658007438181216e-05, "loss": 0.8577, "step": 931 }, { "epoch": 0.11, "learning_rate": 1.9657005157193444e-05, "loss": 0.8605, "step": 932 }, { "epoch": 0.11, "learning_rate": 1.9656001435283054e-05, "loss": 0.8471, "step": 933 }, { "epoch": 0.11, "learning_rate": 1.965499627259981e-05, "loss": 0.8465, "step": 934 }, { "epoch": 0.11, "learning_rate": 1.9653989669293697e-05, "loss": 0.8214, "step": 935 }, { "epoch": 0.11, "learning_rate": 1.9652981625514903e-05, "loss": 0.8047, "step": 936 }, { "epoch": 0.11, "learning_rate": 1.9651972141413842e-05, "loss": 0.8811, "step": 937 }, { "epoch": 0.11, "learning_rate": 1.965096121714114e-05, "loss": 0.8438, "step": 938 }, { "epoch": 0.11, "learning_rate": 1.9649948852847636e-05, "loss": 0.8705, "step": 939 }, { "epoch": 0.11, "learning_rate": 1.9648935048684384e-05, "loss": 0.9079, "step": 940 }, { "epoch": 0.11, "learning_rate": 1.9647919804802657e-05, "loss": 0.8828, "step": 941 }, { "epoch": 0.11, "learning_rate": 1.9646903121353934e-05, "loss": 0.8516, "step": 942 }, { "epoch": 0.11, "learning_rate": 1.964588499848992e-05, "loss": 0.803, "step": 943 }, { "epoch": 0.11, "learning_rate": 1.9644865436362524e-05, "loss": 0.8605, "step": 944 }, { "epoch": 0.11, "learning_rate": 1.964384443512388e-05, "loss": 0.8945, "step": 945 }, { "epoch": 0.11, "learning_rate": 1.9642821994926335e-05, "loss": 0.8566, "step": 946 }, { "epoch": 0.11, "learning_rate": 1.9641798115922436e-05, "loss": 0.8209, "step": 947 }, { "epoch": 0.11, "learning_rate": 1.9640772798264964e-05, "loss": 0.7751, "step": 948 }, { "epoch": 0.11, "learning_rate": 1.9639746042106906e-05, "loss": 0.8214, "step": 949 }, { "epoch": 0.11, "learning_rate": 1.963871784760146e-05, "loss": 0.8426, "step": 950 }, { "epoch": 0.11, "learning_rate": 1.963768821490205e-05, "loss": 0.8599, "step": 951 }, { "epoch": 0.11, "learning_rate": 1.9636657144162304e-05, "loss": 0.8929, "step": 952 }, { "epoch": 0.11, "learning_rate": 1.9635624635536065e-05, "loss": 0.8599, "step": 953 }, { "epoch": 0.11, "learning_rate": 1.96345906891774e-05, "loss": 0.8633, "step": 954 }, { "epoch": 0.11, "learning_rate": 1.963355530524058e-05, "loss": 0.8343, "step": 955 }, { "epoch": 0.11, "learning_rate": 1.9632518483880095e-05, "loss": 0.8482, "step": 956 }, { "epoch": 0.11, "learning_rate": 1.963148022525065e-05, "loss": 0.803, "step": 957 }, { "epoch": 0.11, "learning_rate": 1.9630440529507164e-05, "loss": 0.8739, "step": 958 }, { "epoch": 0.11, "learning_rate": 1.962939939680477e-05, "loss": 0.8337, "step": 959 }, { "epoch": 0.11, "learning_rate": 1.9628356827298814e-05, "loss": 0.8119, "step": 960 }, { "epoch": 0.11, "learning_rate": 1.962731282114486e-05, "loss": 0.7489, "step": 961 }, { "epoch": 0.11, "learning_rate": 1.9626267378498684e-05, "loss": 0.7963, "step": 962 }, { "epoch": 0.11, "learning_rate": 1.9625220499516272e-05, "loss": 0.8365, "step": 963 }, { "epoch": 0.11, "learning_rate": 1.962417218435384e-05, "loss": 0.8237, "step": 964 }, { "epoch": 0.12, "learning_rate": 1.9623122433167793e-05, "loss": 0.8443, "step": 965 }, { "epoch": 0.12, "learning_rate": 1.9622071246114774e-05, "loss": 0.8253, "step": 966 }, { "epoch": 0.12, "learning_rate": 1.962101862335163e-05, "loss": 0.8158, "step": 967 }, { "epoch": 0.12, "learning_rate": 1.961996456503542e-05, "loss": 0.8789, "step": 968 }, { "epoch": 0.12, "learning_rate": 1.961890907132342e-05, "loss": 0.8588, "step": 969 }, { "epoch": 0.12, "learning_rate": 1.9617852142373126e-05, "loss": 0.8549, "step": 970 }, { "epoch": 0.12, "learning_rate": 1.9616793778342234e-05, "loss": 0.8292, "step": 971 }, { "epoch": 0.12, "learning_rate": 1.961573397938867e-05, "loss": 0.7606, "step": 972 }, { "epoch": 0.12, "learning_rate": 1.961467274567056e-05, "loss": 0.8627, "step": 973 }, { "epoch": 0.12, "learning_rate": 1.9613610077346257e-05, "loss": 0.8588, "step": 974 }, { "epoch": 0.12, "learning_rate": 1.9612545974574315e-05, "loss": 0.9063, "step": 975 }, { "epoch": 0.12, "learning_rate": 1.9611480437513516e-05, "loss": 0.8315, "step": 976 }, { "epoch": 0.12, "learning_rate": 1.9610413466322846e-05, "loss": 0.8566, "step": 977 }, { "epoch": 0.12, "learning_rate": 1.960934506116151e-05, "loss": 0.8594, "step": 978 }, { "epoch": 0.12, "learning_rate": 1.9608275222188917e-05, "loss": 0.8438, "step": 979 }, { "epoch": 0.12, "learning_rate": 1.9607203949564706e-05, "loss": 0.865, "step": 980 }, { "epoch": 0.12, "learning_rate": 1.9606131243448718e-05, "loss": 0.8415, "step": 981 }, { "epoch": 0.12, "learning_rate": 1.960505710400101e-05, "loss": 0.8069, "step": 982 }, { "epoch": 0.12, "learning_rate": 1.9603981531381863e-05, "loss": 0.8845, "step": 983 }, { "epoch": 0.12, "learning_rate": 1.9602904525751754e-05, "loss": 0.8465, "step": 984 }, { "epoch": 0.12, "learning_rate": 1.9601826087271387e-05, "loss": 0.8683, "step": 985 }, { "epoch": 0.12, "learning_rate": 1.9600746216101675e-05, "loss": 0.8309, "step": 986 }, { "epoch": 0.12, "learning_rate": 1.9599664912403748e-05, "loss": 0.8225, "step": 987 }, { "epoch": 0.12, "learning_rate": 1.959858217633894e-05, "loss": 0.8376, "step": 988 }, { "epoch": 0.12, "learning_rate": 1.9597498008068817e-05, "loss": 0.861, "step": 989 }, { "epoch": 0.12, "learning_rate": 1.959641240775514e-05, "loss": 0.8382, "step": 990 }, { "epoch": 0.12, "learning_rate": 1.9595325375559894e-05, "loss": 0.8811, "step": 991 }, { "epoch": 0.12, "learning_rate": 1.9594236911645272e-05, "loss": 0.8739, "step": 992 }, { "epoch": 0.12, "learning_rate": 1.9593147016173693e-05, "loss": 0.885, "step": 993 }, { "epoch": 0.12, "learning_rate": 1.959205568930777e-05, "loss": 0.8292, "step": 994 }, { "epoch": 0.12, "learning_rate": 1.9590962931210345e-05, "loss": 0.8175, "step": 995 }, { "epoch": 0.12, "learning_rate": 1.9589868742044466e-05, "loss": 0.87, "step": 996 }, { "epoch": 0.12, "learning_rate": 1.9588773121973402e-05, "loss": 0.8549, "step": 997 }, { "epoch": 0.12, "learning_rate": 1.9587676071160627e-05, "loss": 0.9235, "step": 998 }, { "epoch": 0.12, "learning_rate": 1.9586577589769834e-05, "loss": 0.8694, "step": 999 }, { "epoch": 0.12, "learning_rate": 1.958547767796492e-05, "loss": 0.8309, "step": 1000 }, { "epoch": 0.12, "learning_rate": 1.9584376335910014e-05, "loss": 0.8711, "step": 1001 }, { "epoch": 0.12, "learning_rate": 1.958327356376944e-05, "loss": 0.7785, "step": 1002 }, { "epoch": 0.12, "learning_rate": 1.9582169361707746e-05, "loss": 0.8549, "step": 1003 }, { "epoch": 0.12, "learning_rate": 1.958106372988969e-05, "loss": 0.8705, "step": 1004 }, { "epoch": 0.12, "learning_rate": 1.957995666848024e-05, "loss": 0.841, "step": 1005 }, { "epoch": 0.12, "learning_rate": 1.9578848177644586e-05, "loss": 0.909, "step": 1006 }, { "epoch": 0.12, "learning_rate": 1.957773825754812e-05, "loss": 0.8756, "step": 1007 }, { "epoch": 0.12, "learning_rate": 1.9576626908356458e-05, "loss": 0.865, "step": 1008 }, { "epoch": 0.12, "learning_rate": 1.9575514130235423e-05, "loss": 0.8337, "step": 1009 }, { "epoch": 0.12, "learning_rate": 1.9574399923351054e-05, "loss": 0.8387, "step": 1010 }, { "epoch": 0.12, "learning_rate": 1.95732842878696e-05, "loss": 0.8705, "step": 1011 }, { "epoch": 0.12, "learning_rate": 1.9572167223957526e-05, "loss": 0.856, "step": 1012 }, { "epoch": 0.12, "learning_rate": 1.957104873178151e-05, "loss": 0.7974, "step": 1013 }, { "epoch": 0.12, "learning_rate": 1.956992881150844e-05, "loss": 0.8499, "step": 1014 }, { "epoch": 0.12, "learning_rate": 1.956880746330542e-05, "loss": 0.904, "step": 1015 }, { "epoch": 0.12, "learning_rate": 1.9567684687339764e-05, "loss": 0.8666, "step": 1016 }, { "epoch": 0.12, "learning_rate": 1.9566560483779013e-05, "loss": 0.8532, "step": 1017 }, { "epoch": 0.12, "learning_rate": 1.9565434852790895e-05, "loss": 0.8761, "step": 1018 }, { "epoch": 0.12, "learning_rate": 1.956430779454337e-05, "loss": 0.8594, "step": 1019 }, { "epoch": 0.12, "learning_rate": 1.9563179309204612e-05, "loss": 0.827, "step": 1020 }, { "epoch": 0.12, "learning_rate": 1.9562049396942998e-05, "loss": 0.8259, "step": 1021 }, { "epoch": 0.12, "learning_rate": 1.9560918057927123e-05, "loss": 0.8382, "step": 1022 }, { "epoch": 0.12, "learning_rate": 1.9559785292325793e-05, "loss": 0.7573, "step": 1023 }, { "epoch": 0.12, "learning_rate": 1.955865110030803e-05, "loss": 0.8259, "step": 1024 }, { "epoch": 0.12, "learning_rate": 1.9557515482043067e-05, "loss": 0.8209, "step": 1025 }, { "epoch": 0.12, "learning_rate": 1.9556378437700346e-05, "loss": 0.8527, "step": 1026 }, { "epoch": 0.12, "learning_rate": 1.9555239967449528e-05, "loss": 0.8571, "step": 1027 }, { "epoch": 0.12, "learning_rate": 1.955410007146049e-05, "loss": 0.8365, "step": 1028 }, { "epoch": 0.12, "learning_rate": 1.9552958749903302e-05, "loss": 0.774, "step": 1029 }, { "epoch": 0.12, "learning_rate": 1.9551816002948273e-05, "loss": 0.8638, "step": 1030 }, { "epoch": 0.12, "learning_rate": 1.955067183076591e-05, "loss": 0.832, "step": 1031 }, { "epoch": 0.12, "learning_rate": 1.9549526233526934e-05, "loss": 0.7924, "step": 1032 }, { "epoch": 0.12, "learning_rate": 1.9548379211402276e-05, "loss": 0.8555, "step": 1033 }, { "epoch": 0.12, "learning_rate": 1.954723076456309e-05, "loss": 0.8683, "step": 1034 }, { "epoch": 0.12, "learning_rate": 1.954608089318073e-05, "loss": 0.8566, "step": 1035 }, { "epoch": 0.12, "learning_rate": 1.954492959742677e-05, "loss": 0.8315, "step": 1036 }, { "epoch": 0.12, "learning_rate": 1.9543776877473e-05, "loss": 0.8393, "step": 1037 }, { "epoch": 0.12, "learning_rate": 1.9542622733491408e-05, "loss": 0.9129, "step": 1038 }, { "epoch": 0.12, "learning_rate": 1.9541467165654212e-05, "loss": 0.8588, "step": 1039 }, { "epoch": 0.12, "learning_rate": 1.954031017413383e-05, "loss": 0.8253, "step": 1040 }, { "epoch": 0.12, "learning_rate": 1.9539151759102898e-05, "loss": 0.9018, "step": 1041 }, { "epoch": 0.12, "learning_rate": 1.9537991920734267e-05, "loss": 0.8343, "step": 1042 }, { "epoch": 0.12, "learning_rate": 1.953683065920099e-05, "loss": 0.8287, "step": 1043 }, { "epoch": 0.12, "learning_rate": 1.9535667974676343e-05, "loss": 0.8862, "step": 1044 }, { "epoch": 0.12, "learning_rate": 1.953450386733381e-05, "loss": 0.8309, "step": 1045 }, { "epoch": 0.12, "learning_rate": 1.9533338337347082e-05, "loss": 0.8186, "step": 1046 }, { "epoch": 0.12, "learning_rate": 1.9532171384890074e-05, "loss": 0.8359, "step": 1047 }, { "epoch": 0.12, "learning_rate": 1.9531003010136912e-05, "loss": 0.8817, "step": 1048 }, { "epoch": 0.13, "learning_rate": 1.9529833213261918e-05, "loss": 0.8627, "step": 1049 }, { "epoch": 0.13, "learning_rate": 1.9528661994439643e-05, "loss": 0.8064, "step": 1050 }, { "epoch": 0.13, "learning_rate": 1.9527489353844845e-05, "loss": 0.8198, "step": 1051 }, { "epoch": 0.13, "learning_rate": 1.9526315291652493e-05, "loss": 0.8544, "step": 1052 }, { "epoch": 0.13, "learning_rate": 1.9525139808037767e-05, "loss": 0.8817, "step": 1053 }, { "epoch": 0.13, "learning_rate": 1.9523962903176067e-05, "loss": 0.827, "step": 1054 }, { "epoch": 0.13, "learning_rate": 1.952278457724299e-05, "loss": 0.8253, "step": 1055 }, { "epoch": 0.13, "learning_rate": 1.952160483041436e-05, "loss": 0.8661, "step": 1056 }, { "epoch": 0.13, "learning_rate": 1.952042366286621e-05, "loss": 0.8594, "step": 1057 }, { "epoch": 0.13, "learning_rate": 1.9519241074774778e-05, "loss": 0.8092, "step": 1058 }, { "epoch": 0.13, "learning_rate": 1.9518057066316514e-05, "loss": 0.8761, "step": 1059 }, { "epoch": 0.13, "learning_rate": 1.9516871637668094e-05, "loss": 0.861, "step": 1060 }, { "epoch": 0.13, "learning_rate": 1.951568478900639e-05, "loss": 0.9124, "step": 1061 }, { "epoch": 0.13, "learning_rate": 1.951449652050849e-05, "loss": 0.808, "step": 1062 }, { "epoch": 0.13, "learning_rate": 1.9513306832351696e-05, "loss": 0.7985, "step": 1063 }, { "epoch": 0.13, "learning_rate": 1.9512115724713526e-05, "loss": 0.8002, "step": 1064 }, { "epoch": 0.13, "learning_rate": 1.95109231977717e-05, "loss": 0.8817, "step": 1065 }, { "epoch": 0.13, "learning_rate": 1.950972925170416e-05, "loss": 0.8315, "step": 1066 }, { "epoch": 0.13, "learning_rate": 1.9508533886689053e-05, "loss": 0.8203, "step": 1067 }, { "epoch": 0.13, "learning_rate": 1.950733710290474e-05, "loss": 0.8672, "step": 1068 }, { "epoch": 0.13, "learning_rate": 1.9506138900529786e-05, "loss": 0.8783, "step": 1069 }, { "epoch": 0.13, "learning_rate": 1.950493927974299e-05, "loss": 0.8432, "step": 1070 }, { "epoch": 0.13, "learning_rate": 1.950373824072333e-05, "loss": 0.8956, "step": 1071 }, { "epoch": 0.13, "learning_rate": 1.9502535783650028e-05, "loss": 0.9007, "step": 1072 }, { "epoch": 0.13, "learning_rate": 1.9501331908702493e-05, "loss": 0.88, "step": 1073 }, { "epoch": 0.13, "learning_rate": 1.950012661606036e-05, "loss": 0.8443, "step": 1074 }, { "epoch": 0.13, "learning_rate": 1.949891990590347e-05, "loss": 0.8694, "step": 1075 }, { "epoch": 0.13, "learning_rate": 1.9497711778411876e-05, "loss": 0.8571, "step": 1076 }, { "epoch": 0.13, "learning_rate": 1.949650223376584e-05, "loss": 0.8839, "step": 1077 }, { "epoch": 0.13, "learning_rate": 1.9495291272145843e-05, "loss": 0.7991, "step": 1078 }, { "epoch": 0.13, "learning_rate": 1.9494078893732574e-05, "loss": 0.8242, "step": 1079 }, { "epoch": 0.13, "learning_rate": 1.9492865098706926e-05, "loss": 0.8471, "step": 1080 }, { "epoch": 0.13, "learning_rate": 1.9491649887250013e-05, "loss": 0.8337, "step": 1081 }, { "epoch": 0.13, "learning_rate": 1.9490433259543153e-05, "loss": 0.8583, "step": 1082 }, { "epoch": 0.13, "learning_rate": 1.9489215215767885e-05, "loss": 0.8655, "step": 1083 }, { "epoch": 0.13, "learning_rate": 1.948799575610595e-05, "loss": 0.8867, "step": 1084 }, { "epoch": 0.13, "learning_rate": 1.9486774880739305e-05, "loss": 0.8298, "step": 1085 }, { "epoch": 0.13, "learning_rate": 1.9485552589850116e-05, "loss": 0.875, "step": 1086 }, { "epoch": 0.13, "learning_rate": 1.948432888362076e-05, "loss": 0.764, "step": 1087 }, { "epoch": 0.13, "learning_rate": 1.948310376223383e-05, "loss": 0.7824, "step": 1088 }, { "epoch": 0.13, "learning_rate": 1.9481877225872124e-05, "loss": 0.8142, "step": 1089 }, { "epoch": 0.13, "learning_rate": 1.948064927471865e-05, "loss": 0.8767, "step": 1090 }, { "epoch": 0.13, "learning_rate": 1.947941990895664e-05, "loss": 0.8984, "step": 1091 }, { "epoch": 0.13, "learning_rate": 1.947818912876952e-05, "loss": 0.8259, "step": 1092 }, { "epoch": 0.13, "learning_rate": 1.9476956934340936e-05, "loss": 0.851, "step": 1093 }, { "epoch": 0.13, "learning_rate": 1.9475723325854744e-05, "loss": 0.8164, "step": 1094 }, { "epoch": 0.13, "learning_rate": 1.9474488303495014e-05, "loss": 0.933, "step": 1095 }, { "epoch": 0.13, "learning_rate": 1.9473251867446023e-05, "loss": 0.865, "step": 1096 }, { "epoch": 0.13, "learning_rate": 1.9472014017892257e-05, "loss": 0.8432, "step": 1097 }, { "epoch": 0.13, "learning_rate": 1.9470774755018412e-05, "loss": 0.8516, "step": 1098 }, { "epoch": 0.13, "learning_rate": 1.946953407900941e-05, "loss": 0.9185, "step": 1099 }, { "epoch": 0.13, "learning_rate": 1.9468291990050364e-05, "loss": 0.8521, "step": 1100 }, { "epoch": 0.13, "learning_rate": 1.9467048488326606e-05, "loss": 0.851, "step": 1101 }, { "epoch": 0.13, "learning_rate": 1.9465803574023682e-05, "loss": 0.8432, "step": 1102 }, { "epoch": 0.13, "learning_rate": 1.9464557247327348e-05, "loss": 0.8694, "step": 1103 }, { "epoch": 0.13, "learning_rate": 1.9463309508423563e-05, "loss": 0.7997, "step": 1104 }, { "epoch": 0.13, "learning_rate": 1.9462060357498504e-05, "loss": 0.8359, "step": 1105 }, { "epoch": 0.13, "learning_rate": 1.946080979473856e-05, "loss": 0.8527, "step": 1106 }, { "epoch": 0.13, "learning_rate": 1.945955782033032e-05, "loss": 0.8376, "step": 1107 }, { "epoch": 0.13, "learning_rate": 1.94583044344606e-05, "loss": 0.8438, "step": 1108 }, { "epoch": 0.13, "learning_rate": 1.9457049637316413e-05, "loss": 0.9157, "step": 1109 }, { "epoch": 0.13, "learning_rate": 1.9455793429084992e-05, "loss": 0.8114, "step": 1110 }, { "epoch": 0.13, "learning_rate": 1.945453580995377e-05, "loss": 0.7969, "step": 1111 }, { "epoch": 0.13, "learning_rate": 1.94532767801104e-05, "loss": 0.8058, "step": 1112 }, { "epoch": 0.13, "learning_rate": 1.9452016339742736e-05, "loss": 0.8594, "step": 1113 }, { "epoch": 0.13, "learning_rate": 1.9450754489038857e-05, "loss": 0.9057, "step": 1114 }, { "epoch": 0.13, "learning_rate": 1.944949122818704e-05, "loss": 0.8371, "step": 1115 }, { "epoch": 0.13, "learning_rate": 1.9448226557375776e-05, "loss": 0.8544, "step": 1116 }, { "epoch": 0.13, "learning_rate": 1.9446960476793768e-05, "loss": 0.8627, "step": 1117 }, { "epoch": 0.13, "learning_rate": 1.9445692986629927e-05, "loss": 0.8923, "step": 1118 }, { "epoch": 0.13, "learning_rate": 1.9444424087073376e-05, "loss": 0.8192, "step": 1119 }, { "epoch": 0.13, "learning_rate": 1.9443153778313447e-05, "loss": 0.8443, "step": 1120 }, { "epoch": 0.13, "learning_rate": 1.944188206053968e-05, "loss": 0.8951, "step": 1121 }, { "epoch": 0.13, "learning_rate": 1.944060893394183e-05, "loss": 0.8404, "step": 1122 }, { "epoch": 0.13, "learning_rate": 1.943933439870987e-05, "loss": 0.8644, "step": 1123 }, { "epoch": 0.13, "learning_rate": 1.9438058455033958e-05, "loss": 0.7974, "step": 1124 }, { "epoch": 0.13, "learning_rate": 1.9436781103104484e-05, "loss": 0.8175, "step": 1125 }, { "epoch": 0.13, "learning_rate": 1.9435502343112043e-05, "loss": 0.8577, "step": 1126 }, { "epoch": 0.13, "learning_rate": 1.9434222175247442e-05, "loss": 0.8482, "step": 1127 }, { "epoch": 0.13, "learning_rate": 1.943294059970169e-05, "loss": 0.8125, "step": 1128 }, { "epoch": 0.13, "learning_rate": 1.9431657616666008e-05, "loss": 0.7556, "step": 1129 }, { "epoch": 0.13, "learning_rate": 1.9430373226331837e-05, "loss": 0.8594, "step": 1130 }, { "epoch": 0.13, "learning_rate": 1.942908742889082e-05, "loss": 0.8086, "step": 1131 }, { "epoch": 0.14, "learning_rate": 1.9427800224534808e-05, "loss": 0.8421, "step": 1132 }, { "epoch": 0.14, "learning_rate": 1.9426511613455865e-05, "loss": 0.9247, "step": 1133 }, { "epoch": 0.14, "learning_rate": 1.9425221595846268e-05, "loss": 0.8549, "step": 1134 }, { "epoch": 0.14, "learning_rate": 1.9423930171898494e-05, "loss": 0.8276, "step": 1135 }, { "epoch": 0.14, "learning_rate": 1.9422637341805245e-05, "loss": 0.8571, "step": 1136 }, { "epoch": 0.14, "learning_rate": 1.942134310575942e-05, "loss": 0.8253, "step": 1137 }, { "epoch": 0.14, "learning_rate": 1.942004746395413e-05, "loss": 0.8722, "step": 1138 }, { "epoch": 0.14, "learning_rate": 1.9418750416582704e-05, "loss": 0.8265, "step": 1139 }, { "epoch": 0.14, "learning_rate": 1.9417451963838666e-05, "loss": 0.8895, "step": 1140 }, { "epoch": 0.14, "learning_rate": 1.941615210591577e-05, "loss": 0.8114, "step": 1141 }, { "epoch": 0.14, "learning_rate": 1.9414850843007954e-05, "loss": 0.851, "step": 1142 }, { "epoch": 0.14, "learning_rate": 1.941354817530939e-05, "loss": 0.7768, "step": 1143 }, { "epoch": 0.14, "learning_rate": 1.9412244103014443e-05, "loss": 0.8242, "step": 1144 }, { "epoch": 0.14, "learning_rate": 1.9410938626317698e-05, "loss": 0.8315, "step": 1145 }, { "epoch": 0.14, "learning_rate": 1.9409631745413943e-05, "loss": 0.7612, "step": 1146 }, { "epoch": 0.14, "learning_rate": 1.940832346049818e-05, "loss": 0.8064, "step": 1147 }, { "epoch": 0.14, "learning_rate": 1.9407013771765618e-05, "loss": 0.8008, "step": 1148 }, { "epoch": 0.14, "learning_rate": 1.9405702679411675e-05, "loss": 0.7896, "step": 1149 }, { "epoch": 0.14, "learning_rate": 1.9404390183631975e-05, "loss": 0.8895, "step": 1150 }, { "epoch": 0.14, "learning_rate": 1.940307628462236e-05, "loss": 0.7941, "step": 1151 }, { "epoch": 0.14, "learning_rate": 1.9401760982578878e-05, "loss": 0.841, "step": 1152 }, { "epoch": 0.14, "learning_rate": 1.9400444277697782e-05, "loss": 0.8862, "step": 1153 }, { "epoch": 0.14, "learning_rate": 1.9399126170175543e-05, "loss": 0.8644, "step": 1154 }, { "epoch": 0.14, "learning_rate": 1.9397806660208825e-05, "loss": 0.8566, "step": 1155 }, { "epoch": 0.14, "learning_rate": 1.9396485747994527e-05, "loss": 0.8119, "step": 1156 }, { "epoch": 0.14, "learning_rate": 1.939516343372973e-05, "loss": 0.8198, "step": 1157 }, { "epoch": 0.14, "learning_rate": 1.9393839717611748e-05, "loss": 0.8432, "step": 1158 }, { "epoch": 0.14, "learning_rate": 1.939251459983808e-05, "loss": 0.8951, "step": 1159 }, { "epoch": 0.14, "learning_rate": 1.9391188080606456e-05, "loss": 0.8521, "step": 1160 }, { "epoch": 0.14, "learning_rate": 1.9389860160114803e-05, "loss": 0.8214, "step": 1161 }, { "epoch": 0.14, "learning_rate": 1.938853083856126e-05, "loss": 0.7818, "step": 1162 }, { "epoch": 0.14, "learning_rate": 1.9387200116144175e-05, "loss": 0.8633, "step": 1163 }, { "epoch": 0.14, "learning_rate": 1.9385867993062108e-05, "loss": 0.8588, "step": 1164 }, { "epoch": 0.14, "learning_rate": 1.9384534469513822e-05, "loss": 0.8471, "step": 1165 }, { "epoch": 0.14, "learning_rate": 1.9383199545698295e-05, "loss": 0.8259, "step": 1166 }, { "epoch": 0.14, "learning_rate": 1.938186322181471e-05, "loss": 0.8292, "step": 1167 }, { "epoch": 0.14, "learning_rate": 1.9380525498062454e-05, "loss": 0.7985, "step": 1168 }, { "epoch": 0.14, "learning_rate": 1.937918637464114e-05, "loss": 0.8186, "step": 1169 }, { "epoch": 0.14, "learning_rate": 1.937784585175057e-05, "loss": 0.8432, "step": 1170 }, { "epoch": 0.14, "learning_rate": 1.937650392959077e-05, "loss": 0.8432, "step": 1171 }, { "epoch": 0.14, "learning_rate": 1.9375160608361964e-05, "loss": 0.7813, "step": 1172 }, { "epoch": 0.14, "learning_rate": 1.9373815888264585e-05, "loss": 0.7985, "step": 1173 }, { "epoch": 0.14, "learning_rate": 1.9372469769499288e-05, "loss": 0.8398, "step": 1174 }, { "epoch": 0.14, "learning_rate": 1.9371122252266922e-05, "loss": 0.8633, "step": 1175 }, { "epoch": 0.14, "learning_rate": 1.9369773336768555e-05, "loss": 0.9118, "step": 1176 }, { "epoch": 0.14, "learning_rate": 1.9368423023205452e-05, "loss": 0.8354, "step": 1177 }, { "epoch": 0.14, "learning_rate": 1.9367071311779096e-05, "loss": 0.8041, "step": 1178 }, { "epoch": 0.14, "learning_rate": 1.936571820269118e-05, "loss": 0.8186, "step": 1179 }, { "epoch": 0.14, "learning_rate": 1.936436369614359e-05, "loss": 0.817, "step": 1180 }, { "epoch": 0.14, "learning_rate": 1.9363007792338448e-05, "loss": 0.8281, "step": 1181 }, { "epoch": 0.14, "learning_rate": 1.9361650491478062e-05, "loss": 0.8404, "step": 1182 }, { "epoch": 0.14, "learning_rate": 1.9360291793764953e-05, "loss": 0.8923, "step": 1183 }, { "epoch": 0.14, "learning_rate": 1.9358931699401847e-05, "loss": 0.8153, "step": 1184 }, { "epoch": 0.14, "learning_rate": 1.9357570208591693e-05, "loss": 0.88, "step": 1185 }, { "epoch": 0.14, "learning_rate": 1.935620732153764e-05, "loss": 0.8309, "step": 1186 }, { "epoch": 0.14, "learning_rate": 1.9354843038443038e-05, "loss": 0.8683, "step": 1187 }, { "epoch": 0.14, "learning_rate": 1.9353477359511453e-05, "loss": 0.8979, "step": 1188 }, { "epoch": 0.14, "learning_rate": 1.9352110284946662e-05, "loss": 0.8555, "step": 1189 }, { "epoch": 0.14, "learning_rate": 1.935074181495264e-05, "loss": 0.8253, "step": 1190 }, { "epoch": 0.14, "learning_rate": 1.9349371949733583e-05, "loss": 0.8862, "step": 1191 }, { "epoch": 0.14, "learning_rate": 1.9348000689493887e-05, "loss": 0.8259, "step": 1192 }, { "epoch": 0.14, "learning_rate": 1.9346628034438156e-05, "loss": 0.8901, "step": 1193 }, { "epoch": 0.14, "learning_rate": 1.9345253984771205e-05, "loss": 0.7656, "step": 1194 }, { "epoch": 0.14, "learning_rate": 1.9343878540698057e-05, "loss": 0.8672, "step": 1195 }, { "epoch": 0.14, "learning_rate": 1.934250170242394e-05, "loss": 0.8052, "step": 1196 }, { "epoch": 0.14, "learning_rate": 1.9341123470154294e-05, "loss": 0.8181, "step": 1197 }, { "epoch": 0.14, "learning_rate": 1.9339743844094764e-05, "loss": 0.8382, "step": 1198 }, { "epoch": 0.14, "learning_rate": 1.9338362824451205e-05, "loss": 0.8477, "step": 1199 }, { "epoch": 0.14, "learning_rate": 1.933698041142968e-05, "loss": 0.8895, "step": 1200 }, { "epoch": 0.14, "learning_rate": 1.9335596605236456e-05, "loss": 0.8108, "step": 1201 }, { "epoch": 0.14, "learning_rate": 1.9334211406078012e-05, "loss": 0.8331, "step": 1202 }, { "epoch": 0.14, "learning_rate": 1.9332824814161033e-05, "loss": 0.8248, "step": 1203 }, { "epoch": 0.14, "learning_rate": 1.9331436829692415e-05, "loss": 0.7757, "step": 1204 }, { "epoch": 0.14, "learning_rate": 1.9330047452879262e-05, "loss": 0.8633, "step": 1205 }, { "epoch": 0.14, "learning_rate": 1.9328656683928876e-05, "loss": 0.8198, "step": 1206 }, { "epoch": 0.14, "learning_rate": 1.9327264523048773e-05, "loss": 0.832, "step": 1207 }, { "epoch": 0.14, "learning_rate": 1.9325870970446686e-05, "loss": 0.8945, "step": 1208 }, { "epoch": 0.14, "learning_rate": 1.932447602633054e-05, "loss": 0.8147, "step": 1209 }, { "epoch": 0.14, "learning_rate": 1.932307969090848e-05, "loss": 0.8544, "step": 1210 }, { "epoch": 0.14, "learning_rate": 1.9321681964388847e-05, "loss": 0.8504, "step": 1211 }, { "epoch": 0.14, "learning_rate": 1.93202828469802e-05, "loss": 0.8097, "step": 1212 }, { "epoch": 0.14, "learning_rate": 1.9318882338891302e-05, "loss": 0.861, "step": 1213 }, { "epoch": 0.14, "learning_rate": 1.9317480440331122e-05, "loss": 0.8365, "step": 1214 }, { "epoch": 0.14, "learning_rate": 1.9316077151508838e-05, "loss": 0.8694, "step": 1215 }, { "epoch": 0.15, "learning_rate": 1.931467247263383e-05, "loss": 0.8404, "step": 1216 }, { "epoch": 0.15, "learning_rate": 1.9313266403915698e-05, "loss": 0.846, "step": 1217 }, { "epoch": 0.15, "learning_rate": 1.9311858945564233e-05, "loss": 0.8666, "step": 1218 }, { "epoch": 0.15, "learning_rate": 1.9310450097789456e-05, "loss": 0.8499, "step": 1219 }, { "epoch": 0.15, "learning_rate": 1.9309039860801564e-05, "loss": 0.9196, "step": 1220 }, { "epoch": 0.15, "learning_rate": 1.930762823481099e-05, "loss": 0.8633, "step": 1221 }, { "epoch": 0.15, "learning_rate": 1.9306215220028357e-05, "loss": 0.8304, "step": 1222 }, { "epoch": 0.15, "learning_rate": 1.9304800816664507e-05, "loss": 0.832, "step": 1223 }, { "epoch": 0.15, "learning_rate": 1.9303385024930478e-05, "loss": 0.8304, "step": 1224 }, { "epoch": 0.15, "learning_rate": 1.9301967845037523e-05, "loss": 0.8806, "step": 1225 }, { "epoch": 0.15, "learning_rate": 1.93005492771971e-05, "loss": 0.7835, "step": 1226 }, { "epoch": 0.15, "learning_rate": 1.9299129321620872e-05, "loss": 0.808, "step": 1227 }, { "epoch": 0.15, "learning_rate": 1.9297707978520707e-05, "loss": 0.8131, "step": 1228 }, { "epoch": 0.15, "learning_rate": 1.9296285248108692e-05, "loss": 0.8387, "step": 1229 }, { "epoch": 0.15, "learning_rate": 1.929486113059711e-05, "loss": 0.8398, "step": 1230 }, { "epoch": 0.15, "learning_rate": 1.929343562619845e-05, "loss": 0.8823, "step": 1231 }, { "epoch": 0.15, "learning_rate": 1.9292008735125414e-05, "loss": 0.9107, "step": 1232 }, { "epoch": 0.15, "learning_rate": 1.929058045759091e-05, "loss": 0.8287, "step": 1233 }, { "epoch": 0.15, "learning_rate": 1.9289150793808048e-05, "loss": 0.8382, "step": 1234 }, { "epoch": 0.15, "learning_rate": 1.9287719743990153e-05, "loss": 0.88, "step": 1235 }, { "epoch": 0.15, "learning_rate": 1.9286287308350747e-05, "loss": 0.832, "step": 1236 }, { "epoch": 0.15, "learning_rate": 1.9284853487103566e-05, "loss": 0.8856, "step": 1237 }, { "epoch": 0.15, "learning_rate": 1.9283418280462555e-05, "loss": 0.8298, "step": 1238 }, { "epoch": 0.15, "learning_rate": 1.9281981688641853e-05, "loss": 0.8945, "step": 1239 }, { "epoch": 0.15, "learning_rate": 1.928054371185582e-05, "loss": 0.8493, "step": 1240 }, { "epoch": 0.15, "learning_rate": 1.927910435031901e-05, "loss": 0.8008, "step": 1241 }, { "epoch": 0.15, "learning_rate": 1.9277663604246202e-05, "loss": 0.88, "step": 1242 }, { "epoch": 0.15, "learning_rate": 1.9276221473852356e-05, "loss": 0.8108, "step": 1243 }, { "epoch": 0.15, "learning_rate": 1.9274777959352665e-05, "loss": 0.7941, "step": 1244 }, { "epoch": 0.15, "learning_rate": 1.9273333060962507e-05, "loss": 0.8047, "step": 1245 }, { "epoch": 0.15, "learning_rate": 1.927188677889748e-05, "loss": 0.8454, "step": 1246 }, { "epoch": 0.15, "learning_rate": 1.9270439113373386e-05, "loss": 0.8398, "step": 1247 }, { "epoch": 0.15, "learning_rate": 1.9268990064606222e-05, "loss": 0.8739, "step": 1248 }, { "epoch": 0.15, "learning_rate": 1.9267539632812208e-05, "loss": 0.8672, "step": 1249 }, { "epoch": 0.15, "learning_rate": 1.926608781820776e-05, "loss": 0.8198, "step": 1250 }, { "epoch": 0.15, "learning_rate": 1.9264634621009508e-05, "loss": 0.8532, "step": 1251 }, { "epoch": 0.15, "learning_rate": 1.926318004143428e-05, "loss": 0.784, "step": 1252 }, { "epoch": 0.15, "learning_rate": 1.9261724079699117e-05, "loss": 0.8516, "step": 1253 }, { "epoch": 0.15, "learning_rate": 1.9260266736021256e-05, "loss": 0.8259, "step": 1254 }, { "epoch": 0.15, "learning_rate": 1.9258808010618152e-05, "loss": 0.8404, "step": 1255 }, { "epoch": 0.15, "learning_rate": 1.9257347903707466e-05, "loss": 0.8398, "step": 1256 }, { "epoch": 0.15, "learning_rate": 1.9255886415507054e-05, "loss": 0.8823, "step": 1257 }, { "epoch": 0.15, "learning_rate": 1.9254423546234986e-05, "loss": 0.8186, "step": 1258 }, { "epoch": 0.15, "learning_rate": 1.925295929610954e-05, "loss": 0.7723, "step": 1259 }, { "epoch": 0.15, "learning_rate": 1.9251493665349196e-05, "loss": 0.8331, "step": 1260 }, { "epoch": 0.15, "learning_rate": 1.9250026654172637e-05, "loss": 0.7885, "step": 1261 }, { "epoch": 0.15, "learning_rate": 1.924855826279876e-05, "loss": 0.8331, "step": 1262 }, { "epoch": 0.15, "learning_rate": 1.924708849144666e-05, "loss": 0.8633, "step": 1263 }, { "epoch": 0.15, "learning_rate": 1.924561734033565e-05, "loss": 0.8644, "step": 1264 }, { "epoch": 0.15, "learning_rate": 1.924414480968523e-05, "loss": 0.8237, "step": 1265 }, { "epoch": 0.15, "learning_rate": 1.9242670899715123e-05, "loss": 0.8571, "step": 1266 }, { "epoch": 0.15, "learning_rate": 1.924119561064525e-05, "loss": 0.8566, "step": 1267 }, { "epoch": 0.15, "learning_rate": 1.9239718942695738e-05, "loss": 0.8661, "step": 1268 }, { "epoch": 0.15, "learning_rate": 1.923824089608692e-05, "loss": 0.8064, "step": 1269 }, { "epoch": 0.15, "learning_rate": 1.9236761471039337e-05, "loss": 0.8404, "step": 1270 }, { "epoch": 0.15, "learning_rate": 1.9235280667773736e-05, "loss": 0.8521, "step": 1271 }, { "epoch": 0.15, "learning_rate": 1.9233798486511063e-05, "loss": 0.8722, "step": 1272 }, { "epoch": 0.15, "learning_rate": 1.923231492747248e-05, "loss": 0.8449, "step": 1273 }, { "epoch": 0.15, "learning_rate": 1.9230829990879343e-05, "loss": 0.856, "step": 1274 }, { "epoch": 0.15, "learning_rate": 1.9229343676953224e-05, "loss": 0.8292, "step": 1275 }, { "epoch": 0.15, "learning_rate": 1.9227855985915894e-05, "loss": 0.8488, "step": 1276 }, { "epoch": 0.15, "learning_rate": 1.9226366917989334e-05, "loss": 0.8131, "step": 1277 }, { "epoch": 0.15, "learning_rate": 1.9224876473395727e-05, "loss": 0.8393, "step": 1278 }, { "epoch": 0.15, "learning_rate": 1.9223384652357457e-05, "loss": 0.8912, "step": 1279 }, { "epoch": 0.15, "learning_rate": 1.9221891455097126e-05, "loss": 0.8778, "step": 1280 }, { "epoch": 0.15, "learning_rate": 1.922039688183753e-05, "loss": 0.827, "step": 1281 }, { "epoch": 0.15, "learning_rate": 1.9218900932801677e-05, "loss": 0.8862, "step": 1282 }, { "epoch": 0.15, "learning_rate": 1.921740360821278e-05, "loss": 0.8516, "step": 1283 }, { "epoch": 0.15, "learning_rate": 1.9215904908294244e-05, "loss": 0.8248, "step": 1284 }, { "epoch": 0.15, "learning_rate": 1.92144048332697e-05, "loss": 0.8683, "step": 1285 }, { "epoch": 0.15, "learning_rate": 1.9212903383362974e-05, "loss": 0.7879, "step": 1286 }, { "epoch": 0.15, "learning_rate": 1.921140055879809e-05, "loss": 0.7946, "step": 1287 }, { "epoch": 0.15, "learning_rate": 1.9209896359799297e-05, "loss": 0.8968, "step": 1288 }, { "epoch": 0.15, "learning_rate": 1.9208390786591024e-05, "loss": 0.8521, "step": 1289 }, { "epoch": 0.15, "learning_rate": 1.920688383939793e-05, "loss": 0.8627, "step": 1290 }, { "epoch": 0.15, "learning_rate": 1.9205375518444854e-05, "loss": 0.8214, "step": 1291 }, { "epoch": 0.15, "learning_rate": 1.920386582395686e-05, "loss": 0.8633, "step": 1292 }, { "epoch": 0.15, "learning_rate": 1.920235475615921e-05, "loss": 0.8337, "step": 1293 }, { "epoch": 0.15, "learning_rate": 1.9200842315277368e-05, "loss": 0.8276, "step": 1294 }, { "epoch": 0.15, "learning_rate": 1.9199328501537005e-05, "loss": 0.8393, "step": 1295 }, { "epoch": 0.15, "learning_rate": 1.9197813315164e-05, "loss": 0.8181, "step": 1296 }, { "epoch": 0.15, "learning_rate": 1.919629675638443e-05, "loss": 0.8108, "step": 1297 }, { "epoch": 0.15, "learning_rate": 1.919477882542459e-05, "loss": 0.827, "step": 1298 }, { "epoch": 0.15, "learning_rate": 1.919325952251096e-05, "loss": 0.8477, "step": 1299 }, { "epoch": 0.16, "learning_rate": 1.919173884787024e-05, "loss": 0.8058, "step": 1300 }, { "epoch": 0.16, "learning_rate": 1.9190216801729327e-05, "loss": 0.8287, "step": 1301 }, { "epoch": 0.16, "learning_rate": 1.9188693384315334e-05, "loss": 0.9135, "step": 1302 }, { "epoch": 0.16, "learning_rate": 1.918716859585556e-05, "loss": 0.8477, "step": 1303 }, { "epoch": 0.16, "learning_rate": 1.9185642436577525e-05, "loss": 0.8527, "step": 1304 }, { "epoch": 0.16, "learning_rate": 1.9184114906708946e-05, "loss": 0.8873, "step": 1305 }, { "epoch": 0.16, "learning_rate": 1.9182586006477745e-05, "loss": 0.8119, "step": 1306 }, { "epoch": 0.16, "learning_rate": 1.918105573611205e-05, "loss": 0.8795, "step": 1307 }, { "epoch": 0.16, "learning_rate": 1.9179524095840193e-05, "loss": 0.8783, "step": 1308 }, { "epoch": 0.16, "learning_rate": 1.9177991085890707e-05, "loss": 0.8276, "step": 1309 }, { "epoch": 0.16, "learning_rate": 1.9176456706492337e-05, "loss": 0.8566, "step": 1310 }, { "epoch": 0.16, "learning_rate": 1.917492095787403e-05, "loss": 0.8689, "step": 1311 }, { "epoch": 0.16, "learning_rate": 1.917338384026493e-05, "loss": 0.8019, "step": 1312 }, { "epoch": 0.16, "learning_rate": 1.917184535389439e-05, "loss": 0.8365, "step": 1313 }, { "epoch": 0.16, "learning_rate": 1.9170305498991967e-05, "loss": 0.8929, "step": 1314 }, { "epoch": 0.16, "learning_rate": 1.916876427578743e-05, "loss": 0.7907, "step": 1315 }, { "epoch": 0.16, "learning_rate": 1.916722168451074e-05, "loss": 0.8398, "step": 1316 }, { "epoch": 0.16, "learning_rate": 1.9165677725392066e-05, "loss": 0.7902, "step": 1317 }, { "epoch": 0.16, "learning_rate": 1.9164132398661785e-05, "loss": 0.8683, "step": 1318 }, { "epoch": 0.16, "learning_rate": 1.9162585704550473e-05, "loss": 0.8092, "step": 1319 }, { "epoch": 0.16, "learning_rate": 1.9161037643288916e-05, "loss": 0.8281, "step": 1320 }, { "epoch": 0.16, "learning_rate": 1.91594882151081e-05, "loss": 0.8532, "step": 1321 }, { "epoch": 0.16, "learning_rate": 1.915793742023921e-05, "loss": 0.8538, "step": 1322 }, { "epoch": 0.16, "learning_rate": 1.9156385258913643e-05, "loss": 0.832, "step": 1323 }, { "epoch": 0.16, "learning_rate": 1.9154831731363e-05, "loss": 0.7969, "step": 1324 }, { "epoch": 0.16, "learning_rate": 1.9153276837819078e-05, "loss": 0.8555, "step": 1325 }, { "epoch": 0.16, "learning_rate": 1.9151720578513887e-05, "loss": 0.8504, "step": 1326 }, { "epoch": 0.16, "learning_rate": 1.9150162953679638e-05, "loss": 0.8192, "step": 1327 }, { "epoch": 0.16, "learning_rate": 1.914860396354874e-05, "loss": 0.8192, "step": 1328 }, { "epoch": 0.16, "learning_rate": 1.914704360835381e-05, "loss": 0.8164, "step": 1329 }, { "epoch": 0.16, "learning_rate": 1.9145481888327673e-05, "loss": 0.8499, "step": 1330 }, { "epoch": 0.16, "learning_rate": 1.9143918803703347e-05, "loss": 0.8326, "step": 1331 }, { "epoch": 0.16, "learning_rate": 1.9142354354714067e-05, "loss": 0.8544, "step": 1332 }, { "epoch": 0.16, "learning_rate": 1.914078854159326e-05, "loss": 0.808, "step": 1333 }, { "epoch": 0.16, "learning_rate": 1.913922136457456e-05, "loss": 0.8728, "step": 1334 }, { "epoch": 0.16, "learning_rate": 1.9137652823891814e-05, "loss": 0.8588, "step": 1335 }, { "epoch": 0.16, "learning_rate": 1.9136082919779053e-05, "loss": 0.8828, "step": 1336 }, { "epoch": 0.16, "learning_rate": 1.9134511652470527e-05, "loss": 0.8895, "step": 1337 }, { "epoch": 0.16, "learning_rate": 1.913293902220069e-05, "loss": 0.8616, "step": 1338 }, { "epoch": 0.16, "learning_rate": 1.913136502920419e-05, "loss": 0.8823, "step": 1339 }, { "epoch": 0.16, "learning_rate": 1.912978967371588e-05, "loss": 0.8142, "step": 1340 }, { "epoch": 0.16, "learning_rate": 1.912821295597082e-05, "loss": 0.8677, "step": 1341 }, { "epoch": 0.16, "learning_rate": 1.9126634876204275e-05, "loss": 0.8114, "step": 1342 }, { "epoch": 0.16, "learning_rate": 1.9125055434651712e-05, "loss": 0.7924, "step": 1343 }, { "epoch": 0.16, "learning_rate": 1.9123474631548795e-05, "loss": 0.856, "step": 1344 }, { "epoch": 0.16, "learning_rate": 1.9121892467131395e-05, "loss": 0.8493, "step": 1345 }, { "epoch": 0.16, "learning_rate": 1.9120308941635593e-05, "loss": 0.9263, "step": 1346 }, { "epoch": 0.16, "learning_rate": 1.911872405529766e-05, "loss": 0.8432, "step": 1347 }, { "epoch": 0.16, "learning_rate": 1.9117137808354084e-05, "loss": 0.8225, "step": 1348 }, { "epoch": 0.16, "learning_rate": 1.9115550201041542e-05, "loss": 0.8036, "step": 1349 }, { "epoch": 0.16, "learning_rate": 1.911396123359693e-05, "loss": 0.8103, "step": 1350 }, { "epoch": 0.16, "learning_rate": 1.9112370906257326e-05, "loss": 0.7383, "step": 1351 }, { "epoch": 0.16, "learning_rate": 1.9110779219260034e-05, "loss": 0.8203, "step": 1352 }, { "epoch": 0.16, "learning_rate": 1.9109186172842543e-05, "loss": 0.885, "step": 1353 }, { "epoch": 0.16, "learning_rate": 1.9107591767242554e-05, "loss": 0.8917, "step": 1354 }, { "epoch": 0.16, "learning_rate": 1.9105996002697965e-05, "loss": 0.8276, "step": 1355 }, { "epoch": 0.16, "learning_rate": 1.910439887944689e-05, "loss": 0.8482, "step": 1356 }, { "epoch": 0.16, "learning_rate": 1.9102800397727623e-05, "loss": 0.8828, "step": 1357 }, { "epoch": 0.16, "learning_rate": 1.9101200557778683e-05, "loss": 0.8672, "step": 1358 }, { "epoch": 0.16, "learning_rate": 1.909959935983878e-05, "loss": 0.8421, "step": 1359 }, { "epoch": 0.16, "learning_rate": 1.9097996804146827e-05, "loss": 0.8331, "step": 1360 }, { "epoch": 0.16, "learning_rate": 1.9096392890941943e-05, "loss": 0.8627, "step": 1361 }, { "epoch": 0.16, "learning_rate": 1.9094787620463445e-05, "loss": 0.8795, "step": 1362 }, { "epoch": 0.16, "learning_rate": 1.909318099295086e-05, "loss": 0.8761, "step": 1363 }, { "epoch": 0.16, "learning_rate": 1.9091573008643912e-05, "loss": 0.8052, "step": 1364 }, { "epoch": 0.16, "learning_rate": 1.9089963667782524e-05, "loss": 0.8538, "step": 1365 }, { "epoch": 0.16, "learning_rate": 1.9088352970606832e-05, "loss": 0.889, "step": 1366 }, { "epoch": 0.16, "learning_rate": 1.9086740917357164e-05, "loss": 0.8594, "step": 1367 }, { "epoch": 0.16, "learning_rate": 1.908512750827406e-05, "loss": 0.8119, "step": 1368 }, { "epoch": 0.16, "learning_rate": 1.908351274359825e-05, "loss": 0.8253, "step": 1369 }, { "epoch": 0.16, "learning_rate": 1.908189662357068e-05, "loss": 0.8945, "step": 1370 }, { "epoch": 0.16, "learning_rate": 1.9080279148432485e-05, "loss": 0.8287, "step": 1371 }, { "epoch": 0.16, "learning_rate": 1.907866031842501e-05, "loss": 0.88, "step": 1372 }, { "epoch": 0.16, "learning_rate": 1.9077040133789806e-05, "loss": 0.8917, "step": 1373 }, { "epoch": 0.16, "learning_rate": 1.9075418594768615e-05, "loss": 0.8287, "step": 1374 }, { "epoch": 0.16, "learning_rate": 1.907379570160339e-05, "loss": 0.8287, "step": 1375 }, { "epoch": 0.16, "learning_rate": 1.907217145453628e-05, "loss": 0.7718, "step": 1376 }, { "epoch": 0.16, "learning_rate": 1.9070545853809644e-05, "loss": 0.8292, "step": 1377 }, { "epoch": 0.16, "learning_rate": 1.9068918899666035e-05, "loss": 0.8482, "step": 1378 }, { "epoch": 0.16, "learning_rate": 1.906729059234821e-05, "loss": 0.8237, "step": 1379 }, { "epoch": 0.16, "learning_rate": 1.906566093209913e-05, "loss": 0.8482, "step": 1380 }, { "epoch": 0.16, "learning_rate": 1.906402991916196e-05, "loss": 0.8594, "step": 1381 }, { "epoch": 0.16, "learning_rate": 1.906239755378006e-05, "loss": 0.865, "step": 1382 }, { "epoch": 0.16, "learning_rate": 1.9060763836196988e-05, "loss": 0.8532, "step": 1383 }, { "epoch": 0.17, "learning_rate": 1.905912876665653e-05, "loss": 0.8516, "step": 1384 }, { "epoch": 0.17, "learning_rate": 1.9057492345402634e-05, "loss": 0.8477, "step": 1385 }, { "epoch": 0.17, "learning_rate": 1.905585457267949e-05, "loss": 0.856, "step": 1386 }, { "epoch": 0.17, "learning_rate": 1.9054215448731454e-05, "loss": 0.7651, "step": 1387 }, { "epoch": 0.17, "learning_rate": 1.9052574973803107e-05, "loss": 0.8309, "step": 1388 }, { "epoch": 0.17, "learning_rate": 1.9050933148139226e-05, "loss": 0.8387, "step": 1389 }, { "epoch": 0.17, "learning_rate": 1.9049289971984785e-05, "loss": 0.8705, "step": 1390 }, { "epoch": 0.17, "learning_rate": 1.9047645445584965e-05, "loss": 0.9007, "step": 1391 }, { "epoch": 0.17, "learning_rate": 1.9045999569185142e-05, "loss": 0.8343, "step": 1392 }, { "epoch": 0.17, "learning_rate": 1.9044352343030897e-05, "loss": 0.7835, "step": 1393 }, { "epoch": 0.17, "learning_rate": 1.9042703767368023e-05, "loss": 0.7969, "step": 1394 }, { "epoch": 0.17, "learning_rate": 1.904105384244249e-05, "loss": 0.8488, "step": 1395 }, { "epoch": 0.17, "learning_rate": 1.9039402568500492e-05, "loss": 0.8566, "step": 1396 }, { "epoch": 0.17, "learning_rate": 1.9037749945788417e-05, "loss": 0.8276, "step": 1397 }, { "epoch": 0.17, "learning_rate": 1.9036095974552845e-05, "loss": 0.8912, "step": 1398 }, { "epoch": 0.17, "learning_rate": 1.9034440655040568e-05, "loss": 0.8605, "step": 1399 }, { "epoch": 0.17, "learning_rate": 1.9032783987498585e-05, "loss": 0.8002, "step": 1400 }, { "epoch": 0.17, "learning_rate": 1.903112597217408e-05, "loss": 0.8354, "step": 1401 }, { "epoch": 0.17, "learning_rate": 1.902946660931444e-05, "loss": 0.8265, "step": 1402 }, { "epoch": 0.17, "learning_rate": 1.902780589916727e-05, "loss": 0.8175, "step": 1403 }, { "epoch": 0.17, "learning_rate": 1.9026143841980357e-05, "loss": 0.8443, "step": 1404 }, { "epoch": 0.17, "learning_rate": 1.9024480438001702e-05, "loss": 0.8438, "step": 1405 }, { "epoch": 0.17, "learning_rate": 1.90228156874795e-05, "loss": 0.851, "step": 1406 }, { "epoch": 0.17, "learning_rate": 1.9021149590662143e-05, "loss": 0.8499, "step": 1407 }, { "epoch": 0.17, "learning_rate": 1.9019482147798237e-05, "loss": 0.8181, "step": 1408 }, { "epoch": 0.17, "learning_rate": 1.901781335913658e-05, "loss": 0.8482, "step": 1409 }, { "epoch": 0.17, "learning_rate": 1.901614322492617e-05, "loss": 0.8482, "step": 1410 }, { "epoch": 0.17, "learning_rate": 1.9014471745416207e-05, "loss": 0.8315, "step": 1411 }, { "epoch": 0.17, "learning_rate": 1.9012798920856097e-05, "loss": 0.8292, "step": 1412 }, { "epoch": 0.17, "learning_rate": 1.9011124751495438e-05, "loss": 0.8571, "step": 1413 }, { "epoch": 0.17, "learning_rate": 1.9009449237584033e-05, "loss": 0.8432, "step": 1414 }, { "epoch": 0.17, "learning_rate": 1.9007772379371886e-05, "loss": 0.8265, "step": 1415 }, { "epoch": 0.17, "learning_rate": 1.9006094177109203e-05, "loss": 0.8376, "step": 1416 }, { "epoch": 0.17, "learning_rate": 1.9004414631046392e-05, "loss": 0.8013, "step": 1417 }, { "epoch": 0.17, "learning_rate": 1.9002733741434048e-05, "loss": 0.8432, "step": 1418 }, { "epoch": 0.17, "learning_rate": 1.900105150852299e-05, "loss": 0.8175, "step": 1419 }, { "epoch": 0.17, "learning_rate": 1.899936793256421e-05, "loss": 0.9325, "step": 1420 }, { "epoch": 0.17, "learning_rate": 1.8997683013808924e-05, "loss": 0.9001, "step": 1421 }, { "epoch": 0.17, "learning_rate": 1.8995996752508534e-05, "loss": 0.8013, "step": 1422 }, { "epoch": 0.17, "learning_rate": 1.899430914891465e-05, "loss": 0.8192, "step": 1423 }, { "epoch": 0.17, "learning_rate": 1.899262020327908e-05, "loss": 0.8186, "step": 1424 }, { "epoch": 0.17, "learning_rate": 1.899092991585383e-05, "loss": 0.8036, "step": 1425 }, { "epoch": 0.17, "learning_rate": 1.898923828689111e-05, "loss": 0.856, "step": 1426 }, { "epoch": 0.17, "learning_rate": 1.8987545316643325e-05, "loss": 0.8438, "step": 1427 }, { "epoch": 0.17, "learning_rate": 1.898585100536309e-05, "loss": 0.8694, "step": 1428 }, { "epoch": 0.17, "learning_rate": 1.8984155353303203e-05, "loss": 0.774, "step": 1429 }, { "epoch": 0.17, "learning_rate": 1.8982458360716677e-05, "loss": 0.8237, "step": 1430 }, { "epoch": 0.17, "learning_rate": 1.8980760027856725e-05, "loss": 0.8175, "step": 1431 }, { "epoch": 0.17, "learning_rate": 1.897906035497675e-05, "loss": 0.8131, "step": 1432 }, { "epoch": 0.17, "learning_rate": 1.897735934233036e-05, "loss": 0.808, "step": 1433 }, { "epoch": 0.17, "learning_rate": 1.897565699017137e-05, "loss": 0.8186, "step": 1434 }, { "epoch": 0.17, "learning_rate": 1.897395329875378e-05, "loss": 0.8711, "step": 1435 }, { "epoch": 0.17, "learning_rate": 1.89722482683318e-05, "loss": 0.8393, "step": 1436 }, { "epoch": 0.17, "learning_rate": 1.897054189915984e-05, "loss": 0.8309, "step": 1437 }, { "epoch": 0.17, "learning_rate": 1.8968834191492506e-05, "loss": 0.8633, "step": 1438 }, { "epoch": 0.17, "learning_rate": 1.896712514558461e-05, "loss": 0.7813, "step": 1439 }, { "epoch": 0.17, "learning_rate": 1.8965414761691147e-05, "loss": 0.832, "step": 1440 }, { "epoch": 0.17, "learning_rate": 1.8963703040067336e-05, "loss": 0.7813, "step": 1441 }, { "epoch": 0.17, "learning_rate": 1.8961989980968577e-05, "loss": 0.8382, "step": 1442 }, { "epoch": 0.17, "learning_rate": 1.896027558465048e-05, "loss": 0.8477, "step": 1443 }, { "epoch": 0.17, "learning_rate": 1.8958559851368844e-05, "loss": 0.8454, "step": 1444 }, { "epoch": 0.17, "learning_rate": 1.8956842781379677e-05, "loss": 0.8142, "step": 1445 }, { "epoch": 0.17, "learning_rate": 1.895512437493918e-05, "loss": 0.8371, "step": 1446 }, { "epoch": 0.17, "learning_rate": 1.8953404632303764e-05, "loss": 0.8728, "step": 1447 }, { "epoch": 0.17, "learning_rate": 1.8951683553730026e-05, "loss": 0.8845, "step": 1448 }, { "epoch": 0.17, "learning_rate": 1.894996113947477e-05, "loss": 0.8276, "step": 1449 }, { "epoch": 0.17, "learning_rate": 1.8948237389794998e-05, "loss": 0.8694, "step": 1450 }, { "epoch": 0.17, "learning_rate": 1.894651230494791e-05, "loss": 0.8326, "step": 1451 }, { "epoch": 0.17, "learning_rate": 1.894478588519091e-05, "loss": 0.846, "step": 1452 }, { "epoch": 0.17, "learning_rate": 1.894305813078159e-05, "loss": 0.8248, "step": 1453 }, { "epoch": 0.17, "learning_rate": 1.894132904197775e-05, "loss": 0.7946, "step": 1454 }, { "epoch": 0.17, "learning_rate": 1.8939598619037392e-05, "loss": 0.889, "step": 1455 }, { "epoch": 0.17, "learning_rate": 1.893786686221871e-05, "loss": 0.861, "step": 1456 }, { "epoch": 0.17, "learning_rate": 1.8936133771780097e-05, "loss": 0.9157, "step": 1457 }, { "epoch": 0.17, "learning_rate": 1.8934399347980156e-05, "loss": 0.875, "step": 1458 }, { "epoch": 0.17, "learning_rate": 1.8932663591077668e-05, "loss": 0.7885, "step": 1459 }, { "epoch": 0.17, "learning_rate": 1.8930926501331635e-05, "loss": 0.7746, "step": 1460 }, { "epoch": 0.17, "learning_rate": 1.892918807900125e-05, "loss": 0.9068, "step": 1461 }, { "epoch": 0.17, "learning_rate": 1.8927448324345892e-05, "loss": 0.8371, "step": 1462 }, { "epoch": 0.17, "learning_rate": 1.8925707237625163e-05, "loss": 0.8248, "step": 1463 }, { "epoch": 0.17, "learning_rate": 1.892396481909884e-05, "loss": 0.8175, "step": 1464 }, { "epoch": 0.17, "learning_rate": 1.8922221069026914e-05, "loss": 0.7907, "step": 1465 }, { "epoch": 0.17, "learning_rate": 1.8920475987669573e-05, "loss": 0.8856, "step": 1466 }, { "epoch": 0.17, "learning_rate": 1.8918729575287195e-05, "loss": 0.9118, "step": 1467 }, { "epoch": 0.18, "learning_rate": 1.8916981832140363e-05, "loss": 0.8722, "step": 1468 }, { "epoch": 0.18, "learning_rate": 1.8915232758489865e-05, "loss": 0.8304, "step": 1469 }, { "epoch": 0.18, "learning_rate": 1.8913482354596674e-05, "loss": 0.8432, "step": 1470 }, { "epoch": 0.18, "learning_rate": 1.8911730620721965e-05, "loss": 0.8583, "step": 1471 }, { "epoch": 0.18, "learning_rate": 1.8909977557127123e-05, "loss": 0.8594, "step": 1472 }, { "epoch": 0.18, "learning_rate": 1.8908223164073717e-05, "loss": 0.899, "step": 1473 }, { "epoch": 0.18, "learning_rate": 1.890646744182352e-05, "loss": 0.8677, "step": 1474 }, { "epoch": 0.18, "learning_rate": 1.8904710390638506e-05, "loss": 0.8052, "step": 1475 }, { "epoch": 0.18, "learning_rate": 1.8902952010780846e-05, "loss": 0.8398, "step": 1476 }, { "epoch": 0.18, "learning_rate": 1.8901192302512904e-05, "loss": 0.8203, "step": 1477 }, { "epoch": 0.18, "learning_rate": 1.889943126609725e-05, "loss": 0.8393, "step": 1478 }, { "epoch": 0.18, "learning_rate": 1.8897668901796646e-05, "loss": 0.8398, "step": 1479 }, { "epoch": 0.18, "learning_rate": 1.889590520987405e-05, "loss": 0.885, "step": 1480 }, { "epoch": 0.18, "learning_rate": 1.8894140190592634e-05, "loss": 0.8477, "step": 1481 }, { "epoch": 0.18, "learning_rate": 1.8892373844215748e-05, "loss": 0.8767, "step": 1482 }, { "epoch": 0.18, "learning_rate": 1.889060617100695e-05, "loss": 0.88, "step": 1483 }, { "epoch": 0.18, "learning_rate": 1.8888837171229996e-05, "loss": 0.8438, "step": 1484 }, { "epoch": 0.18, "learning_rate": 1.888706684514884e-05, "loss": 0.8292, "step": 1485 }, { "epoch": 0.18, "learning_rate": 1.888529519302763e-05, "loss": 0.7863, "step": 1486 }, { "epoch": 0.18, "learning_rate": 1.8883522215130715e-05, "loss": 0.8867, "step": 1487 }, { "epoch": 0.18, "learning_rate": 1.888174791172264e-05, "loss": 0.8415, "step": 1488 }, { "epoch": 0.18, "learning_rate": 1.8879972283068154e-05, "loss": 0.8449, "step": 1489 }, { "epoch": 0.18, "learning_rate": 1.8878195329432195e-05, "loss": 0.8878, "step": 1490 }, { "epoch": 0.18, "learning_rate": 1.88764170510799e-05, "loss": 0.8075, "step": 1491 }, { "epoch": 0.18, "learning_rate": 1.8874637448276607e-05, "loss": 0.7941, "step": 1492 }, { "epoch": 0.18, "learning_rate": 1.8872856521287857e-05, "loss": 0.8298, "step": 1493 }, { "epoch": 0.18, "learning_rate": 1.8871074270379373e-05, "loss": 0.7813, "step": 1494 }, { "epoch": 0.18, "learning_rate": 1.8869290695817093e-05, "loss": 0.7533, "step": 1495 }, { "epoch": 0.18, "learning_rate": 1.8867505797867136e-05, "loss": 0.87, "step": 1496 }, { "epoch": 0.18, "learning_rate": 1.8865719576795837e-05, "loss": 0.8231, "step": 1497 }, { "epoch": 0.18, "learning_rate": 1.8863932032869708e-05, "loss": 0.8097, "step": 1498 }, { "epoch": 0.18, "learning_rate": 1.8862143166355476e-05, "loss": 0.7835, "step": 1499 }, { "epoch": 0.18, "learning_rate": 1.8860352977520055e-05, "loss": 0.8566, "step": 1500 }, { "epoch": 0.18, "learning_rate": 1.8858561466630562e-05, "loss": 0.8287, "step": 1501 }, { "epoch": 0.18, "learning_rate": 1.8856768633954303e-05, "loss": 0.8175, "step": 1502 }, { "epoch": 0.18, "learning_rate": 1.8854974479758788e-05, "loss": 0.8555, "step": 1503 }, { "epoch": 0.18, "learning_rate": 1.8853179004311727e-05, "loss": 0.8666, "step": 1504 }, { "epoch": 0.18, "learning_rate": 1.8851382207881023e-05, "loss": 0.8521, "step": 1505 }, { "epoch": 0.18, "learning_rate": 1.884958409073477e-05, "loss": 0.8504, "step": 1506 }, { "epoch": 0.18, "learning_rate": 1.8847784653141267e-05, "loss": 0.8136, "step": 1507 }, { "epoch": 0.18, "learning_rate": 1.8845983895369017e-05, "loss": 0.8387, "step": 1508 }, { "epoch": 0.18, "learning_rate": 1.8844181817686698e-05, "loss": 0.8287, "step": 1509 }, { "epoch": 0.18, "learning_rate": 1.884237842036321e-05, "loss": 0.8443, "step": 1510 }, { "epoch": 0.18, "learning_rate": 1.884057370366763e-05, "loss": 0.8956, "step": 1511 }, { "epoch": 0.18, "learning_rate": 1.8838767667869243e-05, "loss": 0.8376, "step": 1512 }, { "epoch": 0.18, "learning_rate": 1.8836960313237527e-05, "loss": 0.8527, "step": 1513 }, { "epoch": 0.18, "learning_rate": 1.883515164004216e-05, "loss": 0.7963, "step": 1514 }, { "epoch": 0.18, "learning_rate": 1.8833341648553013e-05, "loss": 0.8432, "step": 1515 }, { "epoch": 0.18, "learning_rate": 1.883153033904015e-05, "loss": 0.8315, "step": 1516 }, { "epoch": 0.18, "learning_rate": 1.8829717711773844e-05, "loss": 0.8438, "step": 1517 }, { "epoch": 0.18, "learning_rate": 1.882790376702455e-05, "loss": 0.8527, "step": 1518 }, { "epoch": 0.18, "learning_rate": 1.8826088505062937e-05, "loss": 0.8588, "step": 1519 }, { "epoch": 0.18, "learning_rate": 1.8824271926159854e-05, "loss": 0.8599, "step": 1520 }, { "epoch": 0.18, "learning_rate": 1.8822454030586352e-05, "loss": 0.8622, "step": 1521 }, { "epoch": 0.18, "learning_rate": 1.8820634818613678e-05, "loss": 0.8789, "step": 1522 }, { "epoch": 0.18, "learning_rate": 1.8818814290513282e-05, "loss": 0.8203, "step": 1523 }, { "epoch": 0.18, "learning_rate": 1.8816992446556804e-05, "loss": 0.8108, "step": 1524 }, { "epoch": 0.18, "learning_rate": 1.881516928701608e-05, "loss": 0.8767, "step": 1525 }, { "epoch": 0.18, "learning_rate": 1.8813344812163144e-05, "loss": 0.8198, "step": 1526 }, { "epoch": 0.18, "learning_rate": 1.8811519022270224e-05, "loss": 0.8192, "step": 1527 }, { "epoch": 0.18, "learning_rate": 1.8809691917609748e-05, "loss": 0.8086, "step": 1528 }, { "epoch": 0.18, "learning_rate": 1.880786349845434e-05, "loss": 0.7868, "step": 1529 }, { "epoch": 0.18, "learning_rate": 1.880603376507682e-05, "loss": 0.861, "step": 1530 }, { "epoch": 0.18, "learning_rate": 1.88042027177502e-05, "loss": 0.8147, "step": 1531 }, { "epoch": 0.18, "learning_rate": 1.8802370356747688e-05, "loss": 0.8326, "step": 1532 }, { "epoch": 0.18, "learning_rate": 1.880053668234269e-05, "loss": 0.8164, "step": 1533 }, { "epoch": 0.18, "learning_rate": 1.8798701694808817e-05, "loss": 0.894, "step": 1534 }, { "epoch": 0.18, "learning_rate": 1.8796865394419866e-05, "loss": 0.8337, "step": 1535 }, { "epoch": 0.18, "learning_rate": 1.8795027781449825e-05, "loss": 0.8571, "step": 1536 }, { "epoch": 0.18, "learning_rate": 1.879318885617289e-05, "loss": 0.8354, "step": 1537 }, { "epoch": 0.18, "learning_rate": 1.8791348618863442e-05, "loss": 0.851, "step": 1538 }, { "epoch": 0.18, "learning_rate": 1.8789507069796067e-05, "loss": 0.8544, "step": 1539 }, { "epoch": 0.18, "learning_rate": 1.8787664209245542e-05, "loss": 0.88, "step": 1540 }, { "epoch": 0.18, "learning_rate": 1.8785820037486843e-05, "loss": 0.8393, "step": 1541 }, { "epoch": 0.18, "learning_rate": 1.8783974554795133e-05, "loss": 0.8008, "step": 1542 }, { "epoch": 0.18, "learning_rate": 1.8782127761445782e-05, "loss": 0.8343, "step": 1543 }, { "epoch": 0.18, "learning_rate": 1.8780279657714344e-05, "loss": 0.8923, "step": 1544 }, { "epoch": 0.18, "learning_rate": 1.8778430243876583e-05, "loss": 0.8248, "step": 1545 }, { "epoch": 0.18, "learning_rate": 1.877657952020844e-05, "loss": 0.8343, "step": 1546 }, { "epoch": 0.18, "learning_rate": 1.8774727486986078e-05, "loss": 0.8326, "step": 1547 }, { "epoch": 0.18, "learning_rate": 1.877287414448582e-05, "loss": 0.8326, "step": 1548 }, { "epoch": 0.18, "learning_rate": 1.8771019492984216e-05, "loss": 0.8365, "step": 1549 }, { "epoch": 0.18, "learning_rate": 1.8769163532757996e-05, "loss": 0.8895, "step": 1550 }, { "epoch": 0.18, "learning_rate": 1.8767306264084082e-05, "loss": 0.8198, "step": 1551 }, { "epoch": 0.19, "learning_rate": 1.8765447687239606e-05, "loss": 0.8147, "step": 1552 }, { "epoch": 0.19, "learning_rate": 1.876358780250188e-05, "loss": 0.8164, "step": 1553 }, { "epoch": 0.19, "learning_rate": 1.876172661014842e-05, "loss": 0.8214, "step": 1554 }, { "epoch": 0.19, "learning_rate": 1.8759864110456936e-05, "loss": 0.7494, "step": 1555 }, { "epoch": 0.19, "learning_rate": 1.8758000303705333e-05, "loss": 0.8477, "step": 1556 }, { "epoch": 0.19, "learning_rate": 1.87561351901717e-05, "loss": 0.8588, "step": 1557 }, { "epoch": 0.19, "learning_rate": 1.8754268770134346e-05, "loss": 0.8482, "step": 1558 }, { "epoch": 0.19, "learning_rate": 1.875240104387175e-05, "loss": 0.8058, "step": 1559 }, { "epoch": 0.19, "learning_rate": 1.8750532011662594e-05, "loss": 0.861, "step": 1560 }, { "epoch": 0.19, "learning_rate": 1.874866167378576e-05, "loss": 0.8114, "step": 1561 }, { "epoch": 0.19, "learning_rate": 1.8746790030520326e-05, "loss": 0.8761, "step": 1562 }, { "epoch": 0.19, "learning_rate": 1.874491708214555e-05, "loss": 0.8823, "step": 1563 }, { "epoch": 0.19, "learning_rate": 1.8743042828940904e-05, "loss": 0.8153, "step": 1564 }, { "epoch": 0.19, "learning_rate": 1.8741167271186037e-05, "loss": 0.7935, "step": 1565 }, { "epoch": 0.19, "learning_rate": 1.8739290409160808e-05, "loss": 0.7863, "step": 1566 }, { "epoch": 0.19, "learning_rate": 1.873741224314526e-05, "loss": 0.8387, "step": 1567 }, { "epoch": 0.19, "learning_rate": 1.873553277341964e-05, "loss": 0.8013, "step": 1568 }, { "epoch": 0.19, "learning_rate": 1.8733652000264374e-05, "loss": 0.8516, "step": 1569 }, { "epoch": 0.19, "learning_rate": 1.8731769923960098e-05, "loss": 0.8359, "step": 1570 }, { "epoch": 0.19, "learning_rate": 1.872988654478764e-05, "loss": 0.8354, "step": 1571 }, { "epoch": 0.19, "learning_rate": 1.8728001863028016e-05, "loss": 0.8599, "step": 1572 }, { "epoch": 0.19, "learning_rate": 1.8726115878962438e-05, "loss": 0.851, "step": 1573 }, { "epoch": 0.19, "learning_rate": 1.8724228592872315e-05, "loss": 0.8343, "step": 1574 }, { "epoch": 0.19, "learning_rate": 1.8722340005039248e-05, "loss": 0.7863, "step": 1575 }, { "epoch": 0.19, "learning_rate": 1.8720450115745038e-05, "loss": 0.7835, "step": 1576 }, { "epoch": 0.19, "learning_rate": 1.871855892527167e-05, "loss": 0.861, "step": 1577 }, { "epoch": 0.19, "learning_rate": 1.8716666433901328e-05, "loss": 0.846, "step": 1578 }, { "epoch": 0.19, "learning_rate": 1.87147726419164e-05, "loss": 0.7846, "step": 1579 }, { "epoch": 0.19, "learning_rate": 1.8712877549599448e-05, "loss": 0.7985, "step": 1580 }, { "epoch": 0.19, "learning_rate": 1.8710981157233244e-05, "loss": 0.8075, "step": 1581 }, { "epoch": 0.19, "learning_rate": 1.870908346510075e-05, "loss": 0.8142, "step": 1582 }, { "epoch": 0.19, "learning_rate": 1.8707184473485118e-05, "loss": 0.7985, "step": 1583 }, { "epoch": 0.19, "learning_rate": 1.8705284182669697e-05, "loss": 0.8019, "step": 1584 }, { "epoch": 0.19, "learning_rate": 1.8703382592938034e-05, "loss": 0.8153, "step": 1585 }, { "epoch": 0.19, "learning_rate": 1.870147970457386e-05, "loss": 0.8421, "step": 1586 }, { "epoch": 0.19, "learning_rate": 1.8699575517861105e-05, "loss": 0.832, "step": 1587 }, { "epoch": 0.19, "learning_rate": 1.8697670033083898e-05, "loss": 0.8594, "step": 1588 }, { "epoch": 0.19, "learning_rate": 1.8695763250526552e-05, "loss": 0.8449, "step": 1589 }, { "epoch": 0.19, "learning_rate": 1.8693855170473577e-05, "loss": 0.8566, "step": 1590 }, { "epoch": 0.19, "learning_rate": 1.8691945793209685e-05, "loss": 0.8002, "step": 1591 }, { "epoch": 0.19, "learning_rate": 1.869003511901977e-05, "loss": 0.8242, "step": 1592 }, { "epoch": 0.19, "learning_rate": 1.8688123148188917e-05, "loss": 0.8153, "step": 1593 }, { "epoch": 0.19, "learning_rate": 1.8686209881002423e-05, "loss": 0.8493, "step": 1594 }, { "epoch": 0.19, "learning_rate": 1.868429531774576e-05, "loss": 0.8119, "step": 1595 }, { "epoch": 0.19, "learning_rate": 1.8682379458704606e-05, "loss": 0.8348, "step": 1596 }, { "epoch": 0.19, "learning_rate": 1.8680462304164816e-05, "loss": 0.817, "step": 1597 }, { "epoch": 0.19, "learning_rate": 1.867854385441246e-05, "loss": 0.8142, "step": 1598 }, { "epoch": 0.19, "learning_rate": 1.8676624109733785e-05, "loss": 0.8516, "step": 1599 }, { "epoch": 0.19, "learning_rate": 1.8674703070415235e-05, "loss": 0.8951, "step": 1600 }, { "epoch": 0.19, "learning_rate": 1.867278073674345e-05, "loss": 0.8292, "step": 1601 }, { "epoch": 0.19, "learning_rate": 1.8670857109005263e-05, "loss": 0.8175, "step": 1602 }, { "epoch": 0.19, "learning_rate": 1.8668932187487695e-05, "loss": 0.7628, "step": 1603 }, { "epoch": 0.19, "learning_rate": 1.866700597247797e-05, "loss": 0.8571, "step": 1604 }, { "epoch": 0.19, "learning_rate": 1.866507846426349e-05, "loss": 0.8499, "step": 1605 }, { "epoch": 0.19, "learning_rate": 1.8663149663131864e-05, "loss": 0.8114, "step": 1606 }, { "epoch": 0.19, "learning_rate": 1.866121956937089e-05, "loss": 0.7595, "step": 1607 }, { "epoch": 0.19, "learning_rate": 1.8659288183268555e-05, "loss": 0.8315, "step": 1608 }, { "epoch": 0.19, "learning_rate": 1.8657355505113043e-05, "loss": 0.8186, "step": 1609 }, { "epoch": 0.19, "learning_rate": 1.8655421535192728e-05, "loss": 0.8633, "step": 1610 }, { "epoch": 0.19, "learning_rate": 1.8653486273796175e-05, "loss": 0.7863, "step": 1611 }, { "epoch": 0.19, "learning_rate": 1.865154972121215e-05, "loss": 0.8248, "step": 1612 }, { "epoch": 0.19, "learning_rate": 1.86496118777296e-05, "loss": 0.8683, "step": 1613 }, { "epoch": 0.19, "learning_rate": 1.8647672743637676e-05, "loss": 0.8309, "step": 1614 }, { "epoch": 0.19, "learning_rate": 1.8645732319225716e-05, "loss": 0.8599, "step": 1615 }, { "epoch": 0.19, "learning_rate": 1.8643790604783247e-05, "loss": 0.8488, "step": 1616 }, { "epoch": 0.19, "learning_rate": 1.8641847600599994e-05, "loss": 0.8069, "step": 1617 }, { "epoch": 0.19, "learning_rate": 1.8639903306965878e-05, "loss": 0.8767, "step": 1618 }, { "epoch": 0.19, "learning_rate": 1.8637957724170997e-05, "loss": 0.8041, "step": 1619 }, { "epoch": 0.19, "learning_rate": 1.8636010852505664e-05, "loss": 0.8683, "step": 1620 }, { "epoch": 0.19, "learning_rate": 1.863406269226036e-05, "loss": 0.8354, "step": 1621 }, { "epoch": 0.19, "learning_rate": 1.8632113243725778e-05, "loss": 0.8555, "step": 1622 }, { "epoch": 0.19, "learning_rate": 1.863016250719279e-05, "loss": 0.8214, "step": 1623 }, { "epoch": 0.19, "learning_rate": 1.8628210482952474e-05, "loss": 0.9046, "step": 1624 }, { "epoch": 0.19, "learning_rate": 1.8626257171296083e-05, "loss": 0.8499, "step": 1625 }, { "epoch": 0.19, "learning_rate": 1.8624302572515074e-05, "loss": 0.8393, "step": 1626 }, { "epoch": 0.19, "learning_rate": 1.8622346686901093e-05, "loss": 0.8013, "step": 1627 }, { "epoch": 0.19, "learning_rate": 1.8620389514745976e-05, "loss": 0.8382, "step": 1628 }, { "epoch": 0.19, "learning_rate": 1.8618431056341758e-05, "loss": 0.9085, "step": 1629 }, { "epoch": 0.19, "learning_rate": 1.8616471311980653e-05, "loss": 0.7958, "step": 1630 }, { "epoch": 0.19, "learning_rate": 1.8614510281955086e-05, "loss": 0.8756, "step": 1631 }, { "epoch": 0.19, "learning_rate": 1.861254796655765e-05, "loss": 0.8253, "step": 1632 }, { "epoch": 0.19, "learning_rate": 1.861058436608115e-05, "loss": 0.8304, "step": 1633 }, { "epoch": 0.19, "learning_rate": 1.860861948081857e-05, "loss": 0.7539, "step": 1634 }, { "epoch": 0.19, "learning_rate": 1.8606653311063096e-05, "loss": 0.8549, "step": 1635 }, { "epoch": 0.2, "learning_rate": 1.8604685857108096e-05, "loss": 0.8153, "step": 1636 }, { "epoch": 0.2, "learning_rate": 1.860271711924714e-05, "loss": 0.8504, "step": 1637 }, { "epoch": 0.2, "learning_rate": 1.8600747097773974e-05, "loss": 0.8376, "step": 1638 }, { "epoch": 0.2, "learning_rate": 1.8598775792982552e-05, "loss": 0.8309, "step": 1639 }, { "epoch": 0.2, "learning_rate": 1.8596803205167012e-05, "loss": 0.8544, "step": 1640 }, { "epoch": 0.2, "learning_rate": 1.8594829334621683e-05, "loss": 0.851, "step": 1641 }, { "epoch": 0.2, "learning_rate": 1.8592854181641086e-05, "loss": 0.8069, "step": 1642 }, { "epoch": 0.2, "learning_rate": 1.8590877746519934e-05, "loss": 0.8231, "step": 1643 }, { "epoch": 0.2, "learning_rate": 1.8588900029553133e-05, "loss": 0.7958, "step": 1644 }, { "epoch": 0.2, "learning_rate": 1.8586921031035772e-05, "loss": 0.8292, "step": 1645 }, { "epoch": 0.2, "learning_rate": 1.8584940751263145e-05, "loss": 0.8298, "step": 1646 }, { "epoch": 0.2, "learning_rate": 1.858295919053073e-05, "loss": 0.7729, "step": 1647 }, { "epoch": 0.2, "learning_rate": 1.858097634913419e-05, "loss": 0.8644, "step": 1648 }, { "epoch": 0.2, "learning_rate": 1.8578992227369387e-05, "loss": 0.8382, "step": 1649 }, { "epoch": 0.2, "learning_rate": 1.857700682553237e-05, "loss": 0.8817, "step": 1650 }, { "epoch": 0.2, "learning_rate": 1.8575020143919387e-05, "loss": 0.8672, "step": 1651 }, { "epoch": 0.2, "learning_rate": 1.8573032182826865e-05, "loss": 0.7924, "step": 1652 }, { "epoch": 0.2, "learning_rate": 1.8571042942551437e-05, "loss": 0.8689, "step": 1653 }, { "epoch": 0.2, "learning_rate": 1.8569052423389907e-05, "loss": 0.8248, "step": 1654 }, { "epoch": 0.2, "learning_rate": 1.856706062563928e-05, "loss": 0.7785, "step": 1655 }, { "epoch": 0.2, "learning_rate": 1.856506754959676e-05, "loss": 0.9118, "step": 1656 }, { "epoch": 0.2, "learning_rate": 1.8563073195559736e-05, "loss": 0.7868, "step": 1657 }, { "epoch": 0.2, "learning_rate": 1.856107756382578e-05, "loss": 0.8778, "step": 1658 }, { "epoch": 0.2, "learning_rate": 1.8559080654692655e-05, "loss": 0.7997, "step": 1659 }, { "epoch": 0.2, "learning_rate": 1.855708246845833e-05, "loss": 0.8203, "step": 1660 }, { "epoch": 0.2, "learning_rate": 1.8555083005420948e-05, "loss": 0.8203, "step": 1661 }, { "epoch": 0.2, "learning_rate": 1.8553082265878856e-05, "loss": 0.8711, "step": 1662 }, { "epoch": 0.2, "learning_rate": 1.855108025013058e-05, "loss": 0.7935, "step": 1663 }, { "epoch": 0.2, "learning_rate": 1.8549076958474835e-05, "loss": 0.779, "step": 1664 }, { "epoch": 0.2, "learning_rate": 1.8547072391210546e-05, "loss": 0.8114, "step": 1665 }, { "epoch": 0.2, "learning_rate": 1.8545066548636806e-05, "loss": 0.8521, "step": 1666 }, { "epoch": 0.2, "learning_rate": 1.8543059431052905e-05, "loss": 0.8666, "step": 1667 }, { "epoch": 0.2, "learning_rate": 1.854105103875833e-05, "loss": 0.8471, "step": 1668 }, { "epoch": 0.2, "learning_rate": 1.8539041372052753e-05, "loss": 0.8343, "step": 1669 }, { "epoch": 0.2, "learning_rate": 1.8537030431236035e-05, "loss": 0.8421, "step": 1670 }, { "epoch": 0.2, "learning_rate": 1.8535018216608226e-05, "loss": 0.8566, "step": 1671 }, { "epoch": 0.2, "learning_rate": 1.8533004728469576e-05, "loss": 0.856, "step": 1672 }, { "epoch": 0.2, "learning_rate": 1.853098996712051e-05, "loss": 0.8583, "step": 1673 }, { "epoch": 0.2, "learning_rate": 1.852897393286166e-05, "loss": 0.8544, "step": 1674 }, { "epoch": 0.2, "learning_rate": 1.8526956625993825e-05, "loss": 0.8622, "step": 1675 }, { "epoch": 0.2, "learning_rate": 1.852493804681802e-05, "loss": 0.8465, "step": 1676 }, { "epoch": 0.2, "learning_rate": 1.8522918195635433e-05, "loss": 0.8192, "step": 1677 }, { "epoch": 0.2, "learning_rate": 1.8520897072747444e-05, "loss": 0.8996, "step": 1678 }, { "epoch": 0.2, "learning_rate": 1.851887467845563e-05, "loss": 0.8181, "step": 1679 }, { "epoch": 0.2, "learning_rate": 1.8516851013061744e-05, "loss": 0.8705, "step": 1680 }, { "epoch": 0.2, "learning_rate": 1.8514826076867747e-05, "loss": 0.793, "step": 1681 }, { "epoch": 0.2, "learning_rate": 1.851279987017578e-05, "loss": 0.8125, "step": 1682 }, { "epoch": 0.2, "learning_rate": 1.851077239328816e-05, "loss": 0.8309, "step": 1683 }, { "epoch": 0.2, "learning_rate": 1.8508743646507423e-05, "loss": 0.8449, "step": 1684 }, { "epoch": 0.2, "learning_rate": 1.850671363013627e-05, "loss": 0.8426, "step": 1685 }, { "epoch": 0.2, "learning_rate": 1.8504682344477603e-05, "loss": 0.8555, "step": 1686 }, { "epoch": 0.2, "learning_rate": 1.8502649789834505e-05, "loss": 0.8158, "step": 1687 }, { "epoch": 0.2, "learning_rate": 1.8500615966510263e-05, "loss": 0.8465, "step": 1688 }, { "epoch": 0.2, "learning_rate": 1.8498580874808335e-05, "loss": 0.8097, "step": 1689 }, { "epoch": 0.2, "learning_rate": 1.849654451503238e-05, "loss": 0.8421, "step": 1690 }, { "epoch": 0.2, "learning_rate": 1.8494506887486245e-05, "loss": 0.8125, "step": 1691 }, { "epoch": 0.2, "learning_rate": 1.8492467992473965e-05, "loss": 0.8175, "step": 1692 }, { "epoch": 0.2, "learning_rate": 1.8490427830299763e-05, "loss": 0.8555, "step": 1693 }, { "epoch": 0.2, "learning_rate": 1.848838640126805e-05, "loss": 0.832, "step": 1694 }, { "epoch": 0.2, "learning_rate": 1.848634370568343e-05, "loss": 0.8304, "step": 1695 }, { "epoch": 0.2, "learning_rate": 1.8484299743850693e-05, "loss": 0.822, "step": 1696 }, { "epoch": 0.2, "learning_rate": 1.8482254516074818e-05, "loss": 0.8956, "step": 1697 }, { "epoch": 0.2, "learning_rate": 1.8480208022660976e-05, "loss": 0.8097, "step": 1698 }, { "epoch": 0.2, "learning_rate": 1.847816026391452e-05, "loss": 0.8783, "step": 1699 }, { "epoch": 0.2, "learning_rate": 1.8476111240141e-05, "loss": 0.8544, "step": 1700 }, { "epoch": 0.2, "learning_rate": 1.847406095164615e-05, "loss": 0.8326, "step": 1701 }, { "epoch": 0.2, "learning_rate": 1.8472009398735898e-05, "loss": 0.8404, "step": 1702 }, { "epoch": 0.2, "learning_rate": 1.8469956581716347e-05, "loss": 0.8454, "step": 1703 }, { "epoch": 0.2, "learning_rate": 1.8467902500893806e-05, "loss": 0.8404, "step": 1704 }, { "epoch": 0.2, "learning_rate": 1.8465847156574763e-05, "loss": 0.8136, "step": 1705 }, { "epoch": 0.2, "learning_rate": 1.846379054906589e-05, "loss": 0.8432, "step": 1706 }, { "epoch": 0.2, "learning_rate": 1.8461732678674064e-05, "loss": 0.8398, "step": 1707 }, { "epoch": 0.2, "learning_rate": 1.845967354570633e-05, "loss": 0.8315, "step": 1708 }, { "epoch": 0.2, "learning_rate": 1.845761315046994e-05, "loss": 0.8309, "step": 1709 }, { "epoch": 0.2, "learning_rate": 1.8455551493272316e-05, "loss": 0.7919, "step": 1710 }, { "epoch": 0.2, "learning_rate": 1.845348857442109e-05, "loss": 0.827, "step": 1711 }, { "epoch": 0.2, "learning_rate": 1.845142439422406e-05, "loss": 0.8856, "step": 1712 }, { "epoch": 0.2, "learning_rate": 1.844935895298923e-05, "loss": 0.8153, "step": 1713 }, { "epoch": 0.2, "learning_rate": 1.8447292251024777e-05, "loss": 0.8147, "step": 1714 }, { "epoch": 0.2, "learning_rate": 1.844522428863908e-05, "loss": 0.8108, "step": 1715 }, { "epoch": 0.2, "learning_rate": 1.84431550661407e-05, "loss": 0.7215, "step": 1716 }, { "epoch": 0.2, "learning_rate": 1.8441084583838386e-05, "loss": 0.846, "step": 1717 }, { "epoch": 0.2, "learning_rate": 1.8439012842041067e-05, "loss": 0.8767, "step": 1718 }, { "epoch": 0.21, "learning_rate": 1.8436939841057875e-05, "loss": 0.8092, "step": 1719 }, { "epoch": 0.21, "learning_rate": 1.843486558119812e-05, "loss": 0.8599, "step": 1720 }, { "epoch": 0.21, "learning_rate": 1.8432790062771308e-05, "loss": 0.8504, "step": 1721 }, { "epoch": 0.21, "learning_rate": 1.8430713286087118e-05, "loss": 0.8756, "step": 1722 }, { "epoch": 0.21, "learning_rate": 1.8428635251455436e-05, "loss": 0.832, "step": 1723 }, { "epoch": 0.21, "learning_rate": 1.8426555959186318e-05, "loss": 0.8331, "step": 1724 }, { "epoch": 0.21, "learning_rate": 1.8424475409590016e-05, "loss": 0.8343, "step": 1725 }, { "epoch": 0.21, "learning_rate": 1.8422393602976974e-05, "loss": 0.8432, "step": 1726 }, { "epoch": 0.21, "learning_rate": 1.8420310539657814e-05, "loss": 0.8343, "step": 1727 }, { "epoch": 0.21, "learning_rate": 1.841822621994335e-05, "loss": 0.8209, "step": 1728 }, { "epoch": 0.21, "learning_rate": 1.841614064414459e-05, "loss": 0.7868, "step": 1729 }, { "epoch": 0.21, "learning_rate": 1.8414053812572715e-05, "loss": 0.8058, "step": 1730 }, { "epoch": 0.21, "learning_rate": 1.8411965725539105e-05, "loss": 0.8315, "step": 1731 }, { "epoch": 0.21, "learning_rate": 1.8409876383355324e-05, "loss": 0.7958, "step": 1732 }, { "epoch": 0.21, "learning_rate": 1.8407785786333122e-05, "loss": 0.8052, "step": 1733 }, { "epoch": 0.21, "learning_rate": 1.8405693934784436e-05, "loss": 0.7779, "step": 1734 }, { "epoch": 0.21, "learning_rate": 1.8403600829021392e-05, "loss": 0.8577, "step": 1735 }, { "epoch": 0.21, "learning_rate": 1.8401506469356304e-05, "loss": 0.8359, "step": 1736 }, { "epoch": 0.21, "learning_rate": 1.839941085610167e-05, "loss": 0.8086, "step": 1737 }, { "epoch": 0.21, "learning_rate": 1.839731398957018e-05, "loss": 0.8158, "step": 1738 }, { "epoch": 0.21, "learning_rate": 1.8395215870074704e-05, "loss": 0.8421, "step": 1739 }, { "epoch": 0.21, "learning_rate": 1.8393116497928303e-05, "loss": 0.8203, "step": 1740 }, { "epoch": 0.21, "learning_rate": 1.8391015873444226e-05, "loss": 0.7958, "step": 1741 }, { "epoch": 0.21, "learning_rate": 1.8388913996935907e-05, "loss": 0.8845, "step": 1742 }, { "epoch": 0.21, "learning_rate": 1.8386810868716966e-05, "loss": 0.8186, "step": 1743 }, { "epoch": 0.21, "learning_rate": 1.8384706489101208e-05, "loss": 0.8516, "step": 1744 }, { "epoch": 0.21, "learning_rate": 1.8382600858402636e-05, "loss": 0.8571, "step": 1745 }, { "epoch": 0.21, "learning_rate": 1.8380493976935427e-05, "loss": 0.8365, "step": 1746 }, { "epoch": 0.21, "learning_rate": 1.8378385845013945e-05, "loss": 0.7695, "step": 1747 }, { "epoch": 0.21, "learning_rate": 1.8376276462952752e-05, "loss": 0.8214, "step": 1748 }, { "epoch": 0.21, "learning_rate": 1.837416583106658e-05, "loss": 0.8404, "step": 1749 }, { "epoch": 0.21, "learning_rate": 1.8372053949670367e-05, "loss": 0.8225, "step": 1750 }, { "epoch": 0.21, "learning_rate": 1.836994081907922e-05, "loss": 0.8443, "step": 1751 }, { "epoch": 0.21, "learning_rate": 1.836782643960844e-05, "loss": 0.8912, "step": 1752 }, { "epoch": 0.21, "learning_rate": 1.836571081157352e-05, "loss": 0.8806, "step": 1753 }, { "epoch": 0.21, "learning_rate": 1.8363593935290124e-05, "loss": 0.7863, "step": 1754 }, { "epoch": 0.21, "learning_rate": 1.8361475811074114e-05, "loss": 0.7762, "step": 1755 }, { "epoch": 0.21, "learning_rate": 1.8359356439241537e-05, "loss": 0.822, "step": 1756 }, { "epoch": 0.21, "learning_rate": 1.835723582010863e-05, "loss": 0.7902, "step": 1757 }, { "epoch": 0.21, "learning_rate": 1.83551139539918e-05, "loss": 0.8783, "step": 1758 }, { "epoch": 0.21, "learning_rate": 1.835299084120766e-05, "loss": 0.8175, "step": 1759 }, { "epoch": 0.21, "learning_rate": 1.835086648207299e-05, "loss": 0.8465, "step": 1760 }, { "epoch": 0.21, "learning_rate": 1.834874087690478e-05, "loss": 0.8047, "step": 1761 }, { "epoch": 0.21, "learning_rate": 1.8346614026020178e-05, "loss": 0.8265, "step": 1762 }, { "epoch": 0.21, "learning_rate": 1.834448592973654e-05, "loss": 0.8689, "step": 1763 }, { "epoch": 0.21, "learning_rate": 1.834235658837139e-05, "loss": 0.8421, "step": 1764 }, { "epoch": 0.21, "learning_rate": 1.8340226002242464e-05, "loss": 0.8125, "step": 1765 }, { "epoch": 0.21, "learning_rate": 1.833809417166765e-05, "loss": 0.8917, "step": 1766 }, { "epoch": 0.21, "learning_rate": 1.833596109696505e-05, "loss": 0.8733, "step": 1767 }, { "epoch": 0.21, "learning_rate": 1.833382677845293e-05, "loss": 0.8164, "step": 1768 }, { "epoch": 0.21, "learning_rate": 1.833169121644976e-05, "loss": 0.827, "step": 1769 }, { "epoch": 0.21, "learning_rate": 1.832955441127419e-05, "loss": 0.8164, "step": 1770 }, { "epoch": 0.21, "learning_rate": 1.8327416363245042e-05, "loss": 0.8203, "step": 1771 }, { "epoch": 0.21, "learning_rate": 1.832527707268134e-05, "loss": 0.8225, "step": 1772 }, { "epoch": 0.21, "learning_rate": 1.832313653990229e-05, "loss": 0.7478, "step": 1773 }, { "epoch": 0.21, "learning_rate": 1.832099476522728e-05, "loss": 0.8069, "step": 1774 }, { "epoch": 0.21, "learning_rate": 1.831885174897588e-05, "loss": 0.8583, "step": 1775 }, { "epoch": 0.21, "learning_rate": 1.8316707491467855e-05, "loss": 0.8795, "step": 1776 }, { "epoch": 0.21, "learning_rate": 1.831456199302315e-05, "loss": 0.8142, "step": 1777 }, { "epoch": 0.21, "learning_rate": 1.831241525396189e-05, "loss": 0.7779, "step": 1778 }, { "epoch": 0.21, "learning_rate": 1.8310267274604395e-05, "loss": 0.8482, "step": 1779 }, { "epoch": 0.21, "learning_rate": 1.830811805527116e-05, "loss": 0.8309, "step": 1780 }, { "epoch": 0.21, "learning_rate": 1.8305967596282877e-05, "loss": 0.8504, "step": 1781 }, { "epoch": 0.21, "learning_rate": 1.8303815897960414e-05, "loss": 0.8064, "step": 1782 }, { "epoch": 0.21, "learning_rate": 1.830166296062482e-05, "loss": 0.8058, "step": 1783 }, { "epoch": 0.21, "learning_rate": 1.8299508784597344e-05, "loss": 0.8465, "step": 1784 }, { "epoch": 0.21, "learning_rate": 1.8297353370199406e-05, "loss": 0.8426, "step": 1785 }, { "epoch": 0.21, "learning_rate": 1.8295196717752612e-05, "loss": 0.8482, "step": 1786 }, { "epoch": 0.21, "learning_rate": 1.8293038827578765e-05, "loss": 0.8231, "step": 1787 }, { "epoch": 0.21, "learning_rate": 1.8290879699999836e-05, "loss": 0.8901, "step": 1788 }, { "epoch": 0.21, "learning_rate": 1.8288719335337998e-05, "loss": 0.8036, "step": 1789 }, { "epoch": 0.21, "learning_rate": 1.8286557733915588e-05, "loss": 0.8237, "step": 1790 }, { "epoch": 0.21, "learning_rate": 1.8284394896055143e-05, "loss": 0.7924, "step": 1791 }, { "epoch": 0.21, "learning_rate": 1.828223082207938e-05, "loss": 0.8086, "step": 1792 }, { "epoch": 0.21, "learning_rate": 1.828006551231121e-05, "loss": 0.8164, "step": 1793 }, { "epoch": 0.21, "learning_rate": 1.8277898967073706e-05, "loss": 0.8538, "step": 1794 }, { "epoch": 0.21, "learning_rate": 1.8275731186690144e-05, "loss": 0.851, "step": 1795 }, { "epoch": 0.21, "learning_rate": 1.827356217148398e-05, "loss": 0.784, "step": 1796 }, { "epoch": 0.21, "learning_rate": 1.8271391921778846e-05, "loss": 0.8744, "step": 1797 }, { "epoch": 0.21, "learning_rate": 1.8269220437898574e-05, "loss": 0.8103, "step": 1798 }, { "epoch": 0.21, "learning_rate": 1.826704772016717e-05, "loss": 0.8214, "step": 1799 }, { "epoch": 0.21, "learning_rate": 1.8264873768908816e-05, "loss": 0.755, "step": 1800 }, { "epoch": 0.21, "learning_rate": 1.82626985844479e-05, "loss": 0.8398, "step": 1801 }, { "epoch": 0.21, "learning_rate": 1.826052216710897e-05, "loss": 0.8862, "step": 1802 }, { "epoch": 0.22, "learning_rate": 1.8258344517216784e-05, "loss": 0.7946, "step": 1803 }, { "epoch": 0.22, "learning_rate": 1.8256165635096255e-05, "loss": 0.8259, "step": 1804 }, { "epoch": 0.22, "learning_rate": 1.82539855210725e-05, "loss": 0.8259, "step": 1805 }, { "epoch": 0.22, "learning_rate": 1.8251804175470815e-05, "loss": 0.8292, "step": 1806 }, { "epoch": 0.22, "learning_rate": 1.824962159861668e-05, "loss": 0.8292, "step": 1807 }, { "epoch": 0.22, "learning_rate": 1.824743779083575e-05, "loss": 0.8198, "step": 1808 }, { "epoch": 0.22, "learning_rate": 1.824525275245388e-05, "loss": 0.8181, "step": 1809 }, { "epoch": 0.22, "learning_rate": 1.8243066483797093e-05, "loss": 0.7913, "step": 1810 }, { "epoch": 0.22, "learning_rate": 1.8240878985191607e-05, "loss": 0.7723, "step": 1811 }, { "epoch": 0.22, "learning_rate": 1.8238690256963817e-05, "loss": 0.8337, "step": 1812 }, { "epoch": 0.22, "learning_rate": 1.8236500299440307e-05, "loss": 0.8477, "step": 1813 }, { "epoch": 0.22, "learning_rate": 1.8234309112947832e-05, "loss": 0.8008, "step": 1814 }, { "epoch": 0.22, "learning_rate": 1.8232116697813347e-05, "loss": 0.8164, "step": 1815 }, { "epoch": 0.22, "learning_rate": 1.822992305436398e-05, "loss": 0.7266, "step": 1816 }, { "epoch": 0.22, "learning_rate": 1.8227728182927046e-05, "loss": 0.7846, "step": 1817 }, { "epoch": 0.22, "learning_rate": 1.822553208383004e-05, "loss": 0.817, "step": 1818 }, { "epoch": 0.22, "learning_rate": 1.8223334757400638e-05, "loss": 0.8348, "step": 1819 }, { "epoch": 0.22, "learning_rate": 1.8221136203966715e-05, "loss": 0.8566, "step": 1820 }, { "epoch": 0.22, "learning_rate": 1.8218936423856308e-05, "loss": 0.8214, "step": 1821 }, { "epoch": 0.22, "learning_rate": 1.8216735417397647e-05, "loss": 0.7818, "step": 1822 }, { "epoch": 0.22, "learning_rate": 1.8214533184919148e-05, "loss": 0.8387, "step": 1823 }, { "epoch": 0.22, "learning_rate": 1.8212329726749404e-05, "loss": 0.7829, "step": 1824 }, { "epoch": 0.22, "learning_rate": 1.8210125043217195e-05, "loss": 0.8443, "step": 1825 }, { "epoch": 0.22, "learning_rate": 1.820791913465148e-05, "loss": 0.7511, "step": 1826 }, { "epoch": 0.22, "learning_rate": 1.8205712001381403e-05, "loss": 0.8125, "step": 1827 }, { "epoch": 0.22, "learning_rate": 1.8203503643736293e-05, "loss": 0.7902, "step": 1828 }, { "epoch": 0.22, "learning_rate": 1.8201294062045653e-05, "loss": 0.8092, "step": 1829 }, { "epoch": 0.22, "learning_rate": 1.8199083256639186e-05, "loss": 0.8471, "step": 1830 }, { "epoch": 0.22, "learning_rate": 1.8196871227846756e-05, "loss": 0.8555, "step": 1831 }, { "epoch": 0.22, "learning_rate": 1.819465797599842e-05, "loss": 0.8661, "step": 1832 }, { "epoch": 0.22, "learning_rate": 1.8192443501424426e-05, "loss": 0.827, "step": 1833 }, { "epoch": 0.22, "learning_rate": 1.819022780445519e-05, "loss": 0.7734, "step": 1834 }, { "epoch": 0.22, "learning_rate": 1.8188010885421317e-05, "loss": 0.846, "step": 1835 }, { "epoch": 0.22, "learning_rate": 1.8185792744653596e-05, "loss": 0.8387, "step": 1836 }, { "epoch": 0.22, "learning_rate": 1.8183573382482992e-05, "loss": 0.798, "step": 1837 }, { "epoch": 0.22, "learning_rate": 1.8181352799240662e-05, "loss": 0.8493, "step": 1838 }, { "epoch": 0.22, "learning_rate": 1.8179130995257932e-05, "loss": 0.8287, "step": 1839 }, { "epoch": 0.22, "learning_rate": 1.8176907970866323e-05, "loss": 0.8683, "step": 1840 }, { "epoch": 0.22, "learning_rate": 1.817468372639753e-05, "loss": 0.9035, "step": 1841 }, { "epoch": 0.22, "learning_rate": 1.8172458262183434e-05, "loss": 0.8231, "step": 1842 }, { "epoch": 0.22, "learning_rate": 1.81702315785561e-05, "loss": 0.8276, "step": 1843 }, { "epoch": 0.22, "learning_rate": 1.8168003675847766e-05, "loss": 0.8638, "step": 1844 }, { "epoch": 0.22, "learning_rate": 1.8165774554390857e-05, "loss": 0.8443, "step": 1845 }, { "epoch": 0.22, "learning_rate": 1.816354421451799e-05, "loss": 0.7813, "step": 1846 }, { "epoch": 0.22, "learning_rate": 1.816131265656194e-05, "loss": 0.8147, "step": 1847 }, { "epoch": 0.22, "learning_rate": 1.815907988085569e-05, "loss": 0.808, "step": 1848 }, { "epoch": 0.22, "learning_rate": 1.8156845887732388e-05, "loss": 0.8538, "step": 1849 }, { "epoch": 0.22, "learning_rate": 1.8154610677525366e-05, "loss": 0.8683, "step": 1850 }, { "epoch": 0.22, "learning_rate": 1.8152374250568143e-05, "loss": 0.8661, "step": 1851 }, { "epoch": 0.22, "learning_rate": 1.815013660719442e-05, "loss": 0.8761, "step": 1852 }, { "epoch": 0.22, "learning_rate": 1.8147897747738065e-05, "loss": 0.8142, "step": 1853 }, { "epoch": 0.22, "learning_rate": 1.814565767253315e-05, "loss": 0.8086, "step": 1854 }, { "epoch": 0.22, "learning_rate": 1.814341638191391e-05, "loss": 0.8577, "step": 1855 }, { "epoch": 0.22, "learning_rate": 1.814117387621477e-05, "loss": 0.7958, "step": 1856 }, { "epoch": 0.22, "learning_rate": 1.8138930155770334e-05, "loss": 0.8287, "step": 1857 }, { "epoch": 0.22, "learning_rate": 1.813668522091539e-05, "loss": 0.8036, "step": 1858 }, { "epoch": 0.22, "learning_rate": 1.8134439071984902e-05, "loss": 0.8114, "step": 1859 }, { "epoch": 0.22, "learning_rate": 1.813219170931402e-05, "loss": 0.8147, "step": 1860 }, { "epoch": 0.22, "learning_rate": 1.8129943133238074e-05, "loss": 0.8153, "step": 1861 }, { "epoch": 0.22, "learning_rate": 1.8127693344092573e-05, "loss": 0.8477, "step": 1862 }, { "epoch": 0.22, "learning_rate": 1.8125442342213206e-05, "loss": 0.8304, "step": 1863 }, { "epoch": 0.22, "learning_rate": 1.8123190127935845e-05, "loss": 0.8555, "step": 1864 }, { "epoch": 0.22, "learning_rate": 1.812093670159655e-05, "loss": 0.8571, "step": 1865 }, { "epoch": 0.22, "learning_rate": 1.8118682063531548e-05, "loss": 0.8158, "step": 1866 }, { "epoch": 0.22, "learning_rate": 1.811642621407726e-05, "loss": 0.8248, "step": 1867 }, { "epoch": 0.22, "learning_rate": 1.811416915357027e-05, "loss": 0.7656, "step": 1868 }, { "epoch": 0.22, "learning_rate": 1.811191088234737e-05, "loss": 0.8175, "step": 1869 }, { "epoch": 0.22, "learning_rate": 1.8109651400745504e-05, "loss": 0.8276, "step": 1870 }, { "epoch": 0.22, "learning_rate": 1.8107390709101812e-05, "loss": 0.7829, "step": 1871 }, { "epoch": 0.22, "learning_rate": 1.8105128807753618e-05, "loss": 0.8354, "step": 1872 }, { "epoch": 0.22, "learning_rate": 1.8102865697038415e-05, "loss": 0.8382, "step": 1873 }, { "epoch": 0.22, "learning_rate": 1.8100601377293886e-05, "loss": 0.7907, "step": 1874 }, { "epoch": 0.22, "learning_rate": 1.8098335848857885e-05, "loss": 0.8147, "step": 1875 }, { "epoch": 0.22, "learning_rate": 1.809606911206846e-05, "loss": 0.841, "step": 1876 }, { "epoch": 0.22, "learning_rate": 1.8093801167263822e-05, "loss": 0.8387, "step": 1877 }, { "epoch": 0.22, "learning_rate": 1.809153201478237e-05, "loss": 0.8119, "step": 1878 }, { "epoch": 0.22, "learning_rate": 1.8089261654962693e-05, "loss": 0.8348, "step": 1879 }, { "epoch": 0.22, "learning_rate": 1.808699008814355e-05, "loss": 0.8432, "step": 1880 }, { "epoch": 0.22, "learning_rate": 1.8084717314663876e-05, "loss": 0.8315, "step": 1881 }, { "epoch": 0.22, "learning_rate": 1.80824433348628e-05, "loss": 0.8142, "step": 1882 }, { "epoch": 0.22, "learning_rate": 1.8080168149079614e-05, "loss": 0.8778, "step": 1883 }, { "epoch": 0.22, "learning_rate": 1.8077891757653808e-05, "loss": 0.8248, "step": 1884 }, { "epoch": 0.22, "learning_rate": 1.807561416092503e-05, "loss": 0.8398, "step": 1885 }, { "epoch": 0.22, "learning_rate": 1.8073335359233132e-05, "loss": 0.8142, "step": 1886 }, { "epoch": 0.23, "learning_rate": 1.807105535291813e-05, "loss": 0.841, "step": 1887 }, { "epoch": 0.23, "learning_rate": 1.8068774142320222e-05, "loss": 0.798, "step": 1888 }, { "epoch": 0.23, "learning_rate": 1.8066491727779795e-05, "loss": 0.8231, "step": 1889 }, { "epoch": 0.23, "learning_rate": 1.8064208109637394e-05, "loss": 0.8555, "step": 1890 }, { "epoch": 0.23, "learning_rate": 1.8061923288233772e-05, "loss": 0.8371, "step": 1891 }, { "epoch": 0.23, "learning_rate": 1.8059637263909842e-05, "loss": 0.8304, "step": 1892 }, { "epoch": 0.23, "learning_rate": 1.80573500370067e-05, "loss": 0.8538, "step": 1893 }, { "epoch": 0.23, "learning_rate": 1.8055061607865628e-05, "loss": 0.822, "step": 1894 }, { "epoch": 0.23, "learning_rate": 1.805277197682808e-05, "loss": 0.8421, "step": 1895 }, { "epoch": 0.23, "learning_rate": 1.805048114423569e-05, "loss": 0.856, "step": 1896 }, { "epoch": 0.23, "learning_rate": 1.8048189110430278e-05, "loss": 0.8108, "step": 1897 }, { "epoch": 0.23, "learning_rate": 1.8045895875753835e-05, "loss": 0.8242, "step": 1898 }, { "epoch": 0.23, "learning_rate": 1.8043601440548535e-05, "loss": 0.8571, "step": 1899 }, { "epoch": 0.23, "learning_rate": 1.8041305805156733e-05, "loss": 0.8711, "step": 1900 }, { "epoch": 0.23, "learning_rate": 1.8039008969920958e-05, "loss": 0.7874, "step": 1901 }, { "epoch": 0.23, "learning_rate": 1.8036710935183924e-05, "loss": 0.8717, "step": 1902 }, { "epoch": 0.23, "learning_rate": 1.8034411701288516e-05, "loss": 0.7813, "step": 1903 }, { "epoch": 0.23, "learning_rate": 1.803211126857781e-05, "loss": 0.8661, "step": 1904 }, { "epoch": 0.23, "learning_rate": 1.802980963739505e-05, "loss": 0.8281, "step": 1905 }, { "epoch": 0.23, "learning_rate": 1.8027506808083665e-05, "loss": 0.8951, "step": 1906 }, { "epoch": 0.23, "learning_rate": 1.8025202780987254e-05, "loss": 0.8002, "step": 1907 }, { "epoch": 0.23, "learning_rate": 1.8022897556449606e-05, "loss": 0.8231, "step": 1908 }, { "epoch": 0.23, "learning_rate": 1.8020591134814686e-05, "loss": 0.8069, "step": 1909 }, { "epoch": 0.23, "learning_rate": 1.801828351642663e-05, "loss": 0.8516, "step": 1910 }, { "epoch": 0.23, "learning_rate": 1.801597470162976e-05, "loss": 0.7885, "step": 1911 }, { "epoch": 0.23, "learning_rate": 1.8013664690768577e-05, "loss": 0.8125, "step": 1912 }, { "epoch": 0.23, "learning_rate": 1.8011353484187753e-05, "loss": 0.8538, "step": 1913 }, { "epoch": 0.23, "learning_rate": 1.800904108223215e-05, "loss": 0.8209, "step": 1914 }, { "epoch": 0.23, "learning_rate": 1.8006727485246794e-05, "loss": 0.8119, "step": 1915 }, { "epoch": 0.23, "learning_rate": 1.8004412693576902e-05, "loss": 0.875, "step": 1916 }, { "epoch": 0.23, "learning_rate": 1.8002096707567865e-05, "loss": 0.8281, "step": 1917 }, { "epoch": 0.23, "learning_rate": 1.799977952756525e-05, "loss": 0.8382, "step": 1918 }, { "epoch": 0.23, "learning_rate": 1.7997461153914802e-05, "loss": 0.8108, "step": 1919 }, { "epoch": 0.23, "learning_rate": 1.7995141586962447e-05, "loss": 0.8661, "step": 1920 }, { "epoch": 0.23, "learning_rate": 1.7992820827054286e-05, "loss": 0.8119, "step": 1921 }, { "epoch": 0.23, "learning_rate": 1.7990498874536606e-05, "loss": 0.8198, "step": 1922 }, { "epoch": 0.23, "learning_rate": 1.7988175729755855e-05, "loss": 0.8092, "step": 1923 }, { "epoch": 0.23, "learning_rate": 1.7985851393058683e-05, "loss": 0.8131, "step": 1924 }, { "epoch": 0.23, "learning_rate": 1.7983525864791894e-05, "loss": 0.8728, "step": 1925 }, { "epoch": 0.23, "learning_rate": 1.7981199145302485e-05, "loss": 0.8477, "step": 1926 }, { "epoch": 0.23, "learning_rate": 1.797887123493762e-05, "loss": 0.8064, "step": 1927 }, { "epoch": 0.23, "learning_rate": 1.797654213404466e-05, "loss": 0.8577, "step": 1928 }, { "epoch": 0.23, "learning_rate": 1.7974211842971114e-05, "loss": 0.7902, "step": 1929 }, { "epoch": 0.23, "learning_rate": 1.7971880362064696e-05, "loss": 0.9001, "step": 1930 }, { "epoch": 0.23, "learning_rate": 1.7969547691673284e-05, "loss": 0.8287, "step": 1931 }, { "epoch": 0.23, "learning_rate": 1.7967213832144936e-05, "loss": 0.8343, "step": 1932 }, { "epoch": 0.23, "learning_rate": 1.7964878783827885e-05, "loss": 0.7478, "step": 1933 }, { "epoch": 0.23, "learning_rate": 1.796254254707055e-05, "loss": 0.8052, "step": 1934 }, { "epoch": 0.23, "learning_rate": 1.796020512222151e-05, "loss": 0.8214, "step": 1935 }, { "epoch": 0.23, "learning_rate": 1.795786650962954e-05, "loss": 0.8058, "step": 1936 }, { "epoch": 0.23, "learning_rate": 1.7955526709643585e-05, "loss": 0.7768, "step": 1937 }, { "epoch": 0.23, "learning_rate": 1.7953185722612767e-05, "loss": 0.8002, "step": 1938 }, { "epoch": 0.23, "learning_rate": 1.795084354888638e-05, "loss": 0.8616, "step": 1939 }, { "epoch": 0.23, "learning_rate": 1.7948500188813906e-05, "loss": 0.8666, "step": 1940 }, { "epoch": 0.23, "learning_rate": 1.7946155642744993e-05, "loss": 0.7891, "step": 1941 }, { "epoch": 0.23, "learning_rate": 1.7943809911029472e-05, "loss": 0.8265, "step": 1942 }, { "epoch": 0.23, "learning_rate": 1.7941462994017355e-05, "loss": 0.8767, "step": 1943 }, { "epoch": 0.23, "learning_rate": 1.7939114892058817e-05, "loss": 0.8728, "step": 1944 }, { "epoch": 0.23, "learning_rate": 1.7936765605504228e-05, "loss": 0.8086, "step": 1945 }, { "epoch": 0.23, "learning_rate": 1.7934415134704117e-05, "loss": 0.8203, "step": 1946 }, { "epoch": 0.23, "learning_rate": 1.7932063480009203e-05, "loss": 0.851, "step": 1947 }, { "epoch": 0.23, "learning_rate": 1.7929710641770372e-05, "loss": 0.8158, "step": 1948 }, { "epoch": 0.23, "learning_rate": 1.7927356620338697e-05, "loss": 0.822, "step": 1949 }, { "epoch": 0.23, "learning_rate": 1.7925001416065418e-05, "loss": 0.8298, "step": 1950 }, { "epoch": 0.23, "learning_rate": 1.7922645029301956e-05, "loss": 0.8689, "step": 1951 }, { "epoch": 0.23, "learning_rate": 1.7920287460399906e-05, "loss": 0.8086, "step": 1952 }, { "epoch": 0.23, "learning_rate": 1.7917928709711048e-05, "loss": 0.7868, "step": 1953 }, { "epoch": 0.23, "learning_rate": 1.791556877758732e-05, "loss": 0.798, "step": 1954 }, { "epoch": 0.23, "learning_rate": 1.791320766438086e-05, "loss": 0.8772, "step": 1955 }, { "epoch": 0.23, "learning_rate": 1.791084537044396e-05, "loss": 0.8069, "step": 1956 }, { "epoch": 0.23, "learning_rate": 1.7908481896129102e-05, "loss": 0.8555, "step": 1957 }, { "epoch": 0.23, "learning_rate": 1.790611724178894e-05, "loss": 0.8906, "step": 1958 }, { "epoch": 0.23, "learning_rate": 1.7903751407776307e-05, "loss": 0.7567, "step": 1959 }, { "epoch": 0.23, "learning_rate": 1.7901384394444203e-05, "loss": 0.8198, "step": 1960 }, { "epoch": 0.23, "learning_rate": 1.7899016202145815e-05, "loss": 0.7578, "step": 1961 }, { "epoch": 0.23, "learning_rate": 1.7896646831234505e-05, "loss": 0.7941, "step": 1962 }, { "epoch": 0.23, "learning_rate": 1.7894276282063798e-05, "loss": 0.8153, "step": 1963 }, { "epoch": 0.23, "learning_rate": 1.789190455498741e-05, "loss": 0.7796, "step": 1964 }, { "epoch": 0.23, "learning_rate": 1.7889531650359222e-05, "loss": 0.8733, "step": 1965 }, { "epoch": 0.23, "learning_rate": 1.78871575685333e-05, "loss": 0.8103, "step": 1966 }, { "epoch": 0.23, "learning_rate": 1.788478230986388e-05, "loss": 0.8583, "step": 1967 }, { "epoch": 0.23, "learning_rate": 1.7882405874705372e-05, "loss": 0.8382, "step": 1968 }, { "epoch": 0.23, "learning_rate": 1.7880028263412364e-05, "loss": 0.7617, "step": 1969 }, { "epoch": 0.23, "learning_rate": 1.7877649476339627e-05, "loss": 0.7606, "step": 1970 }, { "epoch": 0.24, "learning_rate": 1.7875269513842092e-05, "loss": 0.7645, "step": 1971 }, { "epoch": 0.24, "learning_rate": 1.787288837627487e-05, "loss": 0.8158, "step": 1972 }, { "epoch": 0.24, "learning_rate": 1.7870506063993265e-05, "loss": 0.8504, "step": 1973 }, { "epoch": 0.24, "learning_rate": 1.786812257735273e-05, "loss": 0.8331, "step": 1974 }, { "epoch": 0.24, "learning_rate": 1.786573791670891e-05, "loss": 0.7645, "step": 1975 }, { "epoch": 0.24, "learning_rate": 1.7863352082417615e-05, "loss": 0.8108, "step": 1976 }, { "epoch": 0.24, "learning_rate": 1.7860965074834844e-05, "loss": 0.8153, "step": 1977 }, { "epoch": 0.24, "learning_rate": 1.785857689431676e-05, "loss": 0.8136, "step": 1978 }, { "epoch": 0.24, "learning_rate": 1.78561875412197e-05, "loss": 0.7946, "step": 1979 }, { "epoch": 0.24, "learning_rate": 1.7853797015900177e-05, "loss": 0.8231, "step": 1980 }, { "epoch": 0.24, "learning_rate": 1.7851405318714893e-05, "loss": 0.8393, "step": 1981 }, { "epoch": 0.24, "learning_rate": 1.78490124500207e-05, "loss": 0.8131, "step": 1982 }, { "epoch": 0.24, "learning_rate": 1.784661841017465e-05, "loss": 0.7997, "step": 1983 }, { "epoch": 0.24, "learning_rate": 1.7844223199533953e-05, "loss": 0.8214, "step": 1984 }, { "epoch": 0.24, "learning_rate": 1.7841826818455994e-05, "loss": 0.8198, "step": 1985 }, { "epoch": 0.24, "learning_rate": 1.7839429267298346e-05, "loss": 0.7556, "step": 1986 }, { "epoch": 0.24, "learning_rate": 1.783703054641874e-05, "loss": 0.7974, "step": 1987 }, { "epoch": 0.24, "learning_rate": 1.783463065617509e-05, "loss": 0.8415, "step": 1988 }, { "epoch": 0.24, "learning_rate": 1.783222959692549e-05, "loss": 0.7997, "step": 1989 }, { "epoch": 0.24, "learning_rate": 1.78298273690282e-05, "loss": 0.8231, "step": 1990 }, { "epoch": 0.24, "learning_rate": 1.7827423972841654e-05, "loss": 0.7221, "step": 1991 }, { "epoch": 0.24, "learning_rate": 1.7825019408724464e-05, "loss": 0.8041, "step": 1992 }, { "epoch": 0.24, "learning_rate": 1.7822613677035417e-05, "loss": 0.8304, "step": 1993 }, { "epoch": 0.24, "learning_rate": 1.782020677813347e-05, "loss": 0.8013, "step": 1994 }, { "epoch": 0.24, "learning_rate": 1.7817798712377757e-05, "loss": 0.8594, "step": 1995 }, { "epoch": 0.24, "learning_rate": 1.7815389480127584e-05, "loss": 0.8867, "step": 1996 }, { "epoch": 0.24, "learning_rate": 1.781297908174244e-05, "loss": 0.8287, "step": 1997 }, { "epoch": 0.24, "learning_rate": 1.781056751758197e-05, "loss": 0.8292, "step": 1998 }, { "epoch": 0.24, "learning_rate": 1.7808154788006017e-05, "loss": 0.8449, "step": 1999 }, { "epoch": 0.24, "learning_rate": 1.780574089337457e-05, "loss": 0.7935, "step": 2000 }, { "epoch": 0.24, "learning_rate": 1.7803325834047818e-05, "loss": 0.832, "step": 2001 }, { "epoch": 0.24, "learning_rate": 1.7800909610386106e-05, "loss": 0.8627, "step": 2002 }, { "epoch": 0.24, "learning_rate": 1.779849222274996e-05, "loss": 0.8158, "step": 2003 }, { "epoch": 0.24, "learning_rate": 1.7796073671500084e-05, "loss": 0.822, "step": 2004 }, { "epoch": 0.24, "learning_rate": 1.779365395699734e-05, "loss": 0.8209, "step": 2005 }, { "epoch": 0.24, "learning_rate": 1.779123307960278e-05, "loss": 0.8214, "step": 2006 }, { "epoch": 0.24, "learning_rate": 1.7788811039677627e-05, "loss": 0.7907, "step": 2007 }, { "epoch": 0.24, "learning_rate": 1.7786387837583266e-05, "loss": 0.7879, "step": 2008 }, { "epoch": 0.24, "learning_rate": 1.7783963473681268e-05, "loss": 0.8131, "step": 2009 }, { "epoch": 0.24, "learning_rate": 1.7781537948333372e-05, "loss": 0.8365, "step": 2010 }, { "epoch": 0.24, "learning_rate": 1.7779111261901487e-05, "loss": 0.8605, "step": 2011 }, { "epoch": 0.24, "learning_rate": 1.7776683414747706e-05, "loss": 0.7985, "step": 2012 }, { "epoch": 0.24, "learning_rate": 1.7774254407234282e-05, "loss": 0.779, "step": 2013 }, { "epoch": 0.24, "learning_rate": 1.7771824239723653e-05, "loss": 0.8136, "step": 2014 }, { "epoch": 0.24, "learning_rate": 1.776939291257842e-05, "loss": 0.8013, "step": 2015 }, { "epoch": 0.24, "learning_rate": 1.7766960426161363e-05, "loss": 0.8717, "step": 2016 }, { "epoch": 0.24, "learning_rate": 1.7764526780835435e-05, "loss": 0.8203, "step": 2017 }, { "epoch": 0.24, "learning_rate": 1.7762091976963755e-05, "loss": 0.7974, "step": 2018 }, { "epoch": 0.24, "learning_rate": 1.7759656014909628e-05, "loss": 0.8504, "step": 2019 }, { "epoch": 0.24, "learning_rate": 1.775721889503652e-05, "loss": 0.8276, "step": 2020 }, { "epoch": 0.24, "learning_rate": 1.7754780617708074e-05, "loss": 0.8287, "step": 2021 }, { "epoch": 0.24, "learning_rate": 1.7752341183288106e-05, "loss": 0.846, "step": 2022 }, { "epoch": 0.24, "learning_rate": 1.7749900592140602e-05, "loss": 0.8432, "step": 2023 }, { "epoch": 0.24, "learning_rate": 1.774745884462973e-05, "loss": 0.8142, "step": 2024 }, { "epoch": 0.24, "learning_rate": 1.7745015941119813e-05, "loss": 0.7985, "step": 2025 }, { "epoch": 0.24, "learning_rate": 1.7742571881975366e-05, "loss": 0.8069, "step": 2026 }, { "epoch": 0.24, "learning_rate": 1.774012666756106e-05, "loss": 0.894, "step": 2027 }, { "epoch": 0.24, "learning_rate": 1.7737680298241754e-05, "loss": 0.8566, "step": 2028 }, { "epoch": 0.24, "learning_rate": 1.7735232774382464e-05, "loss": 0.8895, "step": 2029 }, { "epoch": 0.24, "learning_rate": 1.7732784096348385e-05, "loss": 0.8242, "step": 2030 }, { "epoch": 0.24, "learning_rate": 1.7730334264504888e-05, "loss": 0.8209, "step": 2031 }, { "epoch": 0.24, "learning_rate": 1.7727883279217513e-05, "loss": 0.8644, "step": 2032 }, { "epoch": 0.24, "learning_rate": 1.772543114085197e-05, "loss": 0.8086, "step": 2033 }, { "epoch": 0.24, "learning_rate": 1.7722977849774142e-05, "loss": 0.8644, "step": 2034 }, { "epoch": 0.24, "learning_rate": 1.7720523406350088e-05, "loss": 0.803, "step": 2035 }, { "epoch": 0.24, "learning_rate": 1.7718067810946032e-05, "loss": 0.8387, "step": 2036 }, { "epoch": 0.24, "learning_rate": 1.7715611063928375e-05, "loss": 0.8404, "step": 2037 }, { "epoch": 0.24, "learning_rate": 1.7713153165663686e-05, "loss": 0.8756, "step": 2038 }, { "epoch": 0.24, "learning_rate": 1.7710694116518716e-05, "loss": 0.8002, "step": 2039 }, { "epoch": 0.24, "learning_rate": 1.7708233916860373e-05, "loss": 0.8214, "step": 2040 }, { "epoch": 0.24, "learning_rate": 1.7705772567055747e-05, "loss": 0.8359, "step": 2041 }, { "epoch": 0.24, "learning_rate": 1.7703310067472088e-05, "loss": 0.8516, "step": 2042 }, { "epoch": 0.24, "learning_rate": 1.770084641847684e-05, "loss": 0.8521, "step": 2043 }, { "epoch": 0.24, "learning_rate": 1.769838162043759e-05, "loss": 0.8225, "step": 2044 }, { "epoch": 0.24, "learning_rate": 1.7695915673722124e-05, "loss": 0.8097, "step": 2045 }, { "epoch": 0.24, "learning_rate": 1.769344857869838e-05, "loss": 0.8125, "step": 2046 }, { "epoch": 0.24, "learning_rate": 1.7690980335734467e-05, "loss": 0.8142, "step": 2047 }, { "epoch": 0.24, "learning_rate": 1.768851094519868e-05, "loss": 0.8599, "step": 2048 }, { "epoch": 0.24, "learning_rate": 1.7686040407459476e-05, "loss": 0.7907, "step": 2049 }, { "epoch": 0.24, "learning_rate": 1.7683568722885483e-05, "loss": 0.7807, "step": 2050 }, { "epoch": 0.24, "learning_rate": 1.7681095891845502e-05, "loss": 0.8583, "step": 2051 }, { "epoch": 0.24, "learning_rate": 1.76786219147085e-05, "loss": 0.8343, "step": 2052 }, { "epoch": 0.24, "learning_rate": 1.7676146791843625e-05, "loss": 0.8744, "step": 2053 }, { "epoch": 0.24, "learning_rate": 1.767367052362019e-05, "loss": 0.8153, "step": 2054 }, { "epoch": 0.25, "learning_rate": 1.7671193110407677e-05, "loss": 0.8013, "step": 2055 }, { "epoch": 0.25, "learning_rate": 1.766871455257574e-05, "loss": 0.8315, "step": 2056 }, { "epoch": 0.25, "learning_rate": 1.7666234850494205e-05, "loss": 0.8421, "step": 2057 }, { "epoch": 0.25, "learning_rate": 1.7663754004533072e-05, "loss": 0.8225, "step": 2058 }, { "epoch": 0.25, "learning_rate": 1.7661272015062506e-05, "loss": 0.8371, "step": 2059 }, { "epoch": 0.25, "learning_rate": 1.7658788882452848e-05, "loss": 0.7924, "step": 2060 }, { "epoch": 0.25, "learning_rate": 1.76563046070746e-05, "loss": 0.7439, "step": 2061 }, { "epoch": 0.25, "learning_rate": 1.7653819189298446e-05, "loss": 0.8705, "step": 2062 }, { "epoch": 0.25, "learning_rate": 1.765133262949523e-05, "loss": 0.8281, "step": 2063 }, { "epoch": 0.25, "learning_rate": 1.764884492803598e-05, "loss": 0.8968, "step": 2064 }, { "epoch": 0.25, "learning_rate": 1.764635608529188e-05, "loss": 0.798, "step": 2065 }, { "epoch": 0.25, "learning_rate": 1.7643866101634293e-05, "loss": 0.8393, "step": 2066 }, { "epoch": 0.25, "learning_rate": 1.764137497743475e-05, "loss": 0.8142, "step": 2067 }, { "epoch": 0.25, "learning_rate": 1.7638882713064948e-05, "loss": 0.8449, "step": 2068 }, { "epoch": 0.25, "learning_rate": 1.7636389308896764e-05, "loss": 0.8438, "step": 2069 }, { "epoch": 0.25, "learning_rate": 1.7633894765302234e-05, "loss": 0.7846, "step": 2070 }, { "epoch": 0.25, "learning_rate": 1.7631399082653572e-05, "loss": 0.7879, "step": 2071 }, { "epoch": 0.25, "learning_rate": 1.7628902261323158e-05, "loss": 0.8198, "step": 2072 }, { "epoch": 0.25, "learning_rate": 1.7626404301683543e-05, "loss": 0.8666, "step": 2073 }, { "epoch": 0.25, "learning_rate": 1.762390520410744e-05, "loss": 0.7963, "step": 2074 }, { "epoch": 0.25, "learning_rate": 1.762140496896776e-05, "loss": 0.8231, "step": 2075 }, { "epoch": 0.25, "learning_rate": 1.7618903596637543e-05, "loss": 0.8326, "step": 2076 }, { "epoch": 0.25, "learning_rate": 1.761640108749003e-05, "loss": 0.8348, "step": 2077 }, { "epoch": 0.25, "learning_rate": 1.7613897441898616e-05, "loss": 0.8449, "step": 2078 }, { "epoch": 0.25, "learning_rate": 1.7611392660236873e-05, "loss": 0.8231, "step": 2079 }, { "epoch": 0.25, "learning_rate": 1.7608886742878535e-05, "loss": 0.8421, "step": 2080 }, { "epoch": 0.25, "learning_rate": 1.7606379690197513e-05, "loss": 0.7411, "step": 2081 }, { "epoch": 0.25, "learning_rate": 1.760387150256789e-05, "loss": 0.841, "step": 2082 }, { "epoch": 0.25, "learning_rate": 1.7601362180363902e-05, "loss": 0.8359, "step": 2083 }, { "epoch": 0.25, "learning_rate": 1.7598851723959973e-05, "loss": 0.8633, "step": 2084 }, { "epoch": 0.25, "learning_rate": 1.7596340133730686e-05, "loss": 0.8633, "step": 2085 }, { "epoch": 0.25, "learning_rate": 1.7593827410050796e-05, "loss": 0.7879, "step": 2086 }, { "epoch": 0.25, "learning_rate": 1.759131355329523e-05, "loss": 0.7372, "step": 2087 }, { "epoch": 0.25, "learning_rate": 1.7588798563839073e-05, "loss": 0.7963, "step": 2088 }, { "epoch": 0.25, "learning_rate": 1.7586282442057597e-05, "loss": 0.8276, "step": 2089 }, { "epoch": 0.25, "learning_rate": 1.758376518832622e-05, "loss": 0.784, "step": 2090 }, { "epoch": 0.25, "learning_rate": 1.7581246803020552e-05, "loss": 0.8136, "step": 2091 }, { "epoch": 0.25, "learning_rate": 1.757872728651636e-05, "loss": 0.7935, "step": 2092 }, { "epoch": 0.25, "learning_rate": 1.757620663918958e-05, "loss": 0.8097, "step": 2093 }, { "epoch": 0.25, "learning_rate": 1.7573684861416312e-05, "loss": 0.8477, "step": 2094 }, { "epoch": 0.25, "learning_rate": 1.757116195357284e-05, "loss": 0.7773, "step": 2095 }, { "epoch": 0.25, "learning_rate": 1.7568637916035603e-05, "loss": 0.8013, "step": 2096 }, { "epoch": 0.25, "learning_rate": 1.7566112749181215e-05, "loss": 0.8036, "step": 2097 }, { "epoch": 0.25, "learning_rate": 1.7563586453386454e-05, "loss": 0.8622, "step": 2098 }, { "epoch": 0.25, "learning_rate": 1.7561059029028268e-05, "loss": 0.8203, "step": 2099 }, { "epoch": 0.25, "learning_rate": 1.755853047648378e-05, "loss": 0.8588, "step": 2100 }, { "epoch": 0.25, "learning_rate": 1.7556000796130264e-05, "loss": 0.7952, "step": 2101 }, { "epoch": 0.25, "learning_rate": 1.7553469988345188e-05, "loss": 0.7896, "step": 2102 }, { "epoch": 0.25, "learning_rate": 1.7550938053506162e-05, "loss": 0.7913, "step": 2103 }, { "epoch": 0.25, "learning_rate": 1.7548404991990985e-05, "loss": 0.822, "step": 2104 }, { "epoch": 0.25, "learning_rate": 1.7545870804177612e-05, "loss": 0.8041, "step": 2105 }, { "epoch": 0.25, "learning_rate": 1.7543335490444166e-05, "loss": 0.8382, "step": 2106 }, { "epoch": 0.25, "learning_rate": 1.754079905116895e-05, "loss": 0.8326, "step": 2107 }, { "epoch": 0.25, "learning_rate": 1.7538261486730418e-05, "loss": 0.7684, "step": 2108 }, { "epoch": 0.25, "learning_rate": 1.75357227975072e-05, "loss": 0.8761, "step": 2109 }, { "epoch": 0.25, "learning_rate": 1.7533182983878104e-05, "loss": 0.798, "step": 2110 }, { "epoch": 0.25, "learning_rate": 1.7530642046222082e-05, "loss": 0.8566, "step": 2111 }, { "epoch": 0.25, "learning_rate": 1.752809998491828e-05, "loss": 0.8717, "step": 2112 }, { "epoch": 0.25, "learning_rate": 1.7525556800345992e-05, "loss": 0.8655, "step": 2113 }, { "epoch": 0.25, "learning_rate": 1.752301249288469e-05, "loss": 0.8583, "step": 2114 }, { "epoch": 0.25, "learning_rate": 1.7520467062914005e-05, "loss": 0.8633, "step": 2115 }, { "epoch": 0.25, "learning_rate": 1.7517920510813748e-05, "loss": 0.7656, "step": 2116 }, { "epoch": 0.25, "learning_rate": 1.7515372836963886e-05, "loss": 0.7852, "step": 2117 }, { "epoch": 0.25, "learning_rate": 1.7512824041744557e-05, "loss": 0.8186, "step": 2118 }, { "epoch": 0.25, "learning_rate": 1.7510274125536073e-05, "loss": 0.8287, "step": 2119 }, { "epoch": 0.25, "learning_rate": 1.75077230887189e-05, "loss": 0.8499, "step": 2120 }, { "epoch": 0.25, "learning_rate": 1.750517093167368e-05, "loss": 0.8583, "step": 2121 }, { "epoch": 0.25, "learning_rate": 1.7502617654781226e-05, "loss": 0.8142, "step": 2122 }, { "epoch": 0.25, "learning_rate": 1.7500063258422506e-05, "loss": 0.8181, "step": 2123 }, { "epoch": 0.25, "learning_rate": 1.7497507742978665e-05, "loss": 0.8002, "step": 2124 }, { "epoch": 0.25, "learning_rate": 1.749495110883101e-05, "loss": 0.7813, "step": 2125 }, { "epoch": 0.25, "learning_rate": 1.7492393356361018e-05, "loss": 0.8315, "step": 2126 }, { "epoch": 0.25, "learning_rate": 1.7489834485950333e-05, "loss": 0.7511, "step": 2127 }, { "epoch": 0.25, "learning_rate": 1.748727449798076e-05, "loss": 0.8131, "step": 2128 }, { "epoch": 0.25, "learning_rate": 1.748471339283428e-05, "loss": 0.8571, "step": 2129 }, { "epoch": 0.25, "learning_rate": 1.748215117089303e-05, "loss": 0.8672, "step": 2130 }, { "epoch": 0.25, "learning_rate": 1.7479587832539325e-05, "loss": 0.87, "step": 2131 }, { "epoch": 0.25, "learning_rate": 1.7477023378155635e-05, "loss": 0.9074, "step": 2132 }, { "epoch": 0.25, "learning_rate": 1.747445780812461e-05, "loss": 0.8092, "step": 2133 }, { "epoch": 0.25, "learning_rate": 1.7471891122829054e-05, "loss": 0.8103, "step": 2134 }, { "epoch": 0.25, "learning_rate": 1.7469323322651945e-05, "loss": 0.8683, "step": 2135 }, { "epoch": 0.25, "learning_rate": 1.746675440797642e-05, "loss": 0.8555, "step": 2136 }, { "epoch": 0.25, "learning_rate": 1.7464184379185785e-05, "loss": 0.8092, "step": 2137 }, { "epoch": 0.25, "learning_rate": 1.7461613236663527e-05, "loss": 0.8404, "step": 2138 }, { "epoch": 0.26, "learning_rate": 1.7459040980793276e-05, "loss": 0.7952, "step": 2139 }, { "epoch": 0.26, "learning_rate": 1.7456467611958842e-05, "loss": 0.8086, "step": 2140 }, { "epoch": 0.26, "learning_rate": 1.7453893130544196e-05, "loss": 0.7785, "step": 2141 }, { "epoch": 0.26, "learning_rate": 1.7451317536933477e-05, "loss": 0.8962, "step": 2142 }, { "epoch": 0.26, "learning_rate": 1.7448740831510988e-05, "loss": 0.8292, "step": 2143 }, { "epoch": 0.26, "learning_rate": 1.7446163014661203e-05, "loss": 0.7946, "step": 2144 }, { "epoch": 0.26, "learning_rate": 1.744358408676876e-05, "loss": 0.8521, "step": 2145 }, { "epoch": 0.26, "learning_rate": 1.7441004048218454e-05, "loss": 0.8331, "step": 2146 }, { "epoch": 0.26, "learning_rate": 1.7438422899395256e-05, "loss": 0.8103, "step": 2147 }, { "epoch": 0.26, "learning_rate": 1.74358406406843e-05, "loss": 0.8934, "step": 2148 }, { "epoch": 0.26, "learning_rate": 1.7433257272470886e-05, "loss": 0.8315, "step": 2149 }, { "epoch": 0.26, "learning_rate": 1.743067279514048e-05, "loss": 0.827, "step": 2150 }, { "epoch": 0.26, "learning_rate": 1.7428087209078707e-05, "loss": 0.7885, "step": 2151 }, { "epoch": 0.26, "learning_rate": 1.7425500514671365e-05, "loss": 0.8019, "step": 2152 }, { "epoch": 0.26, "learning_rate": 1.7422912712304417e-05, "loss": 0.7785, "step": 2153 }, { "epoch": 0.26, "learning_rate": 1.7420323802363987e-05, "loss": 0.8421, "step": 2154 }, { "epoch": 0.26, "learning_rate": 1.7417733785236362e-05, "loss": 0.8292, "step": 2155 }, { "epoch": 0.26, "learning_rate": 1.7415142661308007e-05, "loss": 0.8231, "step": 2156 }, { "epoch": 0.26, "learning_rate": 1.7412550430965542e-05, "loss": 0.7863, "step": 2157 }, { "epoch": 0.26, "learning_rate": 1.7409957094595752e-05, "loss": 0.8192, "step": 2158 }, { "epoch": 0.26, "learning_rate": 1.7407362652585585e-05, "loss": 0.8242, "step": 2159 }, { "epoch": 0.26, "learning_rate": 1.7404767105322163e-05, "loss": 0.769, "step": 2160 }, { "epoch": 0.26, "learning_rate": 1.7402170453192773e-05, "loss": 0.7813, "step": 2161 }, { "epoch": 0.26, "learning_rate": 1.739957269658485e-05, "loss": 0.8047, "step": 2162 }, { "epoch": 0.26, "learning_rate": 1.7396973835886016e-05, "loss": 0.8125, "step": 2163 }, { "epoch": 0.26, "learning_rate": 1.7394373871484037e-05, "loss": 0.8304, "step": 2164 }, { "epoch": 0.26, "learning_rate": 1.7391772803766862e-05, "loss": 0.7824, "step": 2165 }, { "epoch": 0.26, "learning_rate": 1.7389170633122594e-05, "loss": 0.7891, "step": 2166 }, { "epoch": 0.26, "learning_rate": 1.7386567359939502e-05, "loss": 0.8276, "step": 2167 }, { "epoch": 0.26, "learning_rate": 1.7383962984606024e-05, "loss": 0.8002, "step": 2168 }, { "epoch": 0.26, "learning_rate": 1.7381357507510753e-05, "loss": 0.832, "step": 2169 }, { "epoch": 0.26, "learning_rate": 1.7378750929042457e-05, "loss": 0.8041, "step": 2170 }, { "epoch": 0.26, "learning_rate": 1.7376143249590068e-05, "loss": 0.8415, "step": 2171 }, { "epoch": 0.26, "learning_rate": 1.7373534469542667e-05, "loss": 0.7913, "step": 2172 }, { "epoch": 0.26, "learning_rate": 1.737092458928952e-05, "loss": 0.8705, "step": 2173 }, { "epoch": 0.26, "learning_rate": 1.736831360922004e-05, "loss": 0.8426, "step": 2174 }, { "epoch": 0.26, "learning_rate": 1.736570152972382e-05, "loss": 0.8878, "step": 2175 }, { "epoch": 0.26, "learning_rate": 1.7363088351190604e-05, "loss": 0.8477, "step": 2176 }, { "epoch": 0.26, "learning_rate": 1.7360474074010303e-05, "loss": 0.8655, "step": 2177 }, { "epoch": 0.26, "learning_rate": 1.7357858698572995e-05, "loss": 0.8348, "step": 2178 }, { "epoch": 0.26, "learning_rate": 1.735524222526892e-05, "loss": 0.865, "step": 2179 }, { "epoch": 0.26, "learning_rate": 1.7352624654488487e-05, "loss": 0.8331, "step": 2180 }, { "epoch": 0.26, "learning_rate": 1.7350005986622254e-05, "loss": 0.8304, "step": 2181 }, { "epoch": 0.26, "learning_rate": 1.7347386222060964e-05, "loss": 0.827, "step": 2182 }, { "epoch": 0.26, "learning_rate": 1.73447653611955e-05, "loss": 0.841, "step": 2183 }, { "epoch": 0.26, "learning_rate": 1.7342143404416933e-05, "loss": 0.8064, "step": 2184 }, { "epoch": 0.26, "learning_rate": 1.733952035211648e-05, "loss": 0.8131, "step": 2185 }, { "epoch": 0.26, "learning_rate": 1.7336896204685524e-05, "loss": 0.8131, "step": 2186 }, { "epoch": 0.26, "learning_rate": 1.733427096251562e-05, "loss": 0.8287, "step": 2187 }, { "epoch": 0.26, "learning_rate": 1.7331644625998475e-05, "loss": 0.7852, "step": 2188 }, { "epoch": 0.26, "learning_rate": 1.732901719552597e-05, "loss": 0.8544, "step": 2189 }, { "epoch": 0.26, "learning_rate": 1.732638867149014e-05, "loss": 0.7913, "step": 2190 }, { "epoch": 0.26, "learning_rate": 1.7323759054283194e-05, "loss": 0.8298, "step": 2191 }, { "epoch": 0.26, "learning_rate": 1.732112834429749e-05, "loss": 0.8164, "step": 2192 }, { "epoch": 0.26, "learning_rate": 1.7318496541925557e-05, "loss": 0.8717, "step": 2193 }, { "epoch": 0.26, "learning_rate": 1.731586364756009e-05, "loss": 0.7785, "step": 2194 }, { "epoch": 0.26, "learning_rate": 1.7313229661593943e-05, "loss": 0.8064, "step": 2195 }, { "epoch": 0.26, "learning_rate": 1.7310594584420133e-05, "loss": 0.7874, "step": 2196 }, { "epoch": 0.26, "learning_rate": 1.730795841643184e-05, "loss": 0.7807, "step": 2197 }, { "epoch": 0.26, "learning_rate": 1.73053211580224e-05, "loss": 0.8259, "step": 2198 }, { "epoch": 0.26, "learning_rate": 1.7302682809585333e-05, "loss": 0.8198, "step": 2199 }, { "epoch": 0.26, "learning_rate": 1.7300043371514293e-05, "loss": 0.7919, "step": 2200 }, { "epoch": 0.26, "learning_rate": 1.729740284420312e-05, "loss": 0.8192, "step": 2201 }, { "epoch": 0.26, "learning_rate": 1.7294761228045805e-05, "loss": 0.7924, "step": 2202 }, { "epoch": 0.26, "learning_rate": 1.7292118523436498e-05, "loss": 0.7974, "step": 2203 }, { "epoch": 0.26, "learning_rate": 1.7289474730769527e-05, "loss": 0.7628, "step": 2204 }, { "epoch": 0.26, "learning_rate": 1.7286829850439366e-05, "loss": 0.7863, "step": 2205 }, { "epoch": 0.26, "learning_rate": 1.728418388284066e-05, "loss": 0.8047, "step": 2206 }, { "epoch": 0.26, "learning_rate": 1.7281536828368213e-05, "loss": 0.8666, "step": 2207 }, { "epoch": 0.26, "learning_rate": 1.7278888687416993e-05, "loss": 0.8008, "step": 2208 }, { "epoch": 0.26, "learning_rate": 1.7276239460382128e-05, "loss": 0.8705, "step": 2209 }, { "epoch": 0.26, "learning_rate": 1.7273589147658913e-05, "loss": 0.8086, "step": 2210 }, { "epoch": 0.26, "learning_rate": 1.72709377496428e-05, "loss": 0.8767, "step": 2211 }, { "epoch": 0.26, "learning_rate": 1.72682852667294e-05, "loss": 0.8917, "step": 2212 }, { "epoch": 0.26, "learning_rate": 1.7265631699314495e-05, "loss": 0.8331, "step": 2213 }, { "epoch": 0.26, "learning_rate": 1.726297704779402e-05, "loss": 0.7891, "step": 2214 }, { "epoch": 0.26, "learning_rate": 1.726032131256408e-05, "loss": 0.7667, "step": 2215 }, { "epoch": 0.26, "learning_rate": 1.725766449402094e-05, "loss": 0.8432, "step": 2216 }, { "epoch": 0.26, "learning_rate": 1.7255006592561017e-05, "loss": 0.7891, "step": 2217 }, { "epoch": 0.26, "learning_rate": 1.72523476085809e-05, "loss": 0.8025, "step": 2218 }, { "epoch": 0.26, "learning_rate": 1.7249687542477335e-05, "loss": 0.8086, "step": 2219 }, { "epoch": 0.26, "learning_rate": 1.724702639464723e-05, "loss": 0.817, "step": 2220 }, { "epoch": 0.26, "learning_rate": 1.724436416548766e-05, "loss": 0.8365, "step": 2221 }, { "epoch": 0.26, "learning_rate": 1.7241700855395854e-05, "loss": 0.865, "step": 2222 }, { "epoch": 0.27, "learning_rate": 1.72390364647692e-05, "loss": 0.8231, "step": 2223 }, { "epoch": 0.27, "learning_rate": 1.7236370994005257e-05, "loss": 0.8728, "step": 2224 }, { "epoch": 0.27, "learning_rate": 1.7233704443501743e-05, "loss": 0.8376, "step": 2225 }, { "epoch": 0.27, "learning_rate": 1.7231036813656525e-05, "loss": 0.8571, "step": 2226 }, { "epoch": 0.27, "learning_rate": 1.722836810486765e-05, "loss": 0.7813, "step": 2227 }, { "epoch": 0.27, "learning_rate": 1.7225698317533307e-05, "loss": 0.8092, "step": 2228 }, { "epoch": 0.27, "learning_rate": 1.7223027452051867e-05, "loss": 0.808, "step": 2229 }, { "epoch": 0.27, "learning_rate": 1.7220355508821838e-05, "loss": 0.8225, "step": 2230 }, { "epoch": 0.27, "learning_rate": 1.7217682488241907e-05, "loss": 0.8192, "step": 2231 }, { "epoch": 0.27, "learning_rate": 1.7215008390710917e-05, "loss": 0.7746, "step": 2232 }, { "epoch": 0.27, "learning_rate": 1.7212333216627865e-05, "loss": 0.8114, "step": 2233 }, { "epoch": 0.27, "learning_rate": 1.720965696639192e-05, "loss": 0.7818, "step": 2234 }, { "epoch": 0.27, "learning_rate": 1.7206979640402403e-05, "loss": 0.822, "step": 2235 }, { "epoch": 0.27, "learning_rate": 1.7204301239058793e-05, "loss": 0.8499, "step": 2236 }, { "epoch": 0.27, "learning_rate": 1.720162176276074e-05, "loss": 0.8393, "step": 2237 }, { "epoch": 0.27, "learning_rate": 1.719894121190805e-05, "loss": 0.8153, "step": 2238 }, { "epoch": 0.27, "learning_rate": 1.719625958690069e-05, "loss": 0.8075, "step": 2239 }, { "epoch": 0.27, "learning_rate": 1.7193576888138777e-05, "loss": 0.8477, "step": 2240 }, { "epoch": 0.27, "learning_rate": 1.71908931160226e-05, "loss": 0.8119, "step": 2241 }, { "epoch": 0.27, "learning_rate": 1.718820827095261e-05, "loss": 0.8432, "step": 2242 }, { "epoch": 0.27, "learning_rate": 1.718552235332941e-05, "loss": 0.8047, "step": 2243 }, { "epoch": 0.27, "learning_rate": 1.718283536355376e-05, "loss": 0.7896, "step": 2244 }, { "epoch": 0.27, "learning_rate": 1.71801473020266e-05, "loss": 0.7695, "step": 2245 }, { "epoch": 0.27, "learning_rate": 1.7177458169149e-05, "loss": 0.7952, "step": 2246 }, { "epoch": 0.27, "learning_rate": 1.7174767965322216e-05, "loss": 0.8493, "step": 2247 }, { "epoch": 0.27, "learning_rate": 1.717207669094765e-05, "loss": 0.865, "step": 2248 }, { "epoch": 0.27, "learning_rate": 1.7169384346426868e-05, "loss": 0.774, "step": 2249 }, { "epoch": 0.27, "learning_rate": 1.7166690932161594e-05, "loss": 0.8555, "step": 2250 }, { "epoch": 0.27, "learning_rate": 1.7163996448553717e-05, "loss": 0.7997, "step": 2251 }, { "epoch": 0.27, "learning_rate": 1.7161300896005273e-05, "loss": 0.8153, "step": 2252 }, { "epoch": 0.27, "learning_rate": 1.7158604274918475e-05, "loss": 0.8069, "step": 2253 }, { "epoch": 0.27, "learning_rate": 1.7155906585695676e-05, "loss": 0.8108, "step": 2254 }, { "epoch": 0.27, "learning_rate": 1.7153207828739407e-05, "loss": 0.8382, "step": 2255 }, { "epoch": 0.27, "learning_rate": 1.7150508004452347e-05, "loss": 0.8359, "step": 2256 }, { "epoch": 0.27, "learning_rate": 1.7147807113237335e-05, "loss": 0.779, "step": 2257 }, { "epoch": 0.27, "learning_rate": 1.7145105155497373e-05, "loss": 0.7997, "step": 2258 }, { "epoch": 0.27, "learning_rate": 1.714240213163562e-05, "loss": 0.8214, "step": 2259 }, { "epoch": 0.27, "learning_rate": 1.71396980420554e-05, "loss": 0.7997, "step": 2260 }, { "epoch": 0.27, "learning_rate": 1.7136992887160174e-05, "loss": 0.7807, "step": 2261 }, { "epoch": 0.27, "learning_rate": 1.7134286667353598e-05, "loss": 0.7969, "step": 2262 }, { "epoch": 0.27, "learning_rate": 1.7131579383039456e-05, "loss": 0.8622, "step": 2263 }, { "epoch": 0.27, "learning_rate": 1.7128871034621705e-05, "loss": 0.865, "step": 2264 }, { "epoch": 0.27, "learning_rate": 1.7126161622504458e-05, "loss": 0.8644, "step": 2265 }, { "epoch": 0.27, "learning_rate": 1.7123451147091986e-05, "loss": 0.745, "step": 2266 }, { "epoch": 0.27, "learning_rate": 1.7120739608788722e-05, "loss": 0.7757, "step": 2267 }, { "epoch": 0.27, "learning_rate": 1.7118027007999252e-05, "loss": 0.8337, "step": 2268 }, { "epoch": 0.27, "learning_rate": 1.7115313345128322e-05, "loss": 0.8638, "step": 2269 }, { "epoch": 0.27, "learning_rate": 1.711259862058084e-05, "loss": 0.7958, "step": 2270 }, { "epoch": 0.27, "learning_rate": 1.7109882834761874e-05, "loss": 0.8092, "step": 2271 }, { "epoch": 0.27, "learning_rate": 1.7107165988076637e-05, "loss": 0.8482, "step": 2272 }, { "epoch": 0.27, "learning_rate": 1.710444808093052e-05, "loss": 0.8097, "step": 2273 }, { "epoch": 0.27, "learning_rate": 1.710172911372906e-05, "loss": 0.8086, "step": 2274 }, { "epoch": 0.27, "learning_rate": 1.7099009086877948e-05, "loss": 0.7762, "step": 2275 }, { "epoch": 0.27, "learning_rate": 1.7096288000783043e-05, "loss": 0.8376, "step": 2276 }, { "epoch": 0.27, "learning_rate": 1.7093565855850363e-05, "loss": 0.8147, "step": 2277 }, { "epoch": 0.27, "learning_rate": 1.709084265248607e-05, "loss": 0.8839, "step": 2278 }, { "epoch": 0.27, "learning_rate": 1.7088118391096507e-05, "loss": 0.798, "step": 2279 }, { "epoch": 0.27, "learning_rate": 1.708539307208815e-05, "loss": 0.8521, "step": 2280 }, { "epoch": 0.27, "learning_rate": 1.7082666695867645e-05, "loss": 0.8013, "step": 2281 }, { "epoch": 0.27, "learning_rate": 1.70799392628418e-05, "loss": 0.8315, "step": 2282 }, { "epoch": 0.27, "learning_rate": 1.7077210773417575e-05, "loss": 0.8337, "step": 2283 }, { "epoch": 0.27, "learning_rate": 1.707448122800208e-05, "loss": 0.8756, "step": 2284 }, { "epoch": 0.27, "learning_rate": 1.70717506270026e-05, "loss": 0.8119, "step": 2285 }, { "epoch": 0.27, "learning_rate": 1.7069018970826566e-05, "loss": 0.8069, "step": 2286 }, { "epoch": 0.27, "learning_rate": 1.7066286259881568e-05, "loss": 0.8566, "step": 2287 }, { "epoch": 0.27, "learning_rate": 1.7063552494575354e-05, "loss": 0.7991, "step": 2288 }, { "epoch": 0.27, "learning_rate": 1.706081767531583e-05, "loss": 0.8292, "step": 2289 }, { "epoch": 0.27, "learning_rate": 1.7058081802511056e-05, "loss": 0.8393, "step": 2290 }, { "epoch": 0.27, "learning_rate": 1.705534487656925e-05, "loss": 0.8097, "step": 2291 }, { "epoch": 0.27, "learning_rate": 1.70526068978988e-05, "loss": 0.8298, "step": 2292 }, { "epoch": 0.27, "learning_rate": 1.7049867866908227e-05, "loss": 0.8304, "step": 2293 }, { "epoch": 0.27, "learning_rate": 1.7047127784006227e-05, "loss": 0.8242, "step": 2294 }, { "epoch": 0.27, "learning_rate": 1.7044386649601653e-05, "loss": 0.7863, "step": 2295 }, { "epoch": 0.27, "learning_rate": 1.7041644464103504e-05, "loss": 0.8599, "step": 2296 }, { "epoch": 0.27, "learning_rate": 1.7038901227920943e-05, "loss": 0.7891, "step": 2297 }, { "epoch": 0.27, "learning_rate": 1.7036156941463288e-05, "loss": 0.8164, "step": 2298 }, { "epoch": 0.27, "learning_rate": 1.7033411605140018e-05, "loss": 0.7589, "step": 2299 }, { "epoch": 0.27, "learning_rate": 1.703066521936076e-05, "loss": 0.7444, "step": 2300 }, { "epoch": 0.27, "learning_rate": 1.7027917784535306e-05, "loss": 0.7746, "step": 2301 }, { "epoch": 0.27, "learning_rate": 1.7025169301073595e-05, "loss": 0.8655, "step": 2302 }, { "epoch": 0.27, "learning_rate": 1.7022419769385735e-05, "loss": 0.7533, "step": 2303 }, { "epoch": 0.27, "learning_rate": 1.7019669189881982e-05, "loss": 0.8047, "step": 2304 }, { "epoch": 0.27, "learning_rate": 1.7016917562972753e-05, "loss": 0.8142, "step": 2305 }, { "epoch": 0.28, "learning_rate": 1.7014164889068613e-05, "loss": 0.7852, "step": 2306 }, { "epoch": 0.28, "learning_rate": 1.7011411168580293e-05, "loss": 0.7941, "step": 2307 }, { "epoch": 0.28, "learning_rate": 1.700865640191867e-05, "loss": 0.8443, "step": 2308 }, { "epoch": 0.28, "learning_rate": 1.700590058949479e-05, "loss": 0.7416, "step": 2309 }, { "epoch": 0.28, "learning_rate": 1.7003143731719848e-05, "loss": 0.8248, "step": 2310 }, { "epoch": 0.28, "learning_rate": 1.700038582900519e-05, "loss": 0.7536, "step": 2311 }, { "epoch": 0.28, "learning_rate": 1.699762688176232e-05, "loss": 0.8538, "step": 2312 }, { "epoch": 0.28, "learning_rate": 1.699486689040291e-05, "loss": 0.75, "step": 2313 }, { "epoch": 0.28, "learning_rate": 1.6992105855338773e-05, "loss": 0.8265, "step": 2314 }, { "epoch": 0.28, "learning_rate": 1.6989343776981887e-05, "loss": 0.8421, "step": 2315 }, { "epoch": 0.28, "learning_rate": 1.698658065574438e-05, "loss": 0.8309, "step": 2316 }, { "epoch": 0.28, "learning_rate": 1.6983816492038537e-05, "loss": 0.8878, "step": 2317 }, { "epoch": 0.28, "learning_rate": 1.69810512862768e-05, "loss": 0.8337, "step": 2318 }, { "epoch": 0.28, "learning_rate": 1.697828503887176e-05, "loss": 0.827, "step": 2319 }, { "epoch": 0.28, "learning_rate": 1.6975517750236177e-05, "loss": 0.7919, "step": 2320 }, { "epoch": 0.28, "learning_rate": 1.6972749420782958e-05, "loss": 0.8281, "step": 2321 }, { "epoch": 0.28, "learning_rate": 1.696998005092516e-05, "loss": 0.8644, "step": 2322 }, { "epoch": 0.28, "learning_rate": 1.6967209641076002e-05, "loss": 0.8069, "step": 2323 }, { "epoch": 0.28, "learning_rate": 1.6964438191648862e-05, "loss": 0.8125, "step": 2324 }, { "epoch": 0.28, "learning_rate": 1.6961665703057267e-05, "loss": 0.8465, "step": 2325 }, { "epoch": 0.28, "learning_rate": 1.6958892175714897e-05, "loss": 0.8733, "step": 2326 }, { "epoch": 0.28, "learning_rate": 1.695611761003559e-05, "loss": 0.7628, "step": 2327 }, { "epoch": 0.28, "learning_rate": 1.695334200643334e-05, "loss": 0.8477, "step": 2328 }, { "epoch": 0.28, "learning_rate": 1.69505653653223e-05, "loss": 0.8248, "step": 2329 }, { "epoch": 0.28, "learning_rate": 1.6947787687116764e-05, "loss": 0.7528, "step": 2330 }, { "epoch": 0.28, "learning_rate": 1.69450089722312e-05, "loss": 0.8136, "step": 2331 }, { "epoch": 0.28, "learning_rate": 1.6942229221080215e-05, "loss": 0.8214, "step": 2332 }, { "epoch": 0.28, "learning_rate": 1.6939448434078572e-05, "loss": 0.8605, "step": 2333 }, { "epoch": 0.28, "learning_rate": 1.69366666116412e-05, "loss": 0.702, "step": 2334 }, { "epoch": 0.28, "learning_rate": 1.6933883754183168e-05, "loss": 0.8013, "step": 2335 }, { "epoch": 0.28, "learning_rate": 1.693109986211971e-05, "loss": 0.7606, "step": 2336 }, { "epoch": 0.28, "learning_rate": 1.6928314935866212e-05, "loss": 0.7723, "step": 2337 }, { "epoch": 0.28, "learning_rate": 1.692552897583821e-05, "loss": 0.8393, "step": 2338 }, { "epoch": 0.28, "learning_rate": 1.69227419824514e-05, "loss": 0.8142, "step": 2339 }, { "epoch": 0.28, "learning_rate": 1.691995395612163e-05, "loss": 0.9012, "step": 2340 }, { "epoch": 0.28, "learning_rate": 1.6917164897264897e-05, "loss": 0.75, "step": 2341 }, { "epoch": 0.28, "learning_rate": 1.691437480629736e-05, "loss": 0.8638, "step": 2342 }, { "epoch": 0.28, "learning_rate": 1.6911583683635334e-05, "loss": 0.7807, "step": 2343 }, { "epoch": 0.28, "learning_rate": 1.690879152969527e-05, "loss": 0.8108, "step": 2344 }, { "epoch": 0.28, "learning_rate": 1.6905998344893796e-05, "loss": 0.8449, "step": 2345 }, { "epoch": 0.28, "learning_rate": 1.690320412964768e-05, "loss": 0.8265, "step": 2346 }, { "epoch": 0.28, "learning_rate": 1.690040888437385e-05, "loss": 0.8343, "step": 2347 }, { "epoch": 0.28, "learning_rate": 1.689761260948938e-05, "loss": 0.8052, "step": 2348 }, { "epoch": 0.28, "learning_rate": 1.6894815305411503e-05, "loss": 0.8186, "step": 2349 }, { "epoch": 0.28, "learning_rate": 1.689201697255761e-05, "loss": 0.8504, "step": 2350 }, { "epoch": 0.28, "learning_rate": 1.688921761134523e-05, "loss": 0.8041, "step": 2351 }, { "epoch": 0.28, "learning_rate": 1.688641722219207e-05, "loss": 0.8142, "step": 2352 }, { "epoch": 0.28, "learning_rate": 1.6883615805515966e-05, "loss": 0.7377, "step": 2353 }, { "epoch": 0.28, "learning_rate": 1.6880813361734922e-05, "loss": 0.7879, "step": 2354 }, { "epoch": 0.28, "learning_rate": 1.687800989126709e-05, "loss": 0.8203, "step": 2355 }, { "epoch": 0.28, "learning_rate": 1.6875205394530777e-05, "loss": 0.8343, "step": 2356 }, { "epoch": 0.28, "learning_rate": 1.687239987194444e-05, "loss": 0.7863, "step": 2357 }, { "epoch": 0.28, "learning_rate": 1.686959332392669e-05, "loss": 0.8253, "step": 2358 }, { "epoch": 0.28, "learning_rate": 1.6866785750896295e-05, "loss": 0.7405, "step": 2359 }, { "epoch": 0.28, "learning_rate": 1.6863977153272174e-05, "loss": 0.8331, "step": 2360 }, { "epoch": 0.28, "learning_rate": 1.6861167531473398e-05, "loss": 0.7729, "step": 2361 }, { "epoch": 0.28, "learning_rate": 1.685835688591919e-05, "loss": 0.8125, "step": 2362 }, { "epoch": 0.28, "learning_rate": 1.6855545217028924e-05, "loss": 0.7958, "step": 2363 }, { "epoch": 0.28, "learning_rate": 1.6852732525222135e-05, "loss": 0.8242, "step": 2364 }, { "epoch": 0.28, "learning_rate": 1.6849918810918504e-05, "loss": 0.803, "step": 2365 }, { "epoch": 0.28, "learning_rate": 1.6847104074537857e-05, "loss": 0.8175, "step": 2366 }, { "epoch": 0.28, "learning_rate": 1.684428831650019e-05, "loss": 0.8013, "step": 2367 }, { "epoch": 0.28, "learning_rate": 1.684147153722564e-05, "loss": 0.8488, "step": 2368 }, { "epoch": 0.28, "learning_rate": 1.68386537371345e-05, "loss": 0.8158, "step": 2369 }, { "epoch": 0.28, "learning_rate": 1.6835834916647216e-05, "loss": 0.7896, "step": 2370 }, { "epoch": 0.28, "learning_rate": 1.6833015076184377e-05, "loss": 0.7533, "step": 2371 }, { "epoch": 0.28, "learning_rate": 1.683019421616674e-05, "loss": 0.8672, "step": 2372 }, { "epoch": 0.28, "learning_rate": 1.68273723370152e-05, "loss": 0.8421, "step": 2373 }, { "epoch": 0.28, "learning_rate": 1.6824549439150813e-05, "loss": 0.8203, "step": 2374 }, { "epoch": 0.28, "learning_rate": 1.682172552299478e-05, "loss": 0.8265, "step": 2375 }, { "epoch": 0.28, "learning_rate": 1.6818900588968462e-05, "loss": 0.8337, "step": 2376 }, { "epoch": 0.28, "learning_rate": 1.681607463749337e-05, "loss": 0.8315, "step": 2377 }, { "epoch": 0.28, "learning_rate": 1.6813247668991154e-05, "loss": 0.841, "step": 2378 }, { "epoch": 0.28, "learning_rate": 1.6810419683883637e-05, "loss": 0.808, "step": 2379 }, { "epoch": 0.28, "learning_rate": 1.680759068259278e-05, "loss": 0.798, "step": 2380 }, { "epoch": 0.28, "learning_rate": 1.6804760665540695e-05, "loss": 0.8119, "step": 2381 }, { "epoch": 0.28, "learning_rate": 1.6801929633149652e-05, "loss": 0.7757, "step": 2382 }, { "epoch": 0.28, "learning_rate": 1.679909758584207e-05, "loss": 0.7924, "step": 2383 }, { "epoch": 0.28, "learning_rate": 1.6796264524040516e-05, "loss": 0.793, "step": 2384 }, { "epoch": 0.28, "learning_rate": 1.6793430448167717e-05, "loss": 0.7154, "step": 2385 }, { "epoch": 0.28, "learning_rate": 1.679059535864654e-05, "loss": 0.8354, "step": 2386 }, { "epoch": 0.28, "learning_rate": 1.678775925590001e-05, "loss": 0.8036, "step": 2387 }, { "epoch": 0.28, "learning_rate": 1.6784922140351306e-05, "loss": 0.8092, "step": 2388 }, { "epoch": 0.28, "learning_rate": 1.678208401242375e-05, "loss": 0.8175, "step": 2389 }, { "epoch": 0.29, "learning_rate": 1.6779244872540823e-05, "loss": 0.7757, "step": 2390 }, { "epoch": 0.29, "learning_rate": 1.6776404721126147e-05, "loss": 0.8789, "step": 2391 }, { "epoch": 0.29, "learning_rate": 1.677356355860351e-05, "loss": 0.8259, "step": 2392 }, { "epoch": 0.29, "learning_rate": 1.6770721385396836e-05, "loss": 0.8164, "step": 2393 }, { "epoch": 0.29, "learning_rate": 1.6767878201930207e-05, "loss": 0.846, "step": 2394 }, { "epoch": 0.29, "learning_rate": 1.6765034008627857e-05, "loss": 0.7997, "step": 2395 }, { "epoch": 0.29, "learning_rate": 1.6762188805914167e-05, "loss": 0.7695, "step": 2396 }, { "epoch": 0.29, "learning_rate": 1.6759342594213666e-05, "loss": 0.8337, "step": 2397 }, { "epoch": 0.29, "learning_rate": 1.6756495373951044e-05, "loss": 0.8153, "step": 2398 }, { "epoch": 0.29, "learning_rate": 1.675364714555113e-05, "loss": 0.7734, "step": 2399 }, { "epoch": 0.29, "learning_rate": 1.6750797909438914e-05, "loss": 0.8225, "step": 2400 }, { "epoch": 0.29, "learning_rate": 1.6747947666039524e-05, "loss": 0.7818, "step": 2401 }, { "epoch": 0.29, "learning_rate": 1.674509641577825e-05, "loss": 0.8119, "step": 2402 }, { "epoch": 0.29, "learning_rate": 1.6742244159080527e-05, "loss": 0.904, "step": 2403 }, { "epoch": 0.29, "learning_rate": 1.6739390896371936e-05, "loss": 0.8343, "step": 2404 }, { "epoch": 0.29, "learning_rate": 1.6736536628078213e-05, "loss": 0.7924, "step": 2405 }, { "epoch": 0.29, "learning_rate": 1.6733681354625255e-05, "loss": 0.8348, "step": 2406 }, { "epoch": 0.29, "learning_rate": 1.6730825076439083e-05, "loss": 0.8337, "step": 2407 }, { "epoch": 0.29, "learning_rate": 1.672796779394589e-05, "loss": 0.7997, "step": 2408 }, { "epoch": 0.29, "learning_rate": 1.672510950757201e-05, "loss": 0.8393, "step": 2409 }, { "epoch": 0.29, "learning_rate": 1.6722250217743928e-05, "loss": 0.8521, "step": 2410 }, { "epoch": 0.29, "learning_rate": 1.6719389924888277e-05, "loss": 0.7712, "step": 2411 }, { "epoch": 0.29, "learning_rate": 1.6716528629431845e-05, "loss": 0.8164, "step": 2412 }, { "epoch": 0.29, "learning_rate": 1.6713666331801565e-05, "loss": 0.7907, "step": 2413 }, { "epoch": 0.29, "learning_rate": 1.671080303242452e-05, "loss": 0.7712, "step": 2414 }, { "epoch": 0.29, "learning_rate": 1.6707938731727945e-05, "loss": 0.7651, "step": 2415 }, { "epoch": 0.29, "learning_rate": 1.6705073430139217e-05, "loss": 0.7723, "step": 2416 }, { "epoch": 0.29, "learning_rate": 1.6702207128085876e-05, "loss": 0.7762, "step": 2417 }, { "epoch": 0.29, "learning_rate": 1.66993398259956e-05, "loss": 0.8415, "step": 2418 }, { "epoch": 0.29, "learning_rate": 1.6696471524296212e-05, "loss": 0.8175, "step": 2419 }, { "epoch": 0.29, "learning_rate": 1.6693602223415705e-05, "loss": 0.7919, "step": 2420 }, { "epoch": 0.29, "learning_rate": 1.6690731923782197e-05, "loss": 0.8136, "step": 2421 }, { "epoch": 0.29, "learning_rate": 1.668786062582397e-05, "loss": 0.8164, "step": 2422 }, { "epoch": 0.29, "learning_rate": 1.6684988329969454e-05, "loss": 0.8147, "step": 2423 }, { "epoch": 0.29, "learning_rate": 1.6682115036647214e-05, "loss": 0.7634, "step": 2424 }, { "epoch": 0.29, "learning_rate": 1.667924074628599e-05, "loss": 0.8304, "step": 2425 }, { "epoch": 0.29, "learning_rate": 1.6676365459314637e-05, "loss": 0.8454, "step": 2426 }, { "epoch": 0.29, "learning_rate": 1.6673489176162188e-05, "loss": 0.7762, "step": 2427 }, { "epoch": 0.29, "learning_rate": 1.6670611897257813e-05, "loss": 0.7974, "step": 2428 }, { "epoch": 0.29, "learning_rate": 1.666773362303083e-05, "loss": 0.8198, "step": 2429 }, { "epoch": 0.29, "learning_rate": 1.6664854353910705e-05, "loss": 0.8834, "step": 2430 }, { "epoch": 0.29, "learning_rate": 1.6661974090327054e-05, "loss": 0.7852, "step": 2431 }, { "epoch": 0.29, "learning_rate": 1.6659092832709643e-05, "loss": 0.8493, "step": 2432 }, { "epoch": 0.29, "learning_rate": 1.6656210581488385e-05, "loss": 0.8259, "step": 2433 }, { "epoch": 0.29, "learning_rate": 1.6653327337093342e-05, "loss": 0.8644, "step": 2434 }, { "epoch": 0.29, "learning_rate": 1.665044309995472e-05, "loss": 0.8343, "step": 2435 }, { "epoch": 0.29, "learning_rate": 1.6647557870502874e-05, "loss": 0.7857, "step": 2436 }, { "epoch": 0.29, "learning_rate": 1.6644671649168315e-05, "loss": 0.8666, "step": 2437 }, { "epoch": 0.29, "learning_rate": 1.6641784436381695e-05, "loss": 0.8298, "step": 2438 }, { "epoch": 0.29, "learning_rate": 1.6638896232573817e-05, "loss": 0.8153, "step": 2439 }, { "epoch": 0.29, "learning_rate": 1.6636007038175623e-05, "loss": 0.8337, "step": 2440 }, { "epoch": 0.29, "learning_rate": 1.6633116853618217e-05, "loss": 0.7533, "step": 2441 }, { "epoch": 0.29, "learning_rate": 1.663022567933284e-05, "loss": 0.8086, "step": 2442 }, { "epoch": 0.29, "learning_rate": 1.6627333515750887e-05, "loss": 0.7935, "step": 2443 }, { "epoch": 0.29, "learning_rate": 1.6624440363303896e-05, "loss": 0.774, "step": 2444 }, { "epoch": 0.29, "learning_rate": 1.6621546222423556e-05, "loss": 0.832, "step": 2445 }, { "epoch": 0.29, "learning_rate": 1.66186510935417e-05, "loss": 0.7896, "step": 2446 }, { "epoch": 0.29, "learning_rate": 1.661575497709031e-05, "loss": 0.7885, "step": 2447 }, { "epoch": 0.29, "learning_rate": 1.661285787350152e-05, "loss": 0.8465, "step": 2448 }, { "epoch": 0.29, "learning_rate": 1.660995978320761e-05, "loss": 0.8276, "step": 2449 }, { "epoch": 0.29, "learning_rate": 1.660706070664099e-05, "loss": 0.8527, "step": 2450 }, { "epoch": 0.29, "learning_rate": 1.6604160644234242e-05, "loss": 0.7952, "step": 2451 }, { "epoch": 0.29, "learning_rate": 1.6601259596420084e-05, "loss": 0.8153, "step": 2452 }, { "epoch": 0.29, "learning_rate": 1.6598357563631382e-05, "loss": 0.8214, "step": 2453 }, { "epoch": 0.29, "learning_rate": 1.6595454546301145e-05, "loss": 0.8069, "step": 2454 }, { "epoch": 0.29, "learning_rate": 1.6592550544862537e-05, "loss": 0.8237, "step": 2455 }, { "epoch": 0.29, "learning_rate": 1.6589645559748863e-05, "loss": 0.7835, "step": 2456 }, { "epoch": 0.29, "learning_rate": 1.6586739591393574e-05, "loss": 0.8209, "step": 2457 }, { "epoch": 0.29, "learning_rate": 1.658383264023027e-05, "loss": 0.7818, "step": 2458 }, { "epoch": 0.29, "learning_rate": 1.6580924706692695e-05, "loss": 0.7785, "step": 2459 }, { "epoch": 0.29, "learning_rate": 1.657801579121475e-05, "loss": 0.8359, "step": 2460 }, { "epoch": 0.29, "learning_rate": 1.6575105894230467e-05, "loss": 0.7896, "step": 2461 }, { "epoch": 0.29, "learning_rate": 1.6572195016174037e-05, "loss": 0.8516, "step": 2462 }, { "epoch": 0.29, "learning_rate": 1.6569283157479787e-05, "loss": 0.8365, "step": 2463 }, { "epoch": 0.29, "learning_rate": 1.6566370318582203e-05, "loss": 0.7662, "step": 2464 }, { "epoch": 0.29, "learning_rate": 1.6563456499915906e-05, "loss": 0.8052, "step": 2465 }, { "epoch": 0.29, "learning_rate": 1.6560541701915662e-05, "loss": 0.841, "step": 2466 }, { "epoch": 0.29, "learning_rate": 1.6557625925016395e-05, "loss": 0.8153, "step": 2467 }, { "epoch": 0.29, "learning_rate": 1.6554709169653168e-05, "loss": 0.7545, "step": 2468 }, { "epoch": 0.29, "learning_rate": 1.655179143626119e-05, "loss": 0.7511, "step": 2469 }, { "epoch": 0.29, "learning_rate": 1.6548872725275817e-05, "loss": 0.7533, "step": 2470 }, { "epoch": 0.29, "learning_rate": 1.6545953037132544e-05, "loss": 0.7902, "step": 2471 }, { "epoch": 0.29, "learning_rate": 1.654303237226702e-05, "loss": 0.8108, "step": 2472 }, { "epoch": 0.29, "learning_rate": 1.6540110731115047e-05, "loss": 0.8192, "step": 2473 }, { "epoch": 0.3, "learning_rate": 1.6537188114112552e-05, "loss": 0.7829, "step": 2474 }, { "epoch": 0.3, "learning_rate": 1.6534264521695626e-05, "loss": 0.8181, "step": 2475 }, { "epoch": 0.3, "learning_rate": 1.6531339954300494e-05, "loss": 0.7779, "step": 2476 }, { "epoch": 0.3, "learning_rate": 1.6528414412363534e-05, "loss": 0.8119, "step": 2477 }, { "epoch": 0.3, "learning_rate": 1.6525487896321263e-05, "loss": 0.7746, "step": 2478 }, { "epoch": 0.3, "learning_rate": 1.652256040661035e-05, "loss": 0.8192, "step": 2479 }, { "epoch": 0.3, "learning_rate": 1.6519631943667604e-05, "loss": 0.7768, "step": 2480 }, { "epoch": 0.3, "learning_rate": 1.6516702507929984e-05, "loss": 0.827, "step": 2481 }, { "epoch": 0.3, "learning_rate": 1.6513772099834587e-05, "loss": 0.7896, "step": 2482 }, { "epoch": 0.3, "learning_rate": 1.6510840719818665e-05, "loss": 0.7997, "step": 2483 }, { "epoch": 0.3, "learning_rate": 1.6507908368319606e-05, "loss": 0.8052, "step": 2484 }, { "epoch": 0.3, "learning_rate": 1.650497504577494e-05, "loss": 0.7779, "step": 2485 }, { "epoch": 0.3, "learning_rate": 1.6502040752622365e-05, "loss": 0.8125, "step": 2486 }, { "epoch": 0.3, "learning_rate": 1.649910548929969e-05, "loss": 0.8376, "step": 2487 }, { "epoch": 0.3, "learning_rate": 1.6496169256244897e-05, "loss": 0.808, "step": 2488 }, { "epoch": 0.3, "learning_rate": 1.6493232053896097e-05, "loss": 0.8198, "step": 2489 }, { "epoch": 0.3, "learning_rate": 1.649029388269155e-05, "loss": 0.8298, "step": 2490 }, { "epoch": 0.3, "learning_rate": 1.6487354743069663e-05, "loss": 0.8108, "step": 2491 }, { "epoch": 0.3, "learning_rate": 1.6484414635468985e-05, "loss": 0.7729, "step": 2492 }, { "epoch": 0.3, "learning_rate": 1.6481473560328206e-05, "loss": 0.7561, "step": 2493 }, { "epoch": 0.3, "learning_rate": 1.647853151808617e-05, "loss": 0.8555, "step": 2494 }, { "epoch": 0.3, "learning_rate": 1.647558850918185e-05, "loss": 0.7868, "step": 2495 }, { "epoch": 0.3, "learning_rate": 1.6472644534054388e-05, "loss": 0.7059, "step": 2496 }, { "epoch": 0.3, "learning_rate": 1.646969959314304e-05, "loss": 0.8136, "step": 2497 }, { "epoch": 0.3, "learning_rate": 1.6466753686887228e-05, "loss": 0.8203, "step": 2498 }, { "epoch": 0.3, "learning_rate": 1.646380681572651e-05, "loss": 0.8354, "step": 2499 }, { "epoch": 0.3, "learning_rate": 1.6460858980100585e-05, "loss": 0.7835, "step": 2500 }, { "epoch": 0.3, "learning_rate": 1.645791018044931e-05, "loss": 0.8114, "step": 2501 }, { "epoch": 0.3, "learning_rate": 1.6454960417212666e-05, "loss": 0.8337, "step": 2502 }, { "epoch": 0.3, "learning_rate": 1.6452009690830787e-05, "loss": 0.774, "step": 2503 }, { "epoch": 0.3, "learning_rate": 1.644905800174396e-05, "loss": 0.7796, "step": 2504 }, { "epoch": 0.3, "learning_rate": 1.64461053503926e-05, "loss": 0.769, "step": 2505 }, { "epoch": 0.3, "learning_rate": 1.644315173721727e-05, "loss": 0.7813, "step": 2506 }, { "epoch": 0.3, "learning_rate": 1.6440197162658685e-05, "loss": 0.8482, "step": 2507 }, { "epoch": 0.3, "learning_rate": 1.6437241627157697e-05, "loss": 0.7818, "step": 2508 }, { "epoch": 0.3, "learning_rate": 1.6434285131155295e-05, "loss": 0.7919, "step": 2509 }, { "epoch": 0.3, "learning_rate": 1.6431327675092625e-05, "loss": 0.841, "step": 2510 }, { "epoch": 0.3, "learning_rate": 1.6428369259410967e-05, "loss": 0.8209, "step": 2511 }, { "epoch": 0.3, "learning_rate": 1.6425409884551748e-05, "loss": 0.7383, "step": 2512 }, { "epoch": 0.3, "learning_rate": 1.6422449550956536e-05, "loss": 0.8348, "step": 2513 }, { "epoch": 0.3, "learning_rate": 1.6419488259067038e-05, "loss": 0.8426, "step": 2514 }, { "epoch": 0.3, "learning_rate": 1.6416526009325117e-05, "loss": 0.7522, "step": 2515 }, { "epoch": 0.3, "learning_rate": 1.6413562802172762e-05, "loss": 0.9023, "step": 2516 }, { "epoch": 0.3, "learning_rate": 1.6410598638052117e-05, "loss": 0.8811, "step": 2517 }, { "epoch": 0.3, "learning_rate": 1.6407633517405467e-05, "loss": 0.7891, "step": 2518 }, { "epoch": 0.3, "learning_rate": 1.6404667440675235e-05, "loss": 0.8549, "step": 2519 }, { "epoch": 0.3, "learning_rate": 1.640170040830399e-05, "loss": 0.8393, "step": 2520 }, { "epoch": 0.3, "learning_rate": 1.6398732420734452e-05, "loss": 0.8387, "step": 2521 }, { "epoch": 0.3, "learning_rate": 1.639576347840946e-05, "loss": 0.7746, "step": 2522 }, { "epoch": 0.3, "learning_rate": 1.639279358177202e-05, "loss": 0.8404, "step": 2523 }, { "epoch": 0.3, "learning_rate": 1.6389822731265265e-05, "loss": 0.8348, "step": 2524 }, { "epoch": 0.3, "learning_rate": 1.6386850927332478e-05, "loss": 0.8304, "step": 2525 }, { "epoch": 0.3, "learning_rate": 1.6383878170417083e-05, "loss": 0.8566, "step": 2526 }, { "epoch": 0.3, "learning_rate": 1.6380904460962647e-05, "loss": 0.7706, "step": 2527 }, { "epoch": 0.3, "learning_rate": 1.6377929799412874e-05, "loss": 0.8326, "step": 2528 }, { "epoch": 0.3, "learning_rate": 1.6374954186211617e-05, "loss": 0.7824, "step": 2529 }, { "epoch": 0.3, "learning_rate": 1.637197762180286e-05, "loss": 0.8041, "step": 2530 }, { "epoch": 0.3, "learning_rate": 1.6369000106630747e-05, "loss": 0.7623, "step": 2531 }, { "epoch": 0.3, "learning_rate": 1.636602164113955e-05, "loss": 0.8393, "step": 2532 }, { "epoch": 0.3, "learning_rate": 1.6363042225773678e-05, "loss": 0.8438, "step": 2533 }, { "epoch": 0.3, "learning_rate": 1.63600618609777e-05, "loss": 0.7768, "step": 2534 }, { "epoch": 0.3, "learning_rate": 1.635708054719631e-05, "loss": 0.7556, "step": 2535 }, { "epoch": 0.3, "learning_rate": 1.635409828487436e-05, "loss": 0.7667, "step": 2536 }, { "epoch": 0.3, "learning_rate": 1.635111507445682e-05, "loss": 0.8231, "step": 2537 }, { "epoch": 0.3, "learning_rate": 1.634813091638882e-05, "loss": 0.7679, "step": 2538 }, { "epoch": 0.3, "learning_rate": 1.634514581111563e-05, "loss": 0.7868, "step": 2539 }, { "epoch": 0.3, "learning_rate": 1.6342159759082655e-05, "loss": 0.851, "step": 2540 }, { "epoch": 0.3, "learning_rate": 1.633917276073545e-05, "loss": 0.8292, "step": 2541 }, { "epoch": 0.3, "learning_rate": 1.6336184816519694e-05, "loss": 0.8371, "step": 2542 }, { "epoch": 0.3, "learning_rate": 1.6333195926881226e-05, "loss": 0.7924, "step": 2543 }, { "epoch": 0.3, "learning_rate": 1.633020609226602e-05, "loss": 0.832, "step": 2544 }, { "epoch": 0.3, "learning_rate": 1.6327215313120182e-05, "loss": 0.7701, "step": 2545 }, { "epoch": 0.3, "learning_rate": 1.6324223589889975e-05, "loss": 0.8175, "step": 2546 }, { "epoch": 0.3, "learning_rate": 1.632123092302179e-05, "loss": 0.7824, "step": 2547 }, { "epoch": 0.3, "learning_rate": 1.631823731296216e-05, "loss": 0.7907, "step": 2548 }, { "epoch": 0.3, "learning_rate": 1.631524276015777e-05, "loss": 0.8209, "step": 2549 }, { "epoch": 0.3, "learning_rate": 1.6312247265055428e-05, "loss": 0.7667, "step": 2550 }, { "epoch": 0.3, "learning_rate": 1.63092508281021e-05, "loss": 0.793, "step": 2551 }, { "epoch": 0.3, "learning_rate": 1.630625344974488e-05, "loss": 0.7779, "step": 2552 }, { "epoch": 0.3, "learning_rate": 1.630325513043101e-05, "loss": 0.7885, "step": 2553 }, { "epoch": 0.3, "learning_rate": 1.6300255870607867e-05, "loss": 0.7863, "step": 2554 }, { "epoch": 0.3, "learning_rate": 1.629725567072297e-05, "loss": 0.8025, "step": 2555 }, { "epoch": 0.3, "learning_rate": 1.6294254531223982e-05, "loss": 0.8281, "step": 2556 }, { "epoch": 0.3, "learning_rate": 1.6291252452558706e-05, "loss": 0.8934, "step": 2557 }, { "epoch": 0.31, "learning_rate": 1.6288249435175078e-05, "loss": 0.8477, "step": 2558 }, { "epoch": 0.31, "learning_rate": 1.628524547952118e-05, "loss": 0.8119, "step": 2559 }, { "epoch": 0.31, "learning_rate": 1.6282240586045224e-05, "loss": 0.803, "step": 2560 }, { "epoch": 0.31, "learning_rate": 1.6279234755195583e-05, "loss": 0.8052, "step": 2561 }, { "epoch": 0.31, "learning_rate": 1.6276227987420753e-05, "loss": 0.8477, "step": 2562 }, { "epoch": 0.31, "learning_rate": 1.6273220283169372e-05, "loss": 0.7896, "step": 2563 }, { "epoch": 0.31, "learning_rate": 1.6270211642890223e-05, "loss": 0.7946, "step": 2564 }, { "epoch": 0.31, "learning_rate": 1.6267202067032224e-05, "loss": 0.7589, "step": 2565 }, { "epoch": 0.31, "learning_rate": 1.6264191556044436e-05, "loss": 0.8025, "step": 2566 }, { "epoch": 0.31, "learning_rate": 1.6261180110376048e-05, "loss": 0.7891, "step": 2567 }, { "epoch": 0.31, "learning_rate": 1.6258167730476412e-05, "loss": 0.8376, "step": 2568 }, { "epoch": 0.31, "learning_rate": 1.6255154416794997e-05, "loss": 0.7662, "step": 2569 }, { "epoch": 0.31, "learning_rate": 1.6252140169781424e-05, "loss": 0.7556, "step": 2570 }, { "epoch": 0.31, "learning_rate": 1.6249124989885446e-05, "loss": 0.8158, "step": 2571 }, { "epoch": 0.31, "learning_rate": 1.6246108877556957e-05, "loss": 0.736, "step": 2572 }, { "epoch": 0.31, "learning_rate": 1.6243091833245994e-05, "loss": 0.8343, "step": 2573 }, { "epoch": 0.31, "learning_rate": 1.6240073857402735e-05, "loss": 0.8404, "step": 2574 }, { "epoch": 0.31, "learning_rate": 1.6237054950477485e-05, "loss": 0.8209, "step": 2575 }, { "epoch": 0.31, "learning_rate": 1.6234035112920696e-05, "loss": 0.7757, "step": 2576 }, { "epoch": 0.31, "learning_rate": 1.623101434518296e-05, "loss": 0.8482, "step": 2577 }, { "epoch": 0.31, "learning_rate": 1.6227992647715008e-05, "loss": 0.8086, "step": 2578 }, { "epoch": 0.31, "learning_rate": 1.6224970020967704e-05, "loss": 0.8298, "step": 2579 }, { "epoch": 0.31, "learning_rate": 1.622194646539206e-05, "loss": 0.7785, "step": 2580 }, { "epoch": 0.31, "learning_rate": 1.6218921981439216e-05, "loss": 0.7628, "step": 2581 }, { "epoch": 0.31, "learning_rate": 1.6215896569560455e-05, "loss": 0.803, "step": 2582 }, { "epoch": 0.31, "learning_rate": 1.62128702302072e-05, "loss": 0.7913, "step": 2583 }, { "epoch": 0.31, "learning_rate": 1.620984296383102e-05, "loss": 0.8532, "step": 2584 }, { "epoch": 0.31, "learning_rate": 1.6206814770883595e-05, "loss": 0.8047, "step": 2585 }, { "epoch": 0.31, "learning_rate": 1.620378565181678e-05, "loss": 0.8292, "step": 2586 }, { "epoch": 0.31, "learning_rate": 1.620075560708254e-05, "loss": 0.7779, "step": 2587 }, { "epoch": 0.31, "learning_rate": 1.6197724637132994e-05, "loss": 0.8359, "step": 2588 }, { "epoch": 0.31, "learning_rate": 1.6194692742420388e-05, "loss": 0.8281, "step": 2589 }, { "epoch": 0.31, "learning_rate": 1.6191659923397115e-05, "loss": 0.8571, "step": 2590 }, { "epoch": 0.31, "learning_rate": 1.61886261805157e-05, "loss": 0.8153, "step": 2591 }, { "epoch": 0.31, "learning_rate": 1.618559151422881e-05, "loss": 0.8265, "step": 2592 }, { "epoch": 0.31, "learning_rate": 1.618255592498925e-05, "loss": 0.8131, "step": 2593 }, { "epoch": 0.31, "learning_rate": 1.617951941324995e-05, "loss": 0.8108, "step": 2594 }, { "epoch": 0.31, "learning_rate": 1.6176481979464002e-05, "loss": 0.7266, "step": 2595 }, { "epoch": 0.31, "learning_rate": 1.6173443624084613e-05, "loss": 0.7846, "step": 2596 }, { "epoch": 0.31, "learning_rate": 1.617040434756514e-05, "loss": 0.8175, "step": 2597 }, { "epoch": 0.31, "learning_rate": 1.616736415035907e-05, "loss": 0.8181, "step": 2598 }, { "epoch": 0.31, "learning_rate": 1.6164323032920037e-05, "loss": 0.8404, "step": 2599 }, { "epoch": 0.31, "learning_rate": 1.61612809957018e-05, "loss": 0.774, "step": 2600 }, { "epoch": 0.31, "learning_rate": 1.615823803915827e-05, "loss": 0.7779, "step": 2601 }, { "epoch": 0.31, "learning_rate": 1.6155194163743474e-05, "loss": 0.8158, "step": 2602 }, { "epoch": 0.31, "learning_rate": 1.6152149369911602e-05, "loss": 0.7969, "step": 2603 }, { "epoch": 0.31, "learning_rate": 1.614910365811696e-05, "loss": 0.8298, "step": 2604 }, { "epoch": 0.31, "learning_rate": 1.6146057028814e-05, "loss": 0.7494, "step": 2605 }, { "epoch": 0.31, "learning_rate": 1.6143009482457315e-05, "loss": 0.8248, "step": 2606 }, { "epoch": 0.31, "learning_rate": 1.6139961019501624e-05, "loss": 0.8627, "step": 2607 }, { "epoch": 0.31, "learning_rate": 1.6136911640401785e-05, "loss": 0.7305, "step": 2608 }, { "epoch": 0.31, "learning_rate": 1.6133861345612812e-05, "loss": 0.8521, "step": 2609 }, { "epoch": 0.31, "learning_rate": 1.613081013558982e-05, "loss": 0.8225, "step": 2610 }, { "epoch": 0.31, "learning_rate": 1.6127758010788093e-05, "loss": 0.7734, "step": 2611 }, { "epoch": 0.31, "learning_rate": 1.6124704971663033e-05, "loss": 0.7919, "step": 2612 }, { "epoch": 0.31, "learning_rate": 1.612165101867019e-05, "loss": 0.7835, "step": 2613 }, { "epoch": 0.31, "learning_rate": 1.611859615226524e-05, "loss": 0.8354, "step": 2614 }, { "epoch": 0.31, "learning_rate": 1.6115540372904003e-05, "loss": 0.8225, "step": 2615 }, { "epoch": 0.31, "learning_rate": 1.6112483681042427e-05, "loss": 0.7997, "step": 2616 }, { "epoch": 0.31, "learning_rate": 1.6109426077136603e-05, "loss": 0.8292, "step": 2617 }, { "epoch": 0.31, "learning_rate": 1.6106367561642758e-05, "loss": 0.7868, "step": 2618 }, { "epoch": 0.31, "learning_rate": 1.610330813501726e-05, "loss": 0.7863, "step": 2619 }, { "epoch": 0.31, "learning_rate": 1.610024779771659e-05, "loss": 0.8728, "step": 2620 }, { "epoch": 0.31, "learning_rate": 1.60971865501974e-05, "loss": 0.8583, "step": 2621 }, { "epoch": 0.31, "learning_rate": 1.6094124392916444e-05, "loss": 0.7985, "step": 2622 }, { "epoch": 0.31, "learning_rate": 1.609106132633063e-05, "loss": 0.8036, "step": 2623 }, { "epoch": 0.31, "learning_rate": 1.6087997350897006e-05, "loss": 0.8058, "step": 2624 }, { "epoch": 0.31, "learning_rate": 1.608493246707274e-05, "loss": 0.8348, "step": 2625 }, { "epoch": 0.31, "learning_rate": 1.608186667531515e-05, "loss": 0.8594, "step": 2626 }, { "epoch": 0.31, "learning_rate": 1.6078799976081673e-05, "loss": 0.7846, "step": 2627 }, { "epoch": 0.31, "learning_rate": 1.6075732369829903e-05, "loss": 0.8041, "step": 2628 }, { "epoch": 0.31, "learning_rate": 1.6072663857017553e-05, "loss": 0.817, "step": 2629 }, { "epoch": 0.31, "learning_rate": 1.6069594438102476e-05, "loss": 0.8198, "step": 2630 }, { "epoch": 0.31, "learning_rate": 1.6066524113542658e-05, "loss": 0.7863, "step": 2631 }, { "epoch": 0.31, "learning_rate": 1.6063452883796225e-05, "loss": 0.7489, "step": 2632 }, { "epoch": 0.31, "learning_rate": 1.6060380749321437e-05, "loss": 0.793, "step": 2633 }, { "epoch": 0.31, "learning_rate": 1.6057307710576687e-05, "loss": 0.7913, "step": 2634 }, { "epoch": 0.31, "learning_rate": 1.6054233768020497e-05, "loss": 0.7746, "step": 2635 }, { "epoch": 0.31, "learning_rate": 1.605115892211154e-05, "loss": 0.8114, "step": 2636 }, { "epoch": 0.31, "learning_rate": 1.6048083173308606e-05, "loss": 0.7679, "step": 2637 }, { "epoch": 0.31, "learning_rate": 1.6045006522070633e-05, "loss": 0.7584, "step": 2638 }, { "epoch": 0.31, "learning_rate": 1.6041928968856688e-05, "loss": 0.8772, "step": 2639 }, { "epoch": 0.31, "learning_rate": 1.6038850514125966e-05, "loss": 0.8315, "step": 2640 }, { "epoch": 0.31, "learning_rate": 1.6035771158337814e-05, "loss": 0.8103, "step": 2641 }, { "epoch": 0.32, "learning_rate": 1.6032690901951696e-05, "loss": 0.8086, "step": 2642 }, { "epoch": 0.32, "learning_rate": 1.6029609745427216e-05, "loss": 0.7919, "step": 2643 }, { "epoch": 0.32, "learning_rate": 1.6026527689224123e-05, "loss": 0.7366, "step": 2644 }, { "epoch": 0.32, "learning_rate": 1.602344473380228e-05, "loss": 0.7422, "step": 2645 }, { "epoch": 0.32, "learning_rate": 1.6020360879621704e-05, "loss": 0.8036, "step": 2646 }, { "epoch": 0.32, "learning_rate": 1.601727612714253e-05, "loss": 0.8103, "step": 2647 }, { "epoch": 0.32, "learning_rate": 1.6014190476825037e-05, "loss": 0.8147, "step": 2648 }, { "epoch": 0.32, "learning_rate": 1.6011103929129635e-05, "loss": 0.8198, "step": 2649 }, { "epoch": 0.32, "learning_rate": 1.6008016484516873e-05, "loss": 0.8298, "step": 2650 }, { "epoch": 0.32, "learning_rate": 1.600492814344742e-05, "loss": 0.7662, "step": 2651 }, { "epoch": 0.32, "learning_rate": 1.6001838906382093e-05, "loss": 0.87, "step": 2652 }, { "epoch": 0.32, "learning_rate": 1.5998748773781834e-05, "loss": 0.7628, "step": 2653 }, { "epoch": 0.32, "learning_rate": 1.599565774610773e-05, "loss": 0.8823, "step": 2654 }, { "epoch": 0.32, "learning_rate": 1.5992565823820983e-05, "loss": 0.8086, "step": 2655 }, { "epoch": 0.32, "learning_rate": 1.5989473007382942e-05, "loss": 0.822, "step": 2656 }, { "epoch": 0.32, "learning_rate": 1.5986379297255092e-05, "loss": 0.7997, "step": 2657 }, { "epoch": 0.32, "learning_rate": 1.5983284693899043e-05, "loss": 0.7857, "step": 2658 }, { "epoch": 0.32, "learning_rate": 1.5980189197776538e-05, "loss": 0.8348, "step": 2659 }, { "epoch": 0.32, "learning_rate": 1.5977092809349456e-05, "loss": 0.846, "step": 2660 }, { "epoch": 0.32, "learning_rate": 1.5973995529079818e-05, "loss": 0.851, "step": 2661 }, { "epoch": 0.32, "learning_rate": 1.597089735742976e-05, "loss": 0.8125, "step": 2662 }, { "epoch": 0.32, "learning_rate": 1.5967798294861562e-05, "loss": 0.8192, "step": 2663 }, { "epoch": 0.32, "learning_rate": 1.596469834183764e-05, "loss": 0.8075, "step": 2664 }, { "epoch": 0.32, "learning_rate": 1.596159749882053e-05, "loss": 0.8225, "step": 2665 }, { "epoch": 0.32, "learning_rate": 1.5958495766272916e-05, "loss": 0.8387, "step": 2666 }, { "epoch": 0.32, "learning_rate": 1.5955393144657612e-05, "loss": 0.8052, "step": 2667 }, { "epoch": 0.32, "learning_rate": 1.5952289634437547e-05, "loss": 0.8125, "step": 2668 }, { "epoch": 0.32, "learning_rate": 1.594918523607581e-05, "loss": 0.803, "step": 2669 }, { "epoch": 0.32, "learning_rate": 1.59460799500356e-05, "loss": 0.7852, "step": 2670 }, { "epoch": 0.32, "learning_rate": 1.5942973776780254e-05, "loss": 0.8164, "step": 2671 }, { "epoch": 0.32, "learning_rate": 1.593986671677326e-05, "loss": 0.7946, "step": 2672 }, { "epoch": 0.32, "learning_rate": 1.5936758770478206e-05, "loss": 0.8259, "step": 2673 }, { "epoch": 0.32, "learning_rate": 1.5933649938358834e-05, "loss": 0.8041, "step": 2674 }, { "epoch": 0.32, "learning_rate": 1.5930540220879015e-05, "loss": 0.7941, "step": 2675 }, { "epoch": 0.32, "learning_rate": 1.5927429618502752e-05, "loss": 0.7963, "step": 2676 }, { "epoch": 0.32, "learning_rate": 1.5924318131694177e-05, "loss": 0.8722, "step": 2677 }, { "epoch": 0.32, "learning_rate": 1.592120576091755e-05, "loss": 0.7589, "step": 2678 }, { "epoch": 0.32, "learning_rate": 1.5918092506637278e-05, "loss": 0.8253, "step": 2679 }, { "epoch": 0.32, "learning_rate": 1.591497836931788e-05, "loss": 0.8114, "step": 2680 }, { "epoch": 0.32, "learning_rate": 1.591186334942402e-05, "loss": 0.8616, "step": 2681 }, { "epoch": 0.32, "learning_rate": 1.5908747447420493e-05, "loss": 0.8265, "step": 2682 }, { "epoch": 0.32, "learning_rate": 1.590563066377222e-05, "loss": 0.7584, "step": 2683 }, { "epoch": 0.32, "learning_rate": 1.5902512998944263e-05, "loss": 0.8019, "step": 2684 }, { "epoch": 0.32, "learning_rate": 1.5899394453401798e-05, "loss": 0.8153, "step": 2685 }, { "epoch": 0.32, "learning_rate": 1.5896275027610154e-05, "loss": 0.8086, "step": 2686 }, { "epoch": 0.32, "learning_rate": 1.5893154722034774e-05, "loss": 0.8052, "step": 2687 }, { "epoch": 0.32, "learning_rate": 1.589003353714124e-05, "loss": 0.8203, "step": 2688 }, { "epoch": 0.32, "learning_rate": 1.5886911473395268e-05, "loss": 0.7985, "step": 2689 }, { "epoch": 0.32, "learning_rate": 1.58837885312627e-05, "loss": 0.8209, "step": 2690 }, { "epoch": 0.32, "learning_rate": 1.5880664711209503e-05, "loss": 0.803, "step": 2691 }, { "epoch": 0.32, "learning_rate": 1.5877540013701796e-05, "loss": 0.8331, "step": 2692 }, { "epoch": 0.32, "learning_rate": 1.5874414439205804e-05, "loss": 0.8287, "step": 2693 }, { "epoch": 0.32, "learning_rate": 1.58712879881879e-05, "loss": 0.8432, "step": 2694 }, { "epoch": 0.32, "learning_rate": 1.5868160661114584e-05, "loss": 0.8661, "step": 2695 }, { "epoch": 0.32, "learning_rate": 1.586503245845248e-05, "loss": 0.8449, "step": 2696 }, { "epoch": 0.32, "learning_rate": 1.5861903380668343e-05, "loss": 0.7009, "step": 2697 }, { "epoch": 0.32, "learning_rate": 1.5858773428229074e-05, "loss": 0.8092, "step": 2698 }, { "epoch": 0.32, "learning_rate": 1.585564260160169e-05, "loss": 0.8331, "step": 2699 }, { "epoch": 0.32, "learning_rate": 1.5852510901253337e-05, "loss": 0.7907, "step": 2700 }, { "epoch": 0.32, "learning_rate": 1.58493783276513e-05, "loss": 0.8259, "step": 2701 }, { "epoch": 0.32, "learning_rate": 1.5846244881262993e-05, "loss": 0.755, "step": 2702 }, { "epoch": 0.32, "learning_rate": 1.584311056255595e-05, "loss": 0.8164, "step": 2703 }, { "epoch": 0.32, "learning_rate": 1.5839975371997852e-05, "loss": 0.7762, "step": 2704 }, { "epoch": 0.32, "learning_rate": 1.58368393100565e-05, "loss": 0.803, "step": 2705 }, { "epoch": 0.32, "learning_rate": 1.5833702377199817e-05, "loss": 0.8231, "step": 2706 }, { "epoch": 0.32, "learning_rate": 1.5830564573895873e-05, "loss": 0.7779, "step": 2707 }, { "epoch": 0.32, "learning_rate": 1.5827425900612855e-05, "loss": 0.7813, "step": 2708 }, { "epoch": 0.32, "learning_rate": 1.5824286357819093e-05, "loss": 0.8237, "step": 2709 }, { "epoch": 0.32, "learning_rate": 1.582114594598303e-05, "loss": 0.7718, "step": 2710 }, { "epoch": 0.32, "learning_rate": 1.581800466557325e-05, "loss": 0.8376, "step": 2711 }, { "epoch": 0.32, "learning_rate": 1.5814862517058465e-05, "loss": 0.8058, "step": 2712 }, { "epoch": 0.32, "learning_rate": 1.5811719500907518e-05, "loss": 0.7868, "step": 2713 }, { "epoch": 0.32, "learning_rate": 1.580857561758937e-05, "loss": 0.8086, "step": 2714 }, { "epoch": 0.32, "learning_rate": 1.5805430867573125e-05, "loss": 0.8253, "step": 2715 }, { "epoch": 0.32, "learning_rate": 1.5802285251328016e-05, "loss": 0.8599, "step": 2716 }, { "epoch": 0.32, "learning_rate": 1.5799138769323393e-05, "loss": 0.8092, "step": 2717 }, { "epoch": 0.32, "learning_rate": 1.5795991422028746e-05, "loss": 0.7628, "step": 2718 }, { "epoch": 0.32, "learning_rate": 1.5792843209913694e-05, "loss": 0.7584, "step": 2719 }, { "epoch": 0.32, "learning_rate": 1.578969413344798e-05, "loss": 0.7461, "step": 2720 }, { "epoch": 0.32, "learning_rate": 1.578654419310147e-05, "loss": 0.7706, "step": 2721 }, { "epoch": 0.32, "learning_rate": 1.5783393389344183e-05, "loss": 0.803, "step": 2722 }, { "epoch": 0.32, "learning_rate": 1.5780241722646238e-05, "loss": 0.7656, "step": 2723 }, { "epoch": 0.32, "learning_rate": 1.57770891934779e-05, "loss": 0.7779, "step": 2724 }, { "epoch": 0.32, "learning_rate": 1.577393580230955e-05, "loss": 0.8359, "step": 2725 }, { "epoch": 0.33, "learning_rate": 1.5770781549611724e-05, "loss": 0.7556, "step": 2726 }, { "epoch": 0.33, "learning_rate": 1.5767626435855056e-05, "loss": 0.8488, "step": 2727 }, { "epoch": 0.33, "learning_rate": 1.5764470461510315e-05, "loss": 0.7349, "step": 2728 }, { "epoch": 0.33, "learning_rate": 1.5761313627048418e-05, "loss": 0.8326, "step": 2729 }, { "epoch": 0.33, "learning_rate": 1.575815593294039e-05, "loss": 0.8142, "step": 2730 }, { "epoch": 0.33, "learning_rate": 1.5754997379657385e-05, "loss": 0.8516, "step": 2731 }, { "epoch": 0.33, "learning_rate": 1.5751837967670702e-05, "loss": 0.8354, "step": 2732 }, { "epoch": 0.33, "learning_rate": 1.574867769745175e-05, "loss": 0.8103, "step": 2733 }, { "epoch": 0.33, "learning_rate": 1.574551656947208e-05, "loss": 0.8493, "step": 2734 }, { "epoch": 0.33, "learning_rate": 1.5742354584203355e-05, "loss": 0.7946, "step": 2735 }, { "epoch": 0.33, "learning_rate": 1.5739191742117382e-05, "loss": 0.7935, "step": 2736 }, { "epoch": 0.33, "learning_rate": 1.5736028043686083e-05, "loss": 0.8147, "step": 2737 }, { "epoch": 0.33, "learning_rate": 1.5732863489381524e-05, "loss": 0.8086, "step": 2738 }, { "epoch": 0.33, "learning_rate": 1.5729698079675874e-05, "loss": 0.7935, "step": 2739 }, { "epoch": 0.33, "learning_rate": 1.5726531815041455e-05, "loss": 0.7924, "step": 2740 }, { "epoch": 0.33, "learning_rate": 1.5723364695950703e-05, "loss": 0.8248, "step": 2741 }, { "epoch": 0.33, "learning_rate": 1.5720196722876184e-05, "loss": 0.7963, "step": 2742 }, { "epoch": 0.33, "learning_rate": 1.571702789629059e-05, "loss": 0.7545, "step": 2743 }, { "epoch": 0.33, "learning_rate": 1.5713858216666742e-05, "loss": 0.8298, "step": 2744 }, { "epoch": 0.33, "learning_rate": 1.5710687684477594e-05, "loss": 0.7891, "step": 2745 }, { "epoch": 0.33, "learning_rate": 1.570751630019621e-05, "loss": 0.7584, "step": 2746 }, { "epoch": 0.33, "learning_rate": 1.5704344064295803e-05, "loss": 0.7807, "step": 2747 }, { "epoch": 0.33, "learning_rate": 1.57011709772497e-05, "loss": 0.7193, "step": 2748 }, { "epoch": 0.33, "learning_rate": 1.5697997039531356e-05, "loss": 0.8041, "step": 2749 }, { "epoch": 0.33, "learning_rate": 1.5694822251614353e-05, "loss": 0.8164, "step": 2750 }, { "epoch": 0.33, "learning_rate": 1.5691646613972404e-05, "loss": 0.7946, "step": 2751 }, { "epoch": 0.33, "learning_rate": 1.5688470127079345e-05, "loss": 0.8281, "step": 2752 }, { "epoch": 0.33, "learning_rate": 1.568529279140914e-05, "loss": 0.755, "step": 2753 }, { "epoch": 0.33, "learning_rate": 1.568211460743588e-05, "loss": 0.8069, "step": 2754 }, { "epoch": 0.33, "learning_rate": 1.5678935575633785e-05, "loss": 0.8097, "step": 2755 }, { "epoch": 0.33, "learning_rate": 1.567575569647719e-05, "loss": 0.8465, "step": 2756 }, { "epoch": 0.33, "learning_rate": 1.5672574970440578e-05, "loss": 0.7561, "step": 2757 }, { "epoch": 0.33, "learning_rate": 1.5669393397998532e-05, "loss": 0.745, "step": 2758 }, { "epoch": 0.33, "learning_rate": 1.5666210979625784e-05, "loss": 0.7958, "step": 2759 }, { "epoch": 0.33, "learning_rate": 1.566302771579718e-05, "loss": 0.8532, "step": 2760 }, { "epoch": 0.33, "learning_rate": 1.5659843606987696e-05, "loss": 0.8465, "step": 2761 }, { "epoch": 0.33, "learning_rate": 1.565665865367243e-05, "loss": 0.8248, "step": 2762 }, { "epoch": 0.33, "learning_rate": 1.5653472856326608e-05, "loss": 0.7567, "step": 2763 }, { "epoch": 0.33, "learning_rate": 1.565028621542559e-05, "loss": 0.8203, "step": 2764 }, { "epoch": 0.33, "learning_rate": 1.5647098731444852e-05, "loss": 0.7561, "step": 2765 }, { "epoch": 0.33, "learning_rate": 1.5643910404859995e-05, "loss": 0.8237, "step": 2766 }, { "epoch": 0.33, "learning_rate": 1.564072123614676e-05, "loss": 0.8114, "step": 2767 }, { "epoch": 0.33, "learning_rate": 1.5637531225780988e-05, "loss": 0.8186, "step": 2768 }, { "epoch": 0.33, "learning_rate": 1.563434037423867e-05, "loss": 0.769, "step": 2769 }, { "epoch": 0.33, "learning_rate": 1.5631148681995914e-05, "loss": 0.7974, "step": 2770 }, { "epoch": 0.33, "learning_rate": 1.562795614952895e-05, "loss": 0.7779, "step": 2771 }, { "epoch": 0.33, "learning_rate": 1.5624762777314132e-05, "loss": 0.7525, "step": 2772 }, { "epoch": 0.33, "learning_rate": 1.5621568565827955e-05, "loss": 0.7628, "step": 2773 }, { "epoch": 0.33, "learning_rate": 1.5618373515547016e-05, "loss": 0.8108, "step": 2774 }, { "epoch": 0.33, "learning_rate": 1.5615177626948054e-05, "loss": 0.7718, "step": 2775 }, { "epoch": 0.33, "learning_rate": 1.5611980900507927e-05, "loss": 0.8343, "step": 2776 }, { "epoch": 0.33, "learning_rate": 1.560878333670362e-05, "loss": 0.7584, "step": 2777 }, { "epoch": 0.33, "learning_rate": 1.560558493601224e-05, "loss": 0.8488, "step": 2778 }, { "epoch": 0.33, "learning_rate": 1.560238569891102e-05, "loss": 0.8025, "step": 2779 }, { "epoch": 0.33, "learning_rate": 1.559918562587732e-05, "loss": 0.8438, "step": 2780 }, { "epoch": 0.33, "learning_rate": 1.5595984717388623e-05, "loss": 0.7701, "step": 2781 }, { "epoch": 0.33, "learning_rate": 1.5592782973922537e-05, "loss": 0.779, "step": 2782 }, { "epoch": 0.33, "learning_rate": 1.5589580395956796e-05, "loss": 0.8438, "step": 2783 }, { "epoch": 0.33, "learning_rate": 1.5586376983969255e-05, "loss": 0.7952, "step": 2784 }, { "epoch": 0.33, "learning_rate": 1.5583172738437892e-05, "loss": 0.8097, "step": 2785 }, { "epoch": 0.33, "learning_rate": 1.557996765984082e-05, "loss": 0.8075, "step": 2786 }, { "epoch": 0.33, "learning_rate": 1.5576761748656264e-05, "loss": 0.827, "step": 2787 }, { "epoch": 0.33, "learning_rate": 1.557355500536258e-05, "loss": 0.7522, "step": 2788 }, { "epoch": 0.33, "learning_rate": 1.5570347430438245e-05, "loss": 0.8571, "step": 2789 }, { "epoch": 0.33, "learning_rate": 1.5567139024361866e-05, "loss": 0.8359, "step": 2790 }, { "epoch": 0.33, "learning_rate": 1.556392978761216e-05, "loss": 0.7902, "step": 2791 }, { "epoch": 0.33, "learning_rate": 1.5560719720667988e-05, "loss": 0.7868, "step": 2792 }, { "epoch": 0.33, "learning_rate": 1.555750882400832e-05, "loss": 0.7952, "step": 2793 }, { "epoch": 0.33, "learning_rate": 1.5554297098112256e-05, "loss": 0.7706, "step": 2794 }, { "epoch": 0.33, "learning_rate": 1.5551084543459016e-05, "loss": 0.8477, "step": 2795 }, { "epoch": 0.33, "learning_rate": 1.5547871160527944e-05, "loss": 0.8359, "step": 2796 }, { "epoch": 0.33, "learning_rate": 1.554465694979851e-05, "loss": 0.8041, "step": 2797 }, { "epoch": 0.33, "learning_rate": 1.554144191175031e-05, "loss": 0.7985, "step": 2798 }, { "epoch": 0.33, "learning_rate": 1.5538226046863058e-05, "loss": 0.8365, "step": 2799 }, { "epoch": 0.33, "learning_rate": 1.553500935561659e-05, "loss": 0.8304, "step": 2800 }, { "epoch": 0.33, "learning_rate": 1.553179183849088e-05, "loss": 0.8259, "step": 2801 }, { "epoch": 0.33, "learning_rate": 1.5528573495966e-05, "loss": 0.8544, "step": 2802 }, { "epoch": 0.33, "learning_rate": 1.5525354328522162e-05, "loss": 0.8315, "step": 2803 }, { "epoch": 0.33, "learning_rate": 1.5522134336639704e-05, "loss": 0.8594, "step": 2804 }, { "epoch": 0.33, "learning_rate": 1.5518913520799082e-05, "loss": 0.8002, "step": 2805 }, { "epoch": 0.33, "learning_rate": 1.551569188148087e-05, "loss": 0.7863, "step": 2806 }, { "epoch": 0.33, "learning_rate": 1.5512469419165766e-05, "loss": 0.7946, "step": 2807 }, { "epoch": 0.33, "learning_rate": 1.5509246134334604e-05, "loss": 0.8359, "step": 2808 }, { "epoch": 0.34, "learning_rate": 1.550602202746832e-05, "loss": 0.8131, "step": 2809 }, { "epoch": 0.34, "learning_rate": 1.550279709904799e-05, "loss": 0.7712, "step": 2810 }, { "epoch": 0.34, "learning_rate": 1.5499571349554804e-05, "loss": 0.7517, "step": 2811 }, { "epoch": 0.34, "learning_rate": 1.5496344779470075e-05, "loss": 0.7991, "step": 2812 }, { "epoch": 0.34, "learning_rate": 1.549311738927524e-05, "loss": 0.8069, "step": 2813 }, { "epoch": 0.34, "learning_rate": 1.5489889179451864e-05, "loss": 0.7935, "step": 2814 }, { "epoch": 0.34, "learning_rate": 1.548666015048162e-05, "loss": 0.8382, "step": 2815 }, { "epoch": 0.34, "learning_rate": 1.5483430302846317e-05, "loss": 0.7885, "step": 2816 }, { "epoch": 0.34, "learning_rate": 1.548019963702788e-05, "loss": 0.7779, "step": 2817 }, { "epoch": 0.34, "learning_rate": 1.547696815350835e-05, "loss": 0.8158, "step": 2818 }, { "epoch": 0.34, "learning_rate": 1.5473735852769908e-05, "loss": 0.7835, "step": 2819 }, { "epoch": 0.34, "learning_rate": 1.547050273529484e-05, "loss": 0.7991, "step": 2820 }, { "epoch": 0.34, "learning_rate": 1.5467268801565563e-05, "loss": 0.7734, "step": 2821 }, { "epoch": 0.34, "learning_rate": 1.546403405206461e-05, "loss": 0.7718, "step": 2822 }, { "epoch": 0.34, "learning_rate": 1.5460798487274636e-05, "loss": 0.7651, "step": 2823 }, { "epoch": 0.34, "learning_rate": 1.545756210767842e-05, "loss": 0.7238, "step": 2824 }, { "epoch": 0.34, "learning_rate": 1.5454324913758873e-05, "loss": 0.7701, "step": 2825 }, { "epoch": 0.34, "learning_rate": 1.5451086905999004e-05, "loss": 0.8052, "step": 2826 }, { "epoch": 0.34, "learning_rate": 1.5447848084881964e-05, "loss": 0.8164, "step": 2827 }, { "epoch": 0.34, "learning_rate": 1.5444608450891013e-05, "loss": 0.7946, "step": 2828 }, { "epoch": 0.34, "learning_rate": 1.544136800450954e-05, "loss": 0.8248, "step": 2829 }, { "epoch": 0.34, "learning_rate": 1.5438126746221053e-05, "loss": 0.8281, "step": 2830 }, { "epoch": 0.34, "learning_rate": 1.5434884676509175e-05, "loss": 0.7372, "step": 2831 }, { "epoch": 0.34, "learning_rate": 1.5431641795857665e-05, "loss": 0.8499, "step": 2832 }, { "epoch": 0.34, "learning_rate": 1.5428398104750383e-05, "loss": 0.8337, "step": 2833 }, { "epoch": 0.34, "learning_rate": 1.5425153603671326e-05, "loss": 0.7857, "step": 2834 }, { "epoch": 0.34, "learning_rate": 1.5421908293104612e-05, "loss": 0.8153, "step": 2835 }, { "epoch": 0.34, "learning_rate": 1.541866217353446e-05, "loss": 0.9124, "step": 2836 }, { "epoch": 0.34, "learning_rate": 1.5415415245445234e-05, "loss": 0.8142, "step": 2837 }, { "epoch": 0.34, "learning_rate": 1.541216750932141e-05, "loss": 0.808, "step": 2838 }, { "epoch": 0.34, "learning_rate": 1.5408918965647575e-05, "loss": 0.7706, "step": 2839 }, { "epoch": 0.34, "learning_rate": 1.540566961490845e-05, "loss": 0.8365, "step": 2840 }, { "epoch": 0.34, "learning_rate": 1.5402419457588867e-05, "loss": 0.8086, "step": 2841 }, { "epoch": 0.34, "learning_rate": 1.539916849417379e-05, "loss": 0.8577, "step": 2842 }, { "epoch": 0.34, "learning_rate": 1.5395916725148287e-05, "loss": 0.8689, "step": 2843 }, { "epoch": 0.34, "learning_rate": 1.539266415099756e-05, "loss": 0.7829, "step": 2844 }, { "epoch": 0.34, "learning_rate": 1.538941077220692e-05, "loss": 0.726, "step": 2845 }, { "epoch": 0.34, "learning_rate": 1.5386156589261812e-05, "loss": 0.7662, "step": 2846 }, { "epoch": 0.34, "learning_rate": 1.5382901602647788e-05, "loss": 0.8276, "step": 2847 }, { "epoch": 0.34, "learning_rate": 1.5379645812850527e-05, "loss": 0.8516, "step": 2848 }, { "epoch": 0.34, "learning_rate": 1.5376389220355822e-05, "loss": 0.8426, "step": 2849 }, { "epoch": 0.34, "learning_rate": 1.5373131825649595e-05, "loss": 0.7706, "step": 2850 }, { "epoch": 0.34, "learning_rate": 1.5369873629217872e-05, "loss": 0.8622, "step": 2851 }, { "epoch": 0.34, "learning_rate": 1.5366614631546825e-05, "loss": 0.8633, "step": 2852 }, { "epoch": 0.34, "learning_rate": 1.5363354833122715e-05, "loss": 0.8231, "step": 2853 }, { "epoch": 0.34, "learning_rate": 1.5360094234431942e-05, "loss": 0.7974, "step": 2854 }, { "epoch": 0.34, "learning_rate": 1.5356832835961023e-05, "loss": 0.7718, "step": 2855 }, { "epoch": 0.34, "learning_rate": 1.5353570638196584e-05, "loss": 0.8443, "step": 2856 }, { "epoch": 0.34, "learning_rate": 1.5350307641625388e-05, "loss": 0.8164, "step": 2857 }, { "epoch": 0.34, "learning_rate": 1.53470438467343e-05, "loss": 0.714, "step": 2858 }, { "epoch": 0.34, "learning_rate": 1.534377925401031e-05, "loss": 0.8142, "step": 2859 }, { "epoch": 0.34, "learning_rate": 1.5340513863940533e-05, "loss": 0.7656, "step": 2860 }, { "epoch": 0.34, "learning_rate": 1.5337247677012196e-05, "loss": 0.822, "step": 2861 }, { "epoch": 0.34, "learning_rate": 1.5333980693712646e-05, "loss": 0.8013, "step": 2862 }, { "epoch": 0.34, "learning_rate": 1.5330712914529352e-05, "loss": 0.726, "step": 2863 }, { "epoch": 0.34, "learning_rate": 1.53274443399499e-05, "loss": 0.7489, "step": 2864 }, { "epoch": 0.34, "learning_rate": 1.5324174970461992e-05, "loss": 0.7935, "step": 2865 }, { "epoch": 0.34, "learning_rate": 1.532090480655345e-05, "loss": 0.7829, "step": 2866 }, { "epoch": 0.34, "learning_rate": 1.5317633848712218e-05, "loss": 0.7723, "step": 2867 }, { "epoch": 0.34, "learning_rate": 1.531436209742636e-05, "loss": 0.7924, "step": 2868 }, { "epoch": 0.34, "learning_rate": 1.5311089553184045e-05, "loss": 0.7773, "step": 2869 }, { "epoch": 0.34, "learning_rate": 1.5307816216473574e-05, "loss": 0.8449, "step": 2870 }, { "epoch": 0.34, "learning_rate": 1.530454208778336e-05, "loss": 0.7405, "step": 2871 }, { "epoch": 0.34, "learning_rate": 1.5301267167601947e-05, "loss": 0.8387, "step": 2872 }, { "epoch": 0.34, "learning_rate": 1.529799145641797e-05, "loss": 0.7941, "step": 2873 }, { "epoch": 0.34, "learning_rate": 1.5294714954720206e-05, "loss": 0.7874, "step": 2874 }, { "epoch": 0.34, "learning_rate": 1.5291437662997545e-05, "loss": 0.8521, "step": 2875 }, { "epoch": 0.34, "learning_rate": 1.5288159581738984e-05, "loss": 0.8147, "step": 2876 }, { "epoch": 0.34, "learning_rate": 1.528488071143365e-05, "loss": 0.8175, "step": 2877 }, { "epoch": 0.34, "learning_rate": 1.5281601052570787e-05, "loss": 0.8471, "step": 2878 }, { "epoch": 0.34, "learning_rate": 1.527832060563975e-05, "loss": 0.8304, "step": 2879 }, { "epoch": 0.34, "learning_rate": 1.5275039371130015e-05, "loss": 0.8013, "step": 2880 }, { "epoch": 0.34, "learning_rate": 1.5271757349531172e-05, "loss": 0.7405, "step": 2881 }, { "epoch": 0.34, "learning_rate": 1.526847454133294e-05, "loss": 0.7662, "step": 2882 }, { "epoch": 0.34, "learning_rate": 1.5265190947025136e-05, "loss": 0.8125, "step": 2883 }, { "epoch": 0.34, "learning_rate": 1.5261906567097713e-05, "loss": 0.75, "step": 2884 }, { "epoch": 0.34, "learning_rate": 1.5258621402040737e-05, "loss": 0.8471, "step": 2885 }, { "epoch": 0.34, "learning_rate": 1.5255335452344378e-05, "loss": 0.7338, "step": 2886 }, { "epoch": 0.34, "learning_rate": 1.5252048718498937e-05, "loss": 0.7533, "step": 2887 }, { "epoch": 0.34, "learning_rate": 1.5248761200994832e-05, "loss": 0.7333, "step": 2888 }, { "epoch": 0.34, "learning_rate": 1.5245472900322587e-05, "loss": 0.774, "step": 2889 }, { "epoch": 0.34, "learning_rate": 1.5242183816972856e-05, "loss": 0.7985, "step": 2890 }, { "epoch": 0.34, "learning_rate": 1.5238893951436397e-05, "loss": 0.7874, "step": 2891 }, { "epoch": 0.34, "learning_rate": 1.5235603304204096e-05, "loss": 0.793, "step": 2892 }, { "epoch": 0.35, "learning_rate": 1.5232311875766953e-05, "loss": 0.8164, "step": 2893 }, { "epoch": 0.35, "learning_rate": 1.5229019666616074e-05, "loss": 0.8214, "step": 2894 }, { "epoch": 0.35, "learning_rate": 1.5225726677242696e-05, "loss": 0.7885, "step": 2895 }, { "epoch": 0.35, "learning_rate": 1.5222432908138163e-05, "loss": 0.8454, "step": 2896 }, { "epoch": 0.35, "learning_rate": 1.5219138359793943e-05, "loss": 0.7946, "step": 2897 }, { "epoch": 0.35, "learning_rate": 1.5215843032701611e-05, "loss": 0.822, "step": 2898 }, { "epoch": 0.35, "learning_rate": 1.5212546927352865e-05, "loss": 0.76, "step": 2899 }, { "epoch": 0.35, "learning_rate": 1.5209250044239521e-05, "loss": 0.7852, "step": 2900 }, { "epoch": 0.35, "learning_rate": 1.5205952383853499e-05, "loss": 0.7935, "step": 2901 }, { "epoch": 0.35, "learning_rate": 1.5202653946686847e-05, "loss": 0.7907, "step": 2902 }, { "epoch": 0.35, "learning_rate": 1.5199354733231731e-05, "loss": 0.7874, "step": 2903 }, { "epoch": 0.35, "learning_rate": 1.519605474398042e-05, "loss": 0.8532, "step": 2904 }, { "epoch": 0.35, "learning_rate": 1.5192753979425306e-05, "loss": 0.7567, "step": 2905 }, { "epoch": 0.35, "learning_rate": 1.5189452440058898e-05, "loss": 0.7679, "step": 2906 }, { "epoch": 0.35, "learning_rate": 1.518615012637382e-05, "loss": 0.7785, "step": 2907 }, { "epoch": 0.35, "learning_rate": 1.5182847038862808e-05, "loss": 0.8477, "step": 2908 }, { "epoch": 0.35, "learning_rate": 1.517954317801872e-05, "loss": 0.7785, "step": 2909 }, { "epoch": 0.35, "learning_rate": 1.517623854433452e-05, "loss": 0.7673, "step": 2910 }, { "epoch": 0.35, "learning_rate": 1.5172933138303298e-05, "loss": 0.8052, "step": 2911 }, { "epoch": 0.35, "learning_rate": 1.516962696041825e-05, "loss": 0.8064, "step": 2912 }, { "epoch": 0.35, "learning_rate": 1.5166320011172695e-05, "loss": 0.779, "step": 2913 }, { "epoch": 0.35, "learning_rate": 1.5163012291060058e-05, "loss": 0.8242, "step": 2914 }, { "epoch": 0.35, "learning_rate": 1.5159703800573886e-05, "loss": 0.7824, "step": 2915 }, { "epoch": 0.35, "learning_rate": 1.5156394540207844e-05, "loss": 0.8265, "step": 2916 }, { "epoch": 0.35, "learning_rate": 1.51530845104557e-05, "loss": 0.7807, "step": 2917 }, { "epoch": 0.35, "learning_rate": 1.5149773711811349e-05, "loss": 0.8019, "step": 2918 }, { "epoch": 0.35, "learning_rate": 1.514646214476879e-05, "loss": 0.7762, "step": 2919 }, { "epoch": 0.35, "learning_rate": 1.514314980982215e-05, "loss": 0.7963, "step": 2920 }, { "epoch": 0.35, "learning_rate": 1.5139836707465655e-05, "loss": 0.7667, "step": 2921 }, { "epoch": 0.35, "learning_rate": 1.5136522838193659e-05, "loss": 0.8075, "step": 2922 }, { "epoch": 0.35, "learning_rate": 1.5133208202500624e-05, "loss": 0.8125, "step": 2923 }, { "epoch": 0.35, "learning_rate": 1.512989280088112e-05, "loss": 0.7561, "step": 2924 }, { "epoch": 0.35, "learning_rate": 1.512657663382985e-05, "loss": 0.7974, "step": 2925 }, { "epoch": 0.35, "learning_rate": 1.5123259701841613e-05, "loss": 0.798, "step": 2926 }, { "epoch": 0.35, "learning_rate": 1.5119942005411325e-05, "loss": 0.7985, "step": 2927 }, { "epoch": 0.35, "learning_rate": 1.511662354503403e-05, "loss": 0.7271, "step": 2928 }, { "epoch": 0.35, "learning_rate": 1.5113304321204867e-05, "loss": 0.7746, "step": 2929 }, { "epoch": 0.35, "learning_rate": 1.5109984334419103e-05, "loss": 0.793, "step": 2930 }, { "epoch": 0.35, "learning_rate": 1.5106663585172108e-05, "loss": 0.8265, "step": 2931 }, { "epoch": 0.35, "learning_rate": 1.5103342073959373e-05, "loss": 0.7997, "step": 2932 }, { "epoch": 0.35, "learning_rate": 1.5100019801276507e-05, "loss": 0.8186, "step": 2933 }, { "epoch": 0.35, "learning_rate": 1.5096696767619219e-05, "loss": 0.8404, "step": 2934 }, { "epoch": 0.35, "learning_rate": 1.5093372973483345e-05, "loss": 0.8186, "step": 2935 }, { "epoch": 0.35, "learning_rate": 1.5090048419364824e-05, "loss": 0.7684, "step": 2936 }, { "epoch": 0.35, "learning_rate": 1.5086723105759716e-05, "loss": 0.8265, "step": 2937 }, { "epoch": 0.35, "learning_rate": 1.5083397033164188e-05, "loss": 0.7852, "step": 2938 }, { "epoch": 0.35, "learning_rate": 1.5080070202074529e-05, "loss": 0.7857, "step": 2939 }, { "epoch": 0.35, "learning_rate": 1.507674261298713e-05, "loss": 0.8331, "step": 2940 }, { "epoch": 0.35, "learning_rate": 1.5073414266398503e-05, "loss": 0.8092, "step": 2941 }, { "epoch": 0.35, "learning_rate": 1.5070085162805273e-05, "loss": 0.7762, "step": 2942 }, { "epoch": 0.35, "learning_rate": 1.5066755302704174e-05, "loss": 0.7807, "step": 2943 }, { "epoch": 0.35, "learning_rate": 1.5063424686592054e-05, "loss": 0.8181, "step": 2944 }, { "epoch": 0.35, "learning_rate": 1.5060093314965879e-05, "loss": 0.8225, "step": 2945 }, { "epoch": 0.35, "learning_rate": 1.5056761188322715e-05, "loss": 0.7969, "step": 2946 }, { "epoch": 0.35, "learning_rate": 1.5053428307159756e-05, "loss": 0.8326, "step": 2947 }, { "epoch": 0.35, "learning_rate": 1.50500946719743e-05, "loss": 0.7294, "step": 2948 }, { "epoch": 0.35, "learning_rate": 1.5046760283263756e-05, "loss": 0.8404, "step": 2949 }, { "epoch": 0.35, "learning_rate": 1.5043425141525652e-05, "loss": 0.8047, "step": 2950 }, { "epoch": 0.35, "learning_rate": 1.5040089247257623e-05, "loss": 0.8214, "step": 2951 }, { "epoch": 0.35, "learning_rate": 1.5036752600957418e-05, "loss": 0.8393, "step": 2952 }, { "epoch": 0.35, "learning_rate": 1.50334152031229e-05, "loss": 0.8092, "step": 2953 }, { "epoch": 0.35, "learning_rate": 1.5030077054252041e-05, "loss": 0.7913, "step": 2954 }, { "epoch": 0.35, "learning_rate": 1.5026738154842925e-05, "loss": 0.808, "step": 2955 }, { "epoch": 0.35, "learning_rate": 1.5023398505393755e-05, "loss": 0.8198, "step": 2956 }, { "epoch": 0.35, "learning_rate": 1.5020058106402833e-05, "loss": 0.7215, "step": 2957 }, { "epoch": 0.35, "learning_rate": 1.5016716958368584e-05, "loss": 0.8354, "step": 2958 }, { "epoch": 0.35, "learning_rate": 1.5013375061789543e-05, "loss": 0.8532, "step": 2959 }, { "epoch": 0.35, "learning_rate": 1.5010032417164353e-05, "loss": 0.7985, "step": 2960 }, { "epoch": 0.35, "learning_rate": 1.500668902499177e-05, "loss": 0.7868, "step": 2961 }, { "epoch": 0.35, "learning_rate": 1.5003344885770657e-05, "loss": 0.8242, "step": 2962 }, { "epoch": 0.35, "learning_rate": 1.5000000000000002e-05, "loss": 0.7868, "step": 2963 }, { "epoch": 0.35, "learning_rate": 1.4996654368178889e-05, "loss": 0.8153, "step": 2964 }, { "epoch": 0.35, "learning_rate": 1.4993307990806524e-05, "loss": 0.731, "step": 2965 }, { "epoch": 0.35, "learning_rate": 1.498996086838222e-05, "loss": 0.8432, "step": 2966 }, { "epoch": 0.35, "learning_rate": 1.4986613001405404e-05, "loss": 0.851, "step": 2967 }, { "epoch": 0.35, "learning_rate": 1.4983264390375602e-05, "loss": 0.8181, "step": 2968 }, { "epoch": 0.35, "learning_rate": 1.497991503579247e-05, "loss": 0.7846, "step": 2969 }, { "epoch": 0.35, "learning_rate": 1.4976564938155757e-05, "loss": 0.793, "step": 2970 }, { "epoch": 0.35, "learning_rate": 1.4973214097965343e-05, "loss": 0.7997, "step": 2971 }, { "epoch": 0.35, "learning_rate": 1.4969862515721197e-05, "loss": 0.7533, "step": 2972 }, { "epoch": 0.35, "learning_rate": 1.4966510191923416e-05, "loss": 0.8237, "step": 2973 }, { "epoch": 0.35, "learning_rate": 1.4963157127072194e-05, "loss": 0.7907, "step": 2974 }, { "epoch": 0.35, "learning_rate": 1.4959803321667843e-05, "loss": 0.7941, "step": 2975 }, { "epoch": 0.35, "learning_rate": 1.495644877621079e-05, "loss": 0.8393, "step": 2976 }, { "epoch": 0.36, "learning_rate": 1.4953093491201562e-05, "loss": 0.784, "step": 2977 }, { "epoch": 0.36, "learning_rate": 1.4949737467140808e-05, "loss": 0.7824, "step": 2978 }, { "epoch": 0.36, "learning_rate": 1.4946380704529273e-05, "loss": 0.7891, "step": 2979 }, { "epoch": 0.36, "learning_rate": 1.4943023203867819e-05, "loss": 0.8309, "step": 2980 }, { "epoch": 0.36, "learning_rate": 1.4939664965657428e-05, "loss": 0.798, "step": 2981 }, { "epoch": 0.36, "learning_rate": 1.4936305990399174e-05, "loss": 0.8103, "step": 2982 }, { "epoch": 0.36, "learning_rate": 1.4932946278594256e-05, "loss": 0.7388, "step": 2983 }, { "epoch": 0.36, "learning_rate": 1.4929585830743971e-05, "loss": 0.8125, "step": 2984 }, { "epoch": 0.36, "learning_rate": 1.4926224647349741e-05, "loss": 0.7623, "step": 2985 }, { "epoch": 0.36, "learning_rate": 1.492286272891308e-05, "loss": 0.7891, "step": 2986 }, { "epoch": 0.36, "learning_rate": 1.4919500075935623e-05, "loss": 0.7801, "step": 2987 }, { "epoch": 0.36, "learning_rate": 1.4916136688919112e-05, "loss": 0.8158, "step": 2988 }, { "epoch": 0.36, "learning_rate": 1.4912772568365395e-05, "loss": 0.7667, "step": 2989 }, { "epoch": 0.36, "learning_rate": 1.4909407714776438e-05, "loss": 0.8092, "step": 2990 }, { "epoch": 0.36, "learning_rate": 1.490604212865431e-05, "loss": 0.8008, "step": 2991 }, { "epoch": 0.36, "learning_rate": 1.4902675810501191e-05, "loss": 0.7667, "step": 2992 }, { "epoch": 0.36, "learning_rate": 1.4899308760819364e-05, "loss": 0.8119, "step": 2993 }, { "epoch": 0.36, "learning_rate": 1.4895940980111232e-05, "loss": 0.7902, "step": 2994 }, { "epoch": 0.36, "learning_rate": 1.48925724688793e-05, "loss": 0.7829, "step": 2995 }, { "epoch": 0.36, "learning_rate": 1.4889203227626186e-05, "loss": 0.7667, "step": 2996 }, { "epoch": 0.36, "learning_rate": 1.4885833256854612e-05, "loss": 0.7835, "step": 2997 }, { "epoch": 0.36, "learning_rate": 1.4882462557067414e-05, "loss": 0.7506, "step": 2998 }, { "epoch": 0.36, "learning_rate": 1.4879091128767533e-05, "loss": 0.7863, "step": 2999 }, { "epoch": 0.36, "learning_rate": 1.4875718972458018e-05, "loss": 0.7718, "step": 3000 }, { "epoch": 0.36, "learning_rate": 1.4872346088642036e-05, "loss": 0.8052, "step": 3001 }, { "epoch": 0.36, "learning_rate": 1.4868972477822845e-05, "loss": 0.7673, "step": 3002 }, { "epoch": 0.36, "learning_rate": 1.4865598140503831e-05, "loss": 0.8527, "step": 3003 }, { "epoch": 0.36, "learning_rate": 1.4862223077188475e-05, "loss": 0.7734, "step": 3004 }, { "epoch": 0.36, "learning_rate": 1.4858847288380369e-05, "loss": 0.8092, "step": 3005 }, { "epoch": 0.36, "learning_rate": 1.485547077458322e-05, "loss": 0.8181, "step": 3006 }, { "epoch": 0.36, "learning_rate": 1.485209353630083e-05, "loss": 0.7104, "step": 3007 }, { "epoch": 0.36, "learning_rate": 1.4848715574037127e-05, "loss": 0.8259, "step": 3008 }, { "epoch": 0.36, "learning_rate": 1.4845336888296127e-05, "loss": 0.8086, "step": 3009 }, { "epoch": 0.36, "learning_rate": 1.4841957479581973e-05, "loss": 0.8823, "step": 3010 }, { "epoch": 0.36, "learning_rate": 1.48385773483989e-05, "loss": 0.8583, "step": 3011 }, { "epoch": 0.36, "learning_rate": 1.483519649525126e-05, "loss": 0.7589, "step": 3012 }, { "epoch": 0.36, "learning_rate": 1.4831814920643513e-05, "loss": 0.8432, "step": 3013 }, { "epoch": 0.36, "learning_rate": 1.4828432625080218e-05, "loss": 0.7684, "step": 3014 }, { "epoch": 0.36, "learning_rate": 1.4825049609066051e-05, "loss": 0.8192, "step": 3015 }, { "epoch": 0.36, "learning_rate": 1.4821665873105797e-05, "loss": 0.8097, "step": 3016 }, { "epoch": 0.36, "learning_rate": 1.4818281417704338e-05, "loss": 0.8343, "step": 3017 }, { "epoch": 0.36, "learning_rate": 1.481489624336667e-05, "loss": 0.7701, "step": 3018 }, { "epoch": 0.36, "learning_rate": 1.4811510350597893e-05, "loss": 0.7701, "step": 3019 }, { "epoch": 0.36, "learning_rate": 1.4808123739903218e-05, "loss": 0.7634, "step": 3020 }, { "epoch": 0.36, "learning_rate": 1.4804736411787963e-05, "loss": 0.7617, "step": 3021 }, { "epoch": 0.36, "learning_rate": 1.4801348366757551e-05, "loss": 0.832, "step": 3022 }, { "epoch": 0.36, "learning_rate": 1.4797959605317514e-05, "loss": 0.7511, "step": 3023 }, { "epoch": 0.36, "learning_rate": 1.4794570127973487e-05, "loss": 0.7801, "step": 3024 }, { "epoch": 0.36, "learning_rate": 1.4791179935231211e-05, "loss": 0.784, "step": 3025 }, { "epoch": 0.36, "learning_rate": 1.4787789027596544e-05, "loss": 0.8248, "step": 3026 }, { "epoch": 0.36, "learning_rate": 1.4784397405575437e-05, "loss": 0.7813, "step": 3027 }, { "epoch": 0.36, "learning_rate": 1.4781005069673962e-05, "loss": 0.7863, "step": 3028 }, { "epoch": 0.36, "learning_rate": 1.477761202039828e-05, "loss": 0.8198, "step": 3029 }, { "epoch": 0.36, "learning_rate": 1.4774218258254678e-05, "loss": 0.8131, "step": 3030 }, { "epoch": 0.36, "learning_rate": 1.4770823783749532e-05, "loss": 0.8309, "step": 3031 }, { "epoch": 0.36, "learning_rate": 1.4767428597389338e-05, "loss": 0.8237, "step": 3032 }, { "epoch": 0.36, "learning_rate": 1.4764032699680686e-05, "loss": 0.8354, "step": 3033 }, { "epoch": 0.36, "learning_rate": 1.476063609113028e-05, "loss": 0.7511, "step": 3034 }, { "epoch": 0.36, "learning_rate": 1.4757238772244933e-05, "loss": 0.774, "step": 3035 }, { "epoch": 0.36, "learning_rate": 1.4753840743531556e-05, "loss": 0.8343, "step": 3036 }, { "epoch": 0.36, "learning_rate": 1.4750442005497166e-05, "loss": 0.7494, "step": 3037 }, { "epoch": 0.36, "learning_rate": 1.4747042558648892e-05, "loss": 0.7907, "step": 3038 }, { "epoch": 0.36, "learning_rate": 1.4743642403493965e-05, "loss": 0.7824, "step": 3039 }, { "epoch": 0.36, "learning_rate": 1.4740241540539724e-05, "loss": 0.8125, "step": 3040 }, { "epoch": 0.36, "learning_rate": 1.4736839970293613e-05, "loss": 0.7695, "step": 3041 }, { "epoch": 0.36, "learning_rate": 1.4733437693263177e-05, "loss": 0.769, "step": 3042 }, { "epoch": 0.36, "learning_rate": 1.4730034709956072e-05, "loss": 0.8979, "step": 3043 }, { "epoch": 0.36, "learning_rate": 1.4726631020880055e-05, "loss": 0.8527, "step": 3044 }, { "epoch": 0.36, "learning_rate": 1.4723226626542996e-05, "loss": 0.8013, "step": 3045 }, { "epoch": 0.36, "learning_rate": 1.4719821527452863e-05, "loss": 0.803, "step": 3046 }, { "epoch": 0.36, "learning_rate": 1.4716415724117728e-05, "loss": 0.7779, "step": 3047 }, { "epoch": 0.36, "learning_rate": 1.4713009217045773e-05, "loss": 0.8438, "step": 3048 }, { "epoch": 0.36, "learning_rate": 1.4709602006745285e-05, "loss": 0.7723, "step": 3049 }, { "epoch": 0.36, "learning_rate": 1.470619409372465e-05, "loss": 0.8008, "step": 3050 }, { "epoch": 0.36, "learning_rate": 1.470278547849237e-05, "loss": 0.8041, "step": 3051 }, { "epoch": 0.36, "learning_rate": 1.4699376161557038e-05, "loss": 0.8331, "step": 3052 }, { "epoch": 0.36, "learning_rate": 1.469596614342736e-05, "loss": 0.8075, "step": 3053 }, { "epoch": 0.36, "learning_rate": 1.4692555424612147e-05, "loss": 0.7489, "step": 3054 }, { "epoch": 0.36, "learning_rate": 1.4689144005620314e-05, "loss": 0.8114, "step": 3055 }, { "epoch": 0.36, "learning_rate": 1.4685731886960876e-05, "loss": 0.7751, "step": 3056 }, { "epoch": 0.36, "learning_rate": 1.4682319069142956e-05, "loss": 0.8387, "step": 3057 }, { "epoch": 0.36, "learning_rate": 1.4678905552675779e-05, "loss": 0.846, "step": 3058 }, { "epoch": 0.36, "learning_rate": 1.4675491338068683e-05, "loss": 0.7729, "step": 3059 }, { "epoch": 0.36, "learning_rate": 1.4672076425831095e-05, "loss": 0.846, "step": 3060 }, { "epoch": 0.37, "learning_rate": 1.4668660816472562e-05, "loss": 0.8164, "step": 3061 }, { "epoch": 0.37, "learning_rate": 1.466524451050272e-05, "loss": 0.793, "step": 3062 }, { "epoch": 0.37, "learning_rate": 1.4661827508431321e-05, "loss": 0.7813, "step": 3063 }, { "epoch": 0.37, "learning_rate": 1.4658409810768216e-05, "loss": 0.7924, "step": 3064 }, { "epoch": 0.37, "learning_rate": 1.4654991418023356e-05, "loss": 0.8371, "step": 3065 }, { "epoch": 0.37, "learning_rate": 1.4651572330706805e-05, "loss": 0.8164, "step": 3066 }, { "epoch": 0.37, "learning_rate": 1.4648152549328722e-05, "loss": 0.8438, "step": 3067 }, { "epoch": 0.37, "learning_rate": 1.4644732074399374e-05, "loss": 0.7461, "step": 3068 }, { "epoch": 0.37, "learning_rate": 1.4641310906429131e-05, "loss": 0.8516, "step": 3069 }, { "epoch": 0.37, "learning_rate": 1.4637889045928463e-05, "loss": 0.7891, "step": 3070 }, { "epoch": 0.37, "learning_rate": 1.4634466493407953e-05, "loss": 0.8298, "step": 3071 }, { "epoch": 0.37, "learning_rate": 1.4631043249378272e-05, "loss": 0.7679, "step": 3072 }, { "epoch": 0.37, "learning_rate": 1.4627619314350207e-05, "loss": 0.8477, "step": 3073 }, { "epoch": 0.37, "learning_rate": 1.4624194688834643e-05, "loss": 0.8158, "step": 3074 }, { "epoch": 0.37, "learning_rate": 1.4620769373342568e-05, "loss": 0.8404, "step": 3075 }, { "epoch": 0.37, "learning_rate": 1.4617343368385073e-05, "loss": 0.7991, "step": 3076 }, { "epoch": 0.37, "learning_rate": 1.4613916674473352e-05, "loss": 0.8504, "step": 3077 }, { "epoch": 0.37, "learning_rate": 1.4610489292118706e-05, "loss": 0.8315, "step": 3078 }, { "epoch": 0.37, "learning_rate": 1.4607061221832534e-05, "loss": 0.841, "step": 3079 }, { "epoch": 0.37, "learning_rate": 1.4603632464126338e-05, "loss": 0.7416, "step": 3080 }, { "epoch": 0.37, "learning_rate": 1.4600203019511724e-05, "loss": 0.8443, "step": 3081 }, { "epoch": 0.37, "learning_rate": 1.4596772888500395e-05, "loss": 0.7813, "step": 3082 }, { "epoch": 0.37, "learning_rate": 1.4593342071604164e-05, "loss": 0.8309, "step": 3083 }, { "epoch": 0.37, "learning_rate": 1.4589910569334947e-05, "loss": 0.7997, "step": 3084 }, { "epoch": 0.37, "learning_rate": 1.4586478382204754e-05, "loss": 0.8354, "step": 3085 }, { "epoch": 0.37, "learning_rate": 1.4583045510725706e-05, "loss": 0.8315, "step": 3086 }, { "epoch": 0.37, "learning_rate": 1.457961195541002e-05, "loss": 0.8013, "step": 3087 }, { "epoch": 0.37, "learning_rate": 1.4576177716770017e-05, "loss": 0.8538, "step": 3088 }, { "epoch": 0.37, "learning_rate": 1.457274279531812e-05, "loss": 0.7126, "step": 3089 }, { "epoch": 0.37, "learning_rate": 1.4569307191566852e-05, "loss": 0.8265, "step": 3090 }, { "epoch": 0.37, "learning_rate": 1.4565870906028845e-05, "loss": 0.7751, "step": 3091 }, { "epoch": 0.37, "learning_rate": 1.4562433939216825e-05, "loss": 0.7863, "step": 3092 }, { "epoch": 0.37, "learning_rate": 1.4558996291643616e-05, "loss": 0.8304, "step": 3093 }, { "epoch": 0.37, "learning_rate": 1.4555557963822162e-05, "loss": 0.7506, "step": 3094 }, { "epoch": 0.37, "learning_rate": 1.4552118956265484e-05, "loss": 0.8075, "step": 3095 }, { "epoch": 0.37, "learning_rate": 1.4548679269486727e-05, "loss": 0.7634, "step": 3096 }, { "epoch": 0.37, "learning_rate": 1.4545238903999116e-05, "loss": 0.8203, "step": 3097 }, { "epoch": 0.37, "learning_rate": 1.4541797860316e-05, "loss": 0.798, "step": 3098 }, { "epoch": 0.37, "learning_rate": 1.4538356138950811e-05, "loss": 0.827, "step": 3099 }, { "epoch": 0.37, "learning_rate": 1.4534913740417087e-05, "loss": 0.7985, "step": 3100 }, { "epoch": 0.37, "learning_rate": 1.4531470665228471e-05, "loss": 0.7723, "step": 3101 }, { "epoch": 0.37, "learning_rate": 1.4528026913898706e-05, "loss": 0.8242, "step": 3102 }, { "epoch": 0.37, "learning_rate": 1.452458248694163e-05, "loss": 0.7813, "step": 3103 }, { "epoch": 0.37, "learning_rate": 1.4521137384871192e-05, "loss": 0.7623, "step": 3104 }, { "epoch": 0.37, "learning_rate": 1.4517691608201432e-05, "loss": 0.7628, "step": 3105 }, { "epoch": 0.37, "learning_rate": 1.4514245157446498e-05, "loss": 0.7746, "step": 3106 }, { "epoch": 0.37, "learning_rate": 1.451079803312063e-05, "loss": 0.7271, "step": 3107 }, { "epoch": 0.37, "learning_rate": 1.4507350235738176e-05, "loss": 0.7896, "step": 3108 }, { "epoch": 0.37, "learning_rate": 1.4503901765813587e-05, "loss": 0.7673, "step": 3109 }, { "epoch": 0.37, "learning_rate": 1.45004526238614e-05, "loss": 0.846, "step": 3110 }, { "epoch": 0.37, "learning_rate": 1.4497002810396273e-05, "loss": 0.7221, "step": 3111 }, { "epoch": 0.37, "learning_rate": 1.4493552325932945e-05, "loss": 0.8371, "step": 3112 }, { "epoch": 0.37, "learning_rate": 1.4490101170986263e-05, "loss": 0.7941, "step": 3113 }, { "epoch": 0.37, "learning_rate": 1.4486649346071179e-05, "loss": 0.7818, "step": 3114 }, { "epoch": 0.37, "learning_rate": 1.4483196851702736e-05, "loss": 0.8304, "step": 3115 }, { "epoch": 0.37, "learning_rate": 1.4479743688396086e-05, "loss": 0.7634, "step": 3116 }, { "epoch": 0.37, "learning_rate": 1.4476289856666467e-05, "loss": 0.779, "step": 3117 }, { "epoch": 0.37, "learning_rate": 1.4472835357029236e-05, "loss": 0.8354, "step": 3118 }, { "epoch": 0.37, "learning_rate": 1.4469380189999833e-05, "loss": 0.7757, "step": 3119 }, { "epoch": 0.37, "learning_rate": 1.4465924356093802e-05, "loss": 0.7656, "step": 3120 }, { "epoch": 0.37, "learning_rate": 1.4462467855826793e-05, "loss": 0.7891, "step": 3121 }, { "epoch": 0.37, "learning_rate": 1.4459010689714547e-05, "loss": 0.8259, "step": 3122 }, { "epoch": 0.37, "learning_rate": 1.4455552858272915e-05, "loss": 0.7589, "step": 3123 }, { "epoch": 0.37, "learning_rate": 1.4452094362017831e-05, "loss": 0.7907, "step": 3124 }, { "epoch": 0.37, "learning_rate": 1.4448635201465341e-05, "loss": 0.8175, "step": 3125 }, { "epoch": 0.37, "learning_rate": 1.4445175377131593e-05, "loss": 0.7472, "step": 3126 }, { "epoch": 0.37, "learning_rate": 1.4441714889532818e-05, "loss": 0.8393, "step": 3127 }, { "epoch": 0.37, "learning_rate": 1.443825373918536e-05, "loss": 0.7723, "step": 3128 }, { "epoch": 0.37, "learning_rate": 1.4434791926605658e-05, "loss": 0.8432, "step": 3129 }, { "epoch": 0.37, "learning_rate": 1.443132945231025e-05, "loss": 0.8025, "step": 3130 }, { "epoch": 0.37, "learning_rate": 1.442786631681577e-05, "loss": 0.8125, "step": 3131 }, { "epoch": 0.37, "learning_rate": 1.4424402520638954e-05, "loss": 0.7896, "step": 3132 }, { "epoch": 0.37, "learning_rate": 1.4420938064296633e-05, "loss": 0.8387, "step": 3133 }, { "epoch": 0.37, "learning_rate": 1.4417472948305743e-05, "loss": 0.8421, "step": 3134 }, { "epoch": 0.37, "learning_rate": 1.4414007173183312e-05, "loss": 0.7467, "step": 3135 }, { "epoch": 0.37, "learning_rate": 1.4410540739446468e-05, "loss": 0.8075, "step": 3136 }, { "epoch": 0.37, "learning_rate": 1.4407073647612442e-05, "loss": 0.88, "step": 3137 }, { "epoch": 0.37, "learning_rate": 1.4403605898198551e-05, "loss": 0.7941, "step": 3138 }, { "epoch": 0.37, "learning_rate": 1.4400137491722225e-05, "loss": 0.8845, "step": 3139 }, { "epoch": 0.37, "learning_rate": 1.4396668428700982e-05, "loss": 0.7472, "step": 3140 }, { "epoch": 0.37, "learning_rate": 1.4393198709652442e-05, "loss": 0.7718, "step": 3141 }, { "epoch": 0.37, "learning_rate": 1.4389728335094327e-05, "loss": 0.769, "step": 3142 }, { "epoch": 0.37, "learning_rate": 1.4386257305544444e-05, "loss": 0.721, "step": 3143 }, { "epoch": 0.37, "learning_rate": 1.4382785621520711e-05, "loss": 0.8147, "step": 3144 }, { "epoch": 0.38, "learning_rate": 1.4379313283541133e-05, "loss": 0.7952, "step": 3145 }, { "epoch": 0.38, "learning_rate": 1.4375840292123823e-05, "loss": 0.8482, "step": 3146 }, { "epoch": 0.38, "learning_rate": 1.4372366647786986e-05, "loss": 0.7656, "step": 3147 }, { "epoch": 0.38, "learning_rate": 1.4368892351048923e-05, "loss": 0.8158, "step": 3148 }, { "epoch": 0.38, "learning_rate": 1.4365417402428034e-05, "loss": 0.8242, "step": 3149 }, { "epoch": 0.38, "learning_rate": 1.4361941802442816e-05, "loss": 0.8449, "step": 3150 }, { "epoch": 0.38, "learning_rate": 1.4358465551611864e-05, "loss": 0.7556, "step": 3151 }, { "epoch": 0.38, "learning_rate": 1.4354988650453874e-05, "loss": 0.7706, "step": 3152 }, { "epoch": 0.38, "learning_rate": 1.4351511099487624e-05, "loss": 0.8108, "step": 3153 }, { "epoch": 0.38, "learning_rate": 1.4348032899232015e-05, "loss": 0.7634, "step": 3154 }, { "epoch": 0.38, "learning_rate": 1.4344554050206017e-05, "loss": 0.827, "step": 3155 }, { "epoch": 0.38, "learning_rate": 1.4341074552928711e-05, "loss": 0.7539, "step": 3156 }, { "epoch": 0.38, "learning_rate": 1.433759440791928e-05, "loss": 0.8393, "step": 3157 }, { "epoch": 0.38, "learning_rate": 1.433411361569699e-05, "loss": 0.8443, "step": 3158 }, { "epoch": 0.38, "learning_rate": 1.4330632176781215e-05, "loss": 0.7779, "step": 3159 }, { "epoch": 0.38, "learning_rate": 1.4327150091691415e-05, "loss": 0.7539, "step": 3160 }, { "epoch": 0.38, "learning_rate": 1.432366736094716e-05, "loss": 0.7757, "step": 3161 }, { "epoch": 0.38, "learning_rate": 1.4320183985068104e-05, "loss": 0.793, "step": 3162 }, { "epoch": 0.38, "learning_rate": 1.4316699964573997e-05, "loss": 0.7634, "step": 3163 }, { "epoch": 0.38, "learning_rate": 1.4313215299984702e-05, "loss": 0.8086, "step": 3164 }, { "epoch": 0.38, "learning_rate": 1.4309729991820154e-05, "loss": 0.764, "step": 3165 }, { "epoch": 0.38, "learning_rate": 1.4306244040600404e-05, "loss": 0.7801, "step": 3166 }, { "epoch": 0.38, "learning_rate": 1.4302757446845588e-05, "loss": 0.7433, "step": 3167 }, { "epoch": 0.38, "learning_rate": 1.4299270211075942e-05, "loss": 0.8125, "step": 3168 }, { "epoch": 0.38, "learning_rate": 1.4295782333811799e-05, "loss": 0.827, "step": 3169 }, { "epoch": 0.38, "learning_rate": 1.4292293815573577e-05, "loss": 0.7567, "step": 3170 }, { "epoch": 0.38, "learning_rate": 1.4288804656881806e-05, "loss": 0.784, "step": 3171 }, { "epoch": 0.38, "learning_rate": 1.4285314858257105e-05, "loss": 0.7701, "step": 3172 }, { "epoch": 0.38, "learning_rate": 1.428182442022018e-05, "loss": 0.822, "step": 3173 }, { "epoch": 0.38, "learning_rate": 1.4278333343291846e-05, "loss": 0.7852, "step": 3174 }, { "epoch": 0.38, "learning_rate": 1.4274841627993003e-05, "loss": 0.7852, "step": 3175 }, { "epoch": 0.38, "learning_rate": 1.427134927484465e-05, "loss": 0.7679, "step": 3176 }, { "epoch": 0.38, "learning_rate": 1.4267856284367887e-05, "loss": 0.8203, "step": 3177 }, { "epoch": 0.38, "learning_rate": 1.4264362657083894e-05, "loss": 0.7545, "step": 3178 }, { "epoch": 0.38, "learning_rate": 1.4260868393513967e-05, "loss": 0.8047, "step": 3179 }, { "epoch": 0.38, "learning_rate": 1.4257373494179473e-05, "loss": 0.7846, "step": 3180 }, { "epoch": 0.38, "learning_rate": 1.4253877959601896e-05, "loss": 0.8214, "step": 3181 }, { "epoch": 0.38, "learning_rate": 1.42503817903028e-05, "loss": 0.7701, "step": 3182 }, { "epoch": 0.38, "learning_rate": 1.4246884986803848e-05, "loss": 0.7829, "step": 3183 }, { "epoch": 0.38, "learning_rate": 1.4243387549626806e-05, "loss": 0.7857, "step": 3184 }, { "epoch": 0.38, "learning_rate": 1.4239889479293516e-05, "loss": 0.8203, "step": 3185 }, { "epoch": 0.38, "learning_rate": 1.4236390776325933e-05, "loss": 0.7227, "step": 3186 }, { "epoch": 0.38, "learning_rate": 1.4232891441246097e-05, "loss": 0.8265, "step": 3187 }, { "epoch": 0.38, "learning_rate": 1.4229391474576142e-05, "loss": 0.8326, "step": 3188 }, { "epoch": 0.38, "learning_rate": 1.4225890876838302e-05, "loss": 0.7506, "step": 3189 }, { "epoch": 0.38, "learning_rate": 1.4222389648554896e-05, "loss": 0.7779, "step": 3190 }, { "epoch": 0.38, "learning_rate": 1.4218887790248348e-05, "loss": 0.8058, "step": 3191 }, { "epoch": 0.38, "learning_rate": 1.421538530244117e-05, "loss": 0.8153, "step": 3192 }, { "epoch": 0.38, "learning_rate": 1.4211882185655967e-05, "loss": 0.8092, "step": 3193 }, { "epoch": 0.38, "learning_rate": 1.420837844041544e-05, "loss": 0.8075, "step": 3194 }, { "epoch": 0.38, "learning_rate": 1.420487406724238e-05, "loss": 0.8304, "step": 3195 }, { "epoch": 0.38, "learning_rate": 1.4201369066659678e-05, "loss": 0.8186, "step": 3196 }, { "epoch": 0.38, "learning_rate": 1.4197863439190317e-05, "loss": 0.7768, "step": 3197 }, { "epoch": 0.38, "learning_rate": 1.4194357185357368e-05, "loss": 0.8052, "step": 3198 }, { "epoch": 0.38, "learning_rate": 1.4190850305684002e-05, "loss": 0.8242, "step": 3199 }, { "epoch": 0.38, "learning_rate": 1.4187342800693484e-05, "loss": 0.7718, "step": 3200 }, { "epoch": 0.38, "learning_rate": 1.418383467090916e-05, "loss": 0.7768, "step": 3201 }, { "epoch": 0.38, "learning_rate": 1.4180325916854487e-05, "loss": 0.8237, "step": 3202 }, { "epoch": 0.38, "learning_rate": 1.4176816539053003e-05, "loss": 0.8147, "step": 3203 }, { "epoch": 0.38, "learning_rate": 1.4173306538028342e-05, "loss": 0.7355, "step": 3204 }, { "epoch": 0.38, "learning_rate": 1.4169795914304232e-05, "loss": 0.7941, "step": 3205 }, { "epoch": 0.38, "learning_rate": 1.4166284668404495e-05, "loss": 0.8103, "step": 3206 }, { "epoch": 0.38, "learning_rate": 1.4162772800853044e-05, "loss": 0.7902, "step": 3207 }, { "epoch": 0.38, "learning_rate": 1.4159260312173882e-05, "loss": 0.7377, "step": 3208 }, { "epoch": 0.38, "learning_rate": 1.4155747202891112e-05, "loss": 0.7355, "step": 3209 }, { "epoch": 0.38, "learning_rate": 1.4152233473528923e-05, "loss": 0.8371, "step": 3210 }, { "epoch": 0.38, "learning_rate": 1.41487191246116e-05, "loss": 0.7997, "step": 3211 }, { "epoch": 0.38, "learning_rate": 1.414520415666352e-05, "loss": 0.7935, "step": 3212 }, { "epoch": 0.38, "learning_rate": 1.4141688570209147e-05, "loss": 0.8203, "step": 3213 }, { "epoch": 0.38, "learning_rate": 1.4138172365773046e-05, "loss": 0.7751, "step": 3214 }, { "epoch": 0.38, "learning_rate": 1.413465554387987e-05, "loss": 0.8025, "step": 3215 }, { "epoch": 0.38, "learning_rate": 1.4131138105054362e-05, "loss": 0.7584, "step": 3216 }, { "epoch": 0.38, "learning_rate": 1.4127620049821365e-05, "loss": 0.8013, "step": 3217 }, { "epoch": 0.38, "learning_rate": 1.4124101378705803e-05, "loss": 0.7734, "step": 3218 }, { "epoch": 0.38, "learning_rate": 1.41205820922327e-05, "loss": 0.7796, "step": 3219 }, { "epoch": 0.38, "learning_rate": 1.4117062190927166e-05, "loss": 0.7991, "step": 3220 }, { "epoch": 0.38, "learning_rate": 1.4113541675314407e-05, "loss": 0.8393, "step": 3221 }, { "epoch": 0.38, "learning_rate": 1.4110020545919723e-05, "loss": 0.8025, "step": 3222 }, { "epoch": 0.38, "learning_rate": 1.4106498803268495e-05, "loss": 0.8465, "step": 3223 }, { "epoch": 0.38, "learning_rate": 1.410297644788621e-05, "loss": 0.7885, "step": 3224 }, { "epoch": 0.38, "learning_rate": 1.4099453480298434e-05, "loss": 0.8064, "step": 3225 }, { "epoch": 0.38, "learning_rate": 1.4095929901030831e-05, "loss": 0.7941, "step": 3226 }, { "epoch": 0.38, "learning_rate": 1.4092405710609156e-05, "loss": 0.7338, "step": 3227 }, { "epoch": 0.38, "learning_rate": 1.4088880909559251e-05, "loss": 0.8203, "step": 3228 }, { "epoch": 0.39, "learning_rate": 1.4085355498407054e-05, "loss": 0.8153, "step": 3229 }, { "epoch": 0.39, "learning_rate": 1.408182947767859e-05, "loss": 0.8717, "step": 3230 }, { "epoch": 0.39, "learning_rate": 1.4078302847899978e-05, "loss": 0.7706, "step": 3231 }, { "epoch": 0.39, "learning_rate": 1.4074775609597428e-05, "loss": 0.841, "step": 3232 }, { "epoch": 0.39, "learning_rate": 1.4071247763297237e-05, "loss": 0.7327, "step": 3233 }, { "epoch": 0.39, "learning_rate": 1.4067719309525796e-05, "loss": 0.7701, "step": 3234 }, { "epoch": 0.39, "learning_rate": 1.4064190248809588e-05, "loss": 0.7712, "step": 3235 }, { "epoch": 0.39, "learning_rate": 1.4060660581675183e-05, "loss": 0.7801, "step": 3236 }, { "epoch": 0.39, "learning_rate": 1.4057130308649243e-05, "loss": 0.7679, "step": 3237 }, { "epoch": 0.39, "learning_rate": 1.405359943025852e-05, "loss": 0.8131, "step": 3238 }, { "epoch": 0.39, "learning_rate": 1.4050067947029855e-05, "loss": 0.7985, "step": 3239 }, { "epoch": 0.39, "learning_rate": 1.4046535859490185e-05, "loss": 0.779, "step": 3240 }, { "epoch": 0.39, "learning_rate": 1.404300316816653e-05, "loss": 0.784, "step": 3241 }, { "epoch": 0.39, "learning_rate": 1.4039469873586004e-05, "loss": 0.7712, "step": 3242 }, { "epoch": 0.39, "learning_rate": 1.4035935976275812e-05, "loss": 0.7628, "step": 3243 }, { "epoch": 0.39, "learning_rate": 1.4032401476763244e-05, "loss": 0.8722, "step": 3244 }, { "epoch": 0.39, "learning_rate": 1.4028866375575687e-05, "loss": 0.8064, "step": 3245 }, { "epoch": 0.39, "learning_rate": 1.4025330673240607e-05, "loss": 0.8147, "step": 3246 }, { "epoch": 0.39, "learning_rate": 1.4021794370285573e-05, "loss": 0.8181, "step": 3247 }, { "epoch": 0.39, "learning_rate": 1.4018257467238234e-05, "loss": 0.8097, "step": 3248 }, { "epoch": 0.39, "learning_rate": 1.4014719964626333e-05, "loss": 0.7533, "step": 3249 }, { "epoch": 0.39, "learning_rate": 1.4011181862977702e-05, "loss": 0.7924, "step": 3250 }, { "epoch": 0.39, "learning_rate": 1.400764316282026e-05, "loss": 0.7958, "step": 3251 }, { "epoch": 0.39, "learning_rate": 1.4004103864682016e-05, "loss": 0.8019, "step": 3252 }, { "epoch": 0.39, "learning_rate": 1.4000563969091067e-05, "loss": 0.8097, "step": 3253 }, { "epoch": 0.39, "learning_rate": 1.3997023476575606e-05, "loss": 0.8125, "step": 3254 }, { "epoch": 0.39, "learning_rate": 1.3993482387663908e-05, "loss": 0.7472, "step": 3255 }, { "epoch": 0.39, "learning_rate": 1.3989940702884339e-05, "loss": 0.7506, "step": 3256 }, { "epoch": 0.39, "learning_rate": 1.3986398422765357e-05, "loss": 0.7344, "step": 3257 }, { "epoch": 0.39, "learning_rate": 1.39828555478355e-05, "loss": 0.8186, "step": 3258 }, { "epoch": 0.39, "learning_rate": 1.3979312078623405e-05, "loss": 0.779, "step": 3259 }, { "epoch": 0.39, "learning_rate": 1.3975768015657794e-05, "loss": 0.8125, "step": 3260 }, { "epoch": 0.39, "learning_rate": 1.3972223359467472e-05, "loss": 0.8259, "step": 3261 }, { "epoch": 0.39, "learning_rate": 1.3968678110581344e-05, "loss": 0.7941, "step": 3262 }, { "epoch": 0.39, "learning_rate": 1.3965132269528395e-05, "loss": 0.8192, "step": 3263 }, { "epoch": 0.39, "learning_rate": 1.3961585836837697e-05, "loss": 0.7868, "step": 3264 }, { "epoch": 0.39, "learning_rate": 1.3958038813038415e-05, "loss": 0.7868, "step": 3265 }, { "epoch": 0.39, "learning_rate": 1.3954491198659801e-05, "loss": 0.8225, "step": 3266 }, { "epoch": 0.39, "learning_rate": 1.3950942994231196e-05, "loss": 0.7768, "step": 3267 }, { "epoch": 0.39, "learning_rate": 1.3947394200282024e-05, "loss": 0.7461, "step": 3268 }, { "epoch": 0.39, "learning_rate": 1.3943844817341809e-05, "loss": 0.7617, "step": 3269 }, { "epoch": 0.39, "learning_rate": 1.394029484594015e-05, "loss": 0.7662, "step": 3270 }, { "epoch": 0.39, "learning_rate": 1.3936744286606735e-05, "loss": 0.7913, "step": 3271 }, { "epoch": 0.39, "learning_rate": 1.3933193139871348e-05, "loss": 0.808, "step": 3272 }, { "epoch": 0.39, "learning_rate": 1.3929641406263854e-05, "loss": 0.8158, "step": 3273 }, { "epoch": 0.39, "learning_rate": 1.3926089086314208e-05, "loss": 0.7517, "step": 3274 }, { "epoch": 0.39, "learning_rate": 1.3922536180552453e-05, "loss": 0.7517, "step": 3275 }, { "epoch": 0.39, "learning_rate": 1.3918982689508715e-05, "loss": 0.8192, "step": 3276 }, { "epoch": 0.39, "learning_rate": 1.3915428613713216e-05, "loss": 0.8527, "step": 3277 }, { "epoch": 0.39, "learning_rate": 1.3911873953696253e-05, "loss": 0.7506, "step": 3278 }, { "epoch": 0.39, "learning_rate": 1.3908318709988222e-05, "loss": 0.808, "step": 3279 }, { "epoch": 0.39, "learning_rate": 1.3904762883119602e-05, "loss": 0.8103, "step": 3280 }, { "epoch": 0.39, "learning_rate": 1.390120647362096e-05, "loss": 0.7645, "step": 3281 }, { "epoch": 0.39, "learning_rate": 1.3897649482022941e-05, "loss": 0.7913, "step": 3282 }, { "epoch": 0.39, "learning_rate": 1.3894091908856288e-05, "loss": 0.8192, "step": 3283 }, { "epoch": 0.39, "learning_rate": 1.3890533754651826e-05, "loss": 0.7706, "step": 3284 }, { "epoch": 0.39, "learning_rate": 1.388697501994047e-05, "loss": 0.7801, "step": 3285 }, { "epoch": 0.39, "learning_rate": 1.3883415705253216e-05, "loss": 0.8052, "step": 3286 }, { "epoch": 0.39, "learning_rate": 1.3879855811121152e-05, "loss": 0.7941, "step": 3287 }, { "epoch": 0.39, "learning_rate": 1.387629533807545e-05, "loss": 0.7879, "step": 3288 }, { "epoch": 0.39, "learning_rate": 1.3872734286647367e-05, "loss": 0.7433, "step": 3289 }, { "epoch": 0.39, "learning_rate": 1.3869172657368248e-05, "loss": 0.8103, "step": 3290 }, { "epoch": 0.39, "learning_rate": 1.3865610450769524e-05, "loss": 0.7746, "step": 3291 }, { "epoch": 0.39, "learning_rate": 1.3862047667382715e-05, "loss": 0.8298, "step": 3292 }, { "epoch": 0.39, "learning_rate": 1.3858484307739417e-05, "loss": 0.7991, "step": 3293 }, { "epoch": 0.39, "learning_rate": 1.3854920372371328e-05, "loss": 0.7974, "step": 3294 }, { "epoch": 0.39, "learning_rate": 1.385135586181022e-05, "loss": 0.798, "step": 3295 }, { "epoch": 0.39, "learning_rate": 1.384779077658795e-05, "loss": 0.8192, "step": 3296 }, { "epoch": 0.39, "learning_rate": 1.3844225117236472e-05, "loss": 0.7857, "step": 3297 }, { "epoch": 0.39, "learning_rate": 1.384065888428781e-05, "loss": 0.7662, "step": 3298 }, { "epoch": 0.39, "learning_rate": 1.3837092078274086e-05, "loss": 0.7584, "step": 3299 }, { "epoch": 0.39, "learning_rate": 1.383352469972751e-05, "loss": 0.7935, "step": 3300 }, { "epoch": 0.39, "learning_rate": 1.3829956749180358e-05, "loss": 0.745, "step": 3301 }, { "epoch": 0.39, "learning_rate": 1.3826388227165013e-05, "loss": 0.7941, "step": 3302 }, { "epoch": 0.39, "learning_rate": 1.3822819134213932e-05, "loss": 0.7785, "step": 3303 }, { "epoch": 0.39, "learning_rate": 1.381924947085966e-05, "loss": 0.7355, "step": 3304 }, { "epoch": 0.39, "learning_rate": 1.3815679237634827e-05, "loss": 0.7695, "step": 3305 }, { "epoch": 0.39, "learning_rate": 1.3812108435072147e-05, "loss": 0.7807, "step": 3306 }, { "epoch": 0.39, "learning_rate": 1.3808537063704421e-05, "loss": 0.8103, "step": 3307 }, { "epoch": 0.39, "learning_rate": 1.3804965124064533e-05, "loss": 0.7879, "step": 3308 }, { "epoch": 0.39, "learning_rate": 1.3801392616685449e-05, "loss": 0.7857, "step": 3309 }, { "epoch": 0.39, "learning_rate": 1.379781954210023e-05, "loss": 0.8237, "step": 3310 }, { "epoch": 0.39, "learning_rate": 1.379424590084201e-05, "loss": 0.7249, "step": 3311 }, { "epoch": 0.39, "learning_rate": 1.3790671693444016e-05, "loss": 0.8019, "step": 3312 }, { "epoch": 0.4, "learning_rate": 1.3787096920439553e-05, "loss": 0.7997, "step": 3313 }, { "epoch": 0.4, "learning_rate": 1.3783521582362011e-05, "loss": 0.7065, "step": 3314 }, { "epoch": 0.4, "learning_rate": 1.3779945679744873e-05, "loss": 0.832, "step": 3315 }, { "epoch": 0.4, "learning_rate": 1.3776369213121691e-05, "loss": 0.779, "step": 3316 }, { "epoch": 0.4, "learning_rate": 1.3772792183026118e-05, "loss": 0.7706, "step": 3317 }, { "epoch": 0.4, "learning_rate": 1.3769214589991879e-05, "loss": 0.7712, "step": 3318 }, { "epoch": 0.4, "learning_rate": 1.3765636434552789e-05, "loss": 0.8069, "step": 3319 }, { "epoch": 0.4, "learning_rate": 1.3762057717242745e-05, "loss": 0.7734, "step": 3320 }, { "epoch": 0.4, "learning_rate": 1.3758478438595722e-05, "loss": 0.8203, "step": 3321 }, { "epoch": 0.4, "learning_rate": 1.3754898599145791e-05, "loss": 0.8019, "step": 3322 }, { "epoch": 0.4, "learning_rate": 1.37513181994271e-05, "loss": 0.7863, "step": 3323 }, { "epoch": 0.4, "learning_rate": 1.3747737239973875e-05, "loss": 0.8086, "step": 3324 }, { "epoch": 0.4, "learning_rate": 1.3744155721320439e-05, "loss": 0.7578, "step": 3325 }, { "epoch": 0.4, "learning_rate": 1.3740573644001187e-05, "loss": 0.8186, "step": 3326 }, { "epoch": 0.4, "learning_rate": 1.3736991008550597e-05, "loss": 0.8119, "step": 3327 }, { "epoch": 0.4, "learning_rate": 1.3733407815503244e-05, "loss": 0.8281, "step": 3328 }, { "epoch": 0.4, "learning_rate": 1.3729824065393765e-05, "loss": 0.8008, "step": 3329 }, { "epoch": 0.4, "learning_rate": 1.37262397587569e-05, "loss": 0.8052, "step": 3330 }, { "epoch": 0.4, "learning_rate": 1.3722654896127464e-05, "loss": 0.827, "step": 3331 }, { "epoch": 0.4, "learning_rate": 1.3719069478040348e-05, "loss": 0.8097, "step": 3332 }, { "epoch": 0.4, "learning_rate": 1.371548350503054e-05, "loss": 0.8404, "step": 3333 }, { "epoch": 0.4, "learning_rate": 1.3711896977633097e-05, "loss": 0.8348, "step": 3334 }, { "epoch": 0.4, "learning_rate": 1.3708309896383169e-05, "loss": 0.8047, "step": 3335 }, { "epoch": 0.4, "learning_rate": 1.3704722261815983e-05, "loss": 0.7935, "step": 3336 }, { "epoch": 0.4, "learning_rate": 1.3701134074466854e-05, "loss": 0.8142, "step": 3337 }, { "epoch": 0.4, "learning_rate": 1.3697545334871173e-05, "loss": 0.798, "step": 3338 }, { "epoch": 0.4, "learning_rate": 1.369395604356441e-05, "loss": 0.7679, "step": 3339 }, { "epoch": 0.4, "learning_rate": 1.3690366201082132e-05, "loss": 0.8644, "step": 3340 }, { "epoch": 0.4, "learning_rate": 1.368677580795998e-05, "loss": 0.7963, "step": 3341 }, { "epoch": 0.4, "learning_rate": 1.368318486473367e-05, "loss": 0.7461, "step": 3342 }, { "epoch": 0.4, "learning_rate": 1.3679593371939012e-05, "loss": 0.7941, "step": 3343 }, { "epoch": 0.4, "learning_rate": 1.3676001330111896e-05, "loss": 0.7673, "step": 3344 }, { "epoch": 0.4, "learning_rate": 1.3672408739788283e-05, "loss": 0.7723, "step": 3345 }, { "epoch": 0.4, "learning_rate": 1.3668815601504228e-05, "loss": 0.7762, "step": 3346 }, { "epoch": 0.4, "learning_rate": 1.3665221915795863e-05, "loss": 0.8025, "step": 3347 }, { "epoch": 0.4, "learning_rate": 1.3661627683199403e-05, "loss": 0.7729, "step": 3348 }, { "epoch": 0.4, "learning_rate": 1.3658032904251142e-05, "loss": 0.7807, "step": 3349 }, { "epoch": 0.4, "learning_rate": 1.365443757948746e-05, "loss": 0.74, "step": 3350 }, { "epoch": 0.4, "learning_rate": 1.3650841709444814e-05, "loss": 0.7109, "step": 3351 }, { "epoch": 0.4, "learning_rate": 1.3647245294659742e-05, "loss": 0.7919, "step": 3352 }, { "epoch": 0.4, "learning_rate": 1.364364833566887e-05, "loss": 0.7528, "step": 3353 }, { "epoch": 0.4, "learning_rate": 1.3640050833008894e-05, "loss": 0.764, "step": 3354 }, { "epoch": 0.4, "learning_rate": 1.3636452787216605e-05, "loss": 0.7288, "step": 3355 }, { "epoch": 0.4, "learning_rate": 1.3632854198828862e-05, "loss": 0.7762, "step": 3356 }, { "epoch": 0.4, "learning_rate": 1.3629255068382617e-05, "loss": 0.7885, "step": 3357 }, { "epoch": 0.4, "learning_rate": 1.3625655396414891e-05, "loss": 0.7405, "step": 3358 }, { "epoch": 0.4, "learning_rate": 1.3622055183462793e-05, "loss": 0.7919, "step": 3359 }, { "epoch": 0.4, "learning_rate": 1.3618454430063512e-05, "loss": 0.798, "step": 3360 }, { "epoch": 0.4, "learning_rate": 1.3614853136754313e-05, "loss": 0.7969, "step": 3361 }, { "epoch": 0.4, "learning_rate": 1.3611251304072552e-05, "loss": 0.7768, "step": 3362 }, { "epoch": 0.4, "learning_rate": 1.3607648932555654e-05, "loss": 0.7902, "step": 3363 }, { "epoch": 0.4, "learning_rate": 1.360404602274113e-05, "loss": 0.7913, "step": 3364 }, { "epoch": 0.4, "learning_rate": 1.3600442575166572e-05, "loss": 0.7651, "step": 3365 }, { "epoch": 0.4, "learning_rate": 1.3596838590369647e-05, "loss": 0.8231, "step": 3366 }, { "epoch": 0.4, "learning_rate": 1.359323406888811e-05, "loss": 0.7891, "step": 3367 }, { "epoch": 0.4, "learning_rate": 1.358962901125979e-05, "loss": 0.8131, "step": 3368 }, { "epoch": 0.4, "learning_rate": 1.35860234180226e-05, "loss": 0.8209, "step": 3369 }, { "epoch": 0.4, "learning_rate": 1.3582417289714528e-05, "loss": 0.7695, "step": 3370 }, { "epoch": 0.4, "learning_rate": 1.3578810626873646e-05, "loss": 0.7718, "step": 3371 }, { "epoch": 0.4, "learning_rate": 1.3575203430038104e-05, "loss": 0.7919, "step": 3372 }, { "epoch": 0.4, "learning_rate": 1.3571595699746134e-05, "loss": 0.8544, "step": 3373 }, { "epoch": 0.4, "learning_rate": 1.3567987436536042e-05, "loss": 0.7941, "step": 3374 }, { "epoch": 0.4, "learning_rate": 1.3564378640946223e-05, "loss": 0.8041, "step": 3375 }, { "epoch": 0.4, "learning_rate": 1.3560769313515142e-05, "loss": 0.8036, "step": 3376 }, { "epoch": 0.4, "learning_rate": 1.3557159454781343e-05, "loss": 0.7701, "step": 3377 }, { "epoch": 0.4, "learning_rate": 1.3553549065283462e-05, "loss": 0.745, "step": 3378 }, { "epoch": 0.4, "learning_rate": 1.3549938145560199e-05, "loss": 0.7628, "step": 3379 }, { "epoch": 0.4, "learning_rate": 1.3546326696150347e-05, "loss": 0.8616, "step": 3380 }, { "epoch": 0.4, "learning_rate": 1.354271471759276e-05, "loss": 0.7109, "step": 3381 }, { "epoch": 0.4, "learning_rate": 1.3539102210426392e-05, "loss": 0.7098, "step": 3382 }, { "epoch": 0.4, "learning_rate": 1.3535489175190257e-05, "loss": 0.7606, "step": 3383 }, { "epoch": 0.4, "learning_rate": 1.3531875612423462e-05, "loss": 0.75, "step": 3384 }, { "epoch": 0.4, "learning_rate": 1.3528261522665187e-05, "loss": 0.7868, "step": 3385 }, { "epoch": 0.4, "learning_rate": 1.3524646906454685e-05, "loss": 0.7154, "step": 3386 }, { "epoch": 0.4, "learning_rate": 1.3521031764331298e-05, "loss": 0.7612, "step": 3387 }, { "epoch": 0.4, "learning_rate": 1.3517416096834446e-05, "loss": 0.8382, "step": 3388 }, { "epoch": 0.4, "learning_rate": 1.3513799904503613e-05, "loss": 0.8359, "step": 3389 }, { "epoch": 0.4, "learning_rate": 1.3510183187878379e-05, "loss": 0.7885, "step": 3390 }, { "epoch": 0.4, "learning_rate": 1.350656594749839e-05, "loss": 0.7907, "step": 3391 }, { "epoch": 0.4, "learning_rate": 1.3502948183903374e-05, "loss": 0.7461, "step": 3392 }, { "epoch": 0.4, "learning_rate": 1.3499329897633144e-05, "loss": 0.8198, "step": 3393 }, { "epoch": 0.4, "learning_rate": 1.3495711089227583e-05, "loss": 0.8052, "step": 3394 }, { "epoch": 0.4, "learning_rate": 1.349209175922665e-05, "loss": 0.793, "step": 3395 }, { "epoch": 0.41, "learning_rate": 1.3488471908170388e-05, "loss": 0.7148, "step": 3396 }, { "epoch": 0.41, "learning_rate": 1.3484851536598912e-05, "loss": 0.7941, "step": 3397 }, { "epoch": 0.41, "learning_rate": 1.3481230645052426e-05, "loss": 0.7701, "step": 3398 }, { "epoch": 0.41, "learning_rate": 1.3477609234071195e-05, "loss": 0.7478, "step": 3399 }, { "epoch": 0.41, "learning_rate": 1.3473987304195575e-05, "loss": 0.7835, "step": 3400 }, { "epoch": 0.41, "learning_rate": 1.3470364855965994e-05, "loss": 0.8013, "step": 3401 }, { "epoch": 0.41, "learning_rate": 1.3466741889922953e-05, "loss": 0.8019, "step": 3402 }, { "epoch": 0.41, "learning_rate": 1.3463118406607042e-05, "loss": 0.8225, "step": 3403 }, { "epoch": 0.41, "learning_rate": 1.3459494406558919e-05, "loss": 0.8075, "step": 3404 }, { "epoch": 0.41, "learning_rate": 1.345586989031932e-05, "loss": 0.7779, "step": 3405 }, { "epoch": 0.41, "learning_rate": 1.3452244858429057e-05, "loss": 0.7489, "step": 3406 }, { "epoch": 0.41, "learning_rate": 1.3448619311429028e-05, "loss": 0.7656, "step": 3407 }, { "epoch": 0.41, "learning_rate": 1.3444993249860198e-05, "loss": 0.7729, "step": 3408 }, { "epoch": 0.41, "learning_rate": 1.3441366674263607e-05, "loss": 0.8281, "step": 3409 }, { "epoch": 0.41, "learning_rate": 1.3437739585180384e-05, "loss": 0.7667, "step": 3410 }, { "epoch": 0.41, "learning_rate": 1.3434111983151725e-05, "loss": 0.7662, "step": 3411 }, { "epoch": 0.41, "learning_rate": 1.3430483868718901e-05, "loss": 0.8376, "step": 3412 }, { "epoch": 0.41, "learning_rate": 1.3426855242423271e-05, "loss": 0.7941, "step": 3413 }, { "epoch": 0.41, "learning_rate": 1.342322610480626e-05, "loss": 0.8058, "step": 3414 }, { "epoch": 0.41, "learning_rate": 1.3419596456409365e-05, "loss": 0.7868, "step": 3415 }, { "epoch": 0.41, "learning_rate": 1.3415966297774172e-05, "loss": 0.8516, "step": 3416 }, { "epoch": 0.41, "learning_rate": 1.3412335629442337e-05, "loss": 0.803, "step": 3417 }, { "epoch": 0.41, "learning_rate": 1.3408704451955595e-05, "loss": 0.7879, "step": 3418 }, { "epoch": 0.41, "learning_rate": 1.3405072765855749e-05, "loss": 0.7333, "step": 3419 }, { "epoch": 0.41, "learning_rate": 1.3401440571684687e-05, "loss": 0.8326, "step": 3420 }, { "epoch": 0.41, "learning_rate": 1.3397807869984365e-05, "loss": 0.7567, "step": 3421 }, { "epoch": 0.41, "learning_rate": 1.3394174661296821e-05, "loss": 0.7924, "step": 3422 }, { "epoch": 0.41, "learning_rate": 1.339054094616417e-05, "loss": 0.7701, "step": 3423 }, { "epoch": 0.41, "learning_rate": 1.3386906725128594e-05, "loss": 0.8359, "step": 3424 }, { "epoch": 0.41, "learning_rate": 1.3383271998732357e-05, "loss": 0.7746, "step": 3425 }, { "epoch": 0.41, "learning_rate": 1.3379636767517799e-05, "loss": 0.8532, "step": 3426 }, { "epoch": 0.41, "learning_rate": 1.3376001032027329e-05, "loss": 0.8231, "step": 3427 }, { "epoch": 0.41, "learning_rate": 1.3372364792803439e-05, "loss": 0.8867, "step": 3428 }, { "epoch": 0.41, "learning_rate": 1.3368728050388688e-05, "loss": 0.7684, "step": 3429 }, { "epoch": 0.41, "learning_rate": 1.336509080532572e-05, "loss": 0.7584, "step": 3430 }, { "epoch": 0.41, "learning_rate": 1.3361453058157247e-05, "loss": 0.8052, "step": 3431 }, { "epoch": 0.41, "learning_rate": 1.3357814809426058e-05, "loss": 0.7969, "step": 3432 }, { "epoch": 0.41, "learning_rate": 1.3354176059675015e-05, "loss": 0.832, "step": 3433 }, { "epoch": 0.41, "learning_rate": 1.3350536809447055e-05, "loss": 0.8019, "step": 3434 }, { "epoch": 0.41, "learning_rate": 1.3346897059285194e-05, "loss": 0.7813, "step": 3435 }, { "epoch": 0.41, "learning_rate": 1.334325680973252e-05, "loss": 0.75, "step": 3436 }, { "epoch": 0.41, "learning_rate": 1.3339616061332188e-05, "loss": 0.7913, "step": 3437 }, { "epoch": 0.41, "learning_rate": 1.3335974814627442e-05, "loss": 0.7846, "step": 3438 }, { "epoch": 0.41, "learning_rate": 1.3332333070161592e-05, "loss": 0.8008, "step": 3439 }, { "epoch": 0.41, "learning_rate": 1.3328690828478017e-05, "loss": 0.7656, "step": 3440 }, { "epoch": 0.41, "learning_rate": 1.3325048090120186e-05, "loss": 0.7924, "step": 3441 }, { "epoch": 0.41, "learning_rate": 1.3321404855631621e-05, "loss": 0.8019, "step": 3442 }, { "epoch": 0.41, "learning_rate": 1.331776112555594e-05, "loss": 0.8398, "step": 3443 }, { "epoch": 0.41, "learning_rate": 1.3314116900436815e-05, "loss": 0.7645, "step": 3444 }, { "epoch": 0.41, "learning_rate": 1.3310472180818008e-05, "loss": 0.7779, "step": 3445 }, { "epoch": 0.41, "learning_rate": 1.3306826967243347e-05, "loss": 0.8036, "step": 3446 }, { "epoch": 0.41, "learning_rate": 1.330318126025673e-05, "loss": 0.8499, "step": 3447 }, { "epoch": 0.41, "learning_rate": 1.3299535060402137e-05, "loss": 0.8387, "step": 3448 }, { "epoch": 0.41, "learning_rate": 1.329588836822362e-05, "loss": 0.8058, "step": 3449 }, { "epoch": 0.41, "learning_rate": 1.3292241184265296e-05, "loss": 0.7757, "step": 3450 }, { "epoch": 0.41, "learning_rate": 1.3288593509071368e-05, "loss": 0.7835, "step": 3451 }, { "epoch": 0.41, "learning_rate": 1.32849453431861e-05, "loss": 0.8064, "step": 3452 }, { "epoch": 0.41, "learning_rate": 1.3281296687153842e-05, "loss": 0.74, "step": 3453 }, { "epoch": 0.41, "learning_rate": 1.3277647541519003e-05, "loss": 0.8069, "step": 3454 }, { "epoch": 0.41, "learning_rate": 1.3273997906826074e-05, "loss": 0.7584, "step": 3455 }, { "epoch": 0.41, "learning_rate": 1.3270347783619623e-05, "loss": 0.7723, "step": 3456 }, { "epoch": 0.41, "learning_rate": 1.3266697172444283e-05, "loss": 0.8008, "step": 3457 }, { "epoch": 0.41, "learning_rate": 1.326304607384476e-05, "loss": 0.8365, "step": 3458 }, { "epoch": 0.41, "learning_rate": 1.3259394488365832e-05, "loss": 0.7573, "step": 3459 }, { "epoch": 0.41, "learning_rate": 1.3255742416552356e-05, "loss": 0.7857, "step": 3460 }, { "epoch": 0.41, "learning_rate": 1.325208985894926e-05, "loss": 0.7612, "step": 3461 }, { "epoch": 0.41, "learning_rate": 1.3248436816101537e-05, "loss": 0.8326, "step": 3462 }, { "epoch": 0.41, "learning_rate": 1.3244783288554263e-05, "loss": 0.7712, "step": 3463 }, { "epoch": 0.41, "learning_rate": 1.324112927685258e-05, "loss": 0.7433, "step": 3464 }, { "epoch": 0.41, "learning_rate": 1.3237474781541702e-05, "loss": 0.8504, "step": 3465 }, { "epoch": 0.41, "learning_rate": 1.3233819803166916e-05, "loss": 0.7907, "step": 3466 }, { "epoch": 0.41, "learning_rate": 1.3230164342273582e-05, "loss": 0.7846, "step": 3467 }, { "epoch": 0.41, "learning_rate": 1.3226508399407134e-05, "loss": 0.784, "step": 3468 }, { "epoch": 0.41, "learning_rate": 1.3222851975113073e-05, "loss": 0.7852, "step": 3469 }, { "epoch": 0.41, "learning_rate": 1.3219195069936976e-05, "loss": 0.8259, "step": 3470 }, { "epoch": 0.41, "learning_rate": 1.321553768442449e-05, "loss": 0.8298, "step": 3471 }, { "epoch": 0.41, "learning_rate": 1.3211879819121332e-05, "loss": 0.8114, "step": 3472 }, { "epoch": 0.41, "learning_rate": 1.3208221474573295e-05, "loss": 0.7773, "step": 3473 }, { "epoch": 0.41, "learning_rate": 1.3204562651326239e-05, "loss": 0.7612, "step": 3474 }, { "epoch": 0.41, "learning_rate": 1.3200903349926094e-05, "loss": 0.798, "step": 3475 }, { "epoch": 0.41, "learning_rate": 1.3197243570918879e-05, "loss": 0.8253, "step": 3476 }, { "epoch": 0.41, "learning_rate": 1.3193583314850651e-05, "loss": 0.7679, "step": 3477 }, { "epoch": 0.41, "learning_rate": 1.3189922582267569e-05, "loss": 0.7907, "step": 3478 }, { "epoch": 0.41, "learning_rate": 1.3186261373715845e-05, "loss": 0.7818, "step": 3479 }, { "epoch": 0.42, "learning_rate": 1.3182599689741774e-05, "loss": 0.779, "step": 3480 }, { "epoch": 0.42, "learning_rate": 1.3178937530891713e-05, "loss": 0.7963, "step": 3481 }, { "epoch": 0.42, "learning_rate": 1.3175274897712095e-05, "loss": 0.7584, "step": 3482 }, { "epoch": 0.42, "learning_rate": 1.3171611790749422e-05, "loss": 0.7768, "step": 3483 }, { "epoch": 0.42, "learning_rate": 1.3167948210550259e-05, "loss": 0.7801, "step": 3484 }, { "epoch": 0.42, "learning_rate": 1.3164284157661256e-05, "loss": 0.7695, "step": 3485 }, { "epoch": 0.42, "learning_rate": 1.316061963262913e-05, "loss": 0.8309, "step": 3486 }, { "epoch": 0.42, "learning_rate": 1.3156954636000655e-05, "loss": 0.7991, "step": 3487 }, { "epoch": 0.42, "learning_rate": 1.3153289168322699e-05, "loss": 0.7768, "step": 3488 }, { "epoch": 0.42, "learning_rate": 1.3149623230142174e-05, "loss": 0.7997, "step": 3489 }, { "epoch": 0.42, "learning_rate": 1.314595682200608e-05, "loss": 0.7612, "step": 3490 }, { "epoch": 0.42, "learning_rate": 1.3142289944461483e-05, "loss": 0.7985, "step": 3491 }, { "epoch": 0.42, "learning_rate": 1.3138622598055517e-05, "loss": 0.8292, "step": 3492 }, { "epoch": 0.42, "learning_rate": 1.313495478333539e-05, "loss": 0.7902, "step": 3493 }, { "epoch": 0.42, "learning_rate": 1.313128650084837e-05, "loss": 0.779, "step": 3494 }, { "epoch": 0.42, "learning_rate": 1.312761775114181e-05, "loss": 0.7695, "step": 3495 }, { "epoch": 0.42, "learning_rate": 1.3123948534763117e-05, "loss": 0.7835, "step": 3496 }, { "epoch": 0.42, "learning_rate": 1.312027885225978e-05, "loss": 0.7645, "step": 3497 }, { "epoch": 0.42, "learning_rate": 1.3116608704179354e-05, "loss": 0.8052, "step": 3498 }, { "epoch": 0.42, "learning_rate": 1.3112938091069455e-05, "loss": 0.8097, "step": 3499 }, { "epoch": 0.42, "learning_rate": 1.3109267013477783e-05, "loss": 0.7517, "step": 3500 }, { "epoch": 0.42, "learning_rate": 1.3105595471952098e-05, "loss": 0.7796, "step": 3501 }, { "epoch": 0.42, "learning_rate": 1.3101923467040227e-05, "loss": 0.8075, "step": 3502 }, { "epoch": 0.42, "learning_rate": 1.3098250999290073e-05, "loss": 0.8186, "step": 3503 }, { "epoch": 0.42, "learning_rate": 1.3094578069249609e-05, "loss": 0.7718, "step": 3504 }, { "epoch": 0.42, "learning_rate": 1.3090904677466864e-05, "loss": 0.7623, "step": 3505 }, { "epoch": 0.42, "learning_rate": 1.3087230824489954e-05, "loss": 0.8041, "step": 3506 }, { "epoch": 0.42, "learning_rate": 1.3083556510867052e-05, "loss": 0.7634, "step": 3507 }, { "epoch": 0.42, "learning_rate": 1.3079881737146402e-05, "loss": 0.7773, "step": 3508 }, { "epoch": 0.42, "learning_rate": 1.3076206503876317e-05, "loss": 0.728, "step": 3509 }, { "epoch": 0.42, "learning_rate": 1.3072530811605177e-05, "loss": 0.7868, "step": 3510 }, { "epoch": 0.42, "learning_rate": 1.3068854660881438e-05, "loss": 0.7645, "step": 3511 }, { "epoch": 0.42, "learning_rate": 1.3065178052253615e-05, "loss": 0.822, "step": 3512 }, { "epoch": 0.42, "learning_rate": 1.3061500986270295e-05, "loss": 0.8036, "step": 3513 }, { "epoch": 0.42, "learning_rate": 1.3057823463480137e-05, "loss": 0.7729, "step": 3514 }, { "epoch": 0.42, "learning_rate": 1.3054145484431857e-05, "loss": 0.8253, "step": 3515 }, { "epoch": 0.42, "learning_rate": 1.3050467049674254e-05, "loss": 0.7896, "step": 3516 }, { "epoch": 0.42, "learning_rate": 1.3046788159756183e-05, "loss": 0.8069, "step": 3517 }, { "epoch": 0.42, "learning_rate": 1.3043108815226573e-05, "loss": 0.7919, "step": 3518 }, { "epoch": 0.42, "learning_rate": 1.3039429016634425e-05, "loss": 0.7729, "step": 3519 }, { "epoch": 0.42, "learning_rate": 1.303574876452879e-05, "loss": 0.774, "step": 3520 }, { "epoch": 0.42, "learning_rate": 1.3032068059458812e-05, "loss": 0.798, "step": 3521 }, { "epoch": 0.42, "learning_rate": 1.3028386901973678e-05, "loss": 0.8092, "step": 3522 }, { "epoch": 0.42, "learning_rate": 1.3024705292622657e-05, "loss": 0.8114, "step": 3523 }, { "epoch": 0.42, "learning_rate": 1.3021023231955088e-05, "loss": 0.7729, "step": 3524 }, { "epoch": 0.42, "learning_rate": 1.3017340720520365e-05, "loss": 0.7751, "step": 3525 }, { "epoch": 0.42, "learning_rate": 1.3013657758867959e-05, "loss": 0.7416, "step": 3526 }, { "epoch": 0.42, "learning_rate": 1.3009974347547405e-05, "loss": 0.7573, "step": 3527 }, { "epoch": 0.42, "learning_rate": 1.3006290487108304e-05, "loss": 0.8281, "step": 3528 }, { "epoch": 0.42, "learning_rate": 1.3002606178100327e-05, "loss": 0.7935, "step": 3529 }, { "epoch": 0.42, "learning_rate": 1.2998921421073205e-05, "loss": 0.7773, "step": 3530 }, { "epoch": 0.42, "learning_rate": 1.299523621657675e-05, "loss": 0.7885, "step": 3531 }, { "epoch": 0.42, "learning_rate": 1.2991550565160822e-05, "loss": 0.8058, "step": 3532 }, { "epoch": 0.42, "learning_rate": 1.2987864467375367e-05, "loss": 0.8097, "step": 3533 }, { "epoch": 0.42, "learning_rate": 1.2984177923770379e-05, "loss": 0.7712, "step": 3534 }, { "epoch": 0.42, "learning_rate": 1.2980490934895929e-05, "loss": 0.8158, "step": 3535 }, { "epoch": 0.42, "learning_rate": 1.297680350130216e-05, "loss": 0.75, "step": 3536 }, { "epoch": 0.42, "learning_rate": 1.2973115623539266e-05, "loss": 0.7902, "step": 3537 }, { "epoch": 0.42, "learning_rate": 1.296942730215752e-05, "loss": 0.8047, "step": 3538 }, { "epoch": 0.42, "learning_rate": 1.2965738537707258e-05, "loss": 0.7963, "step": 3539 }, { "epoch": 0.42, "learning_rate": 1.2962049330738876e-05, "loss": 0.817, "step": 3540 }, { "epoch": 0.42, "learning_rate": 1.2958359681802846e-05, "loss": 0.7974, "step": 3541 }, { "epoch": 0.42, "learning_rate": 1.2954669591449695e-05, "loss": 0.8064, "step": 3542 }, { "epoch": 0.42, "learning_rate": 1.2950979060230027e-05, "loss": 0.7489, "step": 3543 }, { "epoch": 0.42, "learning_rate": 1.2947288088694507e-05, "loss": 0.769, "step": 3544 }, { "epoch": 0.42, "learning_rate": 1.294359667739386e-05, "loss": 0.7963, "step": 3545 }, { "epoch": 0.42, "learning_rate": 1.2939904826878888e-05, "loss": 0.8309, "step": 3546 }, { "epoch": 0.42, "learning_rate": 1.2936212537700446e-05, "loss": 0.7578, "step": 3547 }, { "epoch": 0.42, "learning_rate": 1.2932519810409466e-05, "loss": 0.764, "step": 3548 }, { "epoch": 0.42, "learning_rate": 1.2928826645556935e-05, "loss": 0.7796, "step": 3549 }, { "epoch": 0.42, "learning_rate": 1.2925133043693916e-05, "loss": 0.7076, "step": 3550 }, { "epoch": 0.42, "learning_rate": 1.292143900537153e-05, "loss": 0.8142, "step": 3551 }, { "epoch": 0.42, "learning_rate": 1.2917744531140963e-05, "loss": 0.8421, "step": 3552 }, { "epoch": 0.42, "learning_rate": 1.2914049621553469e-05, "loss": 0.7176, "step": 3553 }, { "epoch": 0.42, "learning_rate": 1.2910354277160365e-05, "loss": 0.8181, "step": 3554 }, { "epoch": 0.42, "learning_rate": 1.2906658498513033e-05, "loss": 0.76, "step": 3555 }, { "epoch": 0.42, "learning_rate": 1.2902962286162923e-05, "loss": 0.7667, "step": 3556 }, { "epoch": 0.42, "learning_rate": 1.2899265640661546e-05, "loss": 0.7511, "step": 3557 }, { "epoch": 0.42, "learning_rate": 1.289556856256048e-05, "loss": 0.7656, "step": 3558 }, { "epoch": 0.42, "learning_rate": 1.2891871052411365e-05, "loss": 0.8153, "step": 3559 }, { "epoch": 0.42, "learning_rate": 1.2888173110765906e-05, "loss": 0.8036, "step": 3560 }, { "epoch": 0.42, "learning_rate": 1.2884474738175877e-05, "loss": 0.7718, "step": 3561 }, { "epoch": 0.42, "learning_rate": 1.2880775935193104e-05, "loss": 0.7405, "step": 3562 }, { "epoch": 0.42, "learning_rate": 1.2877076702369493e-05, "loss": 0.798, "step": 3563 }, { "epoch": 0.43, "learning_rate": 1.287337704025701e-05, "loss": 0.7612, "step": 3564 }, { "epoch": 0.43, "learning_rate": 1.2869676949407673e-05, "loss": 0.822, "step": 3565 }, { "epoch": 0.43, "learning_rate": 1.286597643037358e-05, "loss": 0.7667, "step": 3566 }, { "epoch": 0.43, "learning_rate": 1.286227548370688e-05, "loss": 0.7411, "step": 3567 }, { "epoch": 0.43, "learning_rate": 1.285857410995979e-05, "loss": 0.7478, "step": 3568 }, { "epoch": 0.43, "learning_rate": 1.2854872309684605e-05, "loss": 0.8131, "step": 3569 }, { "epoch": 0.43, "learning_rate": 1.2851170083433661e-05, "loss": 0.7478, "step": 3570 }, { "epoch": 0.43, "learning_rate": 1.2847467431759371e-05, "loss": 0.7746, "step": 3571 }, { "epoch": 0.43, "learning_rate": 1.28437643552142e-05, "loss": 0.764, "step": 3572 }, { "epoch": 0.43, "learning_rate": 1.2840060854350693e-05, "loss": 0.8538, "step": 3573 }, { "epoch": 0.43, "learning_rate": 1.283635692972145e-05, "loss": 0.7813, "step": 3574 }, { "epoch": 0.43, "learning_rate": 1.2832652581879128e-05, "loss": 0.8426, "step": 3575 }, { "epoch": 0.43, "learning_rate": 1.282894781137646e-05, "loss": 0.8086, "step": 3576 }, { "epoch": 0.43, "learning_rate": 1.282524261876623e-05, "loss": 0.716, "step": 3577 }, { "epoch": 0.43, "learning_rate": 1.2821537004601288e-05, "loss": 0.7673, "step": 3578 }, { "epoch": 0.43, "learning_rate": 1.2817830969434558e-05, "loss": 0.7344, "step": 3579 }, { "epoch": 0.43, "learning_rate": 1.2814124513819009e-05, "loss": 0.7991, "step": 3580 }, { "epoch": 0.43, "learning_rate": 1.2810417638307686e-05, "loss": 0.7706, "step": 3581 }, { "epoch": 0.43, "learning_rate": 1.2806710343453689e-05, "loss": 0.784, "step": 3582 }, { "epoch": 0.43, "learning_rate": 1.280300262981019e-05, "loss": 0.8036, "step": 3583 }, { "epoch": 0.43, "learning_rate": 1.2799294497930415e-05, "loss": 0.8069, "step": 3584 }, { "epoch": 0.43, "learning_rate": 1.2795585948367648e-05, "loss": 0.8225, "step": 3585 }, { "epoch": 0.43, "learning_rate": 1.2791876981675251e-05, "loss": 0.808, "step": 3586 }, { "epoch": 0.43, "learning_rate": 1.2788167598406631e-05, "loss": 0.7539, "step": 3587 }, { "epoch": 0.43, "learning_rate": 1.278445779911527e-05, "loss": 0.7327, "step": 3588 }, { "epoch": 0.43, "learning_rate": 1.2780747584354711e-05, "loss": 0.8164, "step": 3589 }, { "epoch": 0.43, "learning_rate": 1.2777036954678553e-05, "loss": 0.8265, "step": 3590 }, { "epoch": 0.43, "learning_rate": 1.2773325910640455e-05, "loss": 0.784, "step": 3591 }, { "epoch": 0.43, "learning_rate": 1.2769614452794146e-05, "loss": 0.7567, "step": 3592 }, { "epoch": 0.43, "learning_rate": 1.276590258169341e-05, "loss": 0.7723, "step": 3593 }, { "epoch": 0.43, "learning_rate": 1.2762190297892101e-05, "loss": 0.8047, "step": 3594 }, { "epoch": 0.43, "learning_rate": 1.2758477601944125e-05, "loss": 0.8002, "step": 3595 }, { "epoch": 0.43, "learning_rate": 1.2754764494403458e-05, "loss": 0.7684, "step": 3596 }, { "epoch": 0.43, "learning_rate": 1.2751050975824124e-05, "loss": 0.7656, "step": 3597 }, { "epoch": 0.43, "learning_rate": 1.2747337046760227e-05, "loss": 0.7567, "step": 3598 }, { "epoch": 0.43, "learning_rate": 1.2743622707765919e-05, "loss": 0.7679, "step": 3599 }, { "epoch": 0.43, "learning_rate": 1.2739907959395414e-05, "loss": 0.8175, "step": 3600 }, { "epoch": 0.43, "learning_rate": 1.2736192802202995e-05, "loss": 0.7879, "step": 3601 }, { "epoch": 0.43, "learning_rate": 1.2732477236743001e-05, "loss": 0.8304, "step": 3602 }, { "epoch": 0.43, "learning_rate": 1.2728761263569828e-05, "loss": 0.8761, "step": 3603 }, { "epoch": 0.43, "learning_rate": 1.272504488323794e-05, "loss": 0.7935, "step": 3604 }, { "epoch": 0.43, "learning_rate": 1.2721328096301852e-05, "loss": 0.7706, "step": 3605 }, { "epoch": 0.43, "learning_rate": 1.2717610903316158e-05, "loss": 0.7974, "step": 3606 }, { "epoch": 0.43, "learning_rate": 1.2713893304835487e-05, "loss": 0.7573, "step": 3607 }, { "epoch": 0.43, "learning_rate": 1.2710175301414554e-05, "loss": 0.7221, "step": 3608 }, { "epoch": 0.43, "learning_rate": 1.2706456893608115e-05, "loss": 0.7896, "step": 3609 }, { "epoch": 0.43, "learning_rate": 1.2702738081970995e-05, "loss": 0.832, "step": 3610 }, { "epoch": 0.43, "learning_rate": 1.269901886705808e-05, "loss": 0.7589, "step": 3611 }, { "epoch": 0.43, "learning_rate": 1.2695299249424317e-05, "loss": 0.7238, "step": 3612 }, { "epoch": 0.43, "learning_rate": 1.2691579229624704e-05, "loss": 0.7126, "step": 3613 }, { "epoch": 0.43, "learning_rate": 1.2687858808214313e-05, "loss": 0.7946, "step": 3614 }, { "epoch": 0.43, "learning_rate": 1.2684137985748264e-05, "loss": 0.7372, "step": 3615 }, { "epoch": 0.43, "learning_rate": 1.2680416762781738e-05, "loss": 0.8158, "step": 3616 }, { "epoch": 0.43, "learning_rate": 1.2676695139869986e-05, "loss": 0.7634, "step": 3617 }, { "epoch": 0.43, "learning_rate": 1.2672973117568309e-05, "loss": 0.7718, "step": 3618 }, { "epoch": 0.43, "learning_rate": 1.2669250696432067e-05, "loss": 0.7645, "step": 3619 }, { "epoch": 0.43, "learning_rate": 1.2665527877016685e-05, "loss": 0.769, "step": 3620 }, { "epoch": 0.43, "learning_rate": 1.266180465987765e-05, "loss": 0.7232, "step": 3621 }, { "epoch": 0.43, "learning_rate": 1.2658081045570498e-05, "loss": 0.7684, "step": 3622 }, { "epoch": 0.43, "learning_rate": 1.2654357034650828e-05, "loss": 0.7829, "step": 3623 }, { "epoch": 0.43, "learning_rate": 1.2650632627674305e-05, "loss": 0.7656, "step": 3624 }, { "epoch": 0.43, "learning_rate": 1.2646907825196648e-05, "loss": 0.7963, "step": 3625 }, { "epoch": 0.43, "learning_rate": 1.2643182627773634e-05, "loss": 0.8025, "step": 3626 }, { "epoch": 0.43, "learning_rate": 1.2639457035961098e-05, "loss": 0.8309, "step": 3627 }, { "epoch": 0.43, "learning_rate": 1.2635731050314934e-05, "loss": 0.8432, "step": 3628 }, { "epoch": 0.43, "learning_rate": 1.2632004671391106e-05, "loss": 0.798, "step": 3629 }, { "epoch": 0.43, "learning_rate": 1.2628277899745616e-05, "loss": 0.7271, "step": 3630 }, { "epoch": 0.43, "learning_rate": 1.2624550735934542e-05, "loss": 0.8047, "step": 3631 }, { "epoch": 0.43, "learning_rate": 1.2620823180514016e-05, "loss": 0.7377, "step": 3632 }, { "epoch": 0.43, "learning_rate": 1.2617095234040224e-05, "loss": 0.8186, "step": 3633 }, { "epoch": 0.43, "learning_rate": 1.2613366897069415e-05, "loss": 0.8471, "step": 3634 }, { "epoch": 0.43, "learning_rate": 1.2609638170157892e-05, "loss": 0.7617, "step": 3635 }, { "epoch": 0.43, "learning_rate": 1.2605909053862017e-05, "loss": 0.798, "step": 3636 }, { "epoch": 0.43, "learning_rate": 1.2602179548738218e-05, "loss": 0.7349, "step": 3637 }, { "epoch": 0.43, "learning_rate": 1.2598449655342973e-05, "loss": 0.7835, "step": 3638 }, { "epoch": 0.43, "learning_rate": 1.2594719374232816e-05, "loss": 0.8097, "step": 3639 }, { "epoch": 0.43, "learning_rate": 1.2590988705964347e-05, "loss": 0.8158, "step": 3640 }, { "epoch": 0.43, "learning_rate": 1.2587257651094214e-05, "loss": 0.7974, "step": 3641 }, { "epoch": 0.43, "learning_rate": 1.2583526210179135e-05, "loss": 0.8259, "step": 3642 }, { "epoch": 0.43, "learning_rate": 1.2579794383775871e-05, "loss": 0.8371, "step": 3643 }, { "epoch": 0.43, "learning_rate": 1.2576062172441255e-05, "loss": 0.7383, "step": 3644 }, { "epoch": 0.43, "learning_rate": 1.2572329576732165e-05, "loss": 0.7037, "step": 3645 }, { "epoch": 0.43, "learning_rate": 1.2568596597205549e-05, "loss": 0.798, "step": 3646 }, { "epoch": 0.43, "learning_rate": 1.2564863234418399e-05, "loss": 0.7924, "step": 3647 }, { "epoch": 0.44, "learning_rate": 1.256112948892777e-05, "loss": 0.827, "step": 3648 }, { "epoch": 0.44, "learning_rate": 1.2557395361290781e-05, "loss": 0.745, "step": 3649 }, { "epoch": 0.44, "learning_rate": 1.2553660852064593e-05, "loss": 0.7974, "step": 3650 }, { "epoch": 0.44, "learning_rate": 1.2549925961806437e-05, "loss": 0.7868, "step": 3651 }, { "epoch": 0.44, "learning_rate": 1.2546190691073598e-05, "loss": 0.7824, "step": 3652 }, { "epoch": 0.44, "learning_rate": 1.2542455040423413e-05, "loss": 0.7511, "step": 3653 }, { "epoch": 0.44, "learning_rate": 1.2538719010413284e-05, "loss": 0.7969, "step": 3654 }, { "epoch": 0.44, "learning_rate": 1.2534982601600657e-05, "loss": 0.7807, "step": 3655 }, { "epoch": 0.44, "learning_rate": 1.2531245814543043e-05, "loss": 0.7388, "step": 3656 }, { "epoch": 0.44, "learning_rate": 1.2527508649798012e-05, "loss": 0.6867, "step": 3657 }, { "epoch": 0.44, "learning_rate": 1.2523771107923188e-05, "loss": 0.7489, "step": 3658 }, { "epoch": 0.44, "learning_rate": 1.2520033189476246e-05, "loss": 0.779, "step": 3659 }, { "epoch": 0.44, "learning_rate": 1.251629489501492e-05, "loss": 0.7606, "step": 3660 }, { "epoch": 0.44, "learning_rate": 1.2512556225097004e-05, "loss": 0.76, "step": 3661 }, { "epoch": 0.44, "learning_rate": 1.2508817180280346e-05, "loss": 0.7483, "step": 3662 }, { "epoch": 0.44, "learning_rate": 1.2505077761122848e-05, "loss": 0.7757, "step": 3663 }, { "epoch": 0.44, "learning_rate": 1.250133796818247e-05, "loss": 0.8153, "step": 3664 }, { "epoch": 0.44, "learning_rate": 1.2497597802017224e-05, "loss": 0.7779, "step": 3665 }, { "epoch": 0.44, "learning_rate": 1.2493857263185185e-05, "loss": 0.7779, "step": 3666 }, { "epoch": 0.44, "learning_rate": 1.2490116352244475e-05, "loss": 0.7561, "step": 3667 }, { "epoch": 0.44, "learning_rate": 1.2486375069753276e-05, "loss": 0.774, "step": 3668 }, { "epoch": 0.44, "learning_rate": 1.2482633416269829e-05, "loss": 0.716, "step": 3669 }, { "epoch": 0.44, "learning_rate": 1.2478891392352424e-05, "loss": 0.7757, "step": 3670 }, { "epoch": 0.44, "learning_rate": 1.2475148998559408e-05, "loss": 0.7712, "step": 3671 }, { "epoch": 0.44, "learning_rate": 1.2471406235449185e-05, "loss": 0.7193, "step": 3672 }, { "epoch": 0.44, "learning_rate": 1.246766310358021e-05, "loss": 0.7667, "step": 3673 }, { "epoch": 0.44, "learning_rate": 1.2463919603511002e-05, "loss": 0.8225, "step": 3674 }, { "epoch": 0.44, "learning_rate": 1.2460175735800125e-05, "loss": 0.7612, "step": 3675 }, { "epoch": 0.44, "learning_rate": 1.2456431501006198e-05, "loss": 0.8242, "step": 3676 }, { "epoch": 0.44, "learning_rate": 1.2452686899687909e-05, "loss": 0.7846, "step": 3677 }, { "epoch": 0.44, "learning_rate": 1.2448941932403981e-05, "loss": 0.8298, "step": 3678 }, { "epoch": 0.44, "learning_rate": 1.2445196599713208e-05, "loss": 0.7907, "step": 3679 }, { "epoch": 0.44, "learning_rate": 1.2441450902174424e-05, "loss": 0.8019, "step": 3680 }, { "epoch": 0.44, "learning_rate": 1.2437704840346527e-05, "loss": 0.7093, "step": 3681 }, { "epoch": 0.44, "learning_rate": 1.2433958414788473e-05, "loss": 0.7355, "step": 3682 }, { "epoch": 0.44, "learning_rate": 1.2430211626059261e-05, "loss": 0.7467, "step": 3683 }, { "epoch": 0.44, "learning_rate": 1.2426464474717954e-05, "loss": 0.803, "step": 3684 }, { "epoch": 0.44, "learning_rate": 1.2422716961323656e-05, "loss": 0.8181, "step": 3685 }, { "epoch": 0.44, "learning_rate": 1.2418969086435541e-05, "loss": 0.8343, "step": 3686 }, { "epoch": 0.44, "learning_rate": 1.241522085061283e-05, "loss": 0.7852, "step": 3687 }, { "epoch": 0.44, "learning_rate": 1.2411472254414795e-05, "loss": 0.817, "step": 3688 }, { "epoch": 0.44, "learning_rate": 1.2407723298400767e-05, "loss": 0.8025, "step": 3689 }, { "epoch": 0.44, "learning_rate": 1.2403973983130127e-05, "loss": 0.8376, "step": 3690 }, { "epoch": 0.44, "learning_rate": 1.2400224309162305e-05, "loss": 0.8025, "step": 3691 }, { "epoch": 0.44, "learning_rate": 1.23964742770568e-05, "loss": 0.8315, "step": 3692 }, { "epoch": 0.44, "learning_rate": 1.2392723887373148e-05, "loss": 0.7511, "step": 3693 }, { "epoch": 0.44, "learning_rate": 1.2388973140670948e-05, "loss": 0.8164, "step": 3694 }, { "epoch": 0.44, "learning_rate": 1.2385222037509848e-05, "loss": 0.7746, "step": 3695 }, { "epoch": 0.44, "learning_rate": 1.238147057844955e-05, "loss": 0.8287, "step": 3696 }, { "epoch": 0.44, "learning_rate": 1.2377718764049811e-05, "loss": 0.7511, "step": 3697 }, { "epoch": 0.44, "learning_rate": 1.2373966594870437e-05, "loss": 0.7824, "step": 3698 }, { "epoch": 0.44, "learning_rate": 1.2370214071471294e-05, "loss": 0.6786, "step": 3699 }, { "epoch": 0.44, "learning_rate": 1.2366461194412292e-05, "loss": 0.803, "step": 3700 }, { "epoch": 0.44, "learning_rate": 1.2362707964253398e-05, "loss": 0.7494, "step": 3701 }, { "epoch": 0.44, "learning_rate": 1.2358954381554635e-05, "loss": 0.817, "step": 3702 }, { "epoch": 0.44, "learning_rate": 1.2355200446876077e-05, "loss": 0.8047, "step": 3703 }, { "epoch": 0.44, "learning_rate": 1.235144616077784e-05, "loss": 0.7874, "step": 3704 }, { "epoch": 0.44, "learning_rate": 1.2347691523820112e-05, "loss": 0.7991, "step": 3705 }, { "epoch": 0.44, "learning_rate": 1.2343936536563114e-05, "loss": 0.8348, "step": 3706 }, { "epoch": 0.44, "learning_rate": 1.2340181199567136e-05, "loss": 0.7751, "step": 3707 }, { "epoch": 0.44, "learning_rate": 1.2336425513392505e-05, "loss": 0.7573, "step": 3708 }, { "epoch": 0.44, "learning_rate": 1.2332669478599612e-05, "loss": 0.7506, "step": 3709 }, { "epoch": 0.44, "learning_rate": 1.2328913095748896e-05, "loss": 0.7427, "step": 3710 }, { "epoch": 0.44, "learning_rate": 1.2325156365400842e-05, "loss": 0.7852, "step": 3711 }, { "epoch": 0.44, "learning_rate": 1.2321399288115995e-05, "loss": 0.7958, "step": 3712 }, { "epoch": 0.44, "learning_rate": 1.2317641864454947e-05, "loss": 0.803, "step": 3713 }, { "epoch": 0.44, "learning_rate": 1.2313884094978349e-05, "loss": 0.7589, "step": 3714 }, { "epoch": 0.44, "learning_rate": 1.2310125980246894e-05, "loss": 0.8499, "step": 3715 }, { "epoch": 0.44, "learning_rate": 1.230636752082133e-05, "loss": 0.8158, "step": 3716 }, { "epoch": 0.44, "learning_rate": 1.2302608717262458e-05, "loss": 0.774, "step": 3717 }, { "epoch": 0.44, "learning_rate": 1.2298849570131128e-05, "loss": 0.7729, "step": 3718 }, { "epoch": 0.44, "learning_rate": 1.2295090079988245e-05, "loss": 0.7506, "step": 3719 }, { "epoch": 0.44, "learning_rate": 1.2291330247394765e-05, "loss": 0.808, "step": 3720 }, { "epoch": 0.44, "learning_rate": 1.228757007291169e-05, "loss": 0.7952, "step": 3721 }, { "epoch": 0.44, "learning_rate": 1.2283809557100077e-05, "loss": 0.7807, "step": 3722 }, { "epoch": 0.44, "learning_rate": 1.2280048700521027e-05, "loss": 0.7874, "step": 3723 }, { "epoch": 0.44, "learning_rate": 1.2276287503735707e-05, "loss": 0.8917, "step": 3724 }, { "epoch": 0.44, "learning_rate": 1.227252596730532e-05, "loss": 0.7835, "step": 3725 }, { "epoch": 0.44, "learning_rate": 1.2268764091791126e-05, "loss": 0.7818, "step": 3726 }, { "epoch": 0.44, "learning_rate": 1.2265001877754437e-05, "loss": 0.7617, "step": 3727 }, { "epoch": 0.44, "learning_rate": 1.226123932575661e-05, "loss": 0.769, "step": 3728 }, { "epoch": 0.44, "learning_rate": 1.2257476436359057e-05, "loss": 0.7556, "step": 3729 }, { "epoch": 0.44, "learning_rate": 1.2253713210123241e-05, "loss": 0.764, "step": 3730 }, { "epoch": 0.44, "learning_rate": 1.224994964761067e-05, "loss": 0.8806, "step": 3731 }, { "epoch": 0.45, "learning_rate": 1.2246185749382908e-05, "loss": 0.7946, "step": 3732 }, { "epoch": 0.45, "learning_rate": 1.2242421516001566e-05, "loss": 0.7271, "step": 3733 }, { "epoch": 0.45, "learning_rate": 1.2238656948028304e-05, "loss": 0.8281, "step": 3734 }, { "epoch": 0.45, "learning_rate": 1.2234892046024838e-05, "loss": 0.8209, "step": 3735 }, { "epoch": 0.45, "learning_rate": 1.2231126810552924e-05, "loss": 0.7835, "step": 3736 }, { "epoch": 0.45, "learning_rate": 1.2227361242174376e-05, "loss": 0.7785, "step": 3737 }, { "epoch": 0.45, "learning_rate": 1.2223595341451054e-05, "loss": 0.7427, "step": 3738 }, { "epoch": 0.45, "learning_rate": 1.2219829108944867e-05, "loss": 0.7204, "step": 3739 }, { "epoch": 0.45, "learning_rate": 1.2216062545217779e-05, "loss": 0.7935, "step": 3740 }, { "epoch": 0.45, "learning_rate": 1.2212295650831798e-05, "loss": 0.7946, "step": 3741 }, { "epoch": 0.45, "learning_rate": 1.2208528426348982e-05, "loss": 0.7204, "step": 3742 }, { "epoch": 0.45, "learning_rate": 1.2204760872331434e-05, "loss": 0.76, "step": 3743 }, { "epoch": 0.45, "learning_rate": 1.2200992989341317e-05, "loss": 0.7673, "step": 3744 }, { "epoch": 0.45, "learning_rate": 1.2197224777940837e-05, "loss": 0.793, "step": 3745 }, { "epoch": 0.45, "learning_rate": 1.2193456238692249e-05, "loss": 0.7891, "step": 3746 }, { "epoch": 0.45, "learning_rate": 1.2189687372157855e-05, "loss": 0.7801, "step": 3747 }, { "epoch": 0.45, "learning_rate": 1.2185918178900007e-05, "loss": 0.7528, "step": 3748 }, { "epoch": 0.45, "learning_rate": 1.2182148659481107e-05, "loss": 0.8147, "step": 3749 }, { "epoch": 0.45, "learning_rate": 1.2178378814463612e-05, "loss": 0.7121, "step": 3750 }, { "epoch": 0.45, "learning_rate": 1.217460864441001e-05, "loss": 0.7746, "step": 3751 }, { "epoch": 0.45, "learning_rate": 1.2170838149882857e-05, "loss": 0.8025, "step": 3752 }, { "epoch": 0.45, "learning_rate": 1.2167067331444748e-05, "loss": 0.7773, "step": 3753 }, { "epoch": 0.45, "learning_rate": 1.2163296189658322e-05, "loss": 0.8214, "step": 3754 }, { "epoch": 0.45, "learning_rate": 1.2159524725086278e-05, "loss": 0.7377, "step": 3755 }, { "epoch": 0.45, "learning_rate": 1.215575293829135e-05, "loss": 0.7455, "step": 3756 }, { "epoch": 0.45, "learning_rate": 1.2151980829836332e-05, "loss": 0.8622, "step": 3757 }, { "epoch": 0.45, "learning_rate": 1.2148208400284056e-05, "loss": 0.731, "step": 3758 }, { "epoch": 0.45, "learning_rate": 1.214443565019741e-05, "loss": 0.808, "step": 3759 }, { "epoch": 0.45, "learning_rate": 1.2140662580139327e-05, "loss": 0.7785, "step": 3760 }, { "epoch": 0.45, "learning_rate": 1.2136889190672782e-05, "loss": 0.8214, "step": 3761 }, { "epoch": 0.45, "learning_rate": 1.2133115482360811e-05, "loss": 0.7723, "step": 3762 }, { "epoch": 0.45, "learning_rate": 1.2129341455766479e-05, "loss": 0.8331, "step": 3763 }, { "epoch": 0.45, "learning_rate": 1.2125567111452918e-05, "loss": 0.7321, "step": 3764 }, { "epoch": 0.45, "learning_rate": 1.2121792449983293e-05, "loss": 0.8281, "step": 3765 }, { "epoch": 0.45, "learning_rate": 1.2118017471920827e-05, "loss": 0.7612, "step": 3766 }, { "epoch": 0.45, "learning_rate": 1.2114242177828782e-05, "loss": 0.784, "step": 3767 }, { "epoch": 0.45, "learning_rate": 1.2110466568270463e-05, "loss": 0.7316, "step": 3768 }, { "epoch": 0.45, "learning_rate": 1.2106690643809238e-05, "loss": 0.827, "step": 3769 }, { "epoch": 0.45, "learning_rate": 1.210291440500851e-05, "loss": 0.7807, "step": 3770 }, { "epoch": 0.45, "learning_rate": 1.2099137852431732e-05, "loss": 0.7539, "step": 3771 }, { "epoch": 0.45, "learning_rate": 1.2095360986642408e-05, "loss": 0.803, "step": 3772 }, { "epoch": 0.45, "learning_rate": 1.2091583808204074e-05, "loss": 0.7628, "step": 3773 }, { "epoch": 0.45, "learning_rate": 1.2087806317680333e-05, "loss": 0.7617, "step": 3774 }, { "epoch": 0.45, "learning_rate": 1.208402851563482e-05, "loss": 0.7963, "step": 3775 }, { "epoch": 0.45, "learning_rate": 1.2080250402631225e-05, "loss": 0.7701, "step": 3776 }, { "epoch": 0.45, "learning_rate": 1.2076471979233275e-05, "loss": 0.8175, "step": 3777 }, { "epoch": 0.45, "learning_rate": 1.2072693246004754e-05, "loss": 0.7879, "step": 3778 }, { "epoch": 0.45, "learning_rate": 1.2068914203509483e-05, "loss": 0.75, "step": 3779 }, { "epoch": 0.45, "learning_rate": 1.2065134852311337e-05, "loss": 0.8376, "step": 3780 }, { "epoch": 0.45, "learning_rate": 1.2061355192974229e-05, "loss": 0.8052, "step": 3781 }, { "epoch": 0.45, "learning_rate": 1.2057575226062127e-05, "loss": 0.7773, "step": 3782 }, { "epoch": 0.45, "learning_rate": 1.205379495213904e-05, "loss": 0.7907, "step": 3783 }, { "epoch": 0.45, "learning_rate": 1.2050014371769018e-05, "loss": 0.7846, "step": 3784 }, { "epoch": 0.45, "learning_rate": 1.2046233485516169e-05, "loss": 0.7874, "step": 3785 }, { "epoch": 0.45, "learning_rate": 1.2042452293944631e-05, "loss": 0.716, "step": 3786 }, { "epoch": 0.45, "learning_rate": 1.2038670797618602e-05, "loss": 0.7874, "step": 3787 }, { "epoch": 0.45, "learning_rate": 1.2034888997102316e-05, "loss": 0.7489, "step": 3788 }, { "epoch": 0.45, "learning_rate": 1.2031106892960058e-05, "loss": 0.7879, "step": 3789 }, { "epoch": 0.45, "learning_rate": 1.2027324485756158e-05, "loss": 0.7533, "step": 3790 }, { "epoch": 0.45, "learning_rate": 1.2023541776054986e-05, "loss": 0.7617, "step": 3791 }, { "epoch": 0.45, "learning_rate": 1.2019758764420961e-05, "loss": 0.7941, "step": 3792 }, { "epoch": 0.45, "learning_rate": 1.2015975451418547e-05, "loss": 0.7734, "step": 3793 }, { "epoch": 0.45, "learning_rate": 1.201219183761225e-05, "loss": 0.7522, "step": 3794 }, { "epoch": 0.45, "learning_rate": 1.2008407923566629e-05, "loss": 0.7506, "step": 3795 }, { "epoch": 0.45, "learning_rate": 1.2004623709846275e-05, "loss": 0.7673, "step": 3796 }, { "epoch": 0.45, "learning_rate": 1.2000839197015839e-05, "loss": 0.7969, "step": 3797 }, { "epoch": 0.45, "learning_rate": 1.1997054385640003e-05, "loss": 0.7249, "step": 3798 }, { "epoch": 0.45, "learning_rate": 1.1993269276283498e-05, "loss": 0.851, "step": 3799 }, { "epoch": 0.45, "learning_rate": 1.1989483869511107e-05, "loss": 0.7969, "step": 3800 }, { "epoch": 0.45, "learning_rate": 1.1985698165887643e-05, "loss": 0.7679, "step": 3801 }, { "epoch": 0.45, "learning_rate": 1.1981912165977975e-05, "loss": 0.7617, "step": 3802 }, { "epoch": 0.45, "learning_rate": 1.1978125870347017e-05, "loss": 0.7662, "step": 3803 }, { "epoch": 0.45, "learning_rate": 1.1974339279559712e-05, "loss": 0.7606, "step": 3804 }, { "epoch": 0.45, "learning_rate": 1.1970552394181065e-05, "loss": 0.7461, "step": 3805 }, { "epoch": 0.45, "learning_rate": 1.1966765214776117e-05, "loss": 0.7098, "step": 3806 }, { "epoch": 0.45, "learning_rate": 1.1962977741909949e-05, "loss": 0.8036, "step": 3807 }, { "epoch": 0.45, "learning_rate": 1.1959189976147698e-05, "loss": 0.7316, "step": 3808 }, { "epoch": 0.45, "learning_rate": 1.195540191805453e-05, "loss": 0.7545, "step": 3809 }, { "epoch": 0.45, "learning_rate": 1.1951613568195666e-05, "loss": 0.8622, "step": 3810 }, { "epoch": 0.45, "learning_rate": 1.194782492713636e-05, "loss": 0.7656, "step": 3811 }, { "epoch": 0.45, "learning_rate": 1.194403599544192e-05, "loss": 0.7679, "step": 3812 }, { "epoch": 0.45, "learning_rate": 1.1940246773677696e-05, "loss": 0.7349, "step": 3813 }, { "epoch": 0.45, "learning_rate": 1.193645726240907e-05, "loss": 0.7294, "step": 3814 }, { "epoch": 0.45, "learning_rate": 1.193266746220148e-05, "loss": 0.7907, "step": 3815 }, { "epoch": 0.46, "learning_rate": 1.1928877373620404e-05, "loss": 0.7573, "step": 3816 }, { "epoch": 0.46, "learning_rate": 1.1925086997231356e-05, "loss": 0.8237, "step": 3817 }, { "epoch": 0.46, "learning_rate": 1.1921296333599908e-05, "loss": 0.7612, "step": 3818 }, { "epoch": 0.46, "learning_rate": 1.1917505383291652e-05, "loss": 0.7651, "step": 3819 }, { "epoch": 0.46, "learning_rate": 1.1913714146872248e-05, "loss": 0.7874, "step": 3820 }, { "epoch": 0.46, "learning_rate": 1.1909922624907379e-05, "loss": 0.755, "step": 3821 }, { "epoch": 0.46, "learning_rate": 1.1906130817962785e-05, "loss": 0.8504, "step": 3822 }, { "epoch": 0.46, "learning_rate": 1.1902338726604237e-05, "loss": 0.8008, "step": 3823 }, { "epoch": 0.46, "learning_rate": 1.1898546351397551e-05, "loss": 0.8013, "step": 3824 }, { "epoch": 0.46, "learning_rate": 1.1894753692908594e-05, "loss": 0.7768, "step": 3825 }, { "epoch": 0.46, "learning_rate": 1.1890960751703264e-05, "loss": 0.8298, "step": 3826 }, { "epoch": 0.46, "learning_rate": 1.1887167528347507e-05, "loss": 0.8622, "step": 3827 }, { "epoch": 0.46, "learning_rate": 1.1883374023407314e-05, "loss": 0.7506, "step": 3828 }, { "epoch": 0.46, "learning_rate": 1.1879580237448713e-05, "loss": 0.7455, "step": 3829 }, { "epoch": 0.46, "learning_rate": 1.1875786171037772e-05, "loss": 0.7974, "step": 3830 }, { "epoch": 0.46, "learning_rate": 1.1871991824740605e-05, "loss": 0.7634, "step": 3831 }, { "epoch": 0.46, "learning_rate": 1.1868197199123366e-05, "loss": 0.7204, "step": 3832 }, { "epoch": 0.46, "learning_rate": 1.1864402294752255e-05, "loss": 0.7204, "step": 3833 }, { "epoch": 0.46, "learning_rate": 1.1860607112193509e-05, "loss": 0.832, "step": 3834 }, { "epoch": 0.46, "learning_rate": 1.1856811652013404e-05, "loss": 0.7824, "step": 3835 }, { "epoch": 0.46, "learning_rate": 1.1853015914778264e-05, "loss": 0.7556, "step": 3836 }, { "epoch": 0.46, "learning_rate": 1.1849219901054449e-05, "loss": 0.7249, "step": 3837 }, { "epoch": 0.46, "learning_rate": 1.1845423611408366e-05, "loss": 0.7779, "step": 3838 }, { "epoch": 0.46, "learning_rate": 1.184162704640646e-05, "loss": 0.7182, "step": 3839 }, { "epoch": 0.46, "learning_rate": 1.1837830206615211e-05, "loss": 0.6925, "step": 3840 }, { "epoch": 0.46, "learning_rate": 1.1834033092601151e-05, "loss": 0.8538, "step": 3841 }, { "epoch": 0.46, "learning_rate": 1.1830235704930846e-05, "loss": 0.846, "step": 3842 }, { "epoch": 0.46, "learning_rate": 1.1826438044170908e-05, "loss": 0.8125, "step": 3843 }, { "epoch": 0.46, "learning_rate": 1.1822640110887977e-05, "loss": 0.7773, "step": 3844 }, { "epoch": 0.46, "learning_rate": 1.1818841905648752e-05, "loss": 0.7824, "step": 3845 }, { "epoch": 0.46, "learning_rate": 1.181504342901996e-05, "loss": 0.8354, "step": 3846 }, { "epoch": 0.46, "learning_rate": 1.1811244681568376e-05, "loss": 0.7679, "step": 3847 }, { "epoch": 0.46, "learning_rate": 1.1807445663860807e-05, "loss": 0.7612, "step": 3848 }, { "epoch": 0.46, "learning_rate": 1.1803646376464104e-05, "loss": 0.7762, "step": 3849 }, { "epoch": 0.46, "learning_rate": 1.1799846819945161e-05, "loss": 0.8438, "step": 3850 }, { "epoch": 0.46, "learning_rate": 1.1796046994870911e-05, "loss": 0.8052, "step": 3851 }, { "epoch": 0.46, "learning_rate": 1.1792246901808325e-05, "loss": 0.7768, "step": 3852 }, { "epoch": 0.46, "learning_rate": 1.1788446541324414e-05, "loss": 0.8343, "step": 3853 }, { "epoch": 0.46, "learning_rate": 1.1784645913986235e-05, "loss": 0.7824, "step": 3854 }, { "epoch": 0.46, "learning_rate": 1.1780845020360875e-05, "loss": 0.7913, "step": 3855 }, { "epoch": 0.46, "learning_rate": 1.1777043861015467e-05, "loss": 0.7891, "step": 3856 }, { "epoch": 0.46, "learning_rate": 1.1773242436517183e-05, "loss": 0.798, "step": 3857 }, { "epoch": 0.46, "learning_rate": 1.1769440747433234e-05, "loss": 0.7807, "step": 3858 }, { "epoch": 0.46, "learning_rate": 1.176563879433087e-05, "loss": 0.7645, "step": 3859 }, { "epoch": 0.46, "learning_rate": 1.1761836577777382e-05, "loss": 0.7969, "step": 3860 }, { "epoch": 0.46, "learning_rate": 1.1758034098340096e-05, "loss": 0.7718, "step": 3861 }, { "epoch": 0.46, "learning_rate": 1.1754231356586381e-05, "loss": 0.7907, "step": 3862 }, { "epoch": 0.46, "learning_rate": 1.1750428353083648e-05, "loss": 0.8097, "step": 3863 }, { "epoch": 0.46, "learning_rate": 1.1746625088399339e-05, "loss": 0.7104, "step": 3864 }, { "epoch": 0.46, "learning_rate": 1.1742821563100943e-05, "loss": 0.808, "step": 3865 }, { "epoch": 0.46, "learning_rate": 1.1739017777755983e-05, "loss": 0.8393, "step": 3866 }, { "epoch": 0.46, "learning_rate": 1.173521373293202e-05, "loss": 0.798, "step": 3867 }, { "epoch": 0.46, "learning_rate": 1.173140942919666e-05, "loss": 0.76, "step": 3868 }, { "epoch": 0.46, "learning_rate": 1.1727604867117542e-05, "loss": 0.7511, "step": 3869 }, { "epoch": 0.46, "learning_rate": 1.1723800047262344e-05, "loss": 0.8008, "step": 3870 }, { "epoch": 0.46, "learning_rate": 1.171999497019878e-05, "loss": 0.8175, "step": 3871 }, { "epoch": 0.46, "learning_rate": 1.1716189636494615e-05, "loss": 0.8622, "step": 3872 }, { "epoch": 0.46, "learning_rate": 1.1712384046717637e-05, "loss": 0.7796, "step": 3873 }, { "epoch": 0.46, "learning_rate": 1.1708578201435677e-05, "loss": 0.8186, "step": 3874 }, { "epoch": 0.46, "learning_rate": 1.170477210121661e-05, "loss": 0.7818, "step": 3875 }, { "epoch": 0.46, "learning_rate": 1.1700965746628343e-05, "loss": 0.7852, "step": 3876 }, { "epoch": 0.46, "learning_rate": 1.1697159138238821e-05, "loss": 0.731, "step": 3877 }, { "epoch": 0.46, "learning_rate": 1.1693352276616028e-05, "loss": 0.7896, "step": 3878 }, { "epoch": 0.46, "learning_rate": 1.1689545162327991e-05, "loss": 0.7863, "step": 3879 }, { "epoch": 0.46, "learning_rate": 1.1685737795942766e-05, "loss": 0.7773, "step": 3880 }, { "epoch": 0.46, "learning_rate": 1.168193017802845e-05, "loss": 0.7723, "step": 3881 }, { "epoch": 0.46, "learning_rate": 1.1678122309153178e-05, "loss": 0.7182, "step": 3882 }, { "epoch": 0.46, "learning_rate": 1.1674314189885123e-05, "loss": 0.793, "step": 3883 }, { "epoch": 0.46, "learning_rate": 1.1670505820792497e-05, "loss": 0.7623, "step": 3884 }, { "epoch": 0.46, "learning_rate": 1.1666697202443547e-05, "loss": 0.8532, "step": 3885 }, { "epoch": 0.46, "learning_rate": 1.1662888335406553e-05, "loss": 0.7525, "step": 3886 }, { "epoch": 0.46, "learning_rate": 1.1659079220249838e-05, "loss": 0.7924, "step": 3887 }, { "epoch": 0.46, "learning_rate": 1.1655269857541765e-05, "loss": 0.7874, "step": 3888 }, { "epoch": 0.46, "learning_rate": 1.1651460247850723e-05, "loss": 0.8025, "step": 3889 }, { "epoch": 0.46, "learning_rate": 1.1647650391745149e-05, "loss": 0.7829, "step": 3890 }, { "epoch": 0.46, "learning_rate": 1.1643840289793508e-05, "loss": 0.7388, "step": 3891 }, { "epoch": 0.46, "learning_rate": 1.1640029942564308e-05, "loss": 0.7394, "step": 3892 }, { "epoch": 0.46, "learning_rate": 1.1636219350626094e-05, "loss": 0.7785, "step": 3893 }, { "epoch": 0.46, "learning_rate": 1.1632408514547437e-05, "loss": 0.7612, "step": 3894 }, { "epoch": 0.46, "learning_rate": 1.162859743489696e-05, "loss": 0.7327, "step": 3895 }, { "epoch": 0.46, "learning_rate": 1.1624786112243312e-05, "loss": 0.8493, "step": 3896 }, { "epoch": 0.46, "learning_rate": 1.162097454715518e-05, "loss": 0.7567, "step": 3897 }, { "epoch": 0.46, "learning_rate": 1.1617162740201287e-05, "loss": 0.7606, "step": 3898 }, { "epoch": 0.46, "learning_rate": 1.1613350691950394e-05, "loss": 0.7807, "step": 3899 }, { "epoch": 0.47, "learning_rate": 1.1609538402971297e-05, "loss": 0.8019, "step": 3900 }, { "epoch": 0.47, "learning_rate": 1.1605725873832829e-05, "loss": 0.7751, "step": 3901 }, { "epoch": 0.47, "learning_rate": 1.1601913105103857e-05, "loss": 0.8036, "step": 3902 }, { "epoch": 0.47, "learning_rate": 1.1598100097353286e-05, "loss": 0.7584, "step": 3903 }, { "epoch": 0.47, "learning_rate": 1.1594286851150054e-05, "loss": 0.7673, "step": 3904 }, { "epoch": 0.47, "learning_rate": 1.1590473367063133e-05, "loss": 0.7835, "step": 3905 }, { "epoch": 0.47, "learning_rate": 1.158665964566154e-05, "loss": 0.7941, "step": 3906 }, { "epoch": 0.47, "learning_rate": 1.1582845687514312e-05, "loss": 0.7913, "step": 3907 }, { "epoch": 0.47, "learning_rate": 1.157903149319054e-05, "loss": 0.7913, "step": 3908 }, { "epoch": 0.47, "learning_rate": 1.1575217063259331e-05, "loss": 0.8164, "step": 3909 }, { "epoch": 0.47, "learning_rate": 1.1571402398289843e-05, "loss": 0.7868, "step": 3910 }, { "epoch": 0.47, "learning_rate": 1.156758749885126e-05, "loss": 0.7589, "step": 3911 }, { "epoch": 0.47, "learning_rate": 1.1563772365512802e-05, "loss": 0.7751, "step": 3912 }, { "epoch": 0.47, "learning_rate": 1.155995699884373e-05, "loss": 0.7734, "step": 3913 }, { "epoch": 0.47, "learning_rate": 1.1556141399413328e-05, "loss": 0.8153, "step": 3914 }, { "epoch": 0.47, "learning_rate": 1.1552325567790928e-05, "loss": 0.8119, "step": 3915 }, { "epoch": 0.47, "learning_rate": 1.1548509504545891e-05, "loss": 0.7695, "step": 3916 }, { "epoch": 0.47, "learning_rate": 1.1544693210247608e-05, "loss": 0.8198, "step": 3917 }, { "epoch": 0.47, "learning_rate": 1.154087668546551e-05, "loss": 0.8136, "step": 3918 }, { "epoch": 0.47, "learning_rate": 1.153705993076906e-05, "loss": 0.7249, "step": 3919 }, { "epoch": 0.47, "learning_rate": 1.1533242946727758e-05, "loss": 0.7667, "step": 3920 }, { "epoch": 0.47, "learning_rate": 1.152942573391114e-05, "loss": 0.7467, "step": 3921 }, { "epoch": 0.47, "learning_rate": 1.1525608292888767e-05, "loss": 0.8583, "step": 3922 }, { "epoch": 0.47, "learning_rate": 1.1521790624230242e-05, "loss": 0.7746, "step": 3923 }, { "epoch": 0.47, "learning_rate": 1.1517972728505198e-05, "loss": 0.6903, "step": 3924 }, { "epoch": 0.47, "learning_rate": 1.1514154606283305e-05, "loss": 0.7935, "step": 3925 }, { "epoch": 0.47, "learning_rate": 1.1510336258134267e-05, "loss": 0.7494, "step": 3926 }, { "epoch": 0.47, "learning_rate": 1.1506517684627816e-05, "loss": 0.803, "step": 3927 }, { "epoch": 0.47, "learning_rate": 1.1502698886333728e-05, "loss": 0.7528, "step": 3928 }, { "epoch": 0.47, "learning_rate": 1.14988798638218e-05, "loss": 0.7539, "step": 3929 }, { "epoch": 0.47, "learning_rate": 1.149506061766187e-05, "loss": 0.7662, "step": 3930 }, { "epoch": 0.47, "learning_rate": 1.1491241148423811e-05, "loss": 0.7383, "step": 3931 }, { "epoch": 0.47, "learning_rate": 1.148742145667752e-05, "loss": 0.7667, "step": 3932 }, { "epoch": 0.47, "learning_rate": 1.1483601542992947e-05, "loss": 0.8304, "step": 3933 }, { "epoch": 0.47, "learning_rate": 1.1479781407940042e-05, "loss": 0.8661, "step": 3934 }, { "epoch": 0.47, "learning_rate": 1.1475961052088826e-05, "loss": 0.7556, "step": 3935 }, { "epoch": 0.47, "learning_rate": 1.1472140476009326e-05, "loss": 0.8432, "step": 3936 }, { "epoch": 0.47, "learning_rate": 1.146831968027161e-05, "loss": 0.7941, "step": 3937 }, { "epoch": 0.47, "learning_rate": 1.146449866544578e-05, "loss": 0.7695, "step": 3938 }, { "epoch": 0.47, "learning_rate": 1.1460677432101971e-05, "loss": 0.7835, "step": 3939 }, { "epoch": 0.47, "learning_rate": 1.1456855980810348e-05, "loss": 0.808, "step": 3940 }, { "epoch": 0.47, "learning_rate": 1.1453034312141116e-05, "loss": 0.6814, "step": 3941 }, { "epoch": 0.47, "learning_rate": 1.1449212426664502e-05, "loss": 0.774, "step": 3942 }, { "epoch": 0.47, "learning_rate": 1.1445390324950766e-05, "loss": 0.7254, "step": 3943 }, { "epoch": 0.47, "learning_rate": 1.144156800757021e-05, "loss": 0.7489, "step": 3944 }, { "epoch": 0.47, "learning_rate": 1.1437745475093159e-05, "loss": 0.7545, "step": 3945 }, { "epoch": 0.47, "learning_rate": 1.1433922728089976e-05, "loss": 0.76, "step": 3946 }, { "epoch": 0.47, "learning_rate": 1.143009976713105e-05, "loss": 0.7416, "step": 3947 }, { "epoch": 0.47, "learning_rate": 1.1426276592786813e-05, "loss": 0.7427, "step": 3948 }, { "epoch": 0.47, "learning_rate": 1.142245320562771e-05, "loss": 0.7902, "step": 3949 }, { "epoch": 0.47, "learning_rate": 1.1418629606224237e-05, "loss": 0.8019, "step": 3950 }, { "epoch": 0.47, "learning_rate": 1.141480579514691e-05, "loss": 0.779, "step": 3951 }, { "epoch": 0.47, "learning_rate": 1.1410981772966283e-05, "loss": 0.7517, "step": 3952 }, { "epoch": 0.47, "learning_rate": 1.1407157540252937e-05, "loss": 0.7651, "step": 3953 }, { "epoch": 0.47, "learning_rate": 1.1403333097577487e-05, "loss": 0.7818, "step": 3954 }, { "epoch": 0.47, "learning_rate": 1.1399508445510577e-05, "loss": 0.7829, "step": 3955 }, { "epoch": 0.47, "learning_rate": 1.1395683584622882e-05, "loss": 0.7813, "step": 3956 }, { "epoch": 0.47, "learning_rate": 1.1391858515485114e-05, "loss": 0.784, "step": 3957 }, { "epoch": 0.47, "learning_rate": 1.1388033238668013e-05, "loss": 0.7483, "step": 3958 }, { "epoch": 0.47, "learning_rate": 1.1384207754742342e-05, "loss": 0.7461, "step": 3959 }, { "epoch": 0.47, "learning_rate": 1.1380382064278907e-05, "loss": 0.7879, "step": 3960 }, { "epoch": 0.47, "learning_rate": 1.137655616784854e-05, "loss": 0.798, "step": 3961 }, { "epoch": 0.47, "learning_rate": 1.1372730066022099e-05, "loss": 0.7667, "step": 3962 }, { "epoch": 0.47, "learning_rate": 1.1368903759370484e-05, "loss": 0.7919, "step": 3963 }, { "epoch": 0.47, "learning_rate": 1.136507724846461e-05, "loss": 0.7952, "step": 3964 }, { "epoch": 0.47, "learning_rate": 1.1361250533875438e-05, "loss": 0.8114, "step": 3965 }, { "epoch": 0.47, "learning_rate": 1.135742361617395e-05, "loss": 0.8209, "step": 3966 }, { "epoch": 0.47, "learning_rate": 1.135359649593116e-05, "loss": 0.7734, "step": 3967 }, { "epoch": 0.47, "learning_rate": 1.1349769173718115e-05, "loss": 0.7567, "step": 3968 }, { "epoch": 0.47, "learning_rate": 1.1345941650105888e-05, "loss": 0.7327, "step": 3969 }, { "epoch": 0.47, "learning_rate": 1.1342113925665584e-05, "loss": 0.7706, "step": 3970 }, { "epoch": 0.47, "learning_rate": 1.133828600096834e-05, "loss": 0.7779, "step": 3971 }, { "epoch": 0.47, "learning_rate": 1.1334457876585316e-05, "loss": 0.8398, "step": 3972 }, { "epoch": 0.47, "learning_rate": 1.1330629553087716e-05, "loss": 0.7405, "step": 3973 }, { "epoch": 0.47, "learning_rate": 1.1326801031046757e-05, "loss": 0.7316, "step": 3974 }, { "epoch": 0.47, "learning_rate": 1.1322972311033695e-05, "loss": 0.7188, "step": 3975 }, { "epoch": 0.47, "learning_rate": 1.1319143393619816e-05, "loss": 0.7411, "step": 3976 }, { "epoch": 0.47, "learning_rate": 1.1315314279376428e-05, "loss": 0.846, "step": 3977 }, { "epoch": 0.47, "learning_rate": 1.1311484968874877e-05, "loss": 0.7857, "step": 3978 }, { "epoch": 0.47, "learning_rate": 1.1307655462686537e-05, "loss": 0.7935, "step": 3979 }, { "epoch": 0.47, "learning_rate": 1.1303825761382805e-05, "loss": 0.8119, "step": 3980 }, { "epoch": 0.47, "learning_rate": 1.1299995865535113e-05, "loss": 0.7879, "step": 3981 }, { "epoch": 0.47, "learning_rate": 1.1296165775714917e-05, "loss": 0.8097, "step": 3982 }, { "epoch": 0.48, "learning_rate": 1.1292335492493712e-05, "loss": 0.784, "step": 3983 }, { "epoch": 0.48, "learning_rate": 1.1288505016443006e-05, "loss": 0.7193, "step": 3984 }, { "epoch": 0.48, "learning_rate": 1.1284674348134352e-05, "loss": 0.7863, "step": 3985 }, { "epoch": 0.48, "learning_rate": 1.128084348813932e-05, "loss": 0.8259, "step": 3986 }, { "epoch": 0.48, "learning_rate": 1.1277012437029516e-05, "loss": 0.8097, "step": 3987 }, { "epoch": 0.48, "learning_rate": 1.1273181195376568e-05, "loss": 0.7422, "step": 3988 }, { "epoch": 0.48, "learning_rate": 1.1269349763752139e-05, "loss": 0.7176, "step": 3989 }, { "epoch": 0.48, "learning_rate": 1.1265518142727916e-05, "loss": 0.7634, "step": 3990 }, { "epoch": 0.48, "learning_rate": 1.1261686332875616e-05, "loss": 0.7193, "step": 3991 }, { "epoch": 0.48, "learning_rate": 1.1257854334766984e-05, "loss": 0.8086, "step": 3992 }, { "epoch": 0.48, "learning_rate": 1.1254022148973791e-05, "loss": 0.7857, "step": 3993 }, { "epoch": 0.48, "learning_rate": 1.1250189776067842e-05, "loss": 0.7751, "step": 3994 }, { "epoch": 0.48, "learning_rate": 1.1246357216620958e-05, "loss": 0.793, "step": 3995 }, { "epoch": 0.48, "learning_rate": 1.1242524471205003e-05, "loss": 0.7282, "step": 3996 }, { "epoch": 0.48, "learning_rate": 1.1238691540391857e-05, "loss": 0.7617, "step": 3997 }, { "epoch": 0.48, "learning_rate": 1.1234858424753436e-05, "loss": 0.74, "step": 3998 }, { "epoch": 0.48, "learning_rate": 1.1231025124861677e-05, "loss": 0.76, "step": 3999 }, { "epoch": 0.48, "learning_rate": 1.1227191641288545e-05, "loss": 0.7494, "step": 4000 }, { "epoch": 0.48, "learning_rate": 1.1223357974606037e-05, "loss": 0.7913, "step": 4001 }, { "epoch": 0.48, "learning_rate": 1.1219524125386173e-05, "loss": 0.7606, "step": 4002 }, { "epoch": 0.48, "learning_rate": 1.1215690094201002e-05, "loss": 0.7684, "step": 4003 }, { "epoch": 0.48, "learning_rate": 1.1211855881622604e-05, "loss": 0.7919, "step": 4004 }, { "epoch": 0.48, "learning_rate": 1.1208021488223081e-05, "loss": 0.7606, "step": 4005 }, { "epoch": 0.48, "learning_rate": 1.1204186914574562e-05, "loss": 0.8008, "step": 4006 }, { "epoch": 0.48, "learning_rate": 1.1200352161249199e-05, "loss": 0.7506, "step": 4007 }, { "epoch": 0.48, "learning_rate": 1.1196517228819183e-05, "loss": 0.7807, "step": 4008 }, { "epoch": 0.48, "learning_rate": 1.1192682117856723e-05, "loss": 0.7215, "step": 4009 }, { "epoch": 0.48, "learning_rate": 1.1188846828934058e-05, "loss": 0.7673, "step": 4010 }, { "epoch": 0.48, "learning_rate": 1.1185011362623448e-05, "loss": 0.8326, "step": 4011 }, { "epoch": 0.48, "learning_rate": 1.118117571949718e-05, "loss": 0.7824, "step": 4012 }, { "epoch": 0.48, "learning_rate": 1.117733990012758e-05, "loss": 0.8181, "step": 4013 }, { "epoch": 0.48, "learning_rate": 1.1173503905086987e-05, "loss": 0.7997, "step": 4014 }, { "epoch": 0.48, "learning_rate": 1.1169667734947766e-05, "loss": 0.7807, "step": 4015 }, { "epoch": 0.48, "learning_rate": 1.1165831390282318e-05, "loss": 0.8203, "step": 4016 }, { "epoch": 0.48, "learning_rate": 1.1161994871663062e-05, "loss": 0.7796, "step": 4017 }, { "epoch": 0.48, "learning_rate": 1.1158158179662443e-05, "loss": 0.7193, "step": 4018 }, { "epoch": 0.48, "learning_rate": 1.1154321314852941e-05, "loss": 0.8387, "step": 4019 }, { "epoch": 0.48, "learning_rate": 1.1150484277807048e-05, "loss": 0.7695, "step": 4020 }, { "epoch": 0.48, "learning_rate": 1.1146647069097292e-05, "loss": 0.8315, "step": 4021 }, { "epoch": 0.48, "learning_rate": 1.114280968929622e-05, "loss": 0.7729, "step": 4022 }, { "epoch": 0.48, "learning_rate": 1.1138972138976412e-05, "loss": 0.7439, "step": 4023 }, { "epoch": 0.48, "learning_rate": 1.1135134418710469e-05, "loss": 0.7913, "step": 4024 }, { "epoch": 0.48, "learning_rate": 1.1131296529071014e-05, "loss": 0.7935, "step": 4025 }, { "epoch": 0.48, "learning_rate": 1.11274584706307e-05, "loss": 0.7958, "step": 4026 }, { "epoch": 0.48, "learning_rate": 1.1123620243962205e-05, "loss": 0.7316, "step": 4027 }, { "epoch": 0.48, "learning_rate": 1.1119781849638232e-05, "loss": 0.7573, "step": 4028 }, { "epoch": 0.48, "learning_rate": 1.1115943288231508e-05, "loss": 0.7427, "step": 4029 }, { "epoch": 0.48, "learning_rate": 1.1112104560314784e-05, "loss": 0.7645, "step": 4030 }, { "epoch": 0.48, "learning_rate": 1.110826566646084e-05, "loss": 0.7746, "step": 4031 }, { "epoch": 0.48, "learning_rate": 1.1104426607242471e-05, "loss": 0.7533, "step": 4032 }, { "epoch": 0.48, "learning_rate": 1.1100587383232506e-05, "loss": 0.7829, "step": 4033 }, { "epoch": 0.48, "learning_rate": 1.1096747995003803e-05, "loss": 0.7712, "step": 4034 }, { "epoch": 0.48, "learning_rate": 1.1092908443129227e-05, "loss": 0.7835, "step": 4035 }, { "epoch": 0.48, "learning_rate": 1.1089068728181686e-05, "loss": 0.8382, "step": 4036 }, { "epoch": 0.48, "learning_rate": 1.10852288507341e-05, "loss": 0.779, "step": 4037 }, { "epoch": 0.48, "learning_rate": 1.1081388811359415e-05, "loss": 0.7684, "step": 4038 }, { "epoch": 0.48, "learning_rate": 1.107754861063061e-05, "loss": 0.75, "step": 4039 }, { "epoch": 0.48, "learning_rate": 1.1073708249120678e-05, "loss": 0.7835, "step": 4040 }, { "epoch": 0.48, "learning_rate": 1.106986772740264e-05, "loss": 0.7444, "step": 4041 }, { "epoch": 0.48, "learning_rate": 1.1066027046049543e-05, "loss": 0.774, "step": 4042 }, { "epoch": 0.48, "learning_rate": 1.1062186205634453e-05, "loss": 0.769, "step": 4043 }, { "epoch": 0.48, "learning_rate": 1.1058345206730461e-05, "loss": 0.7768, "step": 4044 }, { "epoch": 0.48, "learning_rate": 1.1054504049910684e-05, "loss": 0.8209, "step": 4045 }, { "epoch": 0.48, "learning_rate": 1.1050662735748263e-05, "loss": 0.7327, "step": 4046 }, { "epoch": 0.48, "learning_rate": 1.1046821264816358e-05, "loss": 0.7662, "step": 4047 }, { "epoch": 0.48, "learning_rate": 1.104297963768816e-05, "loss": 0.8192, "step": 4048 }, { "epoch": 0.48, "learning_rate": 1.1039137854936875e-05, "loss": 0.7762, "step": 4049 }, { "epoch": 0.48, "learning_rate": 1.1035295917135734e-05, "loss": 0.7796, "step": 4050 }, { "epoch": 0.48, "learning_rate": 1.1031453824857993e-05, "loss": 0.8147, "step": 4051 }, { "epoch": 0.48, "learning_rate": 1.1027611578676936e-05, "loss": 0.7467, "step": 4052 }, { "epoch": 0.48, "learning_rate": 1.102376917916586e-05, "loss": 0.7852, "step": 4053 }, { "epoch": 0.48, "learning_rate": 1.1019926626898092e-05, "loss": 0.764, "step": 4054 }, { "epoch": 0.48, "learning_rate": 1.101608392244698e-05, "loss": 0.7461, "step": 4055 }, { "epoch": 0.48, "learning_rate": 1.1012241066385895e-05, "loss": 0.7896, "step": 4056 }, { "epoch": 0.48, "learning_rate": 1.1008398059288226e-05, "loss": 0.7472, "step": 4057 }, { "epoch": 0.48, "learning_rate": 1.1004554901727388e-05, "loss": 0.8164, "step": 4058 }, { "epoch": 0.48, "learning_rate": 1.1000711594276828e-05, "loss": 0.8186, "step": 4059 }, { "epoch": 0.48, "learning_rate": 1.0996868137509996e-05, "loss": 0.7215, "step": 4060 }, { "epoch": 0.48, "learning_rate": 1.0993024532000378e-05, "loss": 0.8108, "step": 4061 }, { "epoch": 0.48, "learning_rate": 1.0989180778321482e-05, "loss": 0.7545, "step": 4062 }, { "epoch": 0.48, "learning_rate": 1.0985336877046828e-05, "loss": 0.7271, "step": 4063 }, { "epoch": 0.48, "learning_rate": 1.0981492828749973e-05, "loss": 0.8069, "step": 4064 }, { "epoch": 0.48, "learning_rate": 1.097764863400448e-05, "loss": 0.8354, "step": 4065 }, { "epoch": 0.48, "learning_rate": 1.097380429338395e-05, "loss": 0.7969, "step": 4066 }, { "epoch": 0.49, "learning_rate": 1.096995980746199e-05, "loss": 0.7433, "step": 4067 }, { "epoch": 0.49, "learning_rate": 1.0966115176812237e-05, "loss": 0.7673, "step": 4068 }, { "epoch": 0.49, "learning_rate": 1.0962270402008352e-05, "loss": 0.7215, "step": 4069 }, { "epoch": 0.49, "learning_rate": 1.0958425483624012e-05, "loss": 0.7768, "step": 4070 }, { "epoch": 0.49, "learning_rate": 1.0954580422232921e-05, "loss": 0.7924, "step": 4071 }, { "epoch": 0.49, "learning_rate": 1.0950735218408795e-05, "loss": 0.7852, "step": 4072 }, { "epoch": 0.49, "learning_rate": 1.0946889872725381e-05, "loss": 0.7628, "step": 4073 }, { "epoch": 0.49, "learning_rate": 1.0943044385756445e-05, "loss": 0.8331, "step": 4074 }, { "epoch": 0.49, "learning_rate": 1.0939198758075768e-05, "loss": 0.7651, "step": 4075 }, { "epoch": 0.49, "learning_rate": 1.0935352990257161e-05, "loss": 0.7734, "step": 4076 }, { "epoch": 0.49, "learning_rate": 1.0931507082874448e-05, "loss": 0.7991, "step": 4077 }, { "epoch": 0.49, "learning_rate": 1.0927661036501477e-05, "loss": 0.7857, "step": 4078 }, { "epoch": 0.49, "learning_rate": 1.092381485171212e-05, "loss": 0.8136, "step": 4079 }, { "epoch": 0.49, "learning_rate": 1.0919968529080267e-05, "loss": 0.7712, "step": 4080 }, { "epoch": 0.49, "learning_rate": 1.0916122069179824e-05, "loss": 0.7818, "step": 4081 }, { "epoch": 0.49, "learning_rate": 1.0912275472584722e-05, "loss": 0.7478, "step": 4082 }, { "epoch": 0.49, "learning_rate": 1.0908428739868912e-05, "loss": 0.75, "step": 4083 }, { "epoch": 0.49, "learning_rate": 1.0904581871606373e-05, "loss": 0.7238, "step": 4084 }, { "epoch": 0.49, "learning_rate": 1.0900734868371086e-05, "loss": 0.7349, "step": 4085 }, { "epoch": 0.49, "learning_rate": 1.0896887730737069e-05, "loss": 0.7863, "step": 4086 }, { "epoch": 0.49, "learning_rate": 1.0893040459278352e-05, "loss": 0.8131, "step": 4087 }, { "epoch": 0.49, "learning_rate": 1.0889193054568988e-05, "loss": 0.7383, "step": 4088 }, { "epoch": 0.49, "learning_rate": 1.0885345517183046e-05, "loss": 0.76, "step": 4089 }, { "epoch": 0.49, "learning_rate": 1.0881497847694615e-05, "loss": 0.7935, "step": 4090 }, { "epoch": 0.49, "learning_rate": 1.0877650046677815e-05, "loss": 0.726, "step": 4091 }, { "epoch": 0.49, "learning_rate": 1.087380211470677e-05, "loss": 0.7701, "step": 4092 }, { "epoch": 0.49, "learning_rate": 1.0869954052355633e-05, "loss": 0.7673, "step": 4093 }, { "epoch": 0.49, "learning_rate": 1.0866105860198573e-05, "loss": 0.8331, "step": 4094 }, { "epoch": 0.49, "learning_rate": 1.0862257538809775e-05, "loss": 0.7902, "step": 4095 }, { "epoch": 0.49, "learning_rate": 1.0858409088763453e-05, "loss": 0.7455, "step": 4096 }, { "epoch": 0.49, "learning_rate": 1.0854560510633834e-05, "loss": 0.7533, "step": 4097 }, { "epoch": 0.49, "learning_rate": 1.0850711804995164e-05, "loss": 0.7723, "step": 4098 }, { "epoch": 0.49, "learning_rate": 1.0846862972421708e-05, "loss": 0.7835, "step": 4099 }, { "epoch": 0.49, "learning_rate": 1.0843014013487747e-05, "loss": 0.8125, "step": 4100 }, { "epoch": 0.49, "learning_rate": 1.083916492876759e-05, "loss": 0.7165, "step": 4101 }, { "epoch": 0.49, "learning_rate": 1.083531571883556e-05, "loss": 0.7439, "step": 4102 }, { "epoch": 0.49, "learning_rate": 1.0831466384265993e-05, "loss": 0.7388, "step": 4103 }, { "epoch": 0.49, "learning_rate": 1.0827616925633253e-05, "loss": 0.7919, "step": 4104 }, { "epoch": 0.49, "learning_rate": 1.0823767343511716e-05, "loss": 0.7472, "step": 4105 }, { "epoch": 0.49, "learning_rate": 1.0819917638475776e-05, "loss": 0.774, "step": 4106 }, { "epoch": 0.49, "learning_rate": 1.0816067811099856e-05, "loss": 0.7706, "step": 4107 }, { "epoch": 0.49, "learning_rate": 1.0812217861958377e-05, "loss": 0.7673, "step": 4108 }, { "epoch": 0.49, "learning_rate": 1.08083677916258e-05, "loss": 0.784, "step": 4109 }, { "epoch": 0.49, "learning_rate": 1.0804517600676592e-05, "loss": 0.7416, "step": 4110 }, { "epoch": 0.49, "learning_rate": 1.0800667289685239e-05, "loss": 0.8036, "step": 4111 }, { "epoch": 0.49, "learning_rate": 1.0796816859226248e-05, "loss": 0.7215, "step": 4112 }, { "epoch": 0.49, "learning_rate": 1.0792966309874137e-05, "loss": 0.7695, "step": 4113 }, { "epoch": 0.49, "learning_rate": 1.0789115642203454e-05, "loss": 0.793, "step": 4114 }, { "epoch": 0.49, "learning_rate": 1.078526485678875e-05, "loss": 0.7734, "step": 4115 }, { "epoch": 0.49, "learning_rate": 1.078141395420461e-05, "loss": 0.8136, "step": 4116 }, { "epoch": 0.49, "learning_rate": 1.0777562935025621e-05, "loss": 0.7349, "step": 4117 }, { "epoch": 0.49, "learning_rate": 1.0773711799826397e-05, "loss": 0.7829, "step": 4118 }, { "epoch": 0.49, "learning_rate": 1.0769860549181566e-05, "loss": 0.7528, "step": 4119 }, { "epoch": 0.49, "learning_rate": 1.0766009183665767e-05, "loss": 0.7182, "step": 4120 }, { "epoch": 0.49, "learning_rate": 1.076215770385367e-05, "loss": 0.8387, "step": 4121 }, { "epoch": 0.49, "learning_rate": 1.0758306110319956e-05, "loss": 0.7673, "step": 4122 }, { "epoch": 0.49, "learning_rate": 1.0754454403639313e-05, "loss": 0.7768, "step": 4123 }, { "epoch": 0.49, "learning_rate": 1.0750602584386464e-05, "loss": 0.7935, "step": 4124 }, { "epoch": 0.49, "learning_rate": 1.0746750653136135e-05, "loss": 0.7584, "step": 4125 }, { "epoch": 0.49, "learning_rate": 1.074289861046307e-05, "loss": 0.7785, "step": 4126 }, { "epoch": 0.49, "learning_rate": 1.073904645694204e-05, "loss": 0.74, "step": 4127 }, { "epoch": 0.49, "learning_rate": 1.0735194193147815e-05, "loss": 0.7974, "step": 4128 }, { "epoch": 0.49, "learning_rate": 1.0731341819655203e-05, "loss": 0.7494, "step": 4129 }, { "epoch": 0.49, "learning_rate": 1.072748933703901e-05, "loss": 0.832, "step": 4130 }, { "epoch": 0.49, "learning_rate": 1.0723636745874064e-05, "loss": 0.7405, "step": 4131 }, { "epoch": 0.49, "learning_rate": 1.0719784046735217e-05, "loss": 0.798, "step": 4132 }, { "epoch": 0.49, "learning_rate": 1.0715931240197324e-05, "loss": 0.7673, "step": 4133 }, { "epoch": 0.49, "learning_rate": 1.0712078326835267e-05, "loss": 0.7349, "step": 4134 }, { "epoch": 0.49, "learning_rate": 1.0708225307223936e-05, "loss": 0.7796, "step": 4135 }, { "epoch": 0.49, "learning_rate": 1.0704372181938246e-05, "loss": 0.8225, "step": 4136 }, { "epoch": 0.49, "learning_rate": 1.0700518951553118e-05, "loss": 0.7567, "step": 4137 }, { "epoch": 0.49, "learning_rate": 1.0696665616643492e-05, "loss": 0.7494, "step": 4138 }, { "epoch": 0.49, "learning_rate": 1.0692812177784326e-05, "loss": 0.7132, "step": 4139 }, { "epoch": 0.49, "learning_rate": 1.068895863555059e-05, "loss": 0.7634, "step": 4140 }, { "epoch": 0.49, "learning_rate": 1.0685104990517274e-05, "loss": 0.7807, "step": 4141 }, { "epoch": 0.49, "learning_rate": 1.0681251243259383e-05, "loss": 0.7584, "step": 4142 }, { "epoch": 0.49, "learning_rate": 1.0677397394351932e-05, "loss": 0.7606, "step": 4143 }, { "epoch": 0.49, "learning_rate": 1.0673543444369952e-05, "loss": 0.779, "step": 4144 }, { "epoch": 0.49, "learning_rate": 1.0669689393888491e-05, "loss": 0.7941, "step": 4145 }, { "epoch": 0.49, "learning_rate": 1.0665835243482617e-05, "loss": 0.8058, "step": 4146 }, { "epoch": 0.49, "learning_rate": 1.0661980993727408e-05, "loss": 0.8002, "step": 4147 }, { "epoch": 0.49, "learning_rate": 1.065812664519795e-05, "loss": 0.7746, "step": 4148 }, { "epoch": 0.49, "learning_rate": 1.065427219846936e-05, "loss": 0.7991, "step": 4149 }, { "epoch": 0.49, "learning_rate": 1.0650417654116754e-05, "loss": 0.7857, "step": 4150 }, { "epoch": 0.5, "learning_rate": 1.0646563012715267e-05, "loss": 0.7919, "step": 4151 }, { "epoch": 0.5, "learning_rate": 1.064270827484006e-05, "loss": 0.784, "step": 4152 }, { "epoch": 0.5, "learning_rate": 1.0638853441066289e-05, "loss": 0.8019, "step": 4153 }, { "epoch": 0.5, "learning_rate": 1.063499851196914e-05, "loss": 0.7634, "step": 4154 }, { "epoch": 0.5, "learning_rate": 1.0631143488123801e-05, "loss": 0.7344, "step": 4155 }, { "epoch": 0.5, "learning_rate": 1.062728837010549e-05, "loss": 0.7974, "step": 4156 }, { "epoch": 0.5, "learning_rate": 1.0623433158489422e-05, "loss": 0.7344, "step": 4157 }, { "epoch": 0.5, "learning_rate": 1.0619577853850835e-05, "loss": 0.7835, "step": 4158 }, { "epoch": 0.5, "learning_rate": 1.0615722456764981e-05, "loss": 0.7344, "step": 4159 }, { "epoch": 0.5, "learning_rate": 1.0611866967807121e-05, "loss": 0.774, "step": 4160 }, { "epoch": 0.5, "learning_rate": 1.0608011387552536e-05, "loss": 0.7807, "step": 4161 }, { "epoch": 0.5, "learning_rate": 1.060415571657652e-05, "loss": 0.7712, "step": 4162 }, { "epoch": 0.5, "learning_rate": 1.0600299955454372e-05, "loss": 0.7958, "step": 4163 }, { "epoch": 0.5, "learning_rate": 1.0596444104761412e-05, "loss": 0.7355, "step": 4164 }, { "epoch": 0.5, "learning_rate": 1.0592588165072972e-05, "loss": 0.7651, "step": 4165 }, { "epoch": 0.5, "learning_rate": 1.0588732136964399e-05, "loss": 0.8253, "step": 4166 }, { "epoch": 0.5, "learning_rate": 1.0584876021011052e-05, "loss": 0.7467, "step": 4167 }, { "epoch": 0.5, "learning_rate": 1.05810198177883e-05, "loss": 0.7941, "step": 4168 }, { "epoch": 0.5, "learning_rate": 1.0577163527871527e-05, "loss": 0.7573, "step": 4169 }, { "epoch": 0.5, "learning_rate": 1.0573307151836131e-05, "loss": 0.7829, "step": 4170 }, { "epoch": 0.5, "learning_rate": 1.0569450690257524e-05, "loss": 0.774, "step": 4171 }, { "epoch": 0.5, "learning_rate": 1.0565594143711128e-05, "loss": 0.7974, "step": 4172 }, { "epoch": 0.5, "learning_rate": 1.0561737512772376e-05, "loss": 0.827, "step": 4173 }, { "epoch": 0.5, "learning_rate": 1.0557880798016722e-05, "loss": 0.8265, "step": 4174 }, { "epoch": 0.5, "learning_rate": 1.0554024000019622e-05, "loss": 0.7539, "step": 4175 }, { "epoch": 0.5, "learning_rate": 1.0550167119356548e-05, "loss": 0.7963, "step": 4176 }, { "epoch": 0.5, "learning_rate": 1.0546310156602992e-05, "loss": 0.8092, "step": 4177 }, { "epoch": 0.5, "learning_rate": 1.0542453112334444e-05, "loss": 0.7773, "step": 4178 }, { "epoch": 0.5, "learning_rate": 1.0538595987126419e-05, "loss": 0.7623, "step": 4179 }, { "epoch": 0.5, "learning_rate": 1.0534738781554439e-05, "loss": 0.7723, "step": 4180 }, { "epoch": 0.5, "learning_rate": 1.0530881496194036e-05, "loss": 0.755, "step": 4181 }, { "epoch": 0.5, "learning_rate": 1.0527024131620758e-05, "loss": 0.7651, "step": 4182 }, { "epoch": 0.5, "learning_rate": 1.0523166688410158e-05, "loss": 0.6869, "step": 4183 }, { "epoch": 0.5, "learning_rate": 1.051930916713781e-05, "loss": 0.7718, "step": 4184 }, { "epoch": 0.5, "learning_rate": 1.0515451568379296e-05, "loss": 0.745, "step": 4185 }, { "epoch": 0.5, "learning_rate": 1.0511593892710204e-05, "loss": 0.7483, "step": 4186 }, { "epoch": 0.5, "learning_rate": 1.0507736140706145e-05, "loss": 0.7606, "step": 4187 }, { "epoch": 0.5, "learning_rate": 1.0503878312942725e-05, "loss": 0.7751, "step": 4188 }, { "epoch": 0.5, "learning_rate": 1.0500020409995577e-05, "loss": 0.8158, "step": 4189 }, { "epoch": 0.5, "learning_rate": 1.049616243244034e-05, "loss": 0.8365, "step": 4190 }, { "epoch": 0.5, "learning_rate": 1.0492304380852661e-05, "loss": 0.7422, "step": 4191 }, { "epoch": 0.5, "learning_rate": 1.04884462558082e-05, "loss": 0.74, "step": 4192 }, { "epoch": 0.5, "learning_rate": 1.048458805788263e-05, "loss": 0.7718, "step": 4193 }, { "epoch": 0.5, "learning_rate": 1.0480729787651628e-05, "loss": 0.7422, "step": 4194 }, { "epoch": 0.5, "learning_rate": 1.0476871445690895e-05, "loss": 0.7606, "step": 4195 }, { "epoch": 0.5, "learning_rate": 1.0473013032576127e-05, "loss": 0.76, "step": 4196 }, { "epoch": 0.5, "learning_rate": 1.0469154548883042e-05, "loss": 0.7294, "step": 4197 }, { "epoch": 0.5, "learning_rate": 1.0465295995187364e-05, "loss": 0.8097, "step": 4198 }, { "epoch": 0.5, "learning_rate": 1.0461437372064832e-05, "loss": 0.7439, "step": 4199 }, { "epoch": 0.5, "learning_rate": 1.0457578680091182e-05, "loss": 0.7634, "step": 4200 }, { "epoch": 0.5, "learning_rate": 1.0453719919842178e-05, "loss": 0.7706, "step": 4201 }, { "epoch": 0.5, "learning_rate": 1.0449861091893584e-05, "loss": 0.8025, "step": 4202 }, { "epoch": 0.5, "learning_rate": 1.0446002196821175e-05, "loss": 0.716, "step": 4203 }, { "epoch": 0.5, "learning_rate": 1.0442143235200736e-05, "loss": 0.7946, "step": 4204 }, { "epoch": 0.5, "learning_rate": 1.0438284207608068e-05, "loss": 0.8008, "step": 4205 }, { "epoch": 0.5, "learning_rate": 1.0434425114618972e-05, "loss": 0.7137, "step": 4206 }, { "epoch": 0.5, "learning_rate": 1.0430565956809265e-05, "loss": 0.7913, "step": 4207 }, { "epoch": 0.5, "learning_rate": 1.042670673475477e-05, "loss": 0.7623, "step": 4208 }, { "epoch": 0.5, "learning_rate": 1.0422847449031325e-05, "loss": 0.7171, "step": 4209 }, { "epoch": 0.5, "learning_rate": 1.0418988100214777e-05, "loss": 0.7768, "step": 4210 }, { "epoch": 0.5, "learning_rate": 1.0415128688880974e-05, "loss": 0.7305, "step": 4211 }, { "epoch": 0.5, "learning_rate": 1.0411269215605782e-05, "loss": 0.7081, "step": 4212 }, { "epoch": 0.5, "learning_rate": 1.0407409680965075e-05, "loss": 0.7997, "step": 4213 }, { "epoch": 0.5, "learning_rate": 1.0403550085534728e-05, "loss": 0.7372, "step": 4214 }, { "epoch": 0.5, "learning_rate": 1.039969042989064e-05, "loss": 0.8214, "step": 4215 }, { "epoch": 0.5, "learning_rate": 1.0395830714608704e-05, "loss": 0.7829, "step": 4216 }, { "epoch": 0.5, "learning_rate": 1.039197094026483e-05, "loss": 0.731, "step": 4217 }, { "epoch": 0.5, "learning_rate": 1.0388111107434942e-05, "loss": 0.7277, "step": 4218 }, { "epoch": 0.5, "learning_rate": 1.0384251216694954e-05, "loss": 0.8186, "step": 4219 }, { "epoch": 0.5, "learning_rate": 1.038039126862081e-05, "loss": 0.7919, "step": 4220 }, { "epoch": 0.5, "learning_rate": 1.037653126378845e-05, "loss": 0.7422, "step": 4221 }, { "epoch": 0.5, "learning_rate": 1.0372671202773825e-05, "loss": 0.7472, "step": 4222 }, { "epoch": 0.5, "learning_rate": 1.0368811086152895e-05, "loss": 0.779, "step": 4223 }, { "epoch": 0.5, "learning_rate": 1.0364950914501632e-05, "loss": 0.7969, "step": 4224 }, { "epoch": 0.5, "learning_rate": 1.036109068839601e-05, "loss": 0.721, "step": 4225 }, { "epoch": 0.5, "learning_rate": 1.035723040841201e-05, "loss": 0.7584, "step": 4226 }, { "epoch": 0.5, "learning_rate": 1.035337007512563e-05, "loss": 0.7796, "step": 4227 }, { "epoch": 0.5, "learning_rate": 1.034950968911287e-05, "loss": 0.7706, "step": 4228 }, { "epoch": 0.5, "learning_rate": 1.0345649250949733e-05, "loss": 0.7958, "step": 4229 }, { "epoch": 0.5, "learning_rate": 1.0341788761212245e-05, "loss": 0.8192, "step": 4230 }, { "epoch": 0.5, "learning_rate": 1.0337928220476425e-05, "loss": 0.7427, "step": 4231 }, { "epoch": 0.5, "learning_rate": 1.0334067629318303e-05, "loss": 0.7472, "step": 4232 }, { "epoch": 0.5, "learning_rate": 1.0330206988313917e-05, "loss": 0.8203, "step": 4233 }, { "epoch": 0.5, "learning_rate": 1.0326346298039317e-05, "loss": 0.7768, "step": 4234 }, { "epoch": 0.51, "learning_rate": 1.032248555907056e-05, "loss": 0.76, "step": 4235 }, { "epoch": 0.51, "learning_rate": 1.03186247719837e-05, "loss": 0.755, "step": 4236 }, { "epoch": 0.51, "learning_rate": 1.031476393735481e-05, "loss": 0.769, "step": 4237 }, { "epoch": 0.51, "learning_rate": 1.0310903055759963e-05, "loss": 0.7729, "step": 4238 }, { "epoch": 0.51, "learning_rate": 1.0307042127775245e-05, "loss": 0.7913, "step": 4239 }, { "epoch": 0.51, "learning_rate": 1.0303181153976742e-05, "loss": 0.8002, "step": 4240 }, { "epoch": 0.51, "learning_rate": 1.029932013494055e-05, "loss": 0.7796, "step": 4241 }, { "epoch": 0.51, "learning_rate": 1.0295459071242777e-05, "loss": 0.7712, "step": 4242 }, { "epoch": 0.51, "learning_rate": 1.0291597963459525e-05, "loss": 0.7617, "step": 4243 }, { "epoch": 0.51, "learning_rate": 1.0287736812166918e-05, "loss": 0.7455, "step": 4244 }, { "epoch": 0.51, "learning_rate": 1.0283875617941072e-05, "loss": 0.774, "step": 4245 }, { "epoch": 0.51, "learning_rate": 1.028001438135812e-05, "loss": 0.7723, "step": 4246 }, { "epoch": 0.51, "learning_rate": 1.0276153102994197e-05, "loss": 0.8136, "step": 4247 }, { "epoch": 0.51, "learning_rate": 1.0272291783425444e-05, "loss": 0.7785, "step": 4248 }, { "epoch": 0.51, "learning_rate": 1.026843042322801e-05, "loss": 0.7824, "step": 4249 }, { "epoch": 0.51, "learning_rate": 1.026456902297805e-05, "loss": 0.7958, "step": 4250 }, { "epoch": 0.51, "learning_rate": 1.026070758325172e-05, "loss": 0.7667, "step": 4251 }, { "epoch": 0.51, "learning_rate": 1.0256846104625187e-05, "loss": 0.7729, "step": 4252 }, { "epoch": 0.51, "learning_rate": 1.0252984587674621e-05, "loss": 0.7729, "step": 4253 }, { "epoch": 0.51, "learning_rate": 1.0249123032976205e-05, "loss": 0.7065, "step": 4254 }, { "epoch": 0.51, "learning_rate": 1.0245261441106117e-05, "loss": 0.7907, "step": 4255 }, { "epoch": 0.51, "learning_rate": 1.0241399812640549e-05, "loss": 0.7734, "step": 4256 }, { "epoch": 0.51, "learning_rate": 1.0237538148155695e-05, "loss": 0.8136, "step": 4257 }, { "epoch": 0.51, "learning_rate": 1.0233676448227748e-05, "loss": 0.8164, "step": 4258 }, { "epoch": 0.51, "learning_rate": 1.0229814713432915e-05, "loss": 0.7573, "step": 4259 }, { "epoch": 0.51, "learning_rate": 1.0225952944347413e-05, "loss": 0.7394, "step": 4260 }, { "epoch": 0.51, "learning_rate": 1.0222091141547447e-05, "loss": 0.8131, "step": 4261 }, { "epoch": 0.51, "learning_rate": 1.0218229305609246e-05, "loss": 0.7807, "step": 4262 }, { "epoch": 0.51, "learning_rate": 1.021436743710903e-05, "loss": 0.7785, "step": 4263 }, { "epoch": 0.51, "learning_rate": 1.0210505536623026e-05, "loss": 0.7483, "step": 4264 }, { "epoch": 0.51, "learning_rate": 1.0206643604727473e-05, "loss": 0.7773, "step": 4265 }, { "epoch": 0.51, "learning_rate": 1.0202781641998608e-05, "loss": 0.7779, "step": 4266 }, { "epoch": 0.51, "learning_rate": 1.019891964901268e-05, "loss": 0.7924, "step": 4267 }, { "epoch": 0.51, "learning_rate": 1.0195057626345929e-05, "loss": 0.7807, "step": 4268 }, { "epoch": 0.51, "learning_rate": 1.0191195574574613e-05, "loss": 0.7143, "step": 4269 }, { "epoch": 0.51, "learning_rate": 1.0187333494274989e-05, "loss": 0.7796, "step": 4270 }, { "epoch": 0.51, "learning_rate": 1.0183471386023313e-05, "loss": 0.7974, "step": 4271 }, { "epoch": 0.51, "learning_rate": 1.017960925039586e-05, "loss": 0.7439, "step": 4272 }, { "epoch": 0.51, "learning_rate": 1.017574708796889e-05, "loss": 0.7768, "step": 4273 }, { "epoch": 0.51, "learning_rate": 1.0171884899318683e-05, "loss": 0.7232, "step": 4274 }, { "epoch": 0.51, "learning_rate": 1.0168022685021516e-05, "loss": 0.7511, "step": 4275 }, { "epoch": 0.51, "learning_rate": 1.0164160445653668e-05, "loss": 0.7706, "step": 4276 }, { "epoch": 0.51, "learning_rate": 1.0160298181791424e-05, "loss": 0.7846, "step": 4277 }, { "epoch": 0.51, "learning_rate": 1.0156435894011074e-05, "loss": 0.8075, "step": 4278 }, { "epoch": 0.51, "learning_rate": 1.0152573582888909e-05, "loss": 0.7143, "step": 4279 }, { "epoch": 0.51, "learning_rate": 1.0148711249001229e-05, "loss": 0.6953, "step": 4280 }, { "epoch": 0.51, "learning_rate": 1.0144848892924328e-05, "loss": 0.7561, "step": 4281 }, { "epoch": 0.51, "learning_rate": 1.014098651523451e-05, "loss": 0.7779, "step": 4282 }, { "epoch": 0.51, "learning_rate": 1.0137124116508083e-05, "loss": 0.7372, "step": 4283 }, { "epoch": 0.51, "learning_rate": 1.0133261697321353e-05, "loss": 0.808, "step": 4284 }, { "epoch": 0.51, "learning_rate": 1.0129399258250632e-05, "loss": 0.7221, "step": 4285 }, { "epoch": 0.51, "learning_rate": 1.0125536799872235e-05, "loss": 0.7913, "step": 4286 }, { "epoch": 0.51, "learning_rate": 1.0121674322762484e-05, "loss": 0.8131, "step": 4287 }, { "epoch": 0.51, "learning_rate": 1.0117811827497696e-05, "loss": 0.7288, "step": 4288 }, { "epoch": 0.51, "learning_rate": 1.0113949314654192e-05, "loss": 0.7807, "step": 4289 }, { "epoch": 0.51, "learning_rate": 1.0110086784808301e-05, "loss": 0.7907, "step": 4290 }, { "epoch": 0.51, "learning_rate": 1.0106224238536352e-05, "loss": 0.7567, "step": 4291 }, { "epoch": 0.51, "learning_rate": 1.0102361676414674e-05, "loss": 0.7846, "step": 4292 }, { "epoch": 0.51, "learning_rate": 1.00984990990196e-05, "loss": 0.7974, "step": 4293 }, { "epoch": 0.51, "learning_rate": 1.0094636506927469e-05, "loss": 0.7227, "step": 4294 }, { "epoch": 0.51, "learning_rate": 1.0090773900714617e-05, "loss": 0.6752, "step": 4295 }, { "epoch": 0.51, "learning_rate": 1.008691128095738e-05, "loss": 0.7405, "step": 4296 }, { "epoch": 0.51, "learning_rate": 1.0083048648232102e-05, "loss": 0.808, "step": 4297 }, { "epoch": 0.51, "learning_rate": 1.007918600311513e-05, "loss": 0.769, "step": 4298 }, { "epoch": 0.51, "learning_rate": 1.0075323346182804e-05, "loss": 0.8136, "step": 4299 }, { "epoch": 0.51, "learning_rate": 1.0071460678011477e-05, "loss": 0.726, "step": 4300 }, { "epoch": 0.51, "learning_rate": 1.0067597999177498e-05, "loss": 0.8298, "step": 4301 }, { "epoch": 0.51, "learning_rate": 1.0063735310257212e-05, "loss": 0.7333, "step": 4302 }, { "epoch": 0.51, "learning_rate": 1.0059872611826977e-05, "loss": 0.7729, "step": 4303 }, { "epoch": 0.51, "learning_rate": 1.0056009904463143e-05, "loss": 0.719, "step": 4304 }, { "epoch": 0.51, "learning_rate": 1.0052147188742065e-05, "loss": 0.76, "step": 4305 }, { "epoch": 0.51, "learning_rate": 1.0048284465240102e-05, "loss": 0.7723, "step": 4306 }, { "epoch": 0.51, "learning_rate": 1.0044421734533606e-05, "loss": 0.8465, "step": 4307 }, { "epoch": 0.51, "learning_rate": 1.0040558997198943e-05, "loss": 0.7316, "step": 4308 }, { "epoch": 0.51, "learning_rate": 1.0036696253812468e-05, "loss": 0.7773, "step": 4309 }, { "epoch": 0.51, "learning_rate": 1.0032833504950542e-05, "loss": 0.7667, "step": 4310 }, { "epoch": 0.51, "learning_rate": 1.0028970751189522e-05, "loss": 0.7974, "step": 4311 }, { "epoch": 0.51, "learning_rate": 1.0025107993105775e-05, "loss": 0.7327, "step": 4312 }, { "epoch": 0.51, "learning_rate": 1.0021245231275664e-05, "loss": 0.8158, "step": 4313 }, { "epoch": 0.51, "learning_rate": 1.001738246627555e-05, "loss": 0.7483, "step": 4314 }, { "epoch": 0.51, "learning_rate": 1.0013519698681795e-05, "loss": 0.7701, "step": 4315 }, { "epoch": 0.51, "learning_rate": 1.0009656929070766e-05, "loss": 0.736, "step": 4316 }, { "epoch": 0.51, "learning_rate": 1.0005794158018823e-05, "loss": 0.6934, "step": 4317 }, { "epoch": 0.51, "learning_rate": 1.0001931386102337e-05, "loss": 0.8114, "step": 4318 }, { "epoch": 0.52, "learning_rate": 9.998068613897666e-06, "loss": 0.7673, "step": 4319 }, { "epoch": 0.52, "learning_rate": 9.994205841981179e-06, "loss": 0.7394, "step": 4320 }, { "epoch": 0.52, "learning_rate": 9.990343070929235e-06, "loss": 0.7924, "step": 4321 }, { "epoch": 0.52, "learning_rate": 9.986480301318209e-06, "loss": 0.7154, "step": 4322 }, { "epoch": 0.52, "learning_rate": 9.982617533724454e-06, "loss": 0.7305, "step": 4323 }, { "epoch": 0.52, "learning_rate": 9.978754768724337e-06, "loss": 0.7422, "step": 4324 }, { "epoch": 0.52, "learning_rate": 9.974892006894226e-06, "loss": 0.7584, "step": 4325 }, { "epoch": 0.52, "learning_rate": 9.97102924881048e-06, "loss": 0.7227, "step": 4326 }, { "epoch": 0.52, "learning_rate": 9.967166495049463e-06, "loss": 0.7628, "step": 4327 }, { "epoch": 0.52, "learning_rate": 9.963303746187535e-06, "loss": 0.7969, "step": 4328 }, { "epoch": 0.52, "learning_rate": 9.959441002801059e-06, "loss": 0.7573, "step": 4329 }, { "epoch": 0.52, "learning_rate": 9.955578265466394e-06, "loss": 0.7852, "step": 4330 }, { "epoch": 0.52, "learning_rate": 9.9517155347599e-06, "loss": 0.7684, "step": 4331 }, { "epoch": 0.52, "learning_rate": 9.94785281125794e-06, "loss": 0.7913, "step": 4332 }, { "epoch": 0.52, "learning_rate": 9.943990095536862e-06, "loss": 0.7165, "step": 4333 }, { "epoch": 0.52, "learning_rate": 9.940127388173027e-06, "loss": 0.8013, "step": 4334 }, { "epoch": 0.52, "learning_rate": 9.93626468974279e-06, "loss": 0.7667, "step": 4335 }, { "epoch": 0.52, "learning_rate": 9.932402000822503e-06, "loss": 0.7896, "step": 4336 }, { "epoch": 0.52, "learning_rate": 9.928539321988524e-06, "loss": 0.7612, "step": 4337 }, { "epoch": 0.52, "learning_rate": 9.9246766538172e-06, "loss": 0.8086, "step": 4338 }, { "epoch": 0.52, "learning_rate": 9.920813996884874e-06, "loss": 0.8131, "step": 4339 }, { "epoch": 0.52, "learning_rate": 9.9169513517679e-06, "loss": 0.7969, "step": 4340 }, { "epoch": 0.52, "learning_rate": 9.913088719042622e-06, "loss": 0.7667, "step": 4341 }, { "epoch": 0.52, "learning_rate": 9.90922609928539e-06, "loss": 0.7868, "step": 4342 }, { "epoch": 0.52, "learning_rate": 9.905363493072534e-06, "loss": 0.7958, "step": 4343 }, { "epoch": 0.52, "learning_rate": 9.901500900980401e-06, "loss": 0.779, "step": 4344 }, { "epoch": 0.52, "learning_rate": 9.897638323585328e-06, "loss": 0.7701, "step": 4345 }, { "epoch": 0.52, "learning_rate": 9.89377576146365e-06, "loss": 0.8237, "step": 4346 }, { "epoch": 0.52, "learning_rate": 9.889913215191702e-06, "loss": 0.7885, "step": 4347 }, { "epoch": 0.52, "learning_rate": 9.886050685345811e-06, "loss": 0.7349, "step": 4348 }, { "epoch": 0.52, "learning_rate": 9.882188172502306e-06, "loss": 0.7852, "step": 4349 }, { "epoch": 0.52, "learning_rate": 9.878325677237519e-06, "loss": 0.8052, "step": 4350 }, { "epoch": 0.52, "learning_rate": 9.874463200127763e-06, "loss": 0.8181, "step": 4351 }, { "epoch": 0.52, "learning_rate": 9.870600741749373e-06, "loss": 0.6842, "step": 4352 }, { "epoch": 0.52, "learning_rate": 9.86673830267865e-06, "loss": 0.8382, "step": 4353 }, { "epoch": 0.52, "learning_rate": 9.86287588349192e-06, "loss": 0.8214, "step": 4354 }, { "epoch": 0.52, "learning_rate": 9.859013484765491e-06, "loss": 0.8114, "step": 4355 }, { "epoch": 0.52, "learning_rate": 9.855151107075674e-06, "loss": 0.7768, "step": 4356 }, { "epoch": 0.52, "learning_rate": 9.851288750998775e-06, "loss": 0.7985, "step": 4357 }, { "epoch": 0.52, "learning_rate": 9.847426417111093e-06, "loss": 0.7807, "step": 4358 }, { "epoch": 0.52, "learning_rate": 9.843564105988928e-06, "loss": 0.817, "step": 4359 }, { "epoch": 0.52, "learning_rate": 9.839701818208576e-06, "loss": 0.7561, "step": 4360 }, { "epoch": 0.52, "learning_rate": 9.835839554346333e-06, "loss": 0.7383, "step": 4361 }, { "epoch": 0.52, "learning_rate": 9.831977314978487e-06, "loss": 0.8058, "step": 4362 }, { "epoch": 0.52, "learning_rate": 9.82811510068132e-06, "loss": 0.7653, "step": 4363 }, { "epoch": 0.52, "learning_rate": 9.824252912031112e-06, "loss": 0.7667, "step": 4364 }, { "epoch": 0.52, "learning_rate": 9.820390749604142e-06, "loss": 0.798, "step": 4365 }, { "epoch": 0.52, "learning_rate": 9.816528613976687e-06, "loss": 0.7695, "step": 4366 }, { "epoch": 0.52, "learning_rate": 9.812666505725016e-06, "loss": 0.6981, "step": 4367 }, { "epoch": 0.52, "learning_rate": 9.80880442542539e-06, "loss": 0.7695, "step": 4368 }, { "epoch": 0.52, "learning_rate": 9.804942373654075e-06, "loss": 0.697, "step": 4369 }, { "epoch": 0.52, "learning_rate": 9.801080350987325e-06, "loss": 0.8359, "step": 4370 }, { "epoch": 0.52, "learning_rate": 9.797218358001392e-06, "loss": 0.7422, "step": 4371 }, { "epoch": 0.52, "learning_rate": 9.79335639527253e-06, "loss": 0.7556, "step": 4372 }, { "epoch": 0.52, "learning_rate": 9.789494463376977e-06, "loss": 0.784, "step": 4373 }, { "epoch": 0.52, "learning_rate": 9.785632562890974e-06, "loss": 0.7539, "step": 4374 }, { "epoch": 0.52, "learning_rate": 9.781770694390757e-06, "loss": 0.7835, "step": 4375 }, { "epoch": 0.52, "learning_rate": 9.777908858452553e-06, "loss": 0.779, "step": 4376 }, { "epoch": 0.52, "learning_rate": 9.774047055652592e-06, "loss": 0.8142, "step": 4377 }, { "epoch": 0.52, "learning_rate": 9.770185286567086e-06, "loss": 0.7718, "step": 4378 }, { "epoch": 0.52, "learning_rate": 9.766323551772257e-06, "loss": 0.8086, "step": 4379 }, { "epoch": 0.52, "learning_rate": 9.76246185184431e-06, "loss": 0.7779, "step": 4380 }, { "epoch": 0.52, "learning_rate": 9.758600187359453e-06, "loss": 0.8287, "step": 4381 }, { "epoch": 0.52, "learning_rate": 9.754738558893884e-06, "loss": 0.7243, "step": 4382 }, { "epoch": 0.52, "learning_rate": 9.750876967023798e-06, "loss": 0.8025, "step": 4383 }, { "epoch": 0.52, "learning_rate": 9.74701541232538e-06, "loss": 0.7991, "step": 4384 }, { "epoch": 0.52, "learning_rate": 9.743153895374817e-06, "loss": 0.7963, "step": 4385 }, { "epoch": 0.52, "learning_rate": 9.739292416748282e-06, "loss": 0.7478, "step": 4386 }, { "epoch": 0.52, "learning_rate": 9.735430977021956e-06, "loss": 0.7517, "step": 4387 }, { "epoch": 0.52, "learning_rate": 9.731569576771992e-06, "loss": 0.7288, "step": 4388 }, { "epoch": 0.52, "learning_rate": 9.727708216574558e-06, "loss": 0.8002, "step": 4389 }, { "epoch": 0.52, "learning_rate": 9.723846897005805e-06, "loss": 0.7941, "step": 4390 }, { "epoch": 0.52, "learning_rate": 9.719985618641881e-06, "loss": 0.7171, "step": 4391 }, { "epoch": 0.52, "learning_rate": 9.716124382058933e-06, "loss": 0.774, "step": 4392 }, { "epoch": 0.52, "learning_rate": 9.712263187833087e-06, "loss": 0.7394, "step": 4393 }, { "epoch": 0.52, "learning_rate": 9.708402036540478e-06, "loss": 0.8292, "step": 4394 }, { "epoch": 0.52, "learning_rate": 9.704540928757227e-06, "loss": 0.7985, "step": 4395 }, { "epoch": 0.52, "learning_rate": 9.700679865059451e-06, "loss": 0.7963, "step": 4396 }, { "epoch": 0.52, "learning_rate": 9.696818846023263e-06, "loss": 0.7243, "step": 4397 }, { "epoch": 0.52, "learning_rate": 9.692957872224758e-06, "loss": 0.755, "step": 4398 }, { "epoch": 0.52, "learning_rate": 9.689096944240038e-06, "loss": 0.7958, "step": 4399 }, { "epoch": 0.52, "learning_rate": 9.685236062645193e-06, "loss": 0.7846, "step": 4400 }, { "epoch": 0.52, "learning_rate": 9.6813752280163e-06, "loss": 0.7801, "step": 4401 }, { "epoch": 0.52, "learning_rate": 9.677514440929445e-06, "loss": 0.7411, "step": 4402 }, { "epoch": 0.53, "learning_rate": 9.673653701960684e-06, "loss": 0.7556, "step": 4403 }, { "epoch": 0.53, "learning_rate": 9.669793011686084e-06, "loss": 0.731, "step": 4404 }, { "epoch": 0.53, "learning_rate": 9.6659323706817e-06, "loss": 0.7785, "step": 4405 }, { "epoch": 0.53, "learning_rate": 9.662071779523579e-06, "loss": 0.7679, "step": 4406 }, { "epoch": 0.53, "learning_rate": 9.658211238787758e-06, "loss": 0.7589, "step": 4407 }, { "epoch": 0.53, "learning_rate": 9.654350749050268e-06, "loss": 0.8326, "step": 4408 }, { "epoch": 0.53, "learning_rate": 9.650490310887134e-06, "loss": 0.6903, "step": 4409 }, { "epoch": 0.53, "learning_rate": 9.646629924874372e-06, "loss": 0.7054, "step": 4410 }, { "epoch": 0.53, "learning_rate": 9.64276959158799e-06, "loss": 0.8203, "step": 4411 }, { "epoch": 0.53, "learning_rate": 9.638909311603995e-06, "loss": 0.7919, "step": 4412 }, { "epoch": 0.53, "learning_rate": 9.635049085498371e-06, "loss": 0.7785, "step": 4413 }, { "epoch": 0.53, "learning_rate": 9.631188913847108e-06, "loss": 0.7779, "step": 4414 }, { "epoch": 0.53, "learning_rate": 9.627328797226177e-06, "loss": 0.7985, "step": 4415 }, { "epoch": 0.53, "learning_rate": 9.623468736211552e-06, "loss": 0.7098, "step": 4416 }, { "epoch": 0.53, "learning_rate": 9.619608731379196e-06, "loss": 0.7623, "step": 4417 }, { "epoch": 0.53, "learning_rate": 9.61574878330505e-06, "loss": 0.817, "step": 4418 }, { "epoch": 0.53, "learning_rate": 9.611888892565062e-06, "loss": 0.7857, "step": 4419 }, { "epoch": 0.53, "learning_rate": 9.608029059735172e-06, "loss": 0.774, "step": 4420 }, { "epoch": 0.53, "learning_rate": 9.604169285391298e-06, "loss": 0.7483, "step": 4421 }, { "epoch": 0.53, "learning_rate": 9.600309570109366e-06, "loss": 0.7969, "step": 4422 }, { "epoch": 0.53, "learning_rate": 9.596449914465275e-06, "loss": 0.7952, "step": 4423 }, { "epoch": 0.53, "learning_rate": 9.592590319034929e-06, "loss": 0.7394, "step": 4424 }, { "epoch": 0.53, "learning_rate": 9.588730784394221e-06, "loss": 0.7623, "step": 4425 }, { "epoch": 0.53, "learning_rate": 9.584871311119028e-06, "loss": 0.784, "step": 4426 }, { "epoch": 0.53, "learning_rate": 9.581011899785228e-06, "loss": 0.7366, "step": 4427 }, { "epoch": 0.53, "learning_rate": 9.577152550968677e-06, "loss": 0.7098, "step": 4428 }, { "epoch": 0.53, "learning_rate": 9.573293265245231e-06, "loss": 0.7383, "step": 4429 }, { "epoch": 0.53, "learning_rate": 9.569434043190737e-06, "loss": 0.7779, "step": 4430 }, { "epoch": 0.53, "learning_rate": 9.565574885381032e-06, "loss": 0.7729, "step": 4431 }, { "epoch": 0.53, "learning_rate": 9.561715792391936e-06, "loss": 0.7494, "step": 4432 }, { "epoch": 0.53, "learning_rate": 9.557856764799267e-06, "loss": 0.7868, "step": 4433 }, { "epoch": 0.53, "learning_rate": 9.553997803178828e-06, "loss": 0.7919, "step": 4434 }, { "epoch": 0.53, "learning_rate": 9.550138908106417e-06, "loss": 0.7729, "step": 4435 }, { "epoch": 0.53, "learning_rate": 9.546280080157822e-06, "loss": 0.7902, "step": 4436 }, { "epoch": 0.53, "learning_rate": 9.542421319908821e-06, "loss": 0.7718, "step": 4437 }, { "epoch": 0.53, "learning_rate": 9.538562627935173e-06, "loss": 0.74, "step": 4438 }, { "epoch": 0.53, "learning_rate": 9.534704004812638e-06, "loss": 0.7762, "step": 4439 }, { "epoch": 0.53, "learning_rate": 9.530845451116961e-06, "loss": 0.7673, "step": 4440 }, { "epoch": 0.53, "learning_rate": 9.526986967423875e-06, "loss": 0.7277, "step": 4441 }, { "epoch": 0.53, "learning_rate": 9.52312855430911e-06, "loss": 0.7857, "step": 4442 }, { "epoch": 0.53, "learning_rate": 9.519270212348375e-06, "loss": 0.7199, "step": 4443 }, { "epoch": 0.53, "learning_rate": 9.515411942117373e-06, "loss": 0.7701, "step": 4444 }, { "epoch": 0.53, "learning_rate": 9.511553744191804e-06, "loss": 0.7835, "step": 4445 }, { "epoch": 0.53, "learning_rate": 9.50769561914734e-06, "loss": 0.7773, "step": 4446 }, { "epoch": 0.53, "learning_rate": 9.503837567559664e-06, "loss": 0.7706, "step": 4447 }, { "epoch": 0.53, "learning_rate": 9.499979590004426e-06, "loss": 0.7093, "step": 4448 }, { "epoch": 0.53, "learning_rate": 9.496121687057276e-06, "loss": 0.7455, "step": 4449 }, { "epoch": 0.53, "learning_rate": 9.492263859293857e-06, "loss": 0.7902, "step": 4450 }, { "epoch": 0.53, "learning_rate": 9.488406107289798e-06, "loss": 0.7511, "step": 4451 }, { "epoch": 0.53, "learning_rate": 9.484548431620709e-06, "loss": 0.7695, "step": 4452 }, { "epoch": 0.53, "learning_rate": 9.480690832862193e-06, "loss": 0.7773, "step": 4453 }, { "epoch": 0.53, "learning_rate": 9.476833311589844e-06, "loss": 0.8013, "step": 4454 }, { "epoch": 0.53, "learning_rate": 9.472975868379245e-06, "loss": 0.7734, "step": 4455 }, { "epoch": 0.53, "learning_rate": 9.469118503805966e-06, "loss": 0.7974, "step": 4456 }, { "epoch": 0.53, "learning_rate": 9.465261218445564e-06, "loss": 0.8304, "step": 4457 }, { "epoch": 0.53, "learning_rate": 9.461404012873584e-06, "loss": 0.7785, "step": 4458 }, { "epoch": 0.53, "learning_rate": 9.457546887665558e-06, "loss": 0.8426, "step": 4459 }, { "epoch": 0.53, "learning_rate": 9.453689843397011e-06, "loss": 0.7857, "step": 4460 }, { "epoch": 0.53, "learning_rate": 9.449832880643453e-06, "loss": 0.6998, "step": 4461 }, { "epoch": 0.53, "learning_rate": 9.445975999980383e-06, "loss": 0.7009, "step": 4462 }, { "epoch": 0.53, "learning_rate": 9.442119201983283e-06, "loss": 0.7494, "step": 4463 }, { "epoch": 0.53, "learning_rate": 9.438262487227626e-06, "loss": 0.7679, "step": 4464 }, { "epoch": 0.53, "learning_rate": 9.434405856288875e-06, "loss": 0.7946, "step": 4465 }, { "epoch": 0.53, "learning_rate": 9.430549309742478e-06, "loss": 0.7779, "step": 4466 }, { "epoch": 0.53, "learning_rate": 9.426692848163872e-06, "loss": 0.7712, "step": 4467 }, { "epoch": 0.53, "learning_rate": 9.422836472128476e-06, "loss": 0.7723, "step": 4468 }, { "epoch": 0.53, "learning_rate": 9.418980182211703e-06, "loss": 0.7913, "step": 4469 }, { "epoch": 0.53, "learning_rate": 9.415123978988951e-06, "loss": 0.7857, "step": 4470 }, { "epoch": 0.53, "learning_rate": 9.4112678630356e-06, "loss": 0.7857, "step": 4471 }, { "epoch": 0.53, "learning_rate": 9.407411834927033e-06, "loss": 0.7483, "step": 4472 }, { "epoch": 0.53, "learning_rate": 9.403555895238593e-06, "loss": 0.7695, "step": 4473 }, { "epoch": 0.53, "learning_rate": 9.399700044545633e-06, "loss": 0.7461, "step": 4474 }, { "epoch": 0.53, "learning_rate": 9.395844283423483e-06, "loss": 0.8052, "step": 4475 }, { "epoch": 0.53, "learning_rate": 9.391988612447465e-06, "loss": 0.7238, "step": 4476 }, { "epoch": 0.53, "learning_rate": 9.38813303219288e-06, "loss": 0.7154, "step": 4477 }, { "epoch": 0.53, "learning_rate": 9.384277543235024e-06, "loss": 0.7913, "step": 4478 }, { "epoch": 0.53, "learning_rate": 9.380422146149168e-06, "loss": 0.7227, "step": 4479 }, { "epoch": 0.53, "learning_rate": 9.37656684151058e-06, "loss": 0.7344, "step": 4480 }, { "epoch": 0.53, "learning_rate": 9.37271162989451e-06, "loss": 0.8119, "step": 4481 }, { "epoch": 0.53, "learning_rate": 9.3688565118762e-06, "loss": 0.7528, "step": 4482 }, { "epoch": 0.53, "learning_rate": 9.365001488030865e-06, "loss": 0.7461, "step": 4483 }, { "epoch": 0.53, "learning_rate": 9.361146558933715e-06, "loss": 0.7232, "step": 4484 }, { "epoch": 0.53, "learning_rate": 9.357291725159944e-06, "loss": 0.7762, "step": 4485 }, { "epoch": 0.54, "learning_rate": 9.353436987284732e-06, "loss": 0.7919, "step": 4486 }, { "epoch": 0.54, "learning_rate": 9.349582345883253e-06, "loss": 0.7288, "step": 4487 }, { "epoch": 0.54, "learning_rate": 9.345727801530644e-06, "loss": 0.76, "step": 4488 }, { "epoch": 0.54, "learning_rate": 9.341873354802053e-06, "loss": 0.8047, "step": 4489 }, { "epoch": 0.54, "learning_rate": 9.338019006272595e-06, "loss": 0.7349, "step": 4490 }, { "epoch": 0.54, "learning_rate": 9.334164756517383e-06, "loss": 0.7132, "step": 4491 }, { "epoch": 0.54, "learning_rate": 9.330310606111514e-06, "loss": 0.7885, "step": 4492 }, { "epoch": 0.54, "learning_rate": 9.326456555630053e-06, "loss": 0.8315, "step": 4493 }, { "epoch": 0.54, "learning_rate": 9.322602605648073e-06, "loss": 0.832, "step": 4494 }, { "epoch": 0.54, "learning_rate": 9.318748756740622e-06, "loss": 0.7868, "step": 4495 }, { "epoch": 0.54, "learning_rate": 9.314895009482726e-06, "loss": 0.8092, "step": 4496 }, { "epoch": 0.54, "learning_rate": 9.311041364449415e-06, "loss": 0.7472, "step": 4497 }, { "epoch": 0.54, "learning_rate": 9.30718782221568e-06, "loss": 0.7221, "step": 4498 }, { "epoch": 0.54, "learning_rate": 9.303334383356513e-06, "loss": 0.7344, "step": 4499 }, { "epoch": 0.54, "learning_rate": 9.299481048446886e-06, "loss": 0.7896, "step": 4500 }, { "epoch": 0.54, "learning_rate": 9.295627818061756e-06, "loss": 0.7433, "step": 4501 }, { "epoch": 0.54, "learning_rate": 9.291774692776066e-06, "loss": 0.7762, "step": 4502 }, { "epoch": 0.54, "learning_rate": 9.287921673164738e-06, "loss": 0.7941, "step": 4503 }, { "epoch": 0.54, "learning_rate": 9.28406875980268e-06, "loss": 0.7852, "step": 4504 }, { "epoch": 0.54, "learning_rate": 9.280215953264786e-06, "loss": 0.7221, "step": 4505 }, { "epoch": 0.54, "learning_rate": 9.276363254125936e-06, "loss": 0.7511, "step": 4506 }, { "epoch": 0.54, "learning_rate": 9.272510662960996e-06, "loss": 0.7316, "step": 4507 }, { "epoch": 0.54, "learning_rate": 9.2686581803448e-06, "loss": 0.774, "step": 4508 }, { "epoch": 0.54, "learning_rate": 9.264805806852188e-06, "loss": 0.7885, "step": 4509 }, { "epoch": 0.54, "learning_rate": 9.260953543057964e-06, "loss": 0.8398, "step": 4510 }, { "epoch": 0.54, "learning_rate": 9.25710138953693e-06, "loss": 0.7215, "step": 4511 }, { "epoch": 0.54, "learning_rate": 9.253249346863867e-06, "loss": 0.7433, "step": 4512 }, { "epoch": 0.54, "learning_rate": 9.24939741561354e-06, "loss": 0.755, "step": 4513 }, { "epoch": 0.54, "learning_rate": 9.245545596360688e-06, "loss": 0.7963, "step": 4514 }, { "epoch": 0.54, "learning_rate": 9.241693889680047e-06, "loss": 0.8181, "step": 4515 }, { "epoch": 0.54, "learning_rate": 9.23784229614633e-06, "loss": 0.7785, "step": 4516 }, { "epoch": 0.54, "learning_rate": 9.233990816334233e-06, "loss": 0.8348, "step": 4517 }, { "epoch": 0.54, "learning_rate": 9.230139450818441e-06, "loss": 0.7606, "step": 4518 }, { "epoch": 0.54, "learning_rate": 9.226288200173605e-06, "loss": 0.779, "step": 4519 }, { "epoch": 0.54, "learning_rate": 9.222437064974382e-06, "loss": 0.7807, "step": 4520 }, { "epoch": 0.54, "learning_rate": 9.218586045795392e-06, "loss": 0.74, "step": 4521 }, { "epoch": 0.54, "learning_rate": 9.21473514321125e-06, "loss": 0.7383, "step": 4522 }, { "epoch": 0.54, "learning_rate": 9.21088435779655e-06, "loss": 0.7042, "step": 4523 }, { "epoch": 0.54, "learning_rate": 9.207033690125866e-06, "loss": 0.7494, "step": 4524 }, { "epoch": 0.54, "learning_rate": 9.203183140773756e-06, "loss": 0.7388, "step": 4525 }, { "epoch": 0.54, "learning_rate": 9.199332710314765e-06, "loss": 0.7522, "step": 4526 }, { "epoch": 0.54, "learning_rate": 9.19548239932341e-06, "loss": 0.7366, "step": 4527 }, { "epoch": 0.54, "learning_rate": 9.191632208374204e-06, "loss": 0.7673, "step": 4528 }, { "epoch": 0.54, "learning_rate": 9.187782138041625e-06, "loss": 0.7997, "step": 4529 }, { "epoch": 0.54, "learning_rate": 9.18393218890015e-06, "loss": 0.7221, "step": 4530 }, { "epoch": 0.54, "learning_rate": 9.180082361524224e-06, "loss": 0.769, "step": 4531 }, { "epoch": 0.54, "learning_rate": 9.176232656488286e-06, "loss": 0.7628, "step": 4532 }, { "epoch": 0.54, "learning_rate": 9.172383074366749e-06, "loss": 0.8013, "step": 4533 }, { "epoch": 0.54, "learning_rate": 9.16853361573401e-06, "loss": 0.7773, "step": 4534 }, { "epoch": 0.54, "learning_rate": 9.164684281164442e-06, "loss": 0.7762, "step": 4535 }, { "epoch": 0.54, "learning_rate": 9.160835071232411e-06, "loss": 0.8002, "step": 4536 }, { "epoch": 0.54, "learning_rate": 9.156985986512253e-06, "loss": 0.76, "step": 4537 }, { "epoch": 0.54, "learning_rate": 9.153137027578297e-06, "loss": 0.736, "step": 4538 }, { "epoch": 0.54, "learning_rate": 9.149288195004838e-06, "loss": 0.7232, "step": 4539 }, { "epoch": 0.54, "learning_rate": 9.145439489366167e-06, "loss": 0.7422, "step": 4540 }, { "epoch": 0.54, "learning_rate": 9.141590911236547e-06, "loss": 0.7533, "step": 4541 }, { "epoch": 0.54, "learning_rate": 9.137742461190224e-06, "loss": 0.7589, "step": 4542 }, { "epoch": 0.54, "learning_rate": 9.133894139801432e-06, "loss": 0.7662, "step": 4543 }, { "epoch": 0.54, "learning_rate": 9.13004594764437e-06, "loss": 0.7533, "step": 4544 }, { "epoch": 0.54, "learning_rate": 9.126197885293233e-06, "loss": 0.7617, "step": 4545 }, { "epoch": 0.54, "learning_rate": 9.122349953322187e-06, "loss": 0.75, "step": 4546 }, { "epoch": 0.54, "learning_rate": 9.118502152305384e-06, "loss": 0.755, "step": 4547 }, { "epoch": 0.54, "learning_rate": 9.11465448281696e-06, "loss": 0.7321, "step": 4548 }, { "epoch": 0.54, "learning_rate": 9.110806945431017e-06, "loss": 0.7411, "step": 4549 }, { "epoch": 0.54, "learning_rate": 9.10695954072165e-06, "loss": 0.7656, "step": 4550 }, { "epoch": 0.54, "learning_rate": 9.103112269262933e-06, "loss": 0.7578, "step": 4551 }, { "epoch": 0.54, "learning_rate": 9.099265131628915e-06, "loss": 0.74, "step": 4552 }, { "epoch": 0.54, "learning_rate": 9.095418128393632e-06, "loss": 0.7595, "step": 4553 }, { "epoch": 0.54, "learning_rate": 9.09157126013109e-06, "loss": 0.7857, "step": 4554 }, { "epoch": 0.54, "learning_rate": 9.087724527415282e-06, "loss": 0.7528, "step": 4555 }, { "epoch": 0.54, "learning_rate": 9.08387793082018e-06, "loss": 0.8287, "step": 4556 }, { "epoch": 0.54, "learning_rate": 9.080031470919737e-06, "loss": 0.7952, "step": 4557 }, { "epoch": 0.54, "learning_rate": 9.076185148287883e-06, "loss": 0.7801, "step": 4558 }, { "epoch": 0.54, "learning_rate": 9.072338963498526e-06, "loss": 0.6964, "step": 4559 }, { "epoch": 0.54, "learning_rate": 9.068492917125555e-06, "loss": 0.8142, "step": 4560 }, { "epoch": 0.54, "learning_rate": 9.06464700974284e-06, "loss": 0.7662, "step": 4561 }, { "epoch": 0.54, "learning_rate": 9.060801241924232e-06, "loss": 0.7958, "step": 4562 }, { "epoch": 0.54, "learning_rate": 9.056955614243558e-06, "loss": 0.7589, "step": 4563 }, { "epoch": 0.54, "learning_rate": 9.05311012727462e-06, "loss": 0.7935, "step": 4564 }, { "epoch": 0.54, "learning_rate": 9.049264781591209e-06, "loss": 0.7126, "step": 4565 }, { "epoch": 0.54, "learning_rate": 9.045419577767082e-06, "loss": 0.7701, "step": 4566 }, { "epoch": 0.54, "learning_rate": 9.041574516375988e-06, "loss": 0.7852, "step": 4567 }, { "epoch": 0.54, "learning_rate": 9.037729597991653e-06, "loss": 0.7695, "step": 4568 }, { "epoch": 0.54, "learning_rate": 9.033884823187767e-06, "loss": 0.7232, "step": 4569 }, { "epoch": 0.55, "learning_rate": 9.030040192538013e-06, "loss": 0.7829, "step": 4570 }, { "epoch": 0.55, "learning_rate": 9.026195706616055e-06, "loss": 0.7528, "step": 4571 }, { "epoch": 0.55, "learning_rate": 9.022351365995521e-06, "loss": 0.8119, "step": 4572 }, { "epoch": 0.55, "learning_rate": 9.018507171250032e-06, "loss": 0.7578, "step": 4573 }, { "epoch": 0.55, "learning_rate": 9.014663122953174e-06, "loss": 0.8013, "step": 4574 }, { "epoch": 0.55, "learning_rate": 9.010819221678521e-06, "loss": 0.779, "step": 4575 }, { "epoch": 0.55, "learning_rate": 9.006975467999625e-06, "loss": 0.7556, "step": 4576 }, { "epoch": 0.55, "learning_rate": 9.003131862490006e-06, "loss": 0.7584, "step": 4577 }, { "epoch": 0.55, "learning_rate": 8.999288405723177e-06, "loss": 0.7857, "step": 4578 }, { "epoch": 0.55, "learning_rate": 8.995445098272614e-06, "loss": 0.7924, "step": 4579 }, { "epoch": 0.55, "learning_rate": 8.991601940711777e-06, "loss": 0.7199, "step": 4580 }, { "epoch": 0.55, "learning_rate": 8.987758933614108e-06, "loss": 0.7985, "step": 4581 }, { "epoch": 0.55, "learning_rate": 8.983916077553021e-06, "loss": 0.8415, "step": 4582 }, { "epoch": 0.55, "learning_rate": 8.98007337310191e-06, "loss": 0.7695, "step": 4583 }, { "epoch": 0.55, "learning_rate": 8.976230820834143e-06, "loss": 0.7679, "step": 4584 }, { "epoch": 0.55, "learning_rate": 8.972388421323068e-06, "loss": 0.7706, "step": 4585 }, { "epoch": 0.55, "learning_rate": 8.968546175142009e-06, "loss": 0.8147, "step": 4586 }, { "epoch": 0.55, "learning_rate": 8.964704082864268e-06, "loss": 0.7511, "step": 4587 }, { "epoch": 0.55, "learning_rate": 8.96086214506313e-06, "loss": 0.7288, "step": 4588 }, { "epoch": 0.55, "learning_rate": 8.957020362311842e-06, "loss": 0.7829, "step": 4589 }, { "epoch": 0.55, "learning_rate": 8.953178735183645e-06, "loss": 0.7455, "step": 4590 }, { "epoch": 0.55, "learning_rate": 8.949337264251739e-06, "loss": 0.7349, "step": 4591 }, { "epoch": 0.55, "learning_rate": 8.945495950089315e-06, "loss": 0.7539, "step": 4592 }, { "epoch": 0.55, "learning_rate": 8.941654793269544e-06, "loss": 0.7483, "step": 4593 }, { "epoch": 0.55, "learning_rate": 8.937813794365552e-06, "loss": 0.7768, "step": 4594 }, { "epoch": 0.55, "learning_rate": 8.933972953950458e-06, "loss": 0.7751, "step": 4595 }, { "epoch": 0.55, "learning_rate": 8.930132272597361e-06, "loss": 0.7545, "step": 4596 }, { "epoch": 0.55, "learning_rate": 8.926291750879322e-06, "loss": 0.7578, "step": 4597 }, { "epoch": 0.55, "learning_rate": 8.922451389369395e-06, "loss": 0.7148, "step": 4598 }, { "epoch": 0.55, "learning_rate": 8.918611188640588e-06, "loss": 0.7852, "step": 4599 }, { "epoch": 0.55, "learning_rate": 8.914771149265903e-06, "loss": 0.7645, "step": 4600 }, { "epoch": 0.55, "learning_rate": 8.910931271818315e-06, "loss": 0.7662, "step": 4601 }, { "epoch": 0.55, "learning_rate": 8.907091556870775e-06, "loss": 0.7662, "step": 4602 }, { "epoch": 0.55, "learning_rate": 8.903252004996204e-06, "loss": 0.7584, "step": 4603 }, { "epoch": 0.55, "learning_rate": 8.899412616767496e-06, "loss": 0.8064, "step": 4604 }, { "epoch": 0.55, "learning_rate": 8.895573392757532e-06, "loss": 0.7455, "step": 4605 }, { "epoch": 0.55, "learning_rate": 8.891734333539163e-06, "loss": 0.8002, "step": 4606 }, { "epoch": 0.55, "learning_rate": 8.887895439685218e-06, "loss": 0.7545, "step": 4607 }, { "epoch": 0.55, "learning_rate": 8.884056711768494e-06, "loss": 0.7706, "step": 4608 }, { "epoch": 0.55, "learning_rate": 8.88021815036177e-06, "loss": 0.7969, "step": 4609 }, { "epoch": 0.55, "learning_rate": 8.876379756037796e-06, "loss": 0.6886, "step": 4610 }, { "epoch": 0.55, "learning_rate": 8.872541529369302e-06, "loss": 0.769, "step": 4611 }, { "epoch": 0.55, "learning_rate": 8.868703470928987e-06, "loss": 0.7902, "step": 4612 }, { "epoch": 0.55, "learning_rate": 8.864865581289536e-06, "loss": 0.7305, "step": 4613 }, { "epoch": 0.55, "learning_rate": 8.86102786102359e-06, "loss": 0.7941, "step": 4614 }, { "epoch": 0.55, "learning_rate": 8.857190310703782e-06, "loss": 0.8069, "step": 4615 }, { "epoch": 0.55, "learning_rate": 8.853352930902712e-06, "loss": 0.7483, "step": 4616 }, { "epoch": 0.55, "learning_rate": 8.849515722192954e-06, "loss": 0.7729, "step": 4617 }, { "epoch": 0.55, "learning_rate": 8.845678685147064e-06, "loss": 0.7388, "step": 4618 }, { "epoch": 0.55, "learning_rate": 8.841841820337558e-06, "loss": 0.7355, "step": 4619 }, { "epoch": 0.55, "learning_rate": 8.83800512833694e-06, "loss": 0.7277, "step": 4620 }, { "epoch": 0.55, "learning_rate": 8.834168609717685e-06, "loss": 0.7679, "step": 4621 }, { "epoch": 0.55, "learning_rate": 8.830332265052235e-06, "loss": 0.7294, "step": 4622 }, { "epoch": 0.55, "learning_rate": 8.826496094913018e-06, "loss": 0.7824, "step": 4623 }, { "epoch": 0.55, "learning_rate": 8.822660099872423e-06, "loss": 0.7913, "step": 4624 }, { "epoch": 0.55, "learning_rate": 8.818824280502821e-06, "loss": 0.8544, "step": 4625 }, { "epoch": 0.55, "learning_rate": 8.814988637376555e-06, "loss": 0.7561, "step": 4626 }, { "epoch": 0.55, "learning_rate": 8.811153171065945e-06, "loss": 0.8092, "step": 4627 }, { "epoch": 0.55, "learning_rate": 8.80731788214328e-06, "loss": 0.7958, "step": 4628 }, { "epoch": 0.55, "learning_rate": 8.803482771180819e-06, "loss": 0.7813, "step": 4629 }, { "epoch": 0.55, "learning_rate": 8.799647838750803e-06, "loss": 0.7974, "step": 4630 }, { "epoch": 0.55, "learning_rate": 8.795813085425441e-06, "loss": 0.769, "step": 4631 }, { "epoch": 0.55, "learning_rate": 8.79197851177692e-06, "loss": 0.7757, "step": 4632 }, { "epoch": 0.55, "learning_rate": 8.788144118377398e-06, "loss": 0.7863, "step": 4633 }, { "epoch": 0.55, "learning_rate": 8.784309905799e-06, "loss": 0.779, "step": 4634 }, { "epoch": 0.55, "learning_rate": 8.78047587461383e-06, "loss": 0.7193, "step": 4635 }, { "epoch": 0.55, "learning_rate": 8.776642025393966e-06, "loss": 0.74, "step": 4636 }, { "epoch": 0.55, "learning_rate": 8.772808358711457e-06, "loss": 0.7896, "step": 4637 }, { "epoch": 0.55, "learning_rate": 8.768974875138328e-06, "loss": 0.7785, "step": 4638 }, { "epoch": 0.55, "learning_rate": 8.765141575246567e-06, "loss": 0.7132, "step": 4639 }, { "epoch": 0.55, "learning_rate": 8.761308459608145e-06, "loss": 0.817, "step": 4640 }, { "epoch": 0.55, "learning_rate": 8.757475528794999e-06, "loss": 0.7796, "step": 4641 }, { "epoch": 0.55, "learning_rate": 8.753642783379043e-06, "loss": 0.7813, "step": 4642 }, { "epoch": 0.55, "learning_rate": 8.749810223932163e-06, "loss": 0.7813, "step": 4643 }, { "epoch": 0.55, "learning_rate": 8.74597785102621e-06, "loss": 0.7623, "step": 4644 }, { "epoch": 0.55, "learning_rate": 8.742145665233018e-06, "loss": 0.7087, "step": 4645 }, { "epoch": 0.55, "learning_rate": 8.738313667124385e-06, "loss": 0.7148, "step": 4646 }, { "epoch": 0.55, "learning_rate": 8.734481857272085e-06, "loss": 0.774, "step": 4647 }, { "epoch": 0.55, "learning_rate": 8.730650236247864e-06, "loss": 0.7232, "step": 4648 }, { "epoch": 0.55, "learning_rate": 8.726818804623434e-06, "loss": 0.8058, "step": 4649 }, { "epoch": 0.55, "learning_rate": 8.722987562970486e-06, "loss": 0.8298, "step": 4650 }, { "epoch": 0.55, "learning_rate": 8.719156511860681e-06, "loss": 0.7935, "step": 4651 }, { "epoch": 0.55, "learning_rate": 8.715325651865651e-06, "loss": 0.7411, "step": 4652 }, { "epoch": 0.55, "learning_rate": 8.711494983556996e-06, "loss": 0.7589, "step": 4653 }, { "epoch": 0.56, "learning_rate": 8.707664507506293e-06, "loss": 0.7433, "step": 4654 }, { "epoch": 0.56, "learning_rate": 8.703834224285084e-06, "loss": 0.7294, "step": 4655 }, { "epoch": 0.56, "learning_rate": 8.70000413446489e-06, "loss": 0.7617, "step": 4656 }, { "epoch": 0.56, "learning_rate": 8.696174238617196e-06, "loss": 0.7517, "step": 4657 }, { "epoch": 0.56, "learning_rate": 8.692344537313466e-06, "loss": 0.6942, "step": 4658 }, { "epoch": 0.56, "learning_rate": 8.688515031125126e-06, "loss": 0.7645, "step": 4659 }, { "epoch": 0.56, "learning_rate": 8.684685720623575e-06, "loss": 0.7372, "step": 4660 }, { "epoch": 0.56, "learning_rate": 8.680856606380189e-06, "loss": 0.7762, "step": 4661 }, { "epoch": 0.56, "learning_rate": 8.677027688966307e-06, "loss": 0.7595, "step": 4662 }, { "epoch": 0.56, "learning_rate": 8.673198968953248e-06, "loss": 0.7271, "step": 4663 }, { "epoch": 0.56, "learning_rate": 8.669370446912288e-06, "loss": 0.7779, "step": 4664 }, { "epoch": 0.56, "learning_rate": 8.665542123414686e-06, "loss": 0.7779, "step": 4665 }, { "epoch": 0.56, "learning_rate": 8.661713999031664e-06, "loss": 0.7416, "step": 4666 }, { "epoch": 0.56, "learning_rate": 8.657886074334418e-06, "loss": 0.8036, "step": 4667 }, { "epoch": 0.56, "learning_rate": 8.654058349894117e-06, "loss": 0.7701, "step": 4668 }, { "epoch": 0.56, "learning_rate": 8.65023082628189e-06, "loss": 0.7746, "step": 4669 }, { "epoch": 0.56, "learning_rate": 8.646403504068842e-06, "loss": 0.8577, "step": 4670 }, { "epoch": 0.56, "learning_rate": 8.642576383826052e-06, "loss": 0.76, "step": 4671 }, { "epoch": 0.56, "learning_rate": 8.638749466124563e-06, "loss": 0.7913, "step": 4672 }, { "epoch": 0.56, "learning_rate": 8.634922751535394e-06, "loss": 0.7818, "step": 4673 }, { "epoch": 0.56, "learning_rate": 8.631096240629521e-06, "loss": 0.7372, "step": 4674 }, { "epoch": 0.56, "learning_rate": 8.627269933977903e-06, "loss": 0.7506, "step": 4675 }, { "epoch": 0.56, "learning_rate": 8.623443832151461e-06, "loss": 0.7416, "step": 4676 }, { "epoch": 0.56, "learning_rate": 8.619617935721094e-06, "loss": 0.8075, "step": 4677 }, { "epoch": 0.56, "learning_rate": 8.615792245257661e-06, "loss": 0.8114, "step": 4678 }, { "epoch": 0.56, "learning_rate": 8.611966761331992e-06, "loss": 0.7483, "step": 4679 }, { "epoch": 0.56, "learning_rate": 8.608141484514888e-06, "loss": 0.76, "step": 4680 }, { "epoch": 0.56, "learning_rate": 8.60431641537712e-06, "loss": 0.7511, "step": 4681 }, { "epoch": 0.56, "learning_rate": 8.600491554489425e-06, "loss": 0.7494, "step": 4682 }, { "epoch": 0.56, "learning_rate": 8.596666902422518e-06, "loss": 0.7327, "step": 4683 }, { "epoch": 0.56, "learning_rate": 8.592842459747066e-06, "loss": 0.7751, "step": 4684 }, { "epoch": 0.56, "learning_rate": 8.58901822703372e-06, "loss": 0.7824, "step": 4685 }, { "epoch": 0.56, "learning_rate": 8.585194204853091e-06, "loss": 0.7372, "step": 4686 }, { "epoch": 0.56, "learning_rate": 8.581370393775765e-06, "loss": 0.7539, "step": 4687 }, { "epoch": 0.56, "learning_rate": 8.577546794372295e-06, "loss": 0.7489, "step": 4688 }, { "epoch": 0.56, "learning_rate": 8.573723407213192e-06, "loss": 0.7846, "step": 4689 }, { "epoch": 0.56, "learning_rate": 8.569900232868953e-06, "loss": 0.8287, "step": 4690 }, { "epoch": 0.56, "learning_rate": 8.566077271910027e-06, "loss": 0.7573, "step": 4691 }, { "epoch": 0.56, "learning_rate": 8.562254524906843e-06, "loss": 0.7545, "step": 4692 }, { "epoch": 0.56, "learning_rate": 8.558431992429796e-06, "loss": 0.7617, "step": 4693 }, { "epoch": 0.56, "learning_rate": 8.554609675049237e-06, "loss": 0.7355, "step": 4694 }, { "epoch": 0.56, "learning_rate": 8.550787573335501e-06, "loss": 0.7718, "step": 4695 }, { "epoch": 0.56, "learning_rate": 8.546965687858886e-06, "loss": 0.7383, "step": 4696 }, { "epoch": 0.56, "learning_rate": 8.543144019189652e-06, "loss": 0.7439, "step": 4697 }, { "epoch": 0.56, "learning_rate": 8.539322567898029e-06, "loss": 0.7377, "step": 4698 }, { "epoch": 0.56, "learning_rate": 8.535501334554224e-06, "loss": 0.7896, "step": 4699 }, { "epoch": 0.56, "learning_rate": 8.531680319728394e-06, "loss": 0.7885, "step": 4700 }, { "epoch": 0.56, "learning_rate": 8.527859523990676e-06, "loss": 0.7093, "step": 4701 }, { "epoch": 0.56, "learning_rate": 8.524038947911177e-06, "loss": 0.7533, "step": 4702 }, { "epoch": 0.56, "learning_rate": 8.520218592059956e-06, "loss": 0.7567, "step": 4703 }, { "epoch": 0.56, "learning_rate": 8.51639845700706e-06, "loss": 0.736, "step": 4704 }, { "epoch": 0.56, "learning_rate": 8.512578543322481e-06, "loss": 0.7829, "step": 4705 }, { "epoch": 0.56, "learning_rate": 8.508758851576192e-06, "loss": 0.7662, "step": 4706 }, { "epoch": 0.56, "learning_rate": 8.504939382338132e-06, "loss": 0.7985, "step": 4707 }, { "epoch": 0.56, "learning_rate": 8.501120136178202e-06, "loss": 0.7617, "step": 4708 }, { "epoch": 0.56, "learning_rate": 8.497301113666277e-06, "loss": 0.7048, "step": 4709 }, { "epoch": 0.56, "learning_rate": 8.493482315372188e-06, "loss": 0.7388, "step": 4710 }, { "epoch": 0.56, "learning_rate": 8.489663741865736e-06, "loss": 0.8119, "step": 4711 }, { "epoch": 0.56, "learning_rate": 8.485845393716697e-06, "loss": 0.803, "step": 4712 }, { "epoch": 0.56, "learning_rate": 8.482027271494803e-06, "loss": 0.7472, "step": 4713 }, { "epoch": 0.56, "learning_rate": 8.478209375769763e-06, "loss": 0.7656, "step": 4714 }, { "epoch": 0.56, "learning_rate": 8.474391707111236e-06, "loss": 0.8052, "step": 4715 }, { "epoch": 0.56, "learning_rate": 8.470574266088863e-06, "loss": 0.7997, "step": 4716 }, { "epoch": 0.56, "learning_rate": 8.466757053272242e-06, "loss": 0.769, "step": 4717 }, { "epoch": 0.56, "learning_rate": 8.462940069230941e-06, "loss": 0.726, "step": 4718 }, { "epoch": 0.56, "learning_rate": 8.459123314534494e-06, "loss": 0.7411, "step": 4719 }, { "epoch": 0.56, "learning_rate": 8.455306789752395e-06, "loss": 0.7679, "step": 4720 }, { "epoch": 0.56, "learning_rate": 8.451490495454114e-06, "loss": 0.7193, "step": 4721 }, { "epoch": 0.56, "learning_rate": 8.447674432209072e-06, "loss": 0.7427, "step": 4722 }, { "epoch": 0.56, "learning_rate": 8.443858600586672e-06, "loss": 0.7723, "step": 4723 }, { "epoch": 0.56, "learning_rate": 8.440043001156274e-06, "loss": 0.7985, "step": 4724 }, { "epoch": 0.56, "learning_rate": 8.4362276344872e-06, "loss": 0.7813, "step": 4725 }, { "epoch": 0.56, "learning_rate": 8.432412501148741e-06, "loss": 0.7807, "step": 4726 }, { "epoch": 0.56, "learning_rate": 8.428597601710159e-06, "loss": 0.8103, "step": 4727 }, { "epoch": 0.56, "learning_rate": 8.42478293674067e-06, "loss": 0.7807, "step": 4728 }, { "epoch": 0.56, "learning_rate": 8.420968506809466e-06, "loss": 0.8058, "step": 4729 }, { "epoch": 0.56, "learning_rate": 8.41715431248569e-06, "loss": 0.8008, "step": 4730 }, { "epoch": 0.56, "learning_rate": 8.413340354338463e-06, "loss": 0.7734, "step": 4731 }, { "epoch": 0.56, "learning_rate": 8.409526632936866e-06, "loss": 0.8181, "step": 4732 }, { "epoch": 0.56, "learning_rate": 8.405713148849949e-06, "loss": 0.7059, "step": 4733 }, { "epoch": 0.56, "learning_rate": 8.401899902646717e-06, "loss": 0.7969, "step": 4734 }, { "epoch": 0.56, "learning_rate": 8.398086894896145e-06, "loss": 0.793, "step": 4735 }, { "epoch": 0.56, "learning_rate": 8.394274126167173e-06, "loss": 0.7907, "step": 4736 }, { "epoch": 0.56, "learning_rate": 8.390461597028703e-06, "loss": 0.7383, "step": 4737 }, { "epoch": 0.57, "learning_rate": 8.386649308049607e-06, "loss": 0.7104, "step": 4738 }, { "epoch": 0.57, "learning_rate": 8.382837259798717e-06, "loss": 0.8008, "step": 4739 }, { "epoch": 0.57, "learning_rate": 8.379025452844824e-06, "loss": 0.7941, "step": 4740 }, { "epoch": 0.57, "learning_rate": 8.375213887756692e-06, "loss": 0.769, "step": 4741 }, { "epoch": 0.57, "learning_rate": 8.371402565103041e-06, "loss": 0.7545, "step": 4742 }, { "epoch": 0.57, "learning_rate": 8.367591485452563e-06, "loss": 0.7924, "step": 4743 }, { "epoch": 0.57, "learning_rate": 8.36378064937391e-06, "loss": 0.8064, "step": 4744 }, { "epoch": 0.57, "learning_rate": 8.359970057435694e-06, "loss": 0.7762, "step": 4745 }, { "epoch": 0.57, "learning_rate": 8.356159710206493e-06, "loss": 0.7651, "step": 4746 }, { "epoch": 0.57, "learning_rate": 8.352349608254854e-06, "loss": 0.7891, "step": 4747 }, { "epoch": 0.57, "learning_rate": 8.348539752149279e-06, "loss": 0.7439, "step": 4748 }, { "epoch": 0.57, "learning_rate": 8.34473014245824e-06, "loss": 0.7896, "step": 4749 }, { "epoch": 0.57, "learning_rate": 8.340920779750164e-06, "loss": 0.7455, "step": 4750 }, { "epoch": 0.57, "learning_rate": 8.33711166459345e-06, "loss": 0.7422, "step": 4751 }, { "epoch": 0.57, "learning_rate": 8.333302797556458e-06, "loss": 0.7706, "step": 4752 }, { "epoch": 0.57, "learning_rate": 8.329494179207505e-06, "loss": 0.7813, "step": 4753 }, { "epoch": 0.57, "learning_rate": 8.32568581011488e-06, "loss": 0.7511, "step": 4754 }, { "epoch": 0.57, "learning_rate": 8.321877690846827e-06, "loss": 0.8371, "step": 4755 }, { "epoch": 0.57, "learning_rate": 8.318069821971554e-06, "loss": 0.8008, "step": 4756 }, { "epoch": 0.57, "learning_rate": 8.314262204057236e-06, "loss": 0.7684, "step": 4757 }, { "epoch": 0.57, "learning_rate": 8.31045483767201e-06, "loss": 0.7623, "step": 4758 }, { "epoch": 0.57, "learning_rate": 8.306647723383973e-06, "loss": 0.7684, "step": 4759 }, { "epoch": 0.57, "learning_rate": 8.302840861761184e-06, "loss": 0.7673, "step": 4760 }, { "epoch": 0.57, "learning_rate": 8.29903425337166e-06, "loss": 0.7567, "step": 4761 }, { "epoch": 0.57, "learning_rate": 8.295227898783391e-06, "loss": 0.7377, "step": 4762 }, { "epoch": 0.57, "learning_rate": 8.291421798564323e-06, "loss": 0.764, "step": 4763 }, { "epoch": 0.57, "learning_rate": 8.28761595328237e-06, "loss": 0.7907, "step": 4764 }, { "epoch": 0.57, "learning_rate": 8.283810363505388e-06, "loss": 0.7606, "step": 4765 }, { "epoch": 0.57, "learning_rate": 8.280005029801222e-06, "loss": 0.7333, "step": 4766 }, { "epoch": 0.57, "learning_rate": 8.276199952737661e-06, "loss": 0.7891, "step": 4767 }, { "epoch": 0.57, "learning_rate": 8.27239513288246e-06, "loss": 0.7489, "step": 4768 }, { "epoch": 0.57, "learning_rate": 8.268590570803345e-06, "loss": 0.7193, "step": 4769 }, { "epoch": 0.57, "learning_rate": 8.264786267067983e-06, "loss": 0.76, "step": 4770 }, { "epoch": 0.57, "learning_rate": 8.26098222224402e-06, "loss": 0.784, "step": 4771 }, { "epoch": 0.57, "learning_rate": 8.25717843689906e-06, "loss": 0.7667, "step": 4772 }, { "epoch": 0.57, "learning_rate": 8.253374911600663e-06, "loss": 0.7372, "step": 4773 }, { "epoch": 0.57, "learning_rate": 8.249571646916357e-06, "loss": 0.7204, "step": 4774 }, { "epoch": 0.57, "learning_rate": 8.245768643413622e-06, "loss": 0.7517, "step": 4775 }, { "epoch": 0.57, "learning_rate": 8.241965901659907e-06, "loss": 0.7567, "step": 4776 }, { "epoch": 0.57, "learning_rate": 8.23816342222262e-06, "loss": 0.8008, "step": 4777 }, { "epoch": 0.57, "learning_rate": 8.234361205669132e-06, "loss": 0.8064, "step": 4778 }, { "epoch": 0.57, "learning_rate": 8.230559252566771e-06, "loss": 0.7952, "step": 4779 }, { "epoch": 0.57, "learning_rate": 8.22675756348282e-06, "loss": 0.7768, "step": 4780 }, { "epoch": 0.57, "learning_rate": 8.222956138984534e-06, "loss": 0.7422, "step": 4781 }, { "epoch": 0.57, "learning_rate": 8.219154979639126e-06, "loss": 0.7706, "step": 4782 }, { "epoch": 0.57, "learning_rate": 8.215354086013767e-06, "loss": 0.7907, "step": 4783 }, { "epoch": 0.57, "learning_rate": 8.211553458675587e-06, "loss": 0.7684, "step": 4784 }, { "epoch": 0.57, "learning_rate": 8.20775309819168e-06, "loss": 0.8555, "step": 4785 }, { "epoch": 0.57, "learning_rate": 8.203953005129092e-06, "loss": 0.7048, "step": 4786 }, { "epoch": 0.57, "learning_rate": 8.200153180054842e-06, "loss": 0.7695, "step": 4787 }, { "epoch": 0.57, "learning_rate": 8.196353623535897e-06, "loss": 0.7656, "step": 4788 }, { "epoch": 0.57, "learning_rate": 8.192554336139199e-06, "loss": 0.7857, "step": 4789 }, { "epoch": 0.57, "learning_rate": 8.188755318431627e-06, "loss": 0.6948, "step": 4790 }, { "epoch": 0.57, "learning_rate": 8.184956570980041e-06, "loss": 0.7768, "step": 4791 }, { "epoch": 0.57, "learning_rate": 8.18115809435125e-06, "loss": 0.7372, "step": 4792 }, { "epoch": 0.57, "learning_rate": 8.177359889112023e-06, "loss": 0.7461, "step": 4793 }, { "epoch": 0.57, "learning_rate": 8.173561955829099e-06, "loss": 0.7712, "step": 4794 }, { "epoch": 0.57, "learning_rate": 8.169764295069158e-06, "loss": 0.7427, "step": 4795 }, { "epoch": 0.57, "learning_rate": 8.16596690739885e-06, "loss": 0.8119, "step": 4796 }, { "epoch": 0.57, "learning_rate": 8.16216979338479e-06, "loss": 0.7785, "step": 4797 }, { "epoch": 0.57, "learning_rate": 8.158372953593542e-06, "loss": 0.7517, "step": 4798 }, { "epoch": 0.57, "learning_rate": 8.154576388591637e-06, "loss": 0.7126, "step": 4799 }, { "epoch": 0.57, "learning_rate": 8.150780098945553e-06, "loss": 0.7645, "step": 4800 }, { "epoch": 0.57, "learning_rate": 8.146984085221738e-06, "loss": 0.7377, "step": 4801 }, { "epoch": 0.57, "learning_rate": 8.143188347986597e-06, "loss": 0.7333, "step": 4802 }, { "epoch": 0.57, "learning_rate": 8.139392887806494e-06, "loss": 0.76, "step": 4803 }, { "epoch": 0.57, "learning_rate": 8.13559770524775e-06, "loss": 0.7573, "step": 4804 }, { "epoch": 0.57, "learning_rate": 8.131802800876636e-06, "loss": 0.7695, "step": 4805 }, { "epoch": 0.57, "learning_rate": 8.128008175259398e-06, "loss": 0.7299, "step": 4806 }, { "epoch": 0.57, "learning_rate": 8.12421382896223e-06, "loss": 0.7422, "step": 4807 }, { "epoch": 0.57, "learning_rate": 8.120419762551287e-06, "loss": 0.7701, "step": 4808 }, { "epoch": 0.57, "learning_rate": 8.116625976592687e-06, "loss": 0.7299, "step": 4809 }, { "epoch": 0.57, "learning_rate": 8.112832471652494e-06, "loss": 0.736, "step": 4810 }, { "epoch": 0.57, "learning_rate": 8.10903924829674e-06, "loss": 0.7584, "step": 4811 }, { "epoch": 0.57, "learning_rate": 8.10524630709141e-06, "loss": 0.726, "step": 4812 }, { "epoch": 0.57, "learning_rate": 8.10145364860245e-06, "loss": 0.7606, "step": 4813 }, { "epoch": 0.57, "learning_rate": 8.09766127339577e-06, "loss": 0.7645, "step": 4814 }, { "epoch": 0.57, "learning_rate": 8.093869182037219e-06, "loss": 0.7104, "step": 4815 }, { "epoch": 0.57, "learning_rate": 8.090077375092623e-06, "loss": 0.7768, "step": 4816 }, { "epoch": 0.57, "learning_rate": 8.086285853127754e-06, "loss": 0.731, "step": 4817 }, { "epoch": 0.57, "learning_rate": 8.082494616708347e-06, "loss": 0.7439, "step": 4818 }, { "epoch": 0.57, "learning_rate": 8.0787036664001e-06, "loss": 0.76, "step": 4819 }, { "epoch": 0.57, "learning_rate": 8.074913002768646e-06, "loss": 0.7355, "step": 4820 }, { "epoch": 0.57, "learning_rate": 8.071122626379599e-06, "loss": 0.7645, "step": 4821 }, { "epoch": 0.58, "learning_rate": 8.067332537798522e-06, "loss": 0.7645, "step": 4822 }, { "epoch": 0.58, "learning_rate": 8.063542737590932e-06, "loss": 0.7762, "step": 4823 }, { "epoch": 0.58, "learning_rate": 8.059753226322311e-06, "loss": 0.7673, "step": 4824 }, { "epoch": 0.58, "learning_rate": 8.055964004558083e-06, "loss": 0.7645, "step": 4825 }, { "epoch": 0.58, "learning_rate": 8.052175072863643e-06, "loss": 0.7366, "step": 4826 }, { "epoch": 0.58, "learning_rate": 8.048386431804338e-06, "loss": 0.7416, "step": 4827 }, { "epoch": 0.58, "learning_rate": 8.044598081945471e-06, "loss": 0.7299, "step": 4828 }, { "epoch": 0.58, "learning_rate": 8.040810023852306e-06, "loss": 0.8008, "step": 4829 }, { "epoch": 0.58, "learning_rate": 8.037022258090053e-06, "loss": 0.7723, "step": 4830 }, { "epoch": 0.58, "learning_rate": 8.033234785223887e-06, "loss": 0.8047, "step": 4831 }, { "epoch": 0.58, "learning_rate": 8.029447605818936e-06, "loss": 0.7857, "step": 4832 }, { "epoch": 0.58, "learning_rate": 8.02566072044029e-06, "loss": 0.7561, "step": 4833 }, { "epoch": 0.58, "learning_rate": 8.02187412965299e-06, "loss": 0.8281, "step": 4834 }, { "epoch": 0.58, "learning_rate": 8.018087834022028e-06, "loss": 0.74, "step": 4835 }, { "epoch": 0.58, "learning_rate": 8.01430183411236e-06, "loss": 0.7902, "step": 4836 }, { "epoch": 0.58, "learning_rate": 8.010516130488896e-06, "loss": 0.731, "step": 4837 }, { "epoch": 0.58, "learning_rate": 8.006730723716501e-06, "loss": 0.7132, "step": 4838 }, { "epoch": 0.58, "learning_rate": 8.002945614360002e-06, "loss": 0.774, "step": 4839 }, { "epoch": 0.58, "learning_rate": 7.999160802984165e-06, "loss": 0.7612, "step": 4840 }, { "epoch": 0.58, "learning_rate": 7.995376290153727e-06, "loss": 0.7734, "step": 4841 }, { "epoch": 0.58, "learning_rate": 7.991592076433375e-06, "loss": 0.7539, "step": 4842 }, { "epoch": 0.58, "learning_rate": 7.98780816238775e-06, "loss": 0.7773, "step": 4843 }, { "epoch": 0.58, "learning_rate": 7.984024548581458e-06, "loss": 0.6819, "step": 4844 }, { "epoch": 0.58, "learning_rate": 7.980241235579042e-06, "loss": 0.793, "step": 4845 }, { "epoch": 0.58, "learning_rate": 7.976458223945016e-06, "loss": 0.7919, "step": 4846 }, { "epoch": 0.58, "learning_rate": 7.972675514243845e-06, "loss": 0.7667, "step": 4847 }, { "epoch": 0.58, "learning_rate": 7.968893107039942e-06, "loss": 0.7254, "step": 4848 }, { "epoch": 0.58, "learning_rate": 7.965111002897689e-06, "loss": 0.7891, "step": 4849 }, { "epoch": 0.58, "learning_rate": 7.961329202381403e-06, "loss": 0.7684, "step": 4850 }, { "epoch": 0.58, "learning_rate": 7.957547706055374e-06, "loss": 0.7874, "step": 4851 }, { "epoch": 0.58, "learning_rate": 7.953766514483835e-06, "loss": 0.7561, "step": 4852 }, { "epoch": 0.58, "learning_rate": 7.949985628230983e-06, "loss": 0.7271, "step": 4853 }, { "epoch": 0.58, "learning_rate": 7.946205047860964e-06, "loss": 0.7879, "step": 4854 }, { "epoch": 0.58, "learning_rate": 7.942424773937876e-06, "loss": 0.7796, "step": 4855 }, { "epoch": 0.58, "learning_rate": 7.938644807025773e-06, "loss": 0.7595, "step": 4856 }, { "epoch": 0.58, "learning_rate": 7.934865147688667e-06, "loss": 0.7589, "step": 4857 }, { "epoch": 0.58, "learning_rate": 7.931085796490518e-06, "loss": 0.731, "step": 4858 }, { "epoch": 0.58, "learning_rate": 7.92730675399525e-06, "loss": 0.8136, "step": 4859 }, { "epoch": 0.58, "learning_rate": 7.923528020766728e-06, "loss": 0.774, "step": 4860 }, { "epoch": 0.58, "learning_rate": 7.91974959736878e-06, "loss": 0.7388, "step": 4861 }, { "epoch": 0.58, "learning_rate": 7.915971484365182e-06, "loss": 0.7042, "step": 4862 }, { "epoch": 0.58, "learning_rate": 7.912193682319669e-06, "loss": 0.7706, "step": 4863 }, { "epoch": 0.58, "learning_rate": 7.908416191795931e-06, "loss": 0.8047, "step": 4864 }, { "epoch": 0.58, "learning_rate": 7.904639013357598e-06, "loss": 0.7271, "step": 4865 }, { "epoch": 0.58, "learning_rate": 7.900862147568271e-06, "loss": 0.7394, "step": 4866 }, { "epoch": 0.58, "learning_rate": 7.897085594991492e-06, "loss": 0.7439, "step": 4867 }, { "epoch": 0.58, "learning_rate": 7.893309356190764e-06, "loss": 0.7115, "step": 4868 }, { "epoch": 0.58, "learning_rate": 7.889533431729542e-06, "loss": 0.769, "step": 4869 }, { "epoch": 0.58, "learning_rate": 7.885757822171225e-06, "loss": 0.7762, "step": 4870 }, { "epoch": 0.58, "learning_rate": 7.881982528079175e-06, "loss": 0.7388, "step": 4871 }, { "epoch": 0.58, "learning_rate": 7.878207550016708e-06, "loss": 0.7595, "step": 4872 }, { "epoch": 0.58, "learning_rate": 7.874432888547084e-06, "loss": 0.7924, "step": 4873 }, { "epoch": 0.58, "learning_rate": 7.870658544233525e-06, "loss": 0.7628, "step": 4874 }, { "epoch": 0.58, "learning_rate": 7.866884517639195e-06, "loss": 0.7874, "step": 4875 }, { "epoch": 0.58, "learning_rate": 7.86311080932722e-06, "loss": 0.817, "step": 4876 }, { "epoch": 0.58, "learning_rate": 7.859337419860675e-06, "loss": 0.7578, "step": 4877 }, { "epoch": 0.58, "learning_rate": 7.855564349802592e-06, "loss": 0.7137, "step": 4878 }, { "epoch": 0.58, "learning_rate": 7.851791599715947e-06, "loss": 0.7667, "step": 4879 }, { "epoch": 0.58, "learning_rate": 7.848019170163675e-06, "loss": 0.8008, "step": 4880 }, { "epoch": 0.58, "learning_rate": 7.844247061708655e-06, "loss": 0.7282, "step": 4881 }, { "epoch": 0.58, "learning_rate": 7.840475274913725e-06, "loss": 0.7768, "step": 4882 }, { "epoch": 0.58, "learning_rate": 7.836703810341678e-06, "loss": 0.7511, "step": 4883 }, { "epoch": 0.58, "learning_rate": 7.832932668555257e-06, "loss": 0.7969, "step": 4884 }, { "epoch": 0.58, "learning_rate": 7.829161850117144e-06, "loss": 0.7528, "step": 4885 }, { "epoch": 0.58, "learning_rate": 7.825391355589993e-06, "loss": 0.7405, "step": 4886 }, { "epoch": 0.58, "learning_rate": 7.821621185536393e-06, "loss": 0.7573, "step": 4887 }, { "epoch": 0.58, "learning_rate": 7.817851340518894e-06, "loss": 0.7444, "step": 4888 }, { "epoch": 0.58, "learning_rate": 7.814081821099995e-06, "loss": 0.7773, "step": 4889 }, { "epoch": 0.58, "learning_rate": 7.81031262784215e-06, "loss": 0.7623, "step": 4890 }, { "epoch": 0.58, "learning_rate": 7.806543761307755e-06, "loss": 0.7299, "step": 4891 }, { "epoch": 0.58, "learning_rate": 7.802775222059166e-06, "loss": 0.7768, "step": 4892 }, { "epoch": 0.58, "learning_rate": 7.799007010658683e-06, "loss": 0.7355, "step": 4893 }, { "epoch": 0.58, "learning_rate": 7.795239127668566e-06, "loss": 0.7344, "step": 4894 }, { "epoch": 0.58, "learning_rate": 7.791471573651024e-06, "loss": 0.7349, "step": 4895 }, { "epoch": 0.58, "learning_rate": 7.787704349168203e-06, "loss": 0.7545, "step": 4896 }, { "epoch": 0.58, "learning_rate": 7.783937454782223e-06, "loss": 0.7891, "step": 4897 }, { "epoch": 0.58, "learning_rate": 7.780170891055132e-06, "loss": 0.7701, "step": 4898 }, { "epoch": 0.58, "learning_rate": 7.776404658548946e-06, "loss": 0.7048, "step": 4899 }, { "epoch": 0.58, "learning_rate": 7.772638757825627e-06, "loss": 0.6959, "step": 4900 }, { "epoch": 0.58, "learning_rate": 7.76887318944708e-06, "loss": 0.7388, "step": 4901 }, { "epoch": 0.58, "learning_rate": 7.765107953975164e-06, "loss": 0.7813, "step": 4902 }, { "epoch": 0.58, "learning_rate": 7.761343051971698e-06, "loss": 0.7199, "step": 4903 }, { "epoch": 0.58, "learning_rate": 7.757578483998436e-06, "loss": 0.7545, "step": 4904 }, { "epoch": 0.58, "learning_rate": 7.753814250617097e-06, "loss": 0.7349, "step": 4905 }, { "epoch": 0.59, "learning_rate": 7.750050352389334e-06, "loss": 0.7545, "step": 4906 }, { "epoch": 0.59, "learning_rate": 7.746286789876762e-06, "loss": 0.7461, "step": 4907 }, { "epoch": 0.59, "learning_rate": 7.742523563640943e-06, "loss": 0.7796, "step": 4908 }, { "epoch": 0.59, "learning_rate": 7.738760674243393e-06, "loss": 0.7439, "step": 4909 }, { "epoch": 0.59, "learning_rate": 7.734998122245568e-06, "loss": 0.7679, "step": 4910 }, { "epoch": 0.59, "learning_rate": 7.731235908208877e-06, "loss": 0.7706, "step": 4911 }, { "epoch": 0.59, "learning_rate": 7.727474032694683e-06, "loss": 0.7517, "step": 4912 }, { "epoch": 0.59, "learning_rate": 7.723712496264294e-06, "loss": 0.7294, "step": 4913 }, { "epoch": 0.59, "learning_rate": 7.719951299478973e-06, "loss": 0.7355, "step": 4914 }, { "epoch": 0.59, "learning_rate": 7.716190442899928e-06, "loss": 0.7701, "step": 4915 }, { "epoch": 0.59, "learning_rate": 7.712429927088312e-06, "loss": 0.7913, "step": 4916 }, { "epoch": 0.59, "learning_rate": 7.708669752605236e-06, "loss": 0.7612, "step": 4917 }, { "epoch": 0.59, "learning_rate": 7.704909920011754e-06, "loss": 0.726, "step": 4918 }, { "epoch": 0.59, "learning_rate": 7.701150429868872e-06, "loss": 0.6864, "step": 4919 }, { "epoch": 0.59, "learning_rate": 7.697391282737547e-06, "loss": 0.7193, "step": 4920 }, { "epoch": 0.59, "learning_rate": 7.693632479178674e-06, "loss": 0.7266, "step": 4921 }, { "epoch": 0.59, "learning_rate": 7.68987401975311e-06, "loss": 0.7372, "step": 4922 }, { "epoch": 0.59, "learning_rate": 7.686115905021653e-06, "loss": 0.7606, "step": 4923 }, { "epoch": 0.59, "learning_rate": 7.682358135545054e-06, "loss": 0.7667, "step": 4924 }, { "epoch": 0.59, "learning_rate": 7.67860071188401e-06, "loss": 0.7427, "step": 4925 }, { "epoch": 0.59, "learning_rate": 7.674843634599163e-06, "loss": 0.7344, "step": 4926 }, { "epoch": 0.59, "learning_rate": 7.671086904251109e-06, "loss": 0.7662, "step": 4927 }, { "epoch": 0.59, "learning_rate": 7.66733052140039e-06, "loss": 0.7372, "step": 4928 }, { "epoch": 0.59, "learning_rate": 7.663574486607495e-06, "loss": 0.7327, "step": 4929 }, { "epoch": 0.59, "learning_rate": 7.65981880043287e-06, "loss": 0.7511, "step": 4930 }, { "epoch": 0.59, "learning_rate": 7.656063463436887e-06, "loss": 0.8164, "step": 4931 }, { "epoch": 0.59, "learning_rate": 7.652308476179891e-06, "loss": 0.7879, "step": 4932 }, { "epoch": 0.59, "learning_rate": 7.64855383922216e-06, "loss": 0.764, "step": 4933 }, { "epoch": 0.59, "learning_rate": 7.644799553123926e-06, "loss": 0.7115, "step": 4934 }, { "epoch": 0.59, "learning_rate": 7.641045618445367e-06, "loss": 0.7606, "step": 4935 }, { "epoch": 0.59, "learning_rate": 7.637292035746607e-06, "loss": 0.7349, "step": 4936 }, { "epoch": 0.59, "learning_rate": 7.633538805587713e-06, "loss": 0.7852, "step": 4937 }, { "epoch": 0.59, "learning_rate": 7.62978592852871e-06, "loss": 0.7824, "step": 4938 }, { "epoch": 0.59, "learning_rate": 7.6260334051295624e-06, "loss": 0.7455, "step": 4939 }, { "epoch": 0.59, "learning_rate": 7.622281235950193e-06, "loss": 0.7182, "step": 4940 }, { "epoch": 0.59, "learning_rate": 7.618529421550453e-06, "loss": 0.7623, "step": 4941 }, { "epoch": 0.59, "learning_rate": 7.614777962490155e-06, "loss": 0.7472, "step": 4942 }, { "epoch": 0.59, "learning_rate": 7.6110268593290534e-06, "loss": 0.7472, "step": 4943 }, { "epoch": 0.59, "learning_rate": 7.607276112626852e-06, "loss": 0.808, "step": 4944 }, { "epoch": 0.59, "learning_rate": 7.6035257229432034e-06, "loss": 0.7478, "step": 4945 }, { "epoch": 0.59, "learning_rate": 7.599775690837696e-06, "loss": 0.7645, "step": 4946 }, { "epoch": 0.59, "learning_rate": 7.596026016869876e-06, "loss": 0.7785, "step": 4947 }, { "epoch": 0.59, "learning_rate": 7.592276701599236e-06, "loss": 0.716, "step": 4948 }, { "epoch": 0.59, "learning_rate": 7.588527745585206e-06, "loss": 0.7695, "step": 4949 }, { "epoch": 0.59, "learning_rate": 7.584779149387174e-06, "loss": 0.7539, "step": 4950 }, { "epoch": 0.59, "learning_rate": 7.5810309135644625e-06, "loss": 0.7422, "step": 4951 }, { "epoch": 0.59, "learning_rate": 7.5772830386763464e-06, "loss": 0.8019, "step": 4952 }, { "epoch": 0.59, "learning_rate": 7.57353552528205e-06, "loss": 0.6908, "step": 4953 }, { "epoch": 0.59, "learning_rate": 7.569788373940741e-06, "loss": 0.7294, "step": 4954 }, { "epoch": 0.59, "learning_rate": 7.566041585211532e-06, "loss": 0.7857, "step": 4955 }, { "epoch": 0.59, "learning_rate": 7.562295159653474e-06, "loss": 0.7645, "step": 4956 }, { "epoch": 0.59, "learning_rate": 7.5585490978255796e-06, "loss": 0.7545, "step": 4957 }, { "epoch": 0.59, "learning_rate": 7.554803400286796e-06, "loss": 0.8119, "step": 4958 }, { "epoch": 0.59, "learning_rate": 7.55105806759602e-06, "loss": 0.7494, "step": 4959 }, { "epoch": 0.59, "learning_rate": 7.547313100312095e-06, "loss": 0.8058, "step": 4960 }, { "epoch": 0.59, "learning_rate": 7.543568498993804e-06, "loss": 0.7143, "step": 4961 }, { "epoch": 0.59, "learning_rate": 7.53982426419988e-06, "loss": 0.7857, "step": 4962 }, { "epoch": 0.59, "learning_rate": 7.536080396489001e-06, "loss": 0.7807, "step": 4963 }, { "epoch": 0.59, "learning_rate": 7.532336896419789e-06, "loss": 0.7165, "step": 4964 }, { "epoch": 0.59, "learning_rate": 7.52859376455082e-06, "loss": 0.721, "step": 4965 }, { "epoch": 0.59, "learning_rate": 7.524851001440595e-06, "loss": 0.6987, "step": 4966 }, { "epoch": 0.59, "learning_rate": 7.521108607647581e-06, "loss": 0.7467, "step": 4967 }, { "epoch": 0.59, "learning_rate": 7.517366583730173e-06, "loss": 0.7271, "step": 4968 }, { "epoch": 0.59, "learning_rate": 7.513624930246724e-06, "loss": 0.7846, "step": 4969 }, { "epoch": 0.59, "learning_rate": 7.509883647755529e-06, "loss": 0.7651, "step": 4970 }, { "epoch": 0.59, "learning_rate": 7.506142736814819e-06, "loss": 0.7366, "step": 4971 }, { "epoch": 0.59, "learning_rate": 7.502402197982777e-06, "loss": 0.7612, "step": 4972 }, { "epoch": 0.59, "learning_rate": 7.498662031817534e-06, "loss": 0.721, "step": 4973 }, { "epoch": 0.59, "learning_rate": 7.494922238877154e-06, "loss": 0.8036, "step": 4974 }, { "epoch": 0.59, "learning_rate": 7.491182819719658e-06, "loss": 0.6975, "step": 4975 }, { "epoch": 0.59, "learning_rate": 7.487443774902999e-06, "loss": 0.7427, "step": 4976 }, { "epoch": 0.59, "learning_rate": 7.483705104985083e-06, "loss": 0.7573, "step": 4977 }, { "epoch": 0.59, "learning_rate": 7.479966810523758e-06, "loss": 0.8583, "step": 4978 }, { "epoch": 0.59, "learning_rate": 7.476228892076816e-06, "loss": 0.6828, "step": 4979 }, { "epoch": 0.59, "learning_rate": 7.4724913502019905e-06, "loss": 0.8147, "step": 4980 }, { "epoch": 0.59, "learning_rate": 7.468754185456961e-06, "loss": 0.7461, "step": 4981 }, { "epoch": 0.59, "learning_rate": 7.4650173983993476e-06, "loss": 0.7824, "step": 4982 }, { "epoch": 0.59, "learning_rate": 7.461280989586719e-06, "loss": 0.7785, "step": 4983 }, { "epoch": 0.59, "learning_rate": 7.457544959576586e-06, "loss": 0.8097, "step": 4984 }, { "epoch": 0.59, "learning_rate": 7.453809308926405e-06, "loss": 0.6638, "step": 4985 }, { "epoch": 0.59, "learning_rate": 7.450074038193567e-06, "loss": 0.7662, "step": 4986 }, { "epoch": 0.59, "learning_rate": 7.446339147935411e-06, "loss": 0.7137, "step": 4987 }, { "epoch": 0.59, "learning_rate": 7.442604638709223e-06, "loss": 0.7712, "step": 4988 }, { "epoch": 0.59, "learning_rate": 7.438870511072229e-06, "loss": 0.7695, "step": 4989 }, { "epoch": 0.6, "learning_rate": 7.4351367655816055e-06, "loss": 0.7355, "step": 4990 }, { "epoch": 0.6, "learning_rate": 7.431403402794455e-06, "loss": 0.7355, "step": 4991 }, { "epoch": 0.6, "learning_rate": 7.427670423267837e-06, "loss": 0.7506, "step": 4992 }, { "epoch": 0.6, "learning_rate": 7.423937827558747e-06, "loss": 0.7902, "step": 4993 }, { "epoch": 0.6, "learning_rate": 7.42020561622413e-06, "loss": 0.7606, "step": 4994 }, { "epoch": 0.6, "learning_rate": 7.41647378982087e-06, "loss": 0.7824, "step": 4995 }, { "epoch": 0.6, "learning_rate": 7.412742348905788e-06, "loss": 0.7243, "step": 4996 }, { "epoch": 0.6, "learning_rate": 7.409011294035656e-06, "loss": 0.7204, "step": 4997 }, { "epoch": 0.6, "learning_rate": 7.405280625767186e-06, "loss": 0.7193, "step": 4998 }, { "epoch": 0.6, "learning_rate": 7.401550344657029e-06, "loss": 0.7232, "step": 4999 }, { "epoch": 0.6, "learning_rate": 7.397820451261786e-06, "loss": 0.774, "step": 5000 }, { "epoch": 0.6, "learning_rate": 7.394090946137985e-06, "loss": 0.7651, "step": 5001 }, { "epoch": 0.6, "learning_rate": 7.3903618298421125e-06, "loss": 0.7985, "step": 5002 }, { "epoch": 0.6, "learning_rate": 7.386633102930587e-06, "loss": 0.8147, "step": 5003 }, { "epoch": 0.6, "learning_rate": 7.382904765959778e-06, "loss": 0.731, "step": 5004 }, { "epoch": 0.6, "learning_rate": 7.379176819485987e-06, "loss": 0.7054, "step": 5005 }, { "epoch": 0.6, "learning_rate": 7.375449264065462e-06, "loss": 0.7243, "step": 5006 }, { "epoch": 0.6, "learning_rate": 7.371722100254387e-06, "loss": 0.7533, "step": 5007 }, { "epoch": 0.6, "learning_rate": 7.367995328608899e-06, "loss": 0.6931, "step": 5008 }, { "epoch": 0.6, "learning_rate": 7.364268949685066e-06, "loss": 0.8008, "step": 5009 }, { "epoch": 0.6, "learning_rate": 7.360542964038908e-06, "loss": 0.8136, "step": 5010 }, { "epoch": 0.6, "learning_rate": 7.35681737222637e-06, "loss": 0.7617, "step": 5011 }, { "epoch": 0.6, "learning_rate": 7.353092174803355e-06, "loss": 0.7321, "step": 5012 }, { "epoch": 0.6, "learning_rate": 7.349367372325695e-06, "loss": 0.7349, "step": 5013 }, { "epoch": 0.6, "learning_rate": 7.345642965349171e-06, "loss": 0.7009, "step": 5014 }, { "epoch": 0.6, "learning_rate": 7.3419189544295074e-06, "loss": 0.7467, "step": 5015 }, { "epoch": 0.6, "learning_rate": 7.338195340122353e-06, "loss": 0.7433, "step": 5016 }, { "epoch": 0.6, "learning_rate": 7.334472122983316e-06, "loss": 0.7372, "step": 5017 }, { "epoch": 0.6, "learning_rate": 7.3307493035679345e-06, "loss": 0.7679, "step": 5018 }, { "epoch": 0.6, "learning_rate": 7.327026882431694e-06, "loss": 0.817, "step": 5019 }, { "epoch": 0.6, "learning_rate": 7.323304860130018e-06, "loss": 0.6802, "step": 5020 }, { "epoch": 0.6, "learning_rate": 7.319583237218264e-06, "loss": 0.7383, "step": 5021 }, { "epoch": 0.6, "learning_rate": 7.31586201425174e-06, "loss": 0.7991, "step": 5022 }, { "epoch": 0.6, "learning_rate": 7.31214119178569e-06, "loss": 0.7232, "step": 5023 }, { "epoch": 0.6, "learning_rate": 7.308420770375295e-06, "loss": 0.7422, "step": 5024 }, { "epoch": 0.6, "learning_rate": 7.304700750575689e-06, "loss": 0.7472, "step": 5025 }, { "epoch": 0.6, "learning_rate": 7.3009811329419225e-06, "loss": 0.7852, "step": 5026 }, { "epoch": 0.6, "learning_rate": 7.297261918029008e-06, "loss": 0.7182, "step": 5027 }, { "epoch": 0.6, "learning_rate": 7.293543106391888e-06, "loss": 0.7204, "step": 5028 }, { "epoch": 0.6, "learning_rate": 7.28982469858545e-06, "loss": 0.7762, "step": 5029 }, { "epoch": 0.6, "learning_rate": 7.2861066951645165e-06, "loss": 0.7734, "step": 5030 }, { "epoch": 0.6, "learning_rate": 7.282389096683848e-06, "loss": 0.7299, "step": 5031 }, { "epoch": 0.6, "learning_rate": 7.278671903698149e-06, "loss": 0.7573, "step": 5032 }, { "epoch": 0.6, "learning_rate": 7.274955116762064e-06, "loss": 0.7193, "step": 5033 }, { "epoch": 0.6, "learning_rate": 7.271238736430173e-06, "loss": 0.7065, "step": 5034 }, { "epoch": 0.6, "learning_rate": 7.2675227632570025e-06, "loss": 0.76, "step": 5035 }, { "epoch": 0.6, "learning_rate": 7.263807197797006e-06, "loss": 0.7645, "step": 5036 }, { "epoch": 0.6, "learning_rate": 7.2600920406045885e-06, "loss": 0.7829, "step": 5037 }, { "epoch": 0.6, "learning_rate": 7.256377292234085e-06, "loss": 0.7282, "step": 5038 }, { "epoch": 0.6, "learning_rate": 7.252662953239775e-06, "loss": 0.7941, "step": 5039 }, { "epoch": 0.6, "learning_rate": 7.24894902417588e-06, "loss": 0.7388, "step": 5040 }, { "epoch": 0.6, "learning_rate": 7.245235505596548e-06, "loss": 0.7115, "step": 5041 }, { "epoch": 0.6, "learning_rate": 7.241522398055877e-06, "loss": 0.7433, "step": 5042 }, { "epoch": 0.6, "learning_rate": 7.237809702107902e-06, "loss": 0.7857, "step": 5043 }, { "epoch": 0.6, "learning_rate": 7.234097418306592e-06, "loss": 0.7522, "step": 5044 }, { "epoch": 0.6, "learning_rate": 7.230385547205861e-06, "loss": 0.7422, "step": 5045 }, { "epoch": 0.6, "learning_rate": 7.226674089359549e-06, "loss": 0.764, "step": 5046 }, { "epoch": 0.6, "learning_rate": 7.222963045321451e-06, "loss": 0.7779, "step": 5047 }, { "epoch": 0.6, "learning_rate": 7.21925241564529e-06, "loss": 0.7338, "step": 5048 }, { "epoch": 0.6, "learning_rate": 7.215542200884729e-06, "loss": 0.7667, "step": 5049 }, { "epoch": 0.6, "learning_rate": 7.211832401593374e-06, "loss": 0.7388, "step": 5050 }, { "epoch": 0.6, "learning_rate": 7.208123018324755e-06, "loss": 0.7472, "step": 5051 }, { "epoch": 0.6, "learning_rate": 7.204414051632356e-06, "loss": 0.7757, "step": 5052 }, { "epoch": 0.6, "learning_rate": 7.200705502069589e-06, "loss": 0.784, "step": 5053 }, { "epoch": 0.6, "learning_rate": 7.196997370189811e-06, "loss": 0.736, "step": 5054 }, { "epoch": 0.6, "learning_rate": 7.193289656546312e-06, "loss": 0.8237, "step": 5055 }, { "epoch": 0.6, "learning_rate": 7.189582361692319e-06, "loss": 0.7533, "step": 5056 }, { "epoch": 0.6, "learning_rate": 7.185875486180995e-06, "loss": 0.7115, "step": 5057 }, { "epoch": 0.6, "learning_rate": 7.1821690305654454e-06, "loss": 0.7757, "step": 5058 }, { "epoch": 0.6, "learning_rate": 7.178462995398712e-06, "loss": 0.7271, "step": 5059 }, { "epoch": 0.6, "learning_rate": 7.174757381233777e-06, "loss": 0.8181, "step": 5060 }, { "epoch": 0.6, "learning_rate": 7.171052188623544e-06, "loss": 0.7377, "step": 5061 }, { "epoch": 0.6, "learning_rate": 7.167347418120876e-06, "loss": 0.7656, "step": 5062 }, { "epoch": 0.6, "learning_rate": 7.1636430702785545e-06, "loss": 0.8125, "step": 5063 }, { "epoch": 0.6, "learning_rate": 7.159939145649307e-06, "loss": 0.7684, "step": 5064 }, { "epoch": 0.6, "learning_rate": 7.156235644785805e-06, "loss": 0.7522, "step": 5065 }, { "epoch": 0.6, "learning_rate": 7.152532568240635e-06, "loss": 0.7818, "step": 5066 }, { "epoch": 0.6, "learning_rate": 7.148829916566342e-06, "loss": 0.7394, "step": 5067 }, { "epoch": 0.6, "learning_rate": 7.145127690315397e-06, "loss": 0.7868, "step": 5068 }, { "epoch": 0.6, "learning_rate": 7.141425890040207e-06, "loss": 0.7221, "step": 5069 }, { "epoch": 0.6, "learning_rate": 7.1377245162931275e-06, "loss": 0.7472, "step": 5070 }, { "epoch": 0.6, "learning_rate": 7.134023569626427e-06, "loss": 0.7171, "step": 5071 }, { "epoch": 0.6, "learning_rate": 7.130323050592331e-06, "loss": 0.7768, "step": 5072 }, { "epoch": 0.61, "learning_rate": 7.126622959742992e-06, "loss": 0.6953, "step": 5073 }, { "epoch": 0.61, "learning_rate": 7.122923297630508e-06, "loss": 0.8025, "step": 5074 }, { "epoch": 0.61, "learning_rate": 7.119224064806901e-06, "loss": 0.7494, "step": 5075 }, { "epoch": 0.61, "learning_rate": 7.11552526182413e-06, "loss": 0.774, "step": 5076 }, { "epoch": 0.61, "learning_rate": 7.111826889234097e-06, "loss": 0.7193, "step": 5077 }, { "epoch": 0.61, "learning_rate": 7.108128947588637e-06, "loss": 0.7606, "step": 5078 }, { "epoch": 0.61, "learning_rate": 7.1044314374395226e-06, "loss": 0.7746, "step": 5079 }, { "epoch": 0.61, "learning_rate": 7.100734359338455e-06, "loss": 0.7506, "step": 5080 }, { "epoch": 0.61, "learning_rate": 7.09703771383708e-06, "loss": 0.7333, "step": 5081 }, { "epoch": 0.61, "learning_rate": 7.09334150148697e-06, "loss": 0.7628, "step": 5082 }, { "epoch": 0.61, "learning_rate": 7.089645722839638e-06, "loss": 0.7461, "step": 5083 }, { "epoch": 0.61, "learning_rate": 7.0859503784465335e-06, "loss": 0.7444, "step": 5084 }, { "epoch": 0.61, "learning_rate": 7.082255468859039e-06, "loss": 0.7215, "step": 5085 }, { "epoch": 0.61, "learning_rate": 7.078560994628474e-06, "loss": 0.6747, "step": 5086 }, { "epoch": 0.61, "learning_rate": 7.074866956306088e-06, "loss": 0.745, "step": 5087 }, { "epoch": 0.61, "learning_rate": 7.071173354443066e-06, "loss": 0.7974, "step": 5088 }, { "epoch": 0.61, "learning_rate": 7.067480189590537e-06, "loss": 0.75, "step": 5089 }, { "epoch": 0.61, "learning_rate": 7.063787462299554e-06, "loss": 0.7115, "step": 5090 }, { "epoch": 0.61, "learning_rate": 7.060095173121116e-06, "loss": 0.822, "step": 5091 }, { "epoch": 0.61, "learning_rate": 7.05640332260614e-06, "loss": 0.7941, "step": 5092 }, { "epoch": 0.61, "learning_rate": 7.052711911305497e-06, "loss": 0.745, "step": 5093 }, { "epoch": 0.61, "learning_rate": 7.049020939769973e-06, "loss": 0.7109, "step": 5094 }, { "epoch": 0.61, "learning_rate": 7.045330408550304e-06, "loss": 0.6825, "step": 5095 }, { "epoch": 0.61, "learning_rate": 7.041640318197158e-06, "loss": 0.7288, "step": 5096 }, { "epoch": 0.61, "learning_rate": 7.037950669261127e-06, "loss": 0.7433, "step": 5097 }, { "epoch": 0.61, "learning_rate": 7.034261462292744e-06, "loss": 0.841, "step": 5098 }, { "epoch": 0.61, "learning_rate": 7.0305726978424814e-06, "loss": 0.7472, "step": 5099 }, { "epoch": 0.61, "learning_rate": 7.026884376460736e-06, "loss": 0.7768, "step": 5100 }, { "epoch": 0.61, "learning_rate": 7.0231964986978465e-06, "loss": 0.7818, "step": 5101 }, { "epoch": 0.61, "learning_rate": 7.019509065104073e-06, "loss": 0.7673, "step": 5102 }, { "epoch": 0.61, "learning_rate": 7.0158220762296246e-06, "loss": 0.7746, "step": 5103 }, { "epoch": 0.61, "learning_rate": 7.012135532624635e-06, "loss": 0.7712, "step": 5104 }, { "epoch": 0.61, "learning_rate": 7.0084494348391785e-06, "loss": 0.7517, "step": 5105 }, { "epoch": 0.61, "learning_rate": 7.0047637834232554e-06, "loss": 0.7545, "step": 5106 }, { "epoch": 0.61, "learning_rate": 7.001078578926797e-06, "loss": 0.7031, "step": 5107 }, { "epoch": 0.61, "learning_rate": 6.9973938218996765e-06, "loss": 0.7818, "step": 5108 }, { "epoch": 0.61, "learning_rate": 6.993709512891696e-06, "loss": 0.798, "step": 5109 }, { "epoch": 0.61, "learning_rate": 6.990025652452596e-06, "loss": 0.7963, "step": 5110 }, { "epoch": 0.61, "learning_rate": 6.986342241132044e-06, "loss": 0.7132, "step": 5111 }, { "epoch": 0.61, "learning_rate": 6.982659279479639e-06, "loss": 0.7645, "step": 5112 }, { "epoch": 0.61, "learning_rate": 6.9789767680449165e-06, "loss": 0.7455, "step": 5113 }, { "epoch": 0.61, "learning_rate": 6.975294707377343e-06, "loss": 0.7455, "step": 5114 }, { "epoch": 0.61, "learning_rate": 6.971613098026324e-06, "loss": 0.7723, "step": 5115 }, { "epoch": 0.61, "learning_rate": 6.967931940541194e-06, "loss": 0.7528, "step": 5116 }, { "epoch": 0.61, "learning_rate": 6.964251235471211e-06, "loss": 0.7846, "step": 5117 }, { "epoch": 0.61, "learning_rate": 6.96057098336558e-06, "loss": 0.7143, "step": 5118 }, { "epoch": 0.61, "learning_rate": 6.956891184773426e-06, "loss": 0.7243, "step": 5119 }, { "epoch": 0.61, "learning_rate": 6.953211840243816e-06, "loss": 0.7266, "step": 5120 }, { "epoch": 0.61, "learning_rate": 6.949532950325751e-06, "loss": 0.7461, "step": 5121 }, { "epoch": 0.61, "learning_rate": 6.945854515568144e-06, "loss": 0.7478, "step": 5122 }, { "epoch": 0.61, "learning_rate": 6.942176536519867e-06, "loss": 0.7573, "step": 5123 }, { "epoch": 0.61, "learning_rate": 6.938499013729707e-06, "loss": 0.7483, "step": 5124 }, { "epoch": 0.61, "learning_rate": 6.934821947746386e-06, "loss": 0.7723, "step": 5125 }, { "epoch": 0.61, "learning_rate": 6.931145339118566e-06, "loss": 0.7444, "step": 5126 }, { "epoch": 0.61, "learning_rate": 6.9274691883948256e-06, "loss": 0.7729, "step": 5127 }, { "epoch": 0.61, "learning_rate": 6.923793496123686e-06, "loss": 0.7506, "step": 5128 }, { "epoch": 0.61, "learning_rate": 6.9201182628536e-06, "loss": 0.7603, "step": 5129 }, { "epoch": 0.61, "learning_rate": 6.91644348913295e-06, "loss": 0.7667, "step": 5130 }, { "epoch": 0.61, "learning_rate": 6.91276917551005e-06, "loss": 0.7773, "step": 5131 }, { "epoch": 0.61, "learning_rate": 6.909095322533139e-06, "loss": 0.7997, "step": 5132 }, { "epoch": 0.61, "learning_rate": 6.9054219307503955e-06, "loss": 0.7796, "step": 5133 }, { "epoch": 0.61, "learning_rate": 6.901749000709927e-06, "loss": 0.7232, "step": 5134 }, { "epoch": 0.61, "learning_rate": 6.898076532959773e-06, "loss": 0.6942, "step": 5135 }, { "epoch": 0.61, "learning_rate": 6.894404528047906e-06, "loss": 0.7394, "step": 5136 }, { "epoch": 0.61, "learning_rate": 6.89073298652222e-06, "loss": 0.769, "step": 5137 }, { "epoch": 0.61, "learning_rate": 6.887061908930547e-06, "loss": 0.7751, "step": 5138 }, { "epoch": 0.61, "learning_rate": 6.88339129582065e-06, "loss": 0.7271, "step": 5139 }, { "epoch": 0.61, "learning_rate": 6.87972114774022e-06, "loss": 0.7266, "step": 5140 }, { "epoch": 0.61, "learning_rate": 6.876051465236886e-06, "loss": 0.7578, "step": 5141 }, { "epoch": 0.61, "learning_rate": 6.872382248858194e-06, "loss": 0.7137, "step": 5142 }, { "epoch": 0.61, "learning_rate": 6.868713499151633e-06, "loss": 0.7545, "step": 5143 }, { "epoch": 0.61, "learning_rate": 6.865045216664614e-06, "loss": 0.7232, "step": 5144 }, { "epoch": 0.61, "learning_rate": 6.861377401944484e-06, "loss": 0.7729, "step": 5145 }, { "epoch": 0.61, "learning_rate": 6.85771005553852e-06, "loss": 0.7048, "step": 5146 }, { "epoch": 0.61, "learning_rate": 6.854043177993923e-06, "loss": 0.7372, "step": 5147 }, { "epoch": 0.61, "learning_rate": 6.85037676985783e-06, "loss": 0.7416, "step": 5148 }, { "epoch": 0.61, "learning_rate": 6.846710831677305e-06, "loss": 0.7985, "step": 5149 }, { "epoch": 0.61, "learning_rate": 6.843045363999345e-06, "loss": 0.7037, "step": 5150 }, { "epoch": 0.61, "learning_rate": 6.839380367370876e-06, "loss": 0.7729, "step": 5151 }, { "epoch": 0.61, "learning_rate": 6.835715842338746e-06, "loss": 0.769, "step": 5152 }, { "epoch": 0.61, "learning_rate": 6.832051789449744e-06, "loss": 0.7729, "step": 5153 }, { "epoch": 0.61, "learning_rate": 6.8283882092505824e-06, "loss": 0.7327, "step": 5154 }, { "epoch": 0.61, "learning_rate": 6.824725102287908e-06, "loss": 0.764, "step": 5155 }, { "epoch": 0.61, "learning_rate": 6.82106246910829e-06, "loss": 0.7902, "step": 5156 }, { "epoch": 0.62, "learning_rate": 6.817400310258229e-06, "loss": 0.6931, "step": 5157 }, { "epoch": 0.62, "learning_rate": 6.8137386262841565e-06, "loss": 0.7706, "step": 5158 }, { "epoch": 0.62, "learning_rate": 6.810077417732434e-06, "loss": 0.7132, "step": 5159 }, { "epoch": 0.62, "learning_rate": 6.80641668514935e-06, "loss": 0.7478, "step": 5160 }, { "epoch": 0.62, "learning_rate": 6.802756429081128e-06, "loss": 0.784, "step": 5161 }, { "epoch": 0.62, "learning_rate": 6.799096650073906e-06, "loss": 0.7829, "step": 5162 }, { "epoch": 0.62, "learning_rate": 6.7954373486737645e-06, "loss": 0.7171, "step": 5163 }, { "epoch": 0.62, "learning_rate": 6.791778525426708e-06, "loss": 0.7796, "step": 5164 }, { "epoch": 0.62, "learning_rate": 6.788120180878668e-06, "loss": 0.7494, "step": 5165 }, { "epoch": 0.62, "learning_rate": 6.784462315575514e-06, "loss": 0.7271, "step": 5166 }, { "epoch": 0.62, "learning_rate": 6.780804930063026e-06, "loss": 0.7561, "step": 5167 }, { "epoch": 0.62, "learning_rate": 6.77714802488693e-06, "loss": 0.7584, "step": 5168 }, { "epoch": 0.62, "learning_rate": 6.773491600592868e-06, "loss": 0.7065, "step": 5169 }, { "epoch": 0.62, "learning_rate": 6.769835657726418e-06, "loss": 0.6948, "step": 5170 }, { "epoch": 0.62, "learning_rate": 6.7661801968330885e-06, "loss": 0.6914, "step": 5171 }, { "epoch": 0.62, "learning_rate": 6.762525218458302e-06, "loss": 0.7444, "step": 5172 }, { "epoch": 0.62, "learning_rate": 6.758870723147421e-06, "loss": 0.7277, "step": 5173 }, { "epoch": 0.62, "learning_rate": 6.755216711445738e-06, "loss": 0.7489, "step": 5174 }, { "epoch": 0.62, "learning_rate": 6.751563183898463e-06, "loss": 0.8036, "step": 5175 }, { "epoch": 0.62, "learning_rate": 6.7479101410507445e-06, "loss": 0.74, "step": 5176 }, { "epoch": 0.62, "learning_rate": 6.744257583447647e-06, "loss": 0.7277, "step": 5177 }, { "epoch": 0.62, "learning_rate": 6.740605511634171e-06, "loss": 0.7545, "step": 5178 }, { "epoch": 0.62, "learning_rate": 6.736953926155243e-06, "loss": 0.6892, "step": 5179 }, { "epoch": 0.62, "learning_rate": 6.733302827555719e-06, "loss": 0.7059, "step": 5180 }, { "epoch": 0.62, "learning_rate": 6.7296522163803775e-06, "loss": 0.7656, "step": 5181 }, { "epoch": 0.62, "learning_rate": 6.726002093173927e-06, "loss": 0.7294, "step": 5182 }, { "epoch": 0.62, "learning_rate": 6.722352458481001e-06, "loss": 0.7232, "step": 5183 }, { "epoch": 0.62, "learning_rate": 6.718703312846162e-06, "loss": 0.7773, "step": 5184 }, { "epoch": 0.62, "learning_rate": 6.7150546568139e-06, "loss": 0.6858, "step": 5185 }, { "epoch": 0.62, "learning_rate": 6.711406490928637e-06, "loss": 0.726, "step": 5186 }, { "epoch": 0.62, "learning_rate": 6.707758815734706e-06, "loss": 0.7879, "step": 5187 }, { "epoch": 0.62, "learning_rate": 6.704111631776385e-06, "loss": 0.7511, "step": 5188 }, { "epoch": 0.62, "learning_rate": 6.700464939597863e-06, "loss": 0.7383, "step": 5189 }, { "epoch": 0.62, "learning_rate": 6.696818739743272e-06, "loss": 0.7935, "step": 5190 }, { "epoch": 0.62, "learning_rate": 6.693173032756658e-06, "loss": 0.7946, "step": 5191 }, { "epoch": 0.62, "learning_rate": 6.689527819181994e-06, "loss": 0.7913, "step": 5192 }, { "epoch": 0.62, "learning_rate": 6.685883099563188e-06, "loss": 0.7048, "step": 5193 }, { "epoch": 0.62, "learning_rate": 6.682238874444063e-06, "loss": 0.736, "step": 5194 }, { "epoch": 0.62, "learning_rate": 6.67859514436838e-06, "loss": 0.7349, "step": 5195 }, { "epoch": 0.62, "learning_rate": 6.67495190987982e-06, "loss": 0.8298, "step": 5196 }, { "epoch": 0.62, "learning_rate": 6.671309171521984e-06, "loss": 0.7589, "step": 5197 }, { "epoch": 0.62, "learning_rate": 6.667666929838411e-06, "loss": 0.7171, "step": 5198 }, { "epoch": 0.62, "learning_rate": 6.66402518537256e-06, "loss": 0.7199, "step": 5199 }, { "epoch": 0.62, "learning_rate": 6.660383938667814e-06, "loss": 0.7969, "step": 5200 }, { "epoch": 0.62, "learning_rate": 6.656743190267487e-06, "loss": 0.764, "step": 5201 }, { "epoch": 0.62, "learning_rate": 6.653102940714811e-06, "loss": 0.7924, "step": 5202 }, { "epoch": 0.62, "learning_rate": 6.6494631905529475e-06, "loss": 0.784, "step": 5203 }, { "epoch": 0.62, "learning_rate": 6.645823940324987e-06, "loss": 0.7734, "step": 5204 }, { "epoch": 0.62, "learning_rate": 6.642185190573944e-06, "loss": 0.7667, "step": 5205 }, { "epoch": 0.62, "learning_rate": 6.638546941842756e-06, "loss": 0.7528, "step": 5206 }, { "epoch": 0.62, "learning_rate": 6.634909194674284e-06, "loss": 0.7667, "step": 5207 }, { "epoch": 0.62, "learning_rate": 6.631271949611316e-06, "loss": 0.6948, "step": 5208 }, { "epoch": 0.62, "learning_rate": 6.627635207196565e-06, "loss": 0.7617, "step": 5209 }, { "epoch": 0.62, "learning_rate": 6.623998967972673e-06, "loss": 0.75, "step": 5210 }, { "epoch": 0.62, "learning_rate": 6.620363232482206e-06, "loss": 0.6814, "step": 5211 }, { "epoch": 0.62, "learning_rate": 6.6167280012676446e-06, "loss": 0.7249, "step": 5212 }, { "epoch": 0.62, "learning_rate": 6.613093274871409e-06, "loss": 0.7377, "step": 5213 }, { "epoch": 0.62, "learning_rate": 6.609459053835833e-06, "loss": 0.7651, "step": 5214 }, { "epoch": 0.62, "learning_rate": 6.605825338703179e-06, "loss": 0.7645, "step": 5215 }, { "epoch": 0.62, "learning_rate": 6.602192130015639e-06, "loss": 0.7835, "step": 5216 }, { "epoch": 0.62, "learning_rate": 6.598559428315318e-06, "loss": 0.8482, "step": 5217 }, { "epoch": 0.62, "learning_rate": 6.594927234144253e-06, "loss": 0.7316, "step": 5218 }, { "epoch": 0.62, "learning_rate": 6.5912955480444085e-06, "loss": 0.7522, "step": 5219 }, { "epoch": 0.62, "learning_rate": 6.5876643705576625e-06, "loss": 0.7522, "step": 5220 }, { "epoch": 0.62, "learning_rate": 6.584033702225831e-06, "loss": 0.7679, "step": 5221 }, { "epoch": 0.62, "learning_rate": 6.580403543590639e-06, "loss": 0.7299, "step": 5222 }, { "epoch": 0.62, "learning_rate": 6.5767738951937445e-06, "loss": 0.8292, "step": 5223 }, { "epoch": 0.62, "learning_rate": 6.573144757576731e-06, "loss": 0.7081, "step": 5224 }, { "epoch": 0.62, "learning_rate": 6.569516131281099e-06, "loss": 0.7394, "step": 5225 }, { "epoch": 0.62, "learning_rate": 6.56588801684828e-06, "loss": 0.7762, "step": 5226 }, { "epoch": 0.62, "learning_rate": 6.562260414819619e-06, "loss": 0.7595, "step": 5227 }, { "epoch": 0.62, "learning_rate": 6.558633325736394e-06, "loss": 0.7171, "step": 5228 }, { "epoch": 0.62, "learning_rate": 6.555006750139805e-06, "loss": 0.7405, "step": 5229 }, { "epoch": 0.62, "learning_rate": 6.551380688570974e-06, "loss": 0.7048, "step": 5230 }, { "epoch": 0.62, "learning_rate": 6.547755141570945e-06, "loss": 0.7165, "step": 5231 }, { "epoch": 0.62, "learning_rate": 6.5441301096806854e-06, "loss": 0.7366, "step": 5232 }, { "epoch": 0.62, "learning_rate": 6.5405055934410845e-06, "loss": 0.6719, "step": 5233 }, { "epoch": 0.62, "learning_rate": 6.5368815933929586e-06, "loss": 0.6886, "step": 5234 }, { "epoch": 0.62, "learning_rate": 6.533258110077047e-06, "loss": 0.7595, "step": 5235 }, { "epoch": 0.62, "learning_rate": 6.52963514403401e-06, "loss": 0.7076, "step": 5236 }, { "epoch": 0.62, "learning_rate": 6.526012695804427e-06, "loss": 0.8008, "step": 5237 }, { "epoch": 0.62, "learning_rate": 6.522390765928808e-06, "loss": 0.7221, "step": 5238 }, { "epoch": 0.62, "learning_rate": 6.518769354947576e-06, "loss": 0.7489, "step": 5239 }, { "epoch": 0.62, "learning_rate": 6.515148463401086e-06, "loss": 0.7182, "step": 5240 }, { "epoch": 0.63, "learning_rate": 6.511528091829618e-06, "loss": 0.7779, "step": 5241 }, { "epoch": 0.63, "learning_rate": 6.507908240773353e-06, "loss": 0.76, "step": 5242 }, { "epoch": 0.63, "learning_rate": 6.504288910772419e-06, "loss": 0.7612, "step": 5243 }, { "epoch": 0.63, "learning_rate": 6.500670102366857e-06, "loss": 0.803, "step": 5244 }, { "epoch": 0.63, "learning_rate": 6.497051816096626e-06, "loss": 0.7266, "step": 5245 }, { "epoch": 0.63, "learning_rate": 6.493434052501616e-06, "loss": 0.7813, "step": 5246 }, { "epoch": 0.63, "learning_rate": 6.489816812121625e-06, "loss": 0.7472, "step": 5247 }, { "epoch": 0.63, "learning_rate": 6.486200095496389e-06, "loss": 0.7355, "step": 5248 }, { "epoch": 0.63, "learning_rate": 6.482583903165556e-06, "loss": 0.7176, "step": 5249 }, { "epoch": 0.63, "learning_rate": 6.478968235668701e-06, "loss": 0.7349, "step": 5250 }, { "epoch": 0.63, "learning_rate": 6.475353093545319e-06, "loss": 0.7383, "step": 5251 }, { "epoch": 0.63, "learning_rate": 6.471738477334818e-06, "loss": 0.7383, "step": 5252 }, { "epoch": 0.63, "learning_rate": 6.46812438757654e-06, "loss": 0.7372, "step": 5253 }, { "epoch": 0.63, "learning_rate": 6.464510824809744e-06, "loss": 0.7294, "step": 5254 }, { "epoch": 0.63, "learning_rate": 6.460897789573612e-06, "loss": 0.769, "step": 5255 }, { "epoch": 0.63, "learning_rate": 6.457285282407242e-06, "loss": 0.7556, "step": 5256 }, { "epoch": 0.63, "learning_rate": 6.453673303849659e-06, "loss": 0.7288, "step": 5257 }, { "epoch": 0.63, "learning_rate": 6.450061854439802e-06, "loss": 0.7121, "step": 5258 }, { "epoch": 0.63, "learning_rate": 6.446450934716539e-06, "loss": 0.7439, "step": 5259 }, { "epoch": 0.63, "learning_rate": 6.442840545218657e-06, "loss": 0.7383, "step": 5260 }, { "epoch": 0.63, "learning_rate": 6.439230686484864e-06, "loss": 0.7405, "step": 5261 }, { "epoch": 0.63, "learning_rate": 6.435621359053781e-06, "loss": 0.7946, "step": 5262 }, { "epoch": 0.63, "learning_rate": 6.432012563463961e-06, "loss": 0.7087, "step": 5263 }, { "epoch": 0.63, "learning_rate": 6.42840430025387e-06, "loss": 0.7679, "step": 5264 }, { "epoch": 0.63, "learning_rate": 6.424796569961898e-06, "loss": 0.6635, "step": 5265 }, { "epoch": 0.63, "learning_rate": 6.421189373126355e-06, "loss": 0.7087, "step": 5266 }, { "epoch": 0.63, "learning_rate": 6.417582710285475e-06, "loss": 0.7204, "step": 5267 }, { "epoch": 0.63, "learning_rate": 6.413976581977403e-06, "loss": 0.7455, "step": 5268 }, { "epoch": 0.63, "learning_rate": 6.410370988740212e-06, "loss": 0.7746, "step": 5269 }, { "epoch": 0.63, "learning_rate": 6.406765931111891e-06, "loss": 0.7746, "step": 5270 }, { "epoch": 0.63, "learning_rate": 6.403161409630353e-06, "loss": 0.7427, "step": 5271 }, { "epoch": 0.63, "learning_rate": 6.399557424833432e-06, "loss": 0.7785, "step": 5272 }, { "epoch": 0.63, "learning_rate": 6.3959539772588715e-06, "loss": 0.75, "step": 5273 }, { "epoch": 0.63, "learning_rate": 6.392351067444346e-06, "loss": 0.7522, "step": 5274 }, { "epoch": 0.63, "learning_rate": 6.388748695927449e-06, "loss": 0.7037, "step": 5275 }, { "epoch": 0.63, "learning_rate": 6.385146863245686e-06, "loss": 0.7439, "step": 5276 }, { "epoch": 0.63, "learning_rate": 6.381545569936493e-06, "loss": 0.7271, "step": 5277 }, { "epoch": 0.63, "learning_rate": 6.377944816537209e-06, "loss": 0.6903, "step": 5278 }, { "epoch": 0.63, "learning_rate": 6.374344603585111e-06, "loss": 0.7706, "step": 5279 }, { "epoch": 0.63, "learning_rate": 6.370744931617383e-06, "loss": 0.7338, "step": 5280 }, { "epoch": 0.63, "learning_rate": 6.367145801171137e-06, "loss": 0.7026, "step": 5281 }, { "epoch": 0.63, "learning_rate": 6.3635472127833995e-06, "loss": 0.7048, "step": 5282 }, { "epoch": 0.63, "learning_rate": 6.359949166991109e-06, "loss": 0.7863, "step": 5283 }, { "epoch": 0.63, "learning_rate": 6.356351664331134e-06, "loss": 0.764, "step": 5284 }, { "epoch": 0.63, "learning_rate": 6.35275470534026e-06, "loss": 0.7919, "step": 5285 }, { "epoch": 0.63, "learning_rate": 6.34915829055519e-06, "loss": 0.7779, "step": 5286 }, { "epoch": 0.63, "learning_rate": 6.345562420512543e-06, "loss": 0.7813, "step": 5287 }, { "epoch": 0.63, "learning_rate": 6.341967095748861e-06, "loss": 0.7294, "step": 5288 }, { "epoch": 0.63, "learning_rate": 6.3383723168005996e-06, "loss": 0.7394, "step": 5289 }, { "epoch": 0.63, "learning_rate": 6.334778084204139e-06, "loss": 0.7706, "step": 5290 }, { "epoch": 0.63, "learning_rate": 6.331184398495772e-06, "loss": 0.7539, "step": 5291 }, { "epoch": 0.63, "learning_rate": 6.32759126021172e-06, "loss": 0.7651, "step": 5292 }, { "epoch": 0.63, "learning_rate": 6.323998669888107e-06, "loss": 0.7405, "step": 5293 }, { "epoch": 0.63, "learning_rate": 6.3204066280609885e-06, "loss": 0.7316, "step": 5294 }, { "epoch": 0.63, "learning_rate": 6.316815135266331e-06, "loss": 0.7299, "step": 5295 }, { "epoch": 0.63, "learning_rate": 6.313224192040022e-06, "loss": 0.7617, "step": 5296 }, { "epoch": 0.63, "learning_rate": 6.309633798917872e-06, "loss": 0.7439, "step": 5297 }, { "epoch": 0.63, "learning_rate": 6.306043956435593e-06, "loss": 0.6903, "step": 5298 }, { "epoch": 0.63, "learning_rate": 6.3024546651288324e-06, "loss": 0.74, "step": 5299 }, { "epoch": 0.63, "learning_rate": 6.2988659255331495e-06, "loss": 0.6981, "step": 5300 }, { "epoch": 0.63, "learning_rate": 6.295277738184018e-06, "loss": 0.7305, "step": 5301 }, { "epoch": 0.63, "learning_rate": 6.291690103616835e-06, "loss": 0.7042, "step": 5302 }, { "epoch": 0.63, "learning_rate": 6.288103022366907e-06, "loss": 0.7154, "step": 5303 }, { "epoch": 0.63, "learning_rate": 6.2845164949694636e-06, "loss": 0.8052, "step": 5304 }, { "epoch": 0.63, "learning_rate": 6.280930521959651e-06, "loss": 0.7522, "step": 5305 }, { "epoch": 0.63, "learning_rate": 6.277345103872539e-06, "loss": 0.7277, "step": 5306 }, { "epoch": 0.63, "learning_rate": 6.273760241243103e-06, "loss": 0.7461, "step": 5307 }, { "epoch": 0.63, "learning_rate": 6.2701759346062374e-06, "loss": 0.7321, "step": 5308 }, { "epoch": 0.63, "learning_rate": 6.26659218449676e-06, "loss": 0.7567, "step": 5309 }, { "epoch": 0.63, "learning_rate": 6.263008991449403e-06, "loss": 0.7204, "step": 5310 }, { "epoch": 0.63, "learning_rate": 6.259426355998814e-06, "loss": 0.7193, "step": 5311 }, { "epoch": 0.63, "learning_rate": 6.255844278679564e-06, "loss": 0.7455, "step": 5312 }, { "epoch": 0.63, "learning_rate": 6.2522627600261274e-06, "loss": 0.7807, "step": 5313 }, { "epoch": 0.63, "learning_rate": 6.248681800572904e-06, "loss": 0.764, "step": 5314 }, { "epoch": 0.63, "learning_rate": 6.2451014008542096e-06, "loss": 0.7522, "step": 5315 }, { "epoch": 0.63, "learning_rate": 6.241521561404278e-06, "loss": 0.7623, "step": 5316 }, { "epoch": 0.63, "learning_rate": 6.237942282757261e-06, "loss": 0.7478, "step": 5317 }, { "epoch": 0.63, "learning_rate": 6.234363565447215e-06, "loss": 0.7494, "step": 5318 }, { "epoch": 0.63, "learning_rate": 6.230785410008125e-06, "loss": 0.774, "step": 5319 }, { "epoch": 0.63, "learning_rate": 6.227207816973884e-06, "loss": 0.769, "step": 5320 }, { "epoch": 0.63, "learning_rate": 6.223630786878309e-06, "loss": 0.7879, "step": 5321 }, { "epoch": 0.63, "learning_rate": 6.220054320255133e-06, "loss": 0.7305, "step": 5322 }, { "epoch": 0.63, "learning_rate": 6.2164784176379925e-06, "loss": 0.707, "step": 5323 }, { "epoch": 0.63, "learning_rate": 6.2129030795604505e-06, "loss": 0.7561, "step": 5324 }, { "epoch": 0.64, "learning_rate": 6.2093283065559865e-06, "loss": 0.7578, "step": 5325 }, { "epoch": 0.64, "learning_rate": 6.20575409915799e-06, "loss": 0.7919, "step": 5326 }, { "epoch": 0.64, "learning_rate": 6.202180457899774e-06, "loss": 0.7628, "step": 5327 }, { "epoch": 0.64, "learning_rate": 6.198607383314553e-06, "loss": 0.7483, "step": 5328 }, { "epoch": 0.64, "learning_rate": 6.19503487593547e-06, "loss": 0.6987, "step": 5329 }, { "epoch": 0.64, "learning_rate": 6.191462936295582e-06, "loss": 0.6881, "step": 5330 }, { "epoch": 0.64, "learning_rate": 6.187891564927855e-06, "loss": 0.7388, "step": 5331 }, { "epoch": 0.64, "learning_rate": 6.184320762365177e-06, "loss": 0.7997, "step": 5332 }, { "epoch": 0.64, "learning_rate": 6.180750529140345e-06, "loss": 0.7316, "step": 5333 }, { "epoch": 0.64, "learning_rate": 6.177180865786071e-06, "loss": 0.7584, "step": 5334 }, { "epoch": 0.64, "learning_rate": 6.1736117728349886e-06, "loss": 0.7829, "step": 5335 }, { "epoch": 0.64, "learning_rate": 6.170043250819643e-06, "loss": 0.7333, "step": 5336 }, { "epoch": 0.64, "learning_rate": 6.166475300272496e-06, "loss": 0.6669, "step": 5337 }, { "epoch": 0.64, "learning_rate": 6.162907921725916e-06, "loss": 0.7215, "step": 5338 }, { "epoch": 0.64, "learning_rate": 6.159341115712193e-06, "loss": 0.7584, "step": 5339 }, { "epoch": 0.64, "learning_rate": 6.155774882763532e-06, "loss": 0.7818, "step": 5340 }, { "epoch": 0.64, "learning_rate": 6.1522092234120504e-06, "loss": 0.7249, "step": 5341 }, { "epoch": 0.64, "learning_rate": 6.148644138189785e-06, "loss": 0.7282, "step": 5342 }, { "epoch": 0.64, "learning_rate": 6.145079627628674e-06, "loss": 0.7054, "step": 5343 }, { "epoch": 0.64, "learning_rate": 6.141515692260585e-06, "loss": 0.7416, "step": 5344 }, { "epoch": 0.64, "learning_rate": 6.1379523326172895e-06, "loss": 0.7813, "step": 5345 }, { "epoch": 0.64, "learning_rate": 6.134389549230477e-06, "loss": 0.7199, "step": 5346 }, { "epoch": 0.64, "learning_rate": 6.130827342631756e-06, "loss": 0.7545, "step": 5347 }, { "epoch": 0.64, "learning_rate": 6.127265713352637e-06, "loss": 0.7115, "step": 5348 }, { "epoch": 0.64, "learning_rate": 6.123704661924552e-06, "loss": 0.7913, "step": 5349 }, { "epoch": 0.64, "learning_rate": 6.120144188878849e-06, "loss": 0.7852, "step": 5350 }, { "epoch": 0.64, "learning_rate": 6.116584294746785e-06, "loss": 0.7907, "step": 5351 }, { "epoch": 0.64, "learning_rate": 6.113024980059534e-06, "loss": 0.7746, "step": 5352 }, { "epoch": 0.64, "learning_rate": 6.109466245348177e-06, "loss": 0.8013, "step": 5353 }, { "epoch": 0.64, "learning_rate": 6.105908091143715e-06, "loss": 0.7405, "step": 5354 }, { "epoch": 0.64, "learning_rate": 6.10235051797706e-06, "loss": 0.7143, "step": 5355 }, { "epoch": 0.64, "learning_rate": 6.098793526379043e-06, "loss": 0.7405, "step": 5356 }, { "epoch": 0.64, "learning_rate": 6.095237116880399e-06, "loss": 0.736, "step": 5357 }, { "epoch": 0.64, "learning_rate": 6.09168129001178e-06, "loss": 0.697, "step": 5358 }, { "epoch": 0.64, "learning_rate": 6.0881260463037494e-06, "loss": 0.7098, "step": 5359 }, { "epoch": 0.64, "learning_rate": 6.084571386286789e-06, "loss": 0.774, "step": 5360 }, { "epoch": 0.64, "learning_rate": 6.081017310491286e-06, "loss": 0.7436, "step": 5361 }, { "epoch": 0.64, "learning_rate": 6.077463819447552e-06, "loss": 0.7305, "step": 5362 }, { "epoch": 0.64, "learning_rate": 6.073910913685794e-06, "loss": 0.7176, "step": 5363 }, { "epoch": 0.64, "learning_rate": 6.07035859373615e-06, "loss": 0.7478, "step": 5364 }, { "epoch": 0.64, "learning_rate": 6.066806860128654e-06, "loss": 0.7472, "step": 5365 }, { "epoch": 0.64, "learning_rate": 6.063255713393265e-06, "loss": 0.7366, "step": 5366 }, { "epoch": 0.64, "learning_rate": 6.059705154059855e-06, "loss": 0.7154, "step": 5367 }, { "epoch": 0.64, "learning_rate": 6.056155182658192e-06, "loss": 0.7757, "step": 5368 }, { "epoch": 0.64, "learning_rate": 6.052605799717976e-06, "loss": 0.7349, "step": 5369 }, { "epoch": 0.64, "learning_rate": 6.049057005768806e-06, "loss": 0.7266, "step": 5370 }, { "epoch": 0.64, "learning_rate": 6.045508801340201e-06, "loss": 0.6987, "step": 5371 }, { "epoch": 0.64, "learning_rate": 6.04196118696159e-06, "loss": 0.7612, "step": 5372 }, { "epoch": 0.64, "learning_rate": 6.038414163162307e-06, "loss": 0.7271, "step": 5373 }, { "epoch": 0.64, "learning_rate": 6.034867730471608e-06, "loss": 0.769, "step": 5374 }, { "epoch": 0.64, "learning_rate": 6.031321889418657e-06, "loss": 0.7706, "step": 5375 }, { "epoch": 0.64, "learning_rate": 6.027776640532528e-06, "loss": 0.692, "step": 5376 }, { "epoch": 0.64, "learning_rate": 6.0242319843422105e-06, "loss": 0.7573, "step": 5377 }, { "epoch": 0.64, "learning_rate": 6.020687921376598e-06, "loss": 0.764, "step": 5378 }, { "epoch": 0.64, "learning_rate": 6.0171444521645025e-06, "loss": 0.7467, "step": 5379 }, { "epoch": 0.64, "learning_rate": 6.013601577234645e-06, "loss": 0.7935, "step": 5380 }, { "epoch": 0.64, "learning_rate": 6.010059297115663e-06, "loss": 0.7115, "step": 5381 }, { "epoch": 0.64, "learning_rate": 6.006517612336095e-06, "loss": 0.74, "step": 5382 }, { "epoch": 0.64, "learning_rate": 6.002976523424398e-06, "loss": 0.7238, "step": 5383 }, { "epoch": 0.64, "learning_rate": 5.999436030908936e-06, "loss": 0.6948, "step": 5384 }, { "epoch": 0.64, "learning_rate": 5.995896135317988e-06, "loss": 0.8164, "step": 5385 }, { "epoch": 0.64, "learning_rate": 5.9923568371797425e-06, "loss": 0.7701, "step": 5386 }, { "epoch": 0.64, "learning_rate": 5.988818137022302e-06, "loss": 0.7701, "step": 5387 }, { "epoch": 0.64, "learning_rate": 5.985280035373668e-06, "loss": 0.7606, "step": 5388 }, { "epoch": 0.64, "learning_rate": 5.9817425327617685e-06, "loss": 0.7573, "step": 5389 }, { "epoch": 0.64, "learning_rate": 5.978205629714429e-06, "loss": 0.7896, "step": 5390 }, { "epoch": 0.64, "learning_rate": 5.9746693267593935e-06, "loss": 0.7137, "step": 5391 }, { "epoch": 0.64, "learning_rate": 5.971133624424319e-06, "loss": 0.7305, "step": 5392 }, { "epoch": 0.64, "learning_rate": 5.9675985232367585e-06, "loss": 0.7706, "step": 5393 }, { "epoch": 0.64, "learning_rate": 5.96406402372419e-06, "loss": 0.8331, "step": 5394 }, { "epoch": 0.64, "learning_rate": 5.960530126413997e-06, "loss": 0.6948, "step": 5395 }, { "epoch": 0.64, "learning_rate": 5.95699683183347e-06, "loss": 0.7349, "step": 5396 }, { "epoch": 0.64, "learning_rate": 5.95346414050982e-06, "loss": 0.7584, "step": 5397 }, { "epoch": 0.64, "learning_rate": 5.949932052970147e-06, "loss": 0.7634, "step": 5398 }, { "epoch": 0.64, "learning_rate": 5.946400569741483e-06, "loss": 0.7321, "step": 5399 }, { "epoch": 0.64, "learning_rate": 5.94286969135076e-06, "loss": 0.7952, "step": 5400 }, { "epoch": 0.64, "learning_rate": 5.939339418324819e-06, "loss": 0.7517, "step": 5401 }, { "epoch": 0.64, "learning_rate": 5.935809751190416e-06, "loss": 0.7846, "step": 5402 }, { "epoch": 0.64, "learning_rate": 5.9322806904742054e-06, "loss": 0.7762, "step": 5403 }, { "epoch": 0.64, "learning_rate": 5.928752236702766e-06, "loss": 0.7394, "step": 5404 }, { "epoch": 0.64, "learning_rate": 5.925224390402573e-06, "loss": 0.7333, "step": 5405 }, { "epoch": 0.64, "learning_rate": 5.921697152100023e-06, "loss": 0.7282, "step": 5406 }, { "epoch": 0.64, "learning_rate": 5.918170522321413e-06, "loss": 0.7561, "step": 5407 }, { "epoch": 0.64, "learning_rate": 5.914644501592951e-06, "loss": 0.7288, "step": 5408 }, { "epoch": 0.65, "learning_rate": 5.911119090440752e-06, "loss": 0.7254, "step": 5409 }, { "epoch": 0.65, "learning_rate": 5.907594289390846e-06, "loss": 0.6931, "step": 5410 }, { "epoch": 0.65, "learning_rate": 5.904070098969169e-06, "loss": 0.7824, "step": 5411 }, { "epoch": 0.65, "learning_rate": 5.90054651970157e-06, "loss": 0.7377, "step": 5412 }, { "epoch": 0.65, "learning_rate": 5.897023552113793e-06, "loss": 0.7662, "step": 5413 }, { "epoch": 0.65, "learning_rate": 5.893501196731508e-06, "loss": 0.7824, "step": 5414 }, { "epoch": 0.65, "learning_rate": 5.8899794540802815e-06, "loss": 0.7818, "step": 5415 }, { "epoch": 0.65, "learning_rate": 5.886458324685593e-06, "loss": 0.7628, "step": 5416 }, { "epoch": 0.65, "learning_rate": 5.882937809072839e-06, "loss": 0.7455, "step": 5417 }, { "epoch": 0.65, "learning_rate": 5.879417907767304e-06, "loss": 0.7634, "step": 5418 }, { "epoch": 0.65, "learning_rate": 5.875898621294198e-06, "loss": 0.7472, "step": 5419 }, { "epoch": 0.65, "learning_rate": 5.872379950178637e-06, "loss": 0.7483, "step": 5420 }, { "epoch": 0.65, "learning_rate": 5.868861894945638e-06, "loss": 0.7238, "step": 5421 }, { "epoch": 0.65, "learning_rate": 5.8653444561201346e-06, "loss": 0.673, "step": 5422 }, { "epoch": 0.65, "learning_rate": 5.861827634226958e-06, "loss": 0.7679, "step": 5423 }, { "epoch": 0.65, "learning_rate": 5.858311429790856e-06, "loss": 0.6808, "step": 5424 }, { "epoch": 0.65, "learning_rate": 5.8547958433364835e-06, "loss": 0.7573, "step": 5425 }, { "epoch": 0.65, "learning_rate": 5.851280875388403e-06, "loss": 0.7645, "step": 5426 }, { "epoch": 0.65, "learning_rate": 5.847766526471082e-06, "loss": 0.7773, "step": 5427 }, { "epoch": 0.65, "learning_rate": 5.844252797108891e-06, "loss": 0.7148, "step": 5428 }, { "epoch": 0.65, "learning_rate": 5.84073968782612e-06, "loss": 0.7913, "step": 5429 }, { "epoch": 0.65, "learning_rate": 5.83722719914696e-06, "loss": 0.7751, "step": 5430 }, { "epoch": 0.65, "learning_rate": 5.833715331595505e-06, "loss": 0.7165, "step": 5431 }, { "epoch": 0.65, "learning_rate": 5.830204085695773e-06, "loss": 0.7952, "step": 5432 }, { "epoch": 0.65, "learning_rate": 5.826693461971661e-06, "loss": 0.7489, "step": 5433 }, { "epoch": 0.65, "learning_rate": 5.823183460947002e-06, "loss": 0.76, "step": 5434 }, { "epoch": 0.65, "learning_rate": 5.8196740831455165e-06, "loss": 0.6959, "step": 5435 }, { "epoch": 0.65, "learning_rate": 5.81616532909084e-06, "loss": 0.7969, "step": 5436 }, { "epoch": 0.65, "learning_rate": 5.812657199306524e-06, "loss": 0.7606, "step": 5437 }, { "epoch": 0.65, "learning_rate": 5.809149694316e-06, "loss": 0.7846, "step": 5438 }, { "epoch": 0.65, "learning_rate": 5.805642814642636e-06, "loss": 0.7115, "step": 5439 }, { "epoch": 0.65, "learning_rate": 5.802136560809683e-06, "loss": 0.7785, "step": 5440 }, { "epoch": 0.65, "learning_rate": 5.798630933340324e-06, "loss": 0.7723, "step": 5441 }, { "epoch": 0.65, "learning_rate": 5.795125932757624e-06, "loss": 0.6713, "step": 5442 }, { "epoch": 0.65, "learning_rate": 5.791621559584566e-06, "loss": 0.7377, "step": 5443 }, { "epoch": 0.65, "learning_rate": 5.788117814344039e-06, "loss": 0.7857, "step": 5444 }, { "epoch": 0.65, "learning_rate": 5.784614697558832e-06, "loss": 0.7388, "step": 5445 }, { "epoch": 0.65, "learning_rate": 5.781112209751654e-06, "loss": 0.7522, "step": 5446 }, { "epoch": 0.65, "learning_rate": 5.777610351445107e-06, "loss": 0.7645, "step": 5447 }, { "epoch": 0.65, "learning_rate": 5.774109123161704e-06, "loss": 0.769, "step": 5448 }, { "epoch": 0.65, "learning_rate": 5.770608525423863e-06, "loss": 0.7148, "step": 5449 }, { "epoch": 0.65, "learning_rate": 5.767108558753907e-06, "loss": 0.803, "step": 5450 }, { "epoch": 0.65, "learning_rate": 5.763609223674069e-06, "loss": 0.7595, "step": 5451 }, { "epoch": 0.65, "learning_rate": 5.7601105207064875e-06, "loss": 0.7868, "step": 5452 }, { "epoch": 0.65, "learning_rate": 5.7566124503732e-06, "loss": 0.7991, "step": 5453 }, { "epoch": 0.65, "learning_rate": 5.753115013196151e-06, "loss": 0.7405, "step": 5454 }, { "epoch": 0.65, "learning_rate": 5.749618209697203e-06, "loss": 0.7405, "step": 5455 }, { "epoch": 0.65, "learning_rate": 5.7461220403981074e-06, "loss": 0.7511, "step": 5456 }, { "epoch": 0.65, "learning_rate": 5.742626505820526e-06, "loss": 0.7344, "step": 5457 }, { "epoch": 0.65, "learning_rate": 5.739131606486039e-06, "loss": 0.7411, "step": 5458 }, { "epoch": 0.65, "learning_rate": 5.735637342916105e-06, "loss": 0.6942, "step": 5459 }, { "epoch": 0.65, "learning_rate": 5.732143715632116e-06, "loss": 0.7584, "step": 5460 }, { "epoch": 0.65, "learning_rate": 5.7286507251553515e-06, "loss": 0.7377, "step": 5461 }, { "epoch": 0.65, "learning_rate": 5.725158372006997e-06, "loss": 0.76, "step": 5462 }, { "epoch": 0.65, "learning_rate": 5.721666656708159e-06, "loss": 0.7768, "step": 5463 }, { "epoch": 0.65, "learning_rate": 5.718175579779821e-06, "loss": 0.7517, "step": 5464 }, { "epoch": 0.65, "learning_rate": 5.714685141742899e-06, "loss": 0.7048, "step": 5465 }, { "epoch": 0.65, "learning_rate": 5.711195343118197e-06, "loss": 0.7444, "step": 5466 }, { "epoch": 0.65, "learning_rate": 5.707706184426423e-06, "loss": 0.7427, "step": 5467 }, { "epoch": 0.65, "learning_rate": 5.704217666188209e-06, "loss": 0.822, "step": 5468 }, { "epoch": 0.65, "learning_rate": 5.70072978892406e-06, "loss": 0.7294, "step": 5469 }, { "epoch": 0.65, "learning_rate": 5.697242553154414e-06, "loss": 0.7506, "step": 5470 }, { "epoch": 0.65, "learning_rate": 5.693755959399596e-06, "loss": 0.7785, "step": 5471 }, { "epoch": 0.65, "learning_rate": 5.690270008179847e-06, "loss": 0.6931, "step": 5472 }, { "epoch": 0.65, "learning_rate": 5.686784700015302e-06, "loss": 0.7221, "step": 5473 }, { "epoch": 0.65, "learning_rate": 5.683300035426005e-06, "loss": 0.6987, "step": 5474 }, { "epoch": 0.65, "learning_rate": 5.679816014931902e-06, "loss": 0.7734, "step": 5475 }, { "epoch": 0.65, "learning_rate": 5.676332639052842e-06, "loss": 0.7377, "step": 5476 }, { "epoch": 0.65, "learning_rate": 5.6728499083085854e-06, "loss": 0.774, "step": 5477 }, { "epoch": 0.65, "learning_rate": 5.669367823218788e-06, "loss": 0.6775, "step": 5478 }, { "epoch": 0.65, "learning_rate": 5.6658863843030125e-06, "loss": 0.7243, "step": 5479 }, { "epoch": 0.65, "learning_rate": 5.662405592080724e-06, "loss": 0.7673, "step": 5480 }, { "epoch": 0.65, "learning_rate": 5.658925447071289e-06, "loss": 0.7539, "step": 5481 }, { "epoch": 0.65, "learning_rate": 5.6554459497939865e-06, "loss": 0.7439, "step": 5482 }, { "epoch": 0.65, "learning_rate": 5.65196710076799e-06, "loss": 0.7193, "step": 5483 }, { "epoch": 0.65, "learning_rate": 5.648488900512376e-06, "loss": 0.7065, "step": 5484 }, { "epoch": 0.65, "learning_rate": 5.645011349546128e-06, "loss": 0.7299, "step": 5485 }, { "epoch": 0.65, "learning_rate": 5.6415344483881365e-06, "loss": 0.7349, "step": 5486 }, { "epoch": 0.65, "learning_rate": 5.638058197557186e-06, "loss": 0.7405, "step": 5487 }, { "epoch": 0.65, "learning_rate": 5.634582597571969e-06, "loss": 0.7779, "step": 5488 }, { "epoch": 0.65, "learning_rate": 5.631107648951082e-06, "loss": 0.7824, "step": 5489 }, { "epoch": 0.65, "learning_rate": 5.627633352213014e-06, "loss": 0.7517, "step": 5490 }, { "epoch": 0.65, "learning_rate": 5.624159707876178e-06, "loss": 0.7282, "step": 5491 }, { "epoch": 0.65, "learning_rate": 5.620686716458868e-06, "loss": 0.7561, "step": 5492 }, { "epoch": 0.66, "learning_rate": 5.617214378479293e-06, "loss": 0.7176, "step": 5493 }, { "epoch": 0.66, "learning_rate": 5.61374269445556e-06, "loss": 0.7193, "step": 5494 }, { "epoch": 0.66, "learning_rate": 5.610271664905674e-06, "loss": 0.779, "step": 5495 }, { "epoch": 0.66, "learning_rate": 5.606801290347557e-06, "loss": 0.7679, "step": 5496 }, { "epoch": 0.66, "learning_rate": 5.60333157129902e-06, "loss": 0.7059, "step": 5497 }, { "epoch": 0.66, "learning_rate": 5.599862508277779e-06, "loss": 0.7489, "step": 5498 }, { "epoch": 0.66, "learning_rate": 5.596394101801454e-06, "loss": 0.7193, "step": 5499 }, { "epoch": 0.66, "learning_rate": 5.592926352387562e-06, "loss": 0.784, "step": 5500 }, { "epoch": 0.66, "learning_rate": 5.589459260553534e-06, "loss": 0.755, "step": 5501 }, { "epoch": 0.66, "learning_rate": 5.5859928268166876e-06, "loss": 0.7249, "step": 5502 }, { "epoch": 0.66, "learning_rate": 5.582527051694261e-06, "loss": 0.7366, "step": 5503 }, { "epoch": 0.66, "learning_rate": 5.579061935703367e-06, "loss": 0.7422, "step": 5504 }, { "epoch": 0.66, "learning_rate": 5.57559747936105e-06, "loss": 0.7651, "step": 5505 }, { "epoch": 0.66, "learning_rate": 5.572133683184233e-06, "loss": 0.7109, "step": 5506 }, { "epoch": 0.66, "learning_rate": 5.5686705476897505e-06, "loss": 0.7026, "step": 5507 }, { "epoch": 0.66, "learning_rate": 5.565208073394347e-06, "loss": 0.7411, "step": 5508 }, { "epoch": 0.66, "learning_rate": 5.5617462608146425e-06, "loss": 0.7651, "step": 5509 }, { "epoch": 0.66, "learning_rate": 5.5582851104671855e-06, "loss": 0.707, "step": 5510 }, { "epoch": 0.66, "learning_rate": 5.554824622868412e-06, "loss": 0.7467, "step": 5511 }, { "epoch": 0.66, "learning_rate": 5.551364798534658e-06, "loss": 0.7143, "step": 5512 }, { "epoch": 0.66, "learning_rate": 5.5479056379821735e-06, "loss": 0.8064, "step": 5513 }, { "epoch": 0.66, "learning_rate": 5.544447141727089e-06, "loss": 0.721, "step": 5514 }, { "epoch": 0.66, "learning_rate": 5.540989310285454e-06, "loss": 0.7171, "step": 5515 }, { "epoch": 0.66, "learning_rate": 5.537532144173208e-06, "loss": 0.798, "step": 5516 }, { "epoch": 0.66, "learning_rate": 5.534075643906199e-06, "loss": 0.7846, "step": 5517 }, { "epoch": 0.66, "learning_rate": 5.530619810000175e-06, "loss": 0.7076, "step": 5518 }, { "epoch": 0.66, "learning_rate": 5.527164642970768e-06, "loss": 0.7299, "step": 5519 }, { "epoch": 0.66, "learning_rate": 5.523710143333535e-06, "loss": 0.7589, "step": 5520 }, { "epoch": 0.66, "learning_rate": 5.520256311603916e-06, "loss": 0.7344, "step": 5521 }, { "epoch": 0.66, "learning_rate": 5.516803148297265e-06, "loss": 0.7651, "step": 5522 }, { "epoch": 0.66, "learning_rate": 5.5133506539288225e-06, "loss": 0.7907, "step": 5523 }, { "epoch": 0.66, "learning_rate": 5.50989882901374e-06, "loss": 0.8075, "step": 5524 }, { "epoch": 0.66, "learning_rate": 5.50644767406706e-06, "loss": 0.6864, "step": 5525 }, { "epoch": 0.66, "learning_rate": 5.502997189603729e-06, "loss": 0.7372, "step": 5526 }, { "epoch": 0.66, "learning_rate": 5.4995473761385995e-06, "loss": 0.7494, "step": 5527 }, { "epoch": 0.66, "learning_rate": 5.4960982341864175e-06, "loss": 0.7578, "step": 5528 }, { "epoch": 0.66, "learning_rate": 5.492649764261826e-06, "loss": 0.6797, "step": 5529 }, { "epoch": 0.66, "learning_rate": 5.489201966879375e-06, "loss": 0.7171, "step": 5530 }, { "epoch": 0.66, "learning_rate": 5.485754842553506e-06, "loss": 0.7785, "step": 5531 }, { "epoch": 0.66, "learning_rate": 5.48230839179857e-06, "loss": 0.8164, "step": 5532 }, { "epoch": 0.66, "learning_rate": 5.478862615128811e-06, "loss": 0.7427, "step": 5533 }, { "epoch": 0.66, "learning_rate": 5.475417513058373e-06, "loss": 0.6869, "step": 5534 }, { "epoch": 0.66, "learning_rate": 5.471973086101296e-06, "loss": 0.7706, "step": 5535 }, { "epoch": 0.66, "learning_rate": 5.468529334771531e-06, "loss": 0.7718, "step": 5536 }, { "epoch": 0.66, "learning_rate": 5.465086259582917e-06, "loss": 0.7204, "step": 5537 }, { "epoch": 0.66, "learning_rate": 5.461643861049194e-06, "loss": 0.7388, "step": 5538 }, { "epoch": 0.66, "learning_rate": 5.4582021396840044e-06, "loss": 0.7684, "step": 5539 }, { "epoch": 0.66, "learning_rate": 5.454761096000882e-06, "loss": 0.7807, "step": 5540 }, { "epoch": 0.66, "learning_rate": 5.451320730513277e-06, "loss": 0.7762, "step": 5541 }, { "epoch": 0.66, "learning_rate": 5.447881043734517e-06, "loss": 0.7561, "step": 5542 }, { "epoch": 0.66, "learning_rate": 5.4444420361778425e-06, "loss": 0.7243, "step": 5543 }, { "epoch": 0.66, "learning_rate": 5.441003708356387e-06, "loss": 0.7706, "step": 5544 }, { "epoch": 0.66, "learning_rate": 5.437566060783178e-06, "loss": 0.7857, "step": 5545 }, { "epoch": 0.66, "learning_rate": 5.434129093971157e-06, "loss": 0.7054, "step": 5546 }, { "epoch": 0.66, "learning_rate": 5.430692808433147e-06, "loss": 0.7087, "step": 5547 }, { "epoch": 0.66, "learning_rate": 5.427257204681885e-06, "loss": 0.7723, "step": 5548 }, { "epoch": 0.66, "learning_rate": 5.423822283229989e-06, "loss": 0.7422, "step": 5549 }, { "epoch": 0.66, "learning_rate": 5.420388044589981e-06, "loss": 0.7327, "step": 5550 }, { "epoch": 0.66, "learning_rate": 5.416954489274297e-06, "loss": 0.7556, "step": 5551 }, { "epoch": 0.66, "learning_rate": 5.413521617795244e-06, "loss": 0.6903, "step": 5552 }, { "epoch": 0.66, "learning_rate": 5.410089430665057e-06, "loss": 0.7338, "step": 5553 }, { "epoch": 0.66, "learning_rate": 5.406657928395837e-06, "loss": 0.7439, "step": 5554 }, { "epoch": 0.66, "learning_rate": 5.40322711149961e-06, "loss": 0.74, "step": 5555 }, { "epoch": 0.66, "learning_rate": 5.399796980488282e-06, "loss": 0.7221, "step": 5556 }, { "epoch": 0.66, "learning_rate": 5.396367535873663e-06, "loss": 0.7422, "step": 5557 }, { "epoch": 0.66, "learning_rate": 5.392938778167471e-06, "loss": 0.745, "step": 5558 }, { "epoch": 0.66, "learning_rate": 5.389510707881294e-06, "loss": 0.7494, "step": 5559 }, { "epoch": 0.66, "learning_rate": 5.38608332552665e-06, "loss": 0.7193, "step": 5560 }, { "epoch": 0.66, "learning_rate": 5.3826566316149324e-06, "loss": 0.7321, "step": 5561 }, { "epoch": 0.66, "learning_rate": 5.379230626657435e-06, "loss": 0.8025, "step": 5562 }, { "epoch": 0.66, "learning_rate": 5.375805311165364e-06, "loss": 0.7148, "step": 5563 }, { "epoch": 0.66, "learning_rate": 5.372380685649796e-06, "loss": 0.7327, "step": 5564 }, { "epoch": 0.66, "learning_rate": 5.368956750621732e-06, "loss": 0.7511, "step": 5565 }, { "epoch": 0.66, "learning_rate": 5.365533506592049e-06, "loss": 0.8019, "step": 5566 }, { "epoch": 0.66, "learning_rate": 5.362110954071536e-06, "loss": 0.7461, "step": 5567 }, { "epoch": 0.66, "learning_rate": 5.35868909357087e-06, "loss": 0.7294, "step": 5568 }, { "epoch": 0.66, "learning_rate": 5.355267925600628e-06, "loss": 0.7706, "step": 5569 }, { "epoch": 0.66, "learning_rate": 5.351847450671281e-06, "loss": 0.7277, "step": 5570 }, { "epoch": 0.66, "learning_rate": 5.348427669293196e-06, "loss": 0.7444, "step": 5571 }, { "epoch": 0.66, "learning_rate": 5.345008581976645e-06, "loss": 0.6975, "step": 5572 }, { "epoch": 0.66, "learning_rate": 5.341590189231788e-06, "loss": 0.7383, "step": 5573 }, { "epoch": 0.66, "learning_rate": 5.338172491568683e-06, "loss": 0.6775, "step": 5574 }, { "epoch": 0.66, "learning_rate": 5.334755489497285e-06, "loss": 0.7076, "step": 5575 }, { "epoch": 0.66, "learning_rate": 5.331339183527439e-06, "loss": 0.7288, "step": 5576 }, { "epoch": 0.67, "learning_rate": 5.3279235741689064e-06, "loss": 0.7902, "step": 5577 }, { "epoch": 0.67, "learning_rate": 5.32450866193132e-06, "loss": 0.7757, "step": 5578 }, { "epoch": 0.67, "learning_rate": 5.3210944473242235e-06, "loss": 0.7294, "step": 5579 }, { "epoch": 0.67, "learning_rate": 5.31768093085705e-06, "loss": 0.7589, "step": 5580 }, { "epoch": 0.67, "learning_rate": 5.314268113039126e-06, "loss": 0.7098, "step": 5581 }, { "epoch": 0.67, "learning_rate": 5.310855994379689e-06, "loss": 0.6975, "step": 5582 }, { "epoch": 0.67, "learning_rate": 5.3074445753878545e-06, "loss": 0.76, "step": 5583 }, { "epoch": 0.67, "learning_rate": 5.304033856572644e-06, "loss": 0.745, "step": 5584 }, { "epoch": 0.67, "learning_rate": 5.300623838442964e-06, "loss": 0.7807, "step": 5585 }, { "epoch": 0.67, "learning_rate": 5.297214521507632e-06, "loss": 0.7188, "step": 5586 }, { "epoch": 0.67, "learning_rate": 5.293805906275351e-06, "loss": 0.7299, "step": 5587 }, { "epoch": 0.67, "learning_rate": 5.290397993254719e-06, "loss": 0.7327, "step": 5588 }, { "epoch": 0.67, "learning_rate": 5.286990782954231e-06, "loss": 0.7165, "step": 5589 }, { "epoch": 0.67, "learning_rate": 5.283584275882274e-06, "loss": 0.7333, "step": 5590 }, { "epoch": 0.67, "learning_rate": 5.280178472547141e-06, "loss": 0.6953, "step": 5591 }, { "epoch": 0.67, "learning_rate": 5.276773373457007e-06, "loss": 0.7746, "step": 5592 }, { "epoch": 0.67, "learning_rate": 5.273368979119948e-06, "loss": 0.8337, "step": 5593 }, { "epoch": 0.67, "learning_rate": 5.269965290043934e-06, "loss": 0.7254, "step": 5594 }, { "epoch": 0.67, "learning_rate": 5.266562306736826e-06, "loss": 0.7645, "step": 5595 }, { "epoch": 0.67, "learning_rate": 5.263160029706391e-06, "loss": 0.7411, "step": 5596 }, { "epoch": 0.67, "learning_rate": 5.259758459460275e-06, "loss": 0.6908, "step": 5597 }, { "epoch": 0.67, "learning_rate": 5.256357596506039e-06, "loss": 0.7243, "step": 5598 }, { "epoch": 0.67, "learning_rate": 5.25295744135111e-06, "loss": 0.7143, "step": 5599 }, { "epoch": 0.67, "learning_rate": 5.249557994502838e-06, "loss": 0.7645, "step": 5600 }, { "epoch": 0.67, "learning_rate": 5.24615925646845e-06, "loss": 0.7137, "step": 5601 }, { "epoch": 0.67, "learning_rate": 5.242761227755067e-06, "loss": 0.7852, "step": 5602 }, { "epoch": 0.67, "learning_rate": 5.239363908869723e-06, "loss": 0.7098, "step": 5603 }, { "epoch": 0.67, "learning_rate": 5.235967300319317e-06, "loss": 0.7193, "step": 5604 }, { "epoch": 0.67, "learning_rate": 5.232571402610667e-06, "loss": 0.7271, "step": 5605 }, { "epoch": 0.67, "learning_rate": 5.229176216250471e-06, "loss": 0.7528, "step": 5606 }, { "epoch": 0.67, "learning_rate": 5.2257817417453235e-06, "loss": 0.716, "step": 5607 }, { "epoch": 0.67, "learning_rate": 5.2223879796017245e-06, "loss": 0.7779, "step": 5608 }, { "epoch": 0.67, "learning_rate": 5.218994930326042e-06, "loss": 0.726, "step": 5609 }, { "epoch": 0.67, "learning_rate": 5.215602594424565e-06, "loss": 0.7076, "step": 5610 }, { "epoch": 0.67, "learning_rate": 5.212210972403462e-06, "loss": 0.7321, "step": 5611 }, { "epoch": 0.67, "learning_rate": 5.20882006476879e-06, "loss": 0.6953, "step": 5612 }, { "epoch": 0.67, "learning_rate": 5.2054298720265216e-06, "loss": 0.7723, "step": 5613 }, { "epoch": 0.67, "learning_rate": 5.202040394682489e-06, "loss": 0.6945, "step": 5614 }, { "epoch": 0.67, "learning_rate": 5.1986516332424506e-06, "loss": 0.7824, "step": 5615 }, { "epoch": 0.67, "learning_rate": 5.195263588212036e-06, "loss": 0.7863, "step": 5616 }, { "epoch": 0.67, "learning_rate": 5.191876260096783e-06, "loss": 0.7439, "step": 5617 }, { "epoch": 0.67, "learning_rate": 5.188489649402111e-06, "loss": 0.7338, "step": 5618 }, { "epoch": 0.67, "learning_rate": 5.185103756633335e-06, "loss": 0.7271, "step": 5619 }, { "epoch": 0.67, "learning_rate": 5.181718582295668e-06, "loss": 0.7667, "step": 5620 }, { "epoch": 0.67, "learning_rate": 5.178334126894205e-06, "loss": 0.7249, "step": 5621 }, { "epoch": 0.67, "learning_rate": 5.174950390933948e-06, "loss": 0.803, "step": 5622 }, { "epoch": 0.67, "learning_rate": 5.171567374919785e-06, "loss": 0.7098, "step": 5623 }, { "epoch": 0.67, "learning_rate": 5.168185079356494e-06, "loss": 0.7221, "step": 5624 }, { "epoch": 0.67, "learning_rate": 5.164803504748746e-06, "loss": 0.745, "step": 5625 }, { "epoch": 0.67, "learning_rate": 5.161422651601102e-06, "loss": 0.7182, "step": 5626 }, { "epoch": 0.67, "learning_rate": 5.158042520418031e-06, "loss": 0.7048, "step": 5627 }, { "epoch": 0.67, "learning_rate": 5.154663111703875e-06, "loss": 0.7863, "step": 5628 }, { "epoch": 0.67, "learning_rate": 5.151284425962879e-06, "loss": 0.7762, "step": 5629 }, { "epoch": 0.67, "learning_rate": 5.1479064636991695e-06, "loss": 0.745, "step": 5630 }, { "epoch": 0.67, "learning_rate": 5.1445292254167835e-06, "loss": 0.7087, "step": 5631 }, { "epoch": 0.67, "learning_rate": 5.141152711619633e-06, "loss": 0.7221, "step": 5632 }, { "epoch": 0.67, "learning_rate": 5.13777692281153e-06, "loss": 0.7081, "step": 5633 }, { "epoch": 0.67, "learning_rate": 5.1344018594961745e-06, "loss": 0.6869, "step": 5634 }, { "epoch": 0.67, "learning_rate": 5.1310275221771554e-06, "loss": 0.7249, "step": 5635 }, { "epoch": 0.67, "learning_rate": 5.127653911357968e-06, "loss": 0.7595, "step": 5636 }, { "epoch": 0.67, "learning_rate": 5.124281027541984e-06, "loss": 0.7455, "step": 5637 }, { "epoch": 0.67, "learning_rate": 5.120908871232472e-06, "loss": 0.6802, "step": 5638 }, { "epoch": 0.67, "learning_rate": 5.1175374429325915e-06, "loss": 0.7137, "step": 5639 }, { "epoch": 0.67, "learning_rate": 5.11416674314539e-06, "loss": 0.7684, "step": 5640 }, { "epoch": 0.67, "learning_rate": 5.110796772373816e-06, "loss": 0.8225, "step": 5641 }, { "epoch": 0.67, "learning_rate": 5.1074275311207035e-06, "loss": 0.7874, "step": 5642 }, { "epoch": 0.67, "learning_rate": 5.1040590198887685e-06, "loss": 0.7528, "step": 5643 }, { "epoch": 0.67, "learning_rate": 5.100691239180642e-06, "loss": 0.731, "step": 5644 }, { "epoch": 0.67, "learning_rate": 5.097324189498813e-06, "loss": 0.7009, "step": 5645 }, { "epoch": 0.67, "learning_rate": 5.093957871345692e-06, "loss": 0.7254, "step": 5646 }, { "epoch": 0.67, "learning_rate": 5.0905922852235615e-06, "loss": 0.7266, "step": 5647 }, { "epoch": 0.67, "learning_rate": 5.087227431634605e-06, "loss": 0.7288, "step": 5648 }, { "epoch": 0.67, "learning_rate": 5.083863311080892e-06, "loss": 0.7796, "step": 5649 }, { "epoch": 0.67, "learning_rate": 5.080499924064381e-06, "loss": 0.7154, "step": 5650 }, { "epoch": 0.67, "learning_rate": 5.0771372710869245e-06, "loss": 0.7394, "step": 5651 }, { "epoch": 0.67, "learning_rate": 5.073775352650261e-06, "loss": 0.7478, "step": 5652 }, { "epoch": 0.67, "learning_rate": 5.070414169256028e-06, "loss": 0.7667, "step": 5653 }, { "epoch": 0.67, "learning_rate": 5.067053721405747e-06, "loss": 0.7015, "step": 5654 }, { "epoch": 0.67, "learning_rate": 5.063694009600829e-06, "loss": 0.7394, "step": 5655 }, { "epoch": 0.67, "learning_rate": 5.060335034342577e-06, "loss": 0.7232, "step": 5656 }, { "epoch": 0.67, "learning_rate": 5.0569767961321805e-06, "loss": 0.6998, "step": 5657 }, { "epoch": 0.67, "learning_rate": 5.0536192954707305e-06, "loss": 0.7517, "step": 5658 }, { "epoch": 0.67, "learning_rate": 5.050262532859196e-06, "loss": 0.7405, "step": 5659 }, { "epoch": 0.68, "learning_rate": 5.046906508798439e-06, "loss": 0.716, "step": 5660 }, { "epoch": 0.68, "learning_rate": 5.0435512237892095e-06, "loss": 0.6401, "step": 5661 }, { "epoch": 0.68, "learning_rate": 5.040196678332157e-06, "loss": 0.7405, "step": 5662 }, { "epoch": 0.68, "learning_rate": 5.03684287292781e-06, "loss": 0.7087, "step": 5663 }, { "epoch": 0.68, "learning_rate": 5.033489808076588e-06, "loss": 0.7589, "step": 5664 }, { "epoch": 0.68, "learning_rate": 5.0301374842788055e-06, "loss": 0.7768, "step": 5665 }, { "epoch": 0.68, "learning_rate": 5.026785902034658e-06, "loss": 0.7478, "step": 5666 }, { "epoch": 0.68, "learning_rate": 5.023435061844242e-06, "loss": 0.721, "step": 5667 }, { "epoch": 0.68, "learning_rate": 5.020084964207535e-06, "loss": 0.7483, "step": 5668 }, { "epoch": 0.68, "learning_rate": 5.016735609624401e-06, "loss": 0.7667, "step": 5669 }, { "epoch": 0.68, "learning_rate": 5.0133869985946025e-06, "loss": 0.673, "step": 5670 }, { "epoch": 0.68, "learning_rate": 5.0100391316177785e-06, "loss": 0.7483, "step": 5671 }, { "epoch": 0.68, "learning_rate": 5.006692009193477e-06, "loss": 0.7517, "step": 5672 }, { "epoch": 0.68, "learning_rate": 5.003345631821113e-06, "loss": 0.7757, "step": 5673 }, { "epoch": 0.68, "learning_rate": 5.000000000000003e-06, "loss": 0.7388, "step": 5674 }, { "epoch": 0.68, "learning_rate": 4.996655114229347e-06, "loss": 0.7416, "step": 5675 }, { "epoch": 0.68, "learning_rate": 4.993310975008235e-06, "loss": 0.7433, "step": 5676 }, { "epoch": 0.68, "learning_rate": 4.9899675828356505e-06, "loss": 0.7277, "step": 5677 }, { "epoch": 0.68, "learning_rate": 4.986624938210456e-06, "loss": 0.7667, "step": 5678 }, { "epoch": 0.68, "learning_rate": 4.983283041631419e-06, "loss": 0.7857, "step": 5679 }, { "epoch": 0.68, "learning_rate": 4.979941893597167e-06, "loss": 0.7623, "step": 5680 }, { "epoch": 0.68, "learning_rate": 4.976601494606248e-06, "loss": 0.7394, "step": 5681 }, { "epoch": 0.68, "learning_rate": 4.973261845157077e-06, "loss": 0.7394, "step": 5682 }, { "epoch": 0.68, "learning_rate": 4.969922945747959e-06, "loss": 0.7974, "step": 5683 }, { "epoch": 0.68, "learning_rate": 4.966584796877104e-06, "loss": 0.7411, "step": 5684 }, { "epoch": 0.68, "learning_rate": 4.963247399042584e-06, "loss": 0.7042, "step": 5685 }, { "epoch": 0.68, "learning_rate": 4.959910752742379e-06, "loss": 0.7204, "step": 5686 }, { "epoch": 0.68, "learning_rate": 4.956574858474351e-06, "loss": 0.7165, "step": 5687 }, { "epoch": 0.68, "learning_rate": 4.953239716736244e-06, "loss": 0.7467, "step": 5688 }, { "epoch": 0.68, "learning_rate": 4.949905328025706e-06, "loss": 0.793, "step": 5689 }, { "epoch": 0.68, "learning_rate": 4.946571692840246e-06, "loss": 0.6964, "step": 5690 }, { "epoch": 0.68, "learning_rate": 4.943238811677288e-06, "loss": 0.7874, "step": 5691 }, { "epoch": 0.68, "learning_rate": 4.939906685034122e-06, "loss": 0.6987, "step": 5692 }, { "epoch": 0.68, "learning_rate": 4.936575313407946e-06, "loss": 0.7517, "step": 5693 }, { "epoch": 0.68, "learning_rate": 4.933244697295832e-06, "loss": 0.7595, "step": 5694 }, { "epoch": 0.68, "learning_rate": 4.929914837194729e-06, "loss": 0.7411, "step": 5695 }, { "epoch": 0.68, "learning_rate": 4.9265857336015e-06, "loss": 0.7221, "step": 5696 }, { "epoch": 0.68, "learning_rate": 4.923257387012871e-06, "loss": 0.7042, "step": 5697 }, { "epoch": 0.68, "learning_rate": 4.919929797925474e-06, "loss": 0.7561, "step": 5698 }, { "epoch": 0.68, "learning_rate": 4.916602966835814e-06, "loss": 0.7478, "step": 5699 }, { "epoch": 0.68, "learning_rate": 4.913276894240288e-06, "loss": 0.7729, "step": 5700 }, { "epoch": 0.68, "learning_rate": 4.90995158063518e-06, "loss": 0.7743, "step": 5701 }, { "epoch": 0.68, "learning_rate": 4.906627026516657e-06, "loss": 0.7132, "step": 5702 }, { "epoch": 0.68, "learning_rate": 4.903303232380782e-06, "loss": 0.7617, "step": 5703 }, { "epoch": 0.68, "learning_rate": 4.899980198723497e-06, "loss": 0.6992, "step": 5704 }, { "epoch": 0.68, "learning_rate": 4.896657926040629e-06, "loss": 0.7249, "step": 5705 }, { "epoch": 0.68, "learning_rate": 4.893336414827897e-06, "loss": 0.7807, "step": 5706 }, { "epoch": 0.68, "learning_rate": 4.8900156655809004e-06, "loss": 0.7561, "step": 5707 }, { "epoch": 0.68, "learning_rate": 4.886695678795136e-06, "loss": 0.7506, "step": 5708 }, { "epoch": 0.68, "learning_rate": 4.883376454965973e-06, "loss": 0.7684, "step": 5709 }, { "epoch": 0.68, "learning_rate": 4.880057994588677e-06, "loss": 0.721, "step": 5710 }, { "epoch": 0.68, "learning_rate": 4.876740298158389e-06, "loss": 0.6836, "step": 5711 }, { "epoch": 0.68, "learning_rate": 4.873423366170151e-06, "loss": 0.7522, "step": 5712 }, { "epoch": 0.68, "learning_rate": 4.870107199118881e-06, "loss": 0.7785, "step": 5713 }, { "epoch": 0.68, "learning_rate": 4.866791797499381e-06, "loss": 0.7215, "step": 5714 }, { "epoch": 0.68, "learning_rate": 4.863477161806346e-06, "loss": 0.7539, "step": 5715 }, { "epoch": 0.68, "learning_rate": 4.8601632925343455e-06, "loss": 0.7012, "step": 5716 }, { "epoch": 0.68, "learning_rate": 4.856850190177854e-06, "loss": 0.755, "step": 5717 }, { "epoch": 0.68, "learning_rate": 4.853537855231213e-06, "loss": 0.7506, "step": 5718 }, { "epoch": 0.68, "learning_rate": 4.8502262881886565e-06, "loss": 0.7628, "step": 5719 }, { "epoch": 0.68, "learning_rate": 4.846915489544306e-06, "loss": 0.7031, "step": 5720 }, { "epoch": 0.68, "learning_rate": 4.843605459792159e-06, "loss": 0.7718, "step": 5721 }, { "epoch": 0.68, "learning_rate": 4.8402961994261155e-06, "loss": 0.7517, "step": 5722 }, { "epoch": 0.68, "learning_rate": 4.836987708939942e-06, "loss": 0.7377, "step": 5723 }, { "epoch": 0.68, "learning_rate": 4.833679988827311e-06, "loss": 0.8147, "step": 5724 }, { "epoch": 0.68, "learning_rate": 4.830373039581754e-06, "loss": 0.6931, "step": 5725 }, { "epoch": 0.68, "learning_rate": 4.827066861696703e-06, "loss": 0.7266, "step": 5726 }, { "epoch": 0.68, "learning_rate": 4.823761455665481e-06, "loss": 0.7372, "step": 5727 }, { "epoch": 0.68, "learning_rate": 4.82045682198128e-06, "loss": 0.6998, "step": 5728 }, { "epoch": 0.68, "learning_rate": 4.817152961137195e-06, "loss": 0.6931, "step": 5729 }, { "epoch": 0.68, "learning_rate": 4.813849873626182e-06, "loss": 0.764, "step": 5730 }, { "epoch": 0.68, "learning_rate": 4.810547559941103e-06, "loss": 0.6741, "step": 5731 }, { "epoch": 0.68, "learning_rate": 4.8072460205746974e-06, "loss": 0.7829, "step": 5732 }, { "epoch": 0.68, "learning_rate": 4.8039452560195806e-06, "loss": 0.6621, "step": 5733 }, { "epoch": 0.68, "learning_rate": 4.800645266768275e-06, "loss": 0.7427, "step": 5734 }, { "epoch": 0.68, "learning_rate": 4.797346053313153e-06, "loss": 0.7182, "step": 5735 }, { "epoch": 0.68, "learning_rate": 4.794047616146505e-06, "loss": 0.7673, "step": 5736 }, { "epoch": 0.68, "learning_rate": 4.7907499557604854e-06, "loss": 0.7199, "step": 5737 }, { "epoch": 0.68, "learning_rate": 4.787453072647136e-06, "loss": 0.75, "step": 5738 }, { "epoch": 0.68, "learning_rate": 4.784156967298395e-06, "loss": 0.7093, "step": 5739 }, { "epoch": 0.68, "learning_rate": 4.78086164020606e-06, "loss": 0.7037, "step": 5740 }, { "epoch": 0.68, "learning_rate": 4.77756709186184e-06, "loss": 0.7154, "step": 5741 }, { "epoch": 0.68, "learning_rate": 4.774273322757306e-06, "loss": 0.7059, "step": 5742 }, { "epoch": 0.68, "learning_rate": 4.770980333383928e-06, "loss": 0.7137, "step": 5743 }, { "epoch": 0.69, "learning_rate": 4.767688124233051e-06, "loss": 0.7612, "step": 5744 }, { "epoch": 0.69, "learning_rate": 4.764396695795905e-06, "loss": 0.7556, "step": 5745 }, { "epoch": 0.69, "learning_rate": 4.7611060485636055e-06, "loss": 0.7623, "step": 5746 }, { "epoch": 0.69, "learning_rate": 4.757816183027145e-06, "loss": 0.7706, "step": 5747 }, { "epoch": 0.69, "learning_rate": 4.754527099677414e-06, "loss": 0.6892, "step": 5748 }, { "epoch": 0.69, "learning_rate": 4.751238799005171e-06, "loss": 0.7578, "step": 5749 }, { "epoch": 0.69, "learning_rate": 4.747951281501066e-06, "loss": 0.8008, "step": 5750 }, { "epoch": 0.69, "learning_rate": 4.744664547655626e-06, "loss": 0.7528, "step": 5751 }, { "epoch": 0.69, "learning_rate": 4.741378597959267e-06, "loss": 0.7087, "step": 5752 }, { "epoch": 0.69, "learning_rate": 4.738093432902287e-06, "loss": 0.7729, "step": 5753 }, { "epoch": 0.69, "learning_rate": 4.734809052974866e-06, "loss": 0.6987, "step": 5754 }, { "epoch": 0.69, "learning_rate": 4.731525458667066e-06, "loss": 0.7427, "step": 5755 }, { "epoch": 0.69, "learning_rate": 4.728242650468831e-06, "loss": 0.7852, "step": 5756 }, { "epoch": 0.69, "learning_rate": 4.724960628869988e-06, "loss": 0.7282, "step": 5757 }, { "epoch": 0.69, "learning_rate": 4.721679394360252e-06, "loss": 0.7282, "step": 5758 }, { "epoch": 0.69, "learning_rate": 4.718398947429215e-06, "loss": 0.7026, "step": 5759 }, { "epoch": 0.69, "learning_rate": 4.715119288566352e-06, "loss": 0.7589, "step": 5760 }, { "epoch": 0.69, "learning_rate": 4.711840418261018e-06, "loss": 0.7679, "step": 5761 }, { "epoch": 0.69, "learning_rate": 4.708562337002459e-06, "loss": 0.7188, "step": 5762 }, { "epoch": 0.69, "learning_rate": 4.705285045279796e-06, "loss": 0.6959, "step": 5763 }, { "epoch": 0.69, "learning_rate": 4.702008543582034e-06, "loss": 0.7461, "step": 5764 }, { "epoch": 0.69, "learning_rate": 4.69873283239806e-06, "loss": 0.7522, "step": 5765 }, { "epoch": 0.69, "learning_rate": 4.695457912216638e-06, "loss": 0.6998, "step": 5766 }, { "epoch": 0.69, "learning_rate": 4.6921837835264275e-06, "loss": 0.6981, "step": 5767 }, { "epoch": 0.69, "learning_rate": 4.688910446815959e-06, "loss": 0.7472, "step": 5768 }, { "epoch": 0.69, "learning_rate": 4.685637902573646e-06, "loss": 0.7121, "step": 5769 }, { "epoch": 0.69, "learning_rate": 4.682366151287784e-06, "loss": 0.7701, "step": 5770 }, { "epoch": 0.69, "learning_rate": 4.67909519344655e-06, "loss": 0.7985, "step": 5771 }, { "epoch": 0.69, "learning_rate": 4.67582502953801e-06, "loss": 0.7282, "step": 5772 }, { "epoch": 0.69, "learning_rate": 4.6725556600501e-06, "loss": 0.7656, "step": 5773 }, { "epoch": 0.69, "learning_rate": 4.6692870854706504e-06, "loss": 0.731, "step": 5774 }, { "epoch": 0.69, "learning_rate": 4.6660193062873545e-06, "loss": 0.7969, "step": 5775 }, { "epoch": 0.69, "learning_rate": 4.6627523229878066e-06, "loss": 0.7461, "step": 5776 }, { "epoch": 0.69, "learning_rate": 4.65948613605947e-06, "loss": 0.7294, "step": 5777 }, { "epoch": 0.69, "learning_rate": 4.65622074598969e-06, "loss": 0.6864, "step": 5778 }, { "epoch": 0.69, "learning_rate": 4.6529561532657064e-06, "loss": 0.7243, "step": 5779 }, { "epoch": 0.69, "learning_rate": 4.649692358374616e-06, "loss": 0.7673, "step": 5780 }, { "epoch": 0.69, "learning_rate": 4.646429361803418e-06, "loss": 0.7042, "step": 5781 }, { "epoch": 0.69, "learning_rate": 4.643167164038982e-06, "loss": 0.7712, "step": 5782 }, { "epoch": 0.69, "learning_rate": 4.639905765568059e-06, "loss": 0.6984, "step": 5783 }, { "epoch": 0.69, "learning_rate": 4.636645166877292e-06, "loss": 0.764, "step": 5784 }, { "epoch": 0.69, "learning_rate": 4.633385368453179e-06, "loss": 0.7985, "step": 5785 }, { "epoch": 0.69, "learning_rate": 4.630126370782129e-06, "loss": 0.7667, "step": 5786 }, { "epoch": 0.69, "learning_rate": 4.626868174350412e-06, "loss": 0.7316, "step": 5787 }, { "epoch": 0.69, "learning_rate": 4.62361077964418e-06, "loss": 0.7126, "step": 5788 }, { "epoch": 0.69, "learning_rate": 4.620354187149479e-06, "loss": 0.7294, "step": 5789 }, { "epoch": 0.69, "learning_rate": 4.617098397352214e-06, "loss": 0.7411, "step": 5790 }, { "epoch": 0.69, "learning_rate": 4.613843410738191e-06, "loss": 0.7154, "step": 5791 }, { "epoch": 0.69, "learning_rate": 4.610589227793079e-06, "loss": 0.731, "step": 5792 }, { "epoch": 0.69, "learning_rate": 4.607335849002442e-06, "loss": 0.7115, "step": 5793 }, { "epoch": 0.69, "learning_rate": 4.604083274851715e-06, "loss": 0.6853, "step": 5794 }, { "epoch": 0.69, "learning_rate": 4.600831505826214e-06, "loss": 0.7427, "step": 5795 }, { "epoch": 0.69, "learning_rate": 4.597580542411135e-06, "loss": 0.774, "step": 5796 }, { "epoch": 0.69, "learning_rate": 4.594330385091552e-06, "loss": 0.7461, "step": 5797 }, { "epoch": 0.69, "learning_rate": 4.591081034352427e-06, "loss": 0.7143, "step": 5798 }, { "epoch": 0.69, "learning_rate": 4.587832490678594e-06, "loss": 0.7545, "step": 5799 }, { "epoch": 0.69, "learning_rate": 4.584584754554768e-06, "loss": 0.7271, "step": 5800 }, { "epoch": 0.69, "learning_rate": 4.581337826465545e-06, "loss": 0.784, "step": 5801 }, { "epoch": 0.69, "learning_rate": 4.578091706895393e-06, "loss": 0.7545, "step": 5802 }, { "epoch": 0.69, "learning_rate": 4.574846396328675e-06, "loss": 0.7377, "step": 5803 }, { "epoch": 0.69, "learning_rate": 4.571601895249621e-06, "loss": 0.7584, "step": 5804 }, { "epoch": 0.69, "learning_rate": 4.568358204142341e-06, "loss": 0.8248, "step": 5805 }, { "epoch": 0.69, "learning_rate": 4.5651153234908254e-06, "loss": 0.7321, "step": 5806 }, { "epoch": 0.69, "learning_rate": 4.5618732537789516e-06, "loss": 0.7355, "step": 5807 }, { "epoch": 0.69, "learning_rate": 4.558631995490463e-06, "loss": 0.7612, "step": 5808 }, { "epoch": 0.69, "learning_rate": 4.5553915491089905e-06, "loss": 0.7327, "step": 5809 }, { "epoch": 0.69, "learning_rate": 4.55215191511804e-06, "loss": 0.7104, "step": 5810 }, { "epoch": 0.69, "learning_rate": 4.548913094000996e-06, "loss": 0.7467, "step": 5811 }, { "epoch": 0.69, "learning_rate": 4.545675086241129e-06, "loss": 0.7388, "step": 5812 }, { "epoch": 0.69, "learning_rate": 4.542437892321578e-06, "loss": 0.7366, "step": 5813 }, { "epoch": 0.69, "learning_rate": 4.539201512725368e-06, "loss": 0.7405, "step": 5814 }, { "epoch": 0.69, "learning_rate": 4.535965947935396e-06, "loss": 0.7628, "step": 5815 }, { "epoch": 0.69, "learning_rate": 4.532731198434438e-06, "loss": 0.7154, "step": 5816 }, { "epoch": 0.69, "learning_rate": 4.529497264705161e-06, "loss": 0.76, "step": 5817 }, { "epoch": 0.69, "learning_rate": 4.526264147230094e-06, "loss": 0.7154, "step": 5818 }, { "epoch": 0.69, "learning_rate": 4.523031846491652e-06, "loss": 0.7985, "step": 5819 }, { "epoch": 0.69, "learning_rate": 4.519800362972128e-06, "loss": 0.75, "step": 5820 }, { "epoch": 0.69, "learning_rate": 4.516569697153686e-06, "loss": 0.7411, "step": 5821 }, { "epoch": 0.69, "learning_rate": 4.513339849518383e-06, "loss": 0.6925, "step": 5822 }, { "epoch": 0.69, "learning_rate": 4.510110820548137e-06, "loss": 0.7076, "step": 5823 }, { "epoch": 0.69, "learning_rate": 4.506882610724762e-06, "loss": 0.7305, "step": 5824 }, { "epoch": 0.69, "learning_rate": 4.503655220529927e-06, "loss": 0.736, "step": 5825 }, { "epoch": 0.69, "learning_rate": 4.5004286504451985e-06, "loss": 0.76, "step": 5826 }, { "epoch": 0.69, "learning_rate": 4.497202900952013e-06, "loss": 0.7483, "step": 5827 }, { "epoch": 0.7, "learning_rate": 4.49397797253168e-06, "loss": 0.7324, "step": 5828 }, { "epoch": 0.7, "learning_rate": 4.490753865665403e-06, "loss": 0.7065, "step": 5829 }, { "epoch": 0.7, "learning_rate": 4.487530580834235e-06, "loss": 0.7612, "step": 5830 }, { "epoch": 0.7, "learning_rate": 4.484308118519135e-06, "loss": 0.7483, "step": 5831 }, { "epoch": 0.7, "learning_rate": 4.481086479200924e-06, "loss": 0.7321, "step": 5832 }, { "epoch": 0.7, "learning_rate": 4.477865663360297e-06, "loss": 0.7985, "step": 5833 }, { "epoch": 0.7, "learning_rate": 4.474645671477841e-06, "loss": 0.7422, "step": 5834 }, { "epoch": 0.7, "learning_rate": 4.471426504034006e-06, "loss": 0.7366, "step": 5835 }, { "epoch": 0.7, "learning_rate": 4.468208161509128e-06, "loss": 0.7684, "step": 5836 }, { "epoch": 0.7, "learning_rate": 4.4649906443834094e-06, "loss": 0.7037, "step": 5837 }, { "epoch": 0.7, "learning_rate": 4.461773953136944e-06, "loss": 0.755, "step": 5838 }, { "epoch": 0.7, "learning_rate": 4.458558088249691e-06, "loss": 0.6775, "step": 5839 }, { "epoch": 0.7, "learning_rate": 4.455343050201492e-06, "loss": 0.7958, "step": 5840 }, { "epoch": 0.7, "learning_rate": 4.452128839472059e-06, "loss": 0.6925, "step": 5841 }, { "epoch": 0.7, "learning_rate": 4.448915456540986e-06, "loss": 0.7494, "step": 5842 }, { "epoch": 0.7, "learning_rate": 4.4457029018877455e-06, "loss": 0.7081, "step": 5843 }, { "epoch": 0.7, "learning_rate": 4.44249117599168e-06, "loss": 0.736, "step": 5844 }, { "epoch": 0.7, "learning_rate": 4.439280279332013e-06, "loss": 0.7779, "step": 5845 }, { "epoch": 0.7, "learning_rate": 4.436070212387842e-06, "loss": 0.7617, "step": 5846 }, { "epoch": 0.7, "learning_rate": 4.432860975638137e-06, "loss": 0.7377, "step": 5847 }, { "epoch": 0.7, "learning_rate": 4.429652569561757e-06, "loss": 0.7294, "step": 5848 }, { "epoch": 0.7, "learning_rate": 4.426444994637424e-06, "loss": 0.7734, "step": 5849 }, { "epoch": 0.7, "learning_rate": 4.42323825134374e-06, "loss": 0.7277, "step": 5850 }, { "epoch": 0.7, "learning_rate": 4.420032340159185e-06, "loss": 0.7031, "step": 5851 }, { "epoch": 0.7, "learning_rate": 4.416827261562109e-06, "loss": 0.7059, "step": 5852 }, { "epoch": 0.7, "learning_rate": 4.413623016030749e-06, "loss": 0.7673, "step": 5853 }, { "epoch": 0.7, "learning_rate": 4.4104196040432035e-06, "loss": 0.7444, "step": 5854 }, { "epoch": 0.7, "learning_rate": 4.407217026077466e-06, "loss": 0.7561, "step": 5855 }, { "epoch": 0.7, "learning_rate": 4.404015282611378e-06, "loss": 0.7277, "step": 5856 }, { "epoch": 0.7, "learning_rate": 4.400814374122682e-06, "loss": 0.764, "step": 5857 }, { "epoch": 0.7, "learning_rate": 4.3976143010889835e-06, "loss": 0.6998, "step": 5858 }, { "epoch": 0.7, "learning_rate": 4.3944150639877615e-06, "loss": 0.7734, "step": 5859 }, { "epoch": 0.7, "learning_rate": 4.391216663296386e-06, "loss": 0.7991, "step": 5860 }, { "epoch": 0.7, "learning_rate": 4.3880190994920746e-06, "loss": 0.7852, "step": 5861 }, { "epoch": 0.7, "learning_rate": 4.384822373051949e-06, "loss": 0.774, "step": 5862 }, { "epoch": 0.7, "learning_rate": 4.381626484452988e-06, "loss": 0.7009, "step": 5863 }, { "epoch": 0.7, "learning_rate": 4.3784314341720466e-06, "loss": 0.6473, "step": 5864 }, { "epoch": 0.7, "learning_rate": 4.375237222685871e-06, "loss": 0.7617, "step": 5865 }, { "epoch": 0.7, "learning_rate": 4.372043850471054e-06, "loss": 0.7472, "step": 5866 }, { "epoch": 0.7, "learning_rate": 4.368851318004089e-06, "loss": 0.7093, "step": 5867 }, { "epoch": 0.7, "learning_rate": 4.365659625761329e-06, "loss": 0.7511, "step": 5868 }, { "epoch": 0.7, "learning_rate": 4.362468774219013e-06, "loss": 0.7874, "step": 5869 }, { "epoch": 0.7, "learning_rate": 4.3592787638532485e-06, "loss": 0.7104, "step": 5870 }, { "epoch": 0.7, "learning_rate": 4.356089595140005e-06, "loss": 0.7891, "step": 5871 }, { "epoch": 0.7, "learning_rate": 4.352901268555151e-06, "loss": 0.6886, "step": 5872 }, { "epoch": 0.7, "learning_rate": 4.3497137845744095e-06, "loss": 0.76, "step": 5873 }, { "epoch": 0.7, "learning_rate": 4.346527143673392e-06, "loss": 0.7645, "step": 5874 }, { "epoch": 0.7, "learning_rate": 4.343341346327574e-06, "loss": 0.7427, "step": 5875 }, { "epoch": 0.7, "learning_rate": 4.340156393012309e-06, "loss": 0.7305, "step": 5876 }, { "epoch": 0.7, "learning_rate": 4.336972284202824e-06, "loss": 0.7366, "step": 5877 }, { "epoch": 0.7, "learning_rate": 4.333789020374216e-06, "loss": 0.7612, "step": 5878 }, { "epoch": 0.7, "learning_rate": 4.3306066020014684e-06, "loss": 0.7383, "step": 5879 }, { "epoch": 0.7, "learning_rate": 4.327425029559426e-06, "loss": 0.7416, "step": 5880 }, { "epoch": 0.7, "learning_rate": 4.324244303522811e-06, "loss": 0.7517, "step": 5881 }, { "epoch": 0.7, "learning_rate": 4.32106442436622e-06, "loss": 0.7718, "step": 5882 }, { "epoch": 0.7, "learning_rate": 4.31788539256412e-06, "loss": 0.7785, "step": 5883 }, { "epoch": 0.7, "learning_rate": 4.314707208590862e-06, "loss": 0.7656, "step": 5884 }, { "epoch": 0.7, "learning_rate": 4.311529872920658e-06, "loss": 0.7584, "step": 5885 }, { "epoch": 0.7, "learning_rate": 4.308353386027601e-06, "loss": 0.7026, "step": 5886 }, { "epoch": 0.7, "learning_rate": 4.305177748385648e-06, "loss": 0.7148, "step": 5887 }, { "epoch": 0.7, "learning_rate": 4.3020029604686474e-06, "loss": 0.6903, "step": 5888 }, { "epoch": 0.7, "learning_rate": 4.2988290227503025e-06, "loss": 0.6585, "step": 5889 }, { "epoch": 0.7, "learning_rate": 4.2956559357042e-06, "loss": 0.7606, "step": 5890 }, { "epoch": 0.7, "learning_rate": 4.292483699803792e-06, "loss": 0.6925, "step": 5891 }, { "epoch": 0.7, "learning_rate": 4.289312315522409e-06, "loss": 0.7193, "step": 5892 }, { "epoch": 0.7, "learning_rate": 4.286141783333258e-06, "loss": 0.7461, "step": 5893 }, { "epoch": 0.7, "learning_rate": 4.2829721037094126e-06, "loss": 0.6964, "step": 5894 }, { "epoch": 0.7, "learning_rate": 4.279803277123821e-06, "loss": 0.7316, "step": 5895 }, { "epoch": 0.7, "learning_rate": 4.2766353040493016e-06, "loss": 0.7394, "step": 5896 }, { "epoch": 0.7, "learning_rate": 4.273468184958546e-06, "loss": 0.7433, "step": 5897 }, { "epoch": 0.7, "learning_rate": 4.270301920324128e-06, "loss": 0.6875, "step": 5898 }, { "epoch": 0.7, "learning_rate": 4.26713651061848e-06, "loss": 0.7489, "step": 5899 }, { "epoch": 0.7, "learning_rate": 4.26397195631392e-06, "loss": 0.7818, "step": 5900 }, { "epoch": 0.7, "learning_rate": 4.260808257882625e-06, "loss": 0.7321, "step": 5901 }, { "epoch": 0.7, "learning_rate": 4.257645415796647e-06, "loss": 0.6953, "step": 5902 }, { "epoch": 0.7, "learning_rate": 4.254483430527925e-06, "loss": 0.7388, "step": 5903 }, { "epoch": 0.7, "learning_rate": 4.251322302548247e-06, "loss": 0.7545, "step": 5904 }, { "epoch": 0.7, "learning_rate": 4.248162032329302e-06, "loss": 0.7394, "step": 5905 }, { "epoch": 0.7, "learning_rate": 4.245002620342615e-06, "loss": 0.7667, "step": 5906 }, { "epoch": 0.7, "learning_rate": 4.241844067059615e-06, "loss": 0.7143, "step": 5907 }, { "epoch": 0.7, "learning_rate": 4.238686372951586e-06, "loss": 0.7271, "step": 5908 }, { "epoch": 0.7, "learning_rate": 4.235529538489685e-06, "loss": 0.7344, "step": 5909 }, { "epoch": 0.7, "learning_rate": 4.2323735641449525e-06, "loss": 0.697, "step": 5910 }, { "epoch": 0.7, "learning_rate": 4.229218450388278e-06, "loss": 0.7818, "step": 5911 }, { "epoch": 0.71, "learning_rate": 4.226064197690449e-06, "loss": 0.7679, "step": 5912 }, { "epoch": 0.71, "learning_rate": 4.2229108065221055e-06, "loss": 0.7344, "step": 5913 }, { "epoch": 0.71, "learning_rate": 4.219758277353765e-06, "loss": 0.7695, "step": 5914 }, { "epoch": 0.71, "learning_rate": 4.216606610655823e-06, "loss": 0.7249, "step": 5915 }, { "epoch": 0.71, "learning_rate": 4.2134558068985296e-06, "loss": 0.7807, "step": 5916 }, { "epoch": 0.71, "learning_rate": 4.210305866552026e-06, "loss": 0.7472, "step": 5917 }, { "epoch": 0.71, "learning_rate": 4.207156790086306e-06, "loss": 0.7706, "step": 5918 }, { "epoch": 0.71, "learning_rate": 4.204008577971254e-06, "loss": 0.7221, "step": 5919 }, { "epoch": 0.71, "learning_rate": 4.200861230676608e-06, "loss": 0.697, "step": 5920 }, { "epoch": 0.71, "learning_rate": 4.197714748671987e-06, "loss": 0.7132, "step": 5921 }, { "epoch": 0.71, "learning_rate": 4.1945691324268765e-06, "loss": 0.7645, "step": 5922 }, { "epoch": 0.71, "learning_rate": 4.191424382410631e-06, "loss": 0.7461, "step": 5923 }, { "epoch": 0.71, "learning_rate": 4.1882804990924866e-06, "loss": 0.7377, "step": 5924 }, { "epoch": 0.71, "learning_rate": 4.185137482941537e-06, "loss": 0.7377, "step": 5925 }, { "epoch": 0.71, "learning_rate": 4.181995334426753e-06, "loss": 0.7935, "step": 5926 }, { "epoch": 0.71, "learning_rate": 4.178854054016974e-06, "loss": 0.7662, "step": 5927 }, { "epoch": 0.71, "learning_rate": 4.17571364218091e-06, "loss": 0.7121, "step": 5928 }, { "epoch": 0.71, "learning_rate": 4.172574099387146e-06, "loss": 0.6875, "step": 5929 }, { "epoch": 0.71, "learning_rate": 4.1694354261041315e-06, "loss": 0.6959, "step": 5930 }, { "epoch": 0.71, "learning_rate": 4.166297622800188e-06, "loss": 0.673, "step": 5931 }, { "epoch": 0.71, "learning_rate": 4.1631606899435085e-06, "loss": 0.7573, "step": 5932 }, { "epoch": 0.71, "learning_rate": 4.160024628002148e-06, "loss": 0.7388, "step": 5933 }, { "epoch": 0.71, "learning_rate": 4.156889437444051e-06, "loss": 0.7729, "step": 5934 }, { "epoch": 0.71, "learning_rate": 4.153755118737011e-06, "loss": 0.7254, "step": 5935 }, { "epoch": 0.71, "learning_rate": 4.150621672348703e-06, "loss": 0.7584, "step": 5936 }, { "epoch": 0.71, "learning_rate": 4.1474890987466635e-06, "loss": 0.7405, "step": 5937 }, { "epoch": 0.71, "learning_rate": 4.1443573983983125e-06, "loss": 0.7121, "step": 5938 }, { "epoch": 0.71, "learning_rate": 4.141226571770926e-06, "loss": 0.7461, "step": 5939 }, { "epoch": 0.71, "learning_rate": 4.138096619331657e-06, "loss": 0.7478, "step": 5940 }, { "epoch": 0.71, "learning_rate": 4.1349675415475264e-06, "loss": 0.745, "step": 5941 }, { "epoch": 0.71, "learning_rate": 4.131839338885418e-06, "loss": 0.7037, "step": 5942 }, { "epoch": 0.71, "learning_rate": 4.1287120118121e-06, "loss": 0.736, "step": 5943 }, { "epoch": 0.71, "learning_rate": 4.125585560794198e-06, "loss": 0.7026, "step": 5944 }, { "epoch": 0.71, "learning_rate": 4.122459986298208e-06, "loss": 0.7254, "step": 5945 }, { "epoch": 0.71, "learning_rate": 4.1193352887905e-06, "loss": 0.7204, "step": 5946 }, { "epoch": 0.71, "learning_rate": 4.116211468737304e-06, "loss": 0.7132, "step": 5947 }, { "epoch": 0.71, "learning_rate": 4.113088526604736e-06, "loss": 0.7199, "step": 5948 }, { "epoch": 0.71, "learning_rate": 4.10996646285876e-06, "loss": 0.7171, "step": 5949 }, { "epoch": 0.71, "learning_rate": 4.106845277965231e-06, "loss": 0.7277, "step": 5950 }, { "epoch": 0.71, "learning_rate": 4.103724972389848e-06, "loss": 0.702, "step": 5951 }, { "epoch": 0.71, "learning_rate": 4.100605546598203e-06, "loss": 0.7182, "step": 5952 }, { "epoch": 0.71, "learning_rate": 4.097487001055742e-06, "loss": 0.7813, "step": 5953 }, { "epoch": 0.71, "learning_rate": 4.094369336227778e-06, "loss": 0.8019, "step": 5954 }, { "epoch": 0.71, "learning_rate": 4.091252552579511e-06, "loss": 0.7628, "step": 5955 }, { "epoch": 0.71, "learning_rate": 4.088136650575981e-06, "loss": 0.7266, "step": 5956 }, { "epoch": 0.71, "learning_rate": 4.085021630682123e-06, "loss": 0.76, "step": 5957 }, { "epoch": 0.71, "learning_rate": 4.081907493362728e-06, "loss": 0.7093, "step": 5958 }, { "epoch": 0.71, "learning_rate": 4.078794239082448e-06, "loss": 0.7533, "step": 5959 }, { "epoch": 0.71, "learning_rate": 4.0756818683058285e-06, "loss": 0.76, "step": 5960 }, { "epoch": 0.71, "learning_rate": 4.07257038149725e-06, "loss": 0.8103, "step": 5961 }, { "epoch": 0.71, "learning_rate": 4.069459779120986e-06, "loss": 0.7143, "step": 5962 }, { "epoch": 0.71, "learning_rate": 4.066350061641169e-06, "loss": 0.7268, "step": 5963 }, { "epoch": 0.71, "learning_rate": 4.063241229521797e-06, "loss": 0.7913, "step": 5964 }, { "epoch": 0.71, "learning_rate": 4.060133283226748e-06, "loss": 0.7712, "step": 5965 }, { "epoch": 0.71, "learning_rate": 4.057026223219745e-06, "loss": 0.7595, "step": 5966 }, { "epoch": 0.71, "learning_rate": 4.053920049964405e-06, "loss": 0.6942, "step": 5967 }, { "epoch": 0.71, "learning_rate": 4.050814763924191e-06, "loss": 0.803, "step": 5968 }, { "epoch": 0.71, "learning_rate": 4.047710365562453e-06, "loss": 0.8008, "step": 5969 }, { "epoch": 0.71, "learning_rate": 4.044606855342392e-06, "loss": 0.7344, "step": 5970 }, { "epoch": 0.71, "learning_rate": 4.041504233727085e-06, "loss": 0.7076, "step": 5971 }, { "epoch": 0.71, "learning_rate": 4.038402501179473e-06, "loss": 0.7595, "step": 5972 }, { "epoch": 0.71, "learning_rate": 4.0353016581623635e-06, "loss": 0.7221, "step": 5973 }, { "epoch": 0.71, "learning_rate": 4.032201705138441e-06, "loss": 0.7751, "step": 5974 }, { "epoch": 0.71, "learning_rate": 4.029102642570245e-06, "loss": 0.7651, "step": 5975 }, { "epoch": 0.71, "learning_rate": 4.026004470920187e-06, "loss": 0.7065, "step": 5976 }, { "epoch": 0.71, "learning_rate": 4.022907190650546e-06, "loss": 0.7522, "step": 5977 }, { "epoch": 0.71, "learning_rate": 4.019810802223464e-06, "loss": 0.7517, "step": 5978 }, { "epoch": 0.71, "learning_rate": 4.01671530610096e-06, "loss": 0.7204, "step": 5979 }, { "epoch": 0.71, "learning_rate": 4.01362070274491e-06, "loss": 0.6819, "step": 5980 }, { "epoch": 0.71, "learning_rate": 4.01052699261706e-06, "loss": 0.7249, "step": 5981 }, { "epoch": 0.71, "learning_rate": 4.007434176179019e-06, "loss": 0.755, "step": 5982 }, { "epoch": 0.71, "learning_rate": 4.004342253892274e-06, "loss": 0.7628, "step": 5983 }, { "epoch": 0.71, "learning_rate": 4.001251226218167e-06, "loss": 0.7221, "step": 5984 }, { "epoch": 0.71, "learning_rate": 3.998161093617912e-06, "loss": 0.7037, "step": 5985 }, { "epoch": 0.71, "learning_rate": 3.9950718565525845e-06, "loss": 0.7054, "step": 5986 }, { "epoch": 0.71, "learning_rate": 3.99198351548313e-06, "loss": 0.6869, "step": 5987 }, { "epoch": 0.71, "learning_rate": 3.988896070870365e-06, "loss": 0.7461, "step": 5988 }, { "epoch": 0.71, "learning_rate": 3.985809523174965e-06, "loss": 0.731, "step": 5989 }, { "epoch": 0.71, "learning_rate": 3.9827238728574745e-06, "loss": 0.6669, "step": 5990 }, { "epoch": 0.71, "learning_rate": 3.9796391203783014e-06, "loss": 0.6931, "step": 5991 }, { "epoch": 0.71, "learning_rate": 3.97655526619772e-06, "loss": 0.7467, "step": 5992 }, { "epoch": 0.71, "learning_rate": 3.9734723107758795e-06, "loss": 0.8125, "step": 5993 }, { "epoch": 0.71, "learning_rate": 3.970390254572785e-06, "loss": 0.7662, "step": 5994 }, { "epoch": 0.71, "learning_rate": 3.967309098048309e-06, "loss": 0.75, "step": 5995 }, { "epoch": 0.72, "learning_rate": 3.964228841662192e-06, "loss": 0.7109, "step": 5996 }, { "epoch": 0.72, "learning_rate": 3.961149485874035e-06, "loss": 0.7176, "step": 5997 }, { "epoch": 0.72, "learning_rate": 3.958071031143317e-06, "loss": 0.7299, "step": 5998 }, { "epoch": 0.72, "learning_rate": 3.9549934779293664e-06, "loss": 0.7645, "step": 5999 }, { "epoch": 0.72, "learning_rate": 3.9519168266913975e-06, "loss": 0.7589, "step": 6000 }, { "epoch": 0.72, "learning_rate": 3.948841077888462e-06, "loss": 0.7109, "step": 6001 }, { "epoch": 0.72, "learning_rate": 3.945766231979503e-06, "loss": 0.7461, "step": 6002 }, { "epoch": 0.72, "learning_rate": 3.942692289423318e-06, "loss": 0.764, "step": 6003 }, { "epoch": 0.72, "learning_rate": 3.939619250678563e-06, "loss": 0.7411, "step": 6004 }, { "epoch": 0.72, "learning_rate": 3.936547116203777e-06, "loss": 0.7277, "step": 6005 }, { "epoch": 0.72, "learning_rate": 3.933475886457343e-06, "loss": 0.6696, "step": 6006 }, { "epoch": 0.72, "learning_rate": 3.930405561897527e-06, "loss": 0.76, "step": 6007 }, { "epoch": 0.72, "learning_rate": 3.9273361429824495e-06, "loss": 0.6791, "step": 6008 }, { "epoch": 0.72, "learning_rate": 3.9242676301700965e-06, "loss": 0.6936, "step": 6009 }, { "epoch": 0.72, "learning_rate": 3.92120002391833e-06, "loss": 0.6959, "step": 6010 }, { "epoch": 0.72, "learning_rate": 3.918133324684855e-06, "loss": 0.7768, "step": 6011 }, { "epoch": 0.72, "learning_rate": 3.9150675329272634e-06, "loss": 0.7919, "step": 6012 }, { "epoch": 0.72, "learning_rate": 3.912002649102995e-06, "loss": 0.779, "step": 6013 }, { "epoch": 0.72, "learning_rate": 3.90893867366937e-06, "loss": 0.6925, "step": 6014 }, { "epoch": 0.72, "learning_rate": 3.9058756070835635e-06, "loss": 0.7383, "step": 6015 }, { "epoch": 0.72, "learning_rate": 3.902813449802606e-06, "loss": 0.6786, "step": 6016 }, { "epoch": 0.72, "learning_rate": 3.8997522022834125e-06, "loss": 0.6959, "step": 6017 }, { "epoch": 0.72, "learning_rate": 3.896691864982743e-06, "loss": 0.7455, "step": 6018 }, { "epoch": 0.72, "learning_rate": 3.893632438357241e-06, "loss": 0.7321, "step": 6019 }, { "epoch": 0.72, "learning_rate": 3.890573922863399e-06, "loss": 0.7104, "step": 6020 }, { "epoch": 0.72, "learning_rate": 3.887516318957578e-06, "loss": 0.7388, "step": 6021 }, { "epoch": 0.72, "learning_rate": 3.8844596270960036e-06, "loss": 0.7327, "step": 6022 }, { "epoch": 0.72, "learning_rate": 3.88140384773476e-06, "loss": 0.7768, "step": 6023 }, { "epoch": 0.72, "learning_rate": 3.878348981329811e-06, "loss": 0.7958, "step": 6024 }, { "epoch": 0.72, "learning_rate": 3.875295028336968e-06, "loss": 0.6842, "step": 6025 }, { "epoch": 0.72, "learning_rate": 3.87224198921191e-06, "loss": 0.7773, "step": 6026 }, { "epoch": 0.72, "learning_rate": 3.869189864410183e-06, "loss": 0.7444, "step": 6027 }, { "epoch": 0.72, "learning_rate": 3.866138654387191e-06, "loss": 0.7355, "step": 6028 }, { "epoch": 0.72, "learning_rate": 3.863088359598214e-06, "loss": 0.7969, "step": 6029 }, { "epoch": 0.72, "learning_rate": 3.860038980498377e-06, "loss": 0.7148, "step": 6030 }, { "epoch": 0.72, "learning_rate": 3.856990517542689e-06, "loss": 0.6535, "step": 6031 }, { "epoch": 0.72, "learning_rate": 3.853942971186e-06, "loss": 0.7148, "step": 6032 }, { "epoch": 0.72, "learning_rate": 3.850896341883041e-06, "loss": 0.7388, "step": 6033 }, { "epoch": 0.72, "learning_rate": 3.847850630088401e-06, "loss": 0.7985, "step": 6034 }, { "epoch": 0.72, "learning_rate": 3.844805836256524e-06, "loss": 0.716, "step": 6035 }, { "epoch": 0.72, "learning_rate": 3.841761960841736e-06, "loss": 0.7037, "step": 6036 }, { "epoch": 0.72, "learning_rate": 3.838719004298199e-06, "loss": 0.7991, "step": 6037 }, { "epoch": 0.72, "learning_rate": 3.8356769670799645e-06, "loss": 0.7478, "step": 6038 }, { "epoch": 0.72, "learning_rate": 3.832635849640931e-06, "loss": 0.7355, "step": 6039 }, { "epoch": 0.72, "learning_rate": 3.8295956524348596e-06, "loss": 0.7372, "step": 6040 }, { "epoch": 0.72, "learning_rate": 3.826556375915391e-06, "loss": 0.7249, "step": 6041 }, { "epoch": 0.72, "learning_rate": 3.823518020536e-06, "loss": 0.7623, "step": 6042 }, { "epoch": 0.72, "learning_rate": 3.820480586750051e-06, "loss": 0.7176, "step": 6043 }, { "epoch": 0.72, "learning_rate": 3.817444075010752e-06, "loss": 0.7294, "step": 6044 }, { "epoch": 0.72, "learning_rate": 3.8144084857711905e-06, "loss": 0.7349, "step": 6045 }, { "epoch": 0.72, "learning_rate": 3.8113738194843043e-06, "loss": 0.6669, "step": 6046 }, { "epoch": 0.72, "learning_rate": 3.8083400766028877e-06, "loss": 0.7221, "step": 6047 }, { "epoch": 0.72, "learning_rate": 3.8053072575796155e-06, "loss": 0.6713, "step": 6048 }, { "epoch": 0.72, "learning_rate": 3.8022753628670075e-06, "loss": 0.793, "step": 6049 }, { "epoch": 0.72, "learning_rate": 3.7992443929174604e-06, "loss": 0.731, "step": 6050 }, { "epoch": 0.72, "learning_rate": 3.7962143481832227e-06, "loss": 0.7299, "step": 6051 }, { "epoch": 0.72, "learning_rate": 3.793185229116406e-06, "loss": 0.7327, "step": 6052 }, { "epoch": 0.72, "learning_rate": 3.7901570361689875e-06, "loss": 0.7204, "step": 6053 }, { "epoch": 0.72, "learning_rate": 3.7871297697927987e-06, "loss": 0.7232, "step": 6054 }, { "epoch": 0.72, "learning_rate": 3.7841034304395473e-06, "loss": 0.6925, "step": 6055 }, { "epoch": 0.72, "learning_rate": 3.7810780185607877e-06, "loss": 0.7773, "step": 6056 }, { "epoch": 0.72, "learning_rate": 3.778053534607944e-06, "loss": 0.7282, "step": 6057 }, { "epoch": 0.72, "learning_rate": 3.7750299790322985e-06, "loss": 0.7461, "step": 6058 }, { "epoch": 0.72, "learning_rate": 3.772007352284993e-06, "loss": 0.7288, "step": 6059 }, { "epoch": 0.72, "learning_rate": 3.7689856548170413e-06, "loss": 0.7891, "step": 6060 }, { "epoch": 0.72, "learning_rate": 3.7659648870793075e-06, "loss": 0.7355, "step": 6061 }, { "epoch": 0.72, "learning_rate": 3.7629450495225205e-06, "loss": 0.7171, "step": 6062 }, { "epoch": 0.72, "learning_rate": 3.7599261425972666e-06, "loss": 0.7556, "step": 6063 }, { "epoch": 0.72, "learning_rate": 3.756908166754005e-06, "loss": 0.7109, "step": 6064 }, { "epoch": 0.72, "learning_rate": 3.753891122443044e-06, "loss": 0.755, "step": 6065 }, { "epoch": 0.72, "learning_rate": 3.7508750101145584e-06, "loss": 0.7132, "step": 6066 }, { "epoch": 0.72, "learning_rate": 3.747859830218581e-06, "loss": 0.6892, "step": 6067 }, { "epoch": 0.72, "learning_rate": 3.7448455832050036e-06, "loss": 0.6496, "step": 6068 }, { "epoch": 0.72, "learning_rate": 3.74183226952359e-06, "loss": 0.7416, "step": 6069 }, { "epoch": 0.72, "learning_rate": 3.7388198896239526e-06, "loss": 0.7243, "step": 6070 }, { "epoch": 0.72, "learning_rate": 3.735808443955571e-06, "loss": 0.7751, "step": 6071 }, { "epoch": 0.72, "learning_rate": 3.732797932967781e-06, "loss": 0.7522, "step": 6072 }, { "epoch": 0.72, "learning_rate": 3.7297883571097783e-06, "loss": 0.7478, "step": 6073 }, { "epoch": 0.72, "learning_rate": 3.7267797168306295e-06, "loss": 0.7254, "step": 6074 }, { "epoch": 0.72, "learning_rate": 3.7237720125792477e-06, "loss": 0.7182, "step": 6075 }, { "epoch": 0.72, "learning_rate": 3.7207652448044206e-06, "loss": 0.7824, "step": 6076 }, { "epoch": 0.72, "learning_rate": 3.7177594139547813e-06, "loss": 0.7009, "step": 6077 }, { "epoch": 0.72, "learning_rate": 3.714754520478827e-06, "loss": 0.7165, "step": 6078 }, { "epoch": 0.72, "learning_rate": 3.7117505648249275e-06, "loss": 0.7254, "step": 6079 }, { "epoch": 0.73, "learning_rate": 3.708747547441295e-06, "loss": 0.7539, "step": 6080 }, { "epoch": 0.73, "learning_rate": 3.705745468776021e-06, "loss": 0.7031, "step": 6081 }, { "epoch": 0.73, "learning_rate": 3.7027443292770305e-06, "loss": 0.6696, "step": 6082 }, { "epoch": 0.73, "learning_rate": 3.6997441293921367e-06, "loss": 0.7612, "step": 6083 }, { "epoch": 0.73, "learning_rate": 3.6967448695689945e-06, "loss": 0.7478, "step": 6084 }, { "epoch": 0.73, "learning_rate": 3.693746550255121e-06, "loss": 0.7545, "step": 6085 }, { "epoch": 0.73, "learning_rate": 3.690749171897906e-06, "loss": 0.7115, "step": 6086 }, { "epoch": 0.73, "learning_rate": 3.6877527349445742e-06, "loss": 0.7277, "step": 6087 }, { "epoch": 0.73, "learning_rate": 3.6847572398422348e-06, "loss": 0.7461, "step": 6088 }, { "epoch": 0.73, "learning_rate": 3.6817626870378432e-06, "loss": 0.6646, "step": 6089 }, { "epoch": 0.73, "learning_rate": 3.6787690769782124e-06, "loss": 0.6953, "step": 6090 }, { "epoch": 0.73, "learning_rate": 3.6757764101100315e-06, "loss": 0.7154, "step": 6091 }, { "epoch": 0.73, "learning_rate": 3.67278468687982e-06, "loss": 0.7294, "step": 6092 }, { "epoch": 0.73, "learning_rate": 3.669793907733985e-06, "loss": 0.7227, "step": 6093 }, { "epoch": 0.73, "learning_rate": 3.666804073118775e-06, "loss": 0.7824, "step": 6094 }, { "epoch": 0.73, "learning_rate": 3.663815183480308e-06, "loss": 0.7974, "step": 6095 }, { "epoch": 0.73, "learning_rate": 3.660827239264555e-06, "loss": 0.7171, "step": 6096 }, { "epoch": 0.73, "learning_rate": 3.6578402409173462e-06, "loss": 0.7578, "step": 6097 }, { "epoch": 0.73, "learning_rate": 3.6548541888843737e-06, "loss": 0.7606, "step": 6098 }, { "epoch": 0.73, "learning_rate": 3.6518690836111816e-06, "loss": 0.7612, "step": 6099 }, { "epoch": 0.73, "learning_rate": 3.6488849255431846e-06, "loss": 0.7746, "step": 6100 }, { "epoch": 0.73, "learning_rate": 3.645901715125646e-06, "loss": 0.7718, "step": 6101 }, { "epoch": 0.73, "learning_rate": 3.6429194528036917e-06, "loss": 0.7171, "step": 6102 }, { "epoch": 0.73, "learning_rate": 3.639938139022304e-06, "loss": 0.7009, "step": 6103 }, { "epoch": 0.73, "learning_rate": 3.636957774226323e-06, "loss": 0.7483, "step": 6104 }, { "epoch": 0.73, "learning_rate": 3.6339783588604537e-06, "loss": 0.7567, "step": 6105 }, { "epoch": 0.73, "learning_rate": 3.6309998933692547e-06, "loss": 0.8075, "step": 6106 }, { "epoch": 0.73, "learning_rate": 3.6280223781971413e-06, "loss": 0.7394, "step": 6107 }, { "epoch": 0.73, "learning_rate": 3.6250458137883883e-06, "loss": 0.7383, "step": 6108 }, { "epoch": 0.73, "learning_rate": 3.6220702005871276e-06, "loss": 0.6702, "step": 6109 }, { "epoch": 0.73, "learning_rate": 3.619095539037355e-06, "loss": 0.75, "step": 6110 }, { "epoch": 0.73, "learning_rate": 3.616121829582919e-06, "loss": 0.7712, "step": 6111 }, { "epoch": 0.73, "learning_rate": 3.6131490726675254e-06, "loss": 0.6892, "step": 6112 }, { "epoch": 0.73, "learning_rate": 3.610177268734738e-06, "loss": 0.7294, "step": 6113 }, { "epoch": 0.73, "learning_rate": 3.607206418227984e-06, "loss": 0.7277, "step": 6114 }, { "epoch": 0.73, "learning_rate": 3.604236521590544e-06, "loss": 0.7388, "step": 6115 }, { "epoch": 0.73, "learning_rate": 3.6012675792655537e-06, "loss": 0.76, "step": 6116 }, { "epoch": 0.73, "learning_rate": 3.5982995916960106e-06, "loss": 0.7327, "step": 6117 }, { "epoch": 0.73, "learning_rate": 3.5953325593247657e-06, "loss": 0.7199, "step": 6118 }, { "epoch": 0.73, "learning_rate": 3.592366482594536e-06, "loss": 0.6802, "step": 6119 }, { "epoch": 0.73, "learning_rate": 3.5894013619478863e-06, "loss": 0.7045, "step": 6120 }, { "epoch": 0.73, "learning_rate": 3.586437197827244e-06, "loss": 0.8142, "step": 6121 }, { "epoch": 0.73, "learning_rate": 3.5834739906748904e-06, "loss": 0.7165, "step": 6122 }, { "epoch": 0.73, "learning_rate": 3.5805117409329637e-06, "loss": 0.7405, "step": 6123 }, { "epoch": 0.73, "learning_rate": 3.577550449043469e-06, "loss": 0.7472, "step": 6124 }, { "epoch": 0.73, "learning_rate": 3.5745901154482522e-06, "loss": 0.6858, "step": 6125 }, { "epoch": 0.73, "learning_rate": 3.571630740589036e-06, "loss": 0.7612, "step": 6126 }, { "epoch": 0.73, "learning_rate": 3.568672324907375e-06, "loss": 0.6964, "step": 6127 }, { "epoch": 0.73, "learning_rate": 3.5657148688447063e-06, "loss": 0.6367, "step": 6128 }, { "epoch": 0.73, "learning_rate": 3.5627583728423075e-06, "loss": 0.7388, "step": 6129 }, { "epoch": 0.73, "learning_rate": 3.559802837341315e-06, "loss": 0.7349, "step": 6130 }, { "epoch": 0.73, "learning_rate": 3.556848262782735e-06, "loss": 0.6998, "step": 6131 }, { "epoch": 0.73, "learning_rate": 3.5538946496074043e-06, "loss": 0.7467, "step": 6132 }, { "epoch": 0.73, "learning_rate": 3.5509419982560435e-06, "loss": 0.7054, "step": 6133 }, { "epoch": 0.73, "learning_rate": 3.547990309169215e-06, "loss": 0.6828, "step": 6134 }, { "epoch": 0.73, "learning_rate": 3.5450395827873363e-06, "loss": 0.6512, "step": 6135 }, { "epoch": 0.73, "learning_rate": 3.542089819550696e-06, "loss": 0.7461, "step": 6136 }, { "epoch": 0.73, "learning_rate": 3.5391410198994134e-06, "loss": 0.6869, "step": 6137 }, { "epoch": 0.73, "learning_rate": 3.536193184273493e-06, "loss": 0.7779, "step": 6138 }, { "epoch": 0.73, "learning_rate": 3.533246313112775e-06, "loss": 0.7969, "step": 6139 }, { "epoch": 0.73, "learning_rate": 3.53030040685696e-06, "loss": 0.7026, "step": 6140 }, { "epoch": 0.73, "learning_rate": 3.527355465945618e-06, "loss": 0.7282, "step": 6141 }, { "epoch": 0.73, "learning_rate": 3.524411490818149e-06, "loss": 0.7712, "step": 6142 }, { "epoch": 0.73, "learning_rate": 3.5214684819138346e-06, "loss": 0.7324, "step": 6143 }, { "epoch": 0.73, "learning_rate": 3.5185264396717943e-06, "loss": 0.7818, "step": 6144 }, { "epoch": 0.73, "learning_rate": 3.5155853645310178e-06, "loss": 0.7656, "step": 6145 }, { "epoch": 0.73, "learning_rate": 3.5126452569303394e-06, "loss": 0.6864, "step": 6146 }, { "epoch": 0.73, "learning_rate": 3.5097061173084522e-06, "loss": 0.7573, "step": 6147 }, { "epoch": 0.73, "learning_rate": 3.5067679461039072e-06, "loss": 0.7673, "step": 6148 }, { "epoch": 0.73, "learning_rate": 3.5038307437551032e-06, "loss": 0.7215, "step": 6149 }, { "epoch": 0.73, "learning_rate": 3.50089451070031e-06, "loss": 0.7344, "step": 6150 }, { "epoch": 0.73, "learning_rate": 3.4979592473776394e-06, "loss": 0.7154, "step": 6151 }, { "epoch": 0.73, "learning_rate": 3.49502495422506e-06, "loss": 0.7277, "step": 6152 }, { "epoch": 0.73, "learning_rate": 3.4920916316803998e-06, "loss": 0.7132, "step": 6153 }, { "epoch": 0.73, "learning_rate": 3.4891592801813367e-06, "loss": 0.7165, "step": 6154 }, { "epoch": 0.73, "learning_rate": 3.4862279001654143e-06, "loss": 0.6931, "step": 6155 }, { "epoch": 0.73, "learning_rate": 3.483297492070019e-06, "loss": 0.7176, "step": 6156 }, { "epoch": 0.73, "learning_rate": 3.480368056332398e-06, "loss": 0.726, "step": 6157 }, { "epoch": 0.73, "learning_rate": 3.477439593389651e-06, "loss": 0.7651, "step": 6158 }, { "epoch": 0.73, "learning_rate": 3.474512103678739e-06, "loss": 0.6763, "step": 6159 }, { "epoch": 0.73, "learning_rate": 3.471585587636469e-06, "loss": 0.7054, "step": 6160 }, { "epoch": 0.73, "learning_rate": 3.468660045699509e-06, "loss": 0.7377, "step": 6161 }, { "epoch": 0.73, "learning_rate": 3.4657354783043786e-06, "loss": 0.7026, "step": 6162 }, { "epoch": 0.74, "learning_rate": 3.462811885887448e-06, "loss": 0.731, "step": 6163 }, { "epoch": 0.74, "learning_rate": 3.459889268884955e-06, "loss": 0.7522, "step": 6164 }, { "epoch": 0.74, "learning_rate": 3.45696762773298e-06, "loss": 0.7366, "step": 6165 }, { "epoch": 0.74, "learning_rate": 3.45404696286746e-06, "loss": 0.654, "step": 6166 }, { "epoch": 0.74, "learning_rate": 3.45112727472419e-06, "loss": 0.7712, "step": 6167 }, { "epoch": 0.74, "learning_rate": 3.448208563738812e-06, "loss": 0.726, "step": 6168 }, { "epoch": 0.74, "learning_rate": 3.4452908303468336e-06, "loss": 0.6981, "step": 6169 }, { "epoch": 0.74, "learning_rate": 3.4423740749836065e-06, "loss": 0.7729, "step": 6170 }, { "epoch": 0.74, "learning_rate": 3.4394582980843416e-06, "loss": 0.7243, "step": 6171 }, { "epoch": 0.74, "learning_rate": 3.4365435000841018e-06, "loss": 0.7366, "step": 6172 }, { "epoch": 0.74, "learning_rate": 3.4336296814178003e-06, "loss": 0.7539, "step": 6173 }, { "epoch": 0.74, "learning_rate": 3.4307168425202154e-06, "loss": 0.7533, "step": 6174 }, { "epoch": 0.74, "learning_rate": 3.4278049838259643e-06, "loss": 0.7416, "step": 6175 }, { "epoch": 0.74, "learning_rate": 3.424894105769537e-06, "loss": 0.7093, "step": 6176 }, { "epoch": 0.74, "learning_rate": 3.421984208785253e-06, "loss": 0.7048, "step": 6177 }, { "epoch": 0.74, "learning_rate": 3.419075293307307e-06, "loss": 0.7567, "step": 6178 }, { "epoch": 0.74, "learning_rate": 3.4161673597697364e-06, "loss": 0.6981, "step": 6179 }, { "epoch": 0.74, "learning_rate": 3.413260408606429e-06, "loss": 0.7589, "step": 6180 }, { "epoch": 0.74, "learning_rate": 3.4103544402511435e-06, "loss": 0.6775, "step": 6181 }, { "epoch": 0.74, "learning_rate": 3.4074494551374647e-06, "loss": 0.7026, "step": 6182 }, { "epoch": 0.74, "learning_rate": 3.4045454536988566e-06, "loss": 0.6858, "step": 6183 }, { "epoch": 0.74, "learning_rate": 3.4016424363686206e-06, "loss": 0.7271, "step": 6184 }, { "epoch": 0.74, "learning_rate": 3.3987404035799155e-06, "loss": 0.7299, "step": 6185 }, { "epoch": 0.74, "learning_rate": 3.395839355765762e-06, "loss": 0.7706, "step": 6186 }, { "epoch": 0.74, "learning_rate": 3.392939293359013e-06, "loss": 0.697, "step": 6187 }, { "epoch": 0.74, "learning_rate": 3.3900402167923976e-06, "loss": 0.7015, "step": 6188 }, { "epoch": 0.74, "learning_rate": 3.3871421264984796e-06, "loss": 0.7065, "step": 6189 }, { "epoch": 0.74, "learning_rate": 3.384245022909689e-06, "loss": 0.7037, "step": 6190 }, { "epoch": 0.74, "learning_rate": 3.3813489064583027e-06, "loss": 0.7478, "step": 6191 }, { "epoch": 0.74, "learning_rate": 3.378453777576448e-06, "loss": 0.654, "step": 6192 }, { "epoch": 0.74, "learning_rate": 3.3755596366961074e-06, "loss": 0.7902, "step": 6193 }, { "epoch": 0.74, "learning_rate": 3.372666484249114e-06, "loss": 0.7796, "step": 6194 }, { "epoch": 0.74, "learning_rate": 3.3697743206671616e-06, "loss": 0.7645, "step": 6195 }, { "epoch": 0.74, "learning_rate": 3.3668831463817865e-06, "loss": 0.7115, "step": 6196 }, { "epoch": 0.74, "learning_rate": 3.3639929618243804e-06, "loss": 0.7059, "step": 6197 }, { "epoch": 0.74, "learning_rate": 3.3611037674261894e-06, "loss": 0.7338, "step": 6198 }, { "epoch": 0.74, "learning_rate": 3.358215563618306e-06, "loss": 0.7422, "step": 6199 }, { "epoch": 0.74, "learning_rate": 3.355328350831686e-06, "loss": 0.7037, "step": 6200 }, { "epoch": 0.74, "learning_rate": 3.3524421294971276e-06, "loss": 0.7288, "step": 6201 }, { "epoch": 0.74, "learning_rate": 3.3495569000452854e-06, "loss": 0.7533, "step": 6202 }, { "epoch": 0.74, "learning_rate": 3.3466726629066626e-06, "loss": 0.7263, "step": 6203 }, { "epoch": 0.74, "learning_rate": 3.3437894185116147e-06, "loss": 0.7148, "step": 6204 }, { "epoch": 0.74, "learning_rate": 3.340907167290357e-06, "loss": 0.6847, "step": 6205 }, { "epoch": 0.74, "learning_rate": 3.3380259096729485e-06, "loss": 0.7416, "step": 6206 }, { "epoch": 0.74, "learning_rate": 3.3351456460892983e-06, "loss": 0.7232, "step": 6207 }, { "epoch": 0.74, "learning_rate": 3.332266376969171e-06, "loss": 0.7807, "step": 6208 }, { "epoch": 0.74, "learning_rate": 3.329388102742188e-06, "loss": 0.7294, "step": 6209 }, { "epoch": 0.74, "learning_rate": 3.326510823837814e-06, "loss": 0.7338, "step": 6210 }, { "epoch": 0.74, "learning_rate": 3.323634540685364e-06, "loss": 0.7394, "step": 6211 }, { "epoch": 0.74, "learning_rate": 3.3207592537140186e-06, "loss": 0.7316, "step": 6212 }, { "epoch": 0.74, "learning_rate": 3.3178849633527865e-06, "loss": 0.6981, "step": 6213 }, { "epoch": 0.74, "learning_rate": 3.31501167003055e-06, "loss": 0.7746, "step": 6214 }, { "epoch": 0.74, "learning_rate": 3.312139374176032e-06, "loss": 0.7037, "step": 6215 }, { "epoch": 0.74, "learning_rate": 3.309268076217803e-06, "loss": 0.7182, "step": 6216 }, { "epoch": 0.74, "learning_rate": 3.3063977765843005e-06, "loss": 0.7695, "step": 6217 }, { "epoch": 0.74, "learning_rate": 3.3035284757037877e-06, "loss": 0.7433, "step": 6218 }, { "epoch": 0.74, "learning_rate": 3.300660174004405e-06, "loss": 0.6747, "step": 6219 }, { "epoch": 0.74, "learning_rate": 3.297792871914124e-06, "loss": 0.7589, "step": 6220 }, { "epoch": 0.74, "learning_rate": 3.2949265698607825e-06, "loss": 0.6964, "step": 6221 }, { "epoch": 0.74, "learning_rate": 3.2920612682720576e-06, "loss": 0.7701, "step": 6222 }, { "epoch": 0.74, "learning_rate": 3.289196967575482e-06, "loss": 0.7573, "step": 6223 }, { "epoch": 0.74, "learning_rate": 3.286333668198438e-06, "loss": 0.7048, "step": 6224 }, { "epoch": 0.74, "learning_rate": 3.2834713705681555e-06, "loss": 0.7506, "step": 6225 }, { "epoch": 0.74, "learning_rate": 3.2806100751117243e-06, "loss": 0.7243, "step": 6226 }, { "epoch": 0.74, "learning_rate": 3.2777497822560754e-06, "loss": 0.7137, "step": 6227 }, { "epoch": 0.74, "learning_rate": 3.2748904924279935e-06, "loss": 0.7238, "step": 6228 }, { "epoch": 0.74, "learning_rate": 3.2720322060541143e-06, "loss": 0.7528, "step": 6229 }, { "epoch": 0.74, "learning_rate": 3.269174923560918e-06, "loss": 0.7282, "step": 6230 }, { "epoch": 0.74, "learning_rate": 3.2663186453747487e-06, "loss": 0.6925, "step": 6231 }, { "epoch": 0.74, "learning_rate": 3.2634633719217857e-06, "loss": 0.7656, "step": 6232 }, { "epoch": 0.74, "learning_rate": 3.2606091036280676e-06, "loss": 0.716, "step": 6233 }, { "epoch": 0.74, "learning_rate": 3.2577558409194787e-06, "loss": 0.7087, "step": 6234 }, { "epoch": 0.74, "learning_rate": 3.2549035842217514e-06, "loss": 0.7031, "step": 6235 }, { "epoch": 0.74, "learning_rate": 3.252052333960477e-06, "loss": 0.7511, "step": 6236 }, { "epoch": 0.74, "learning_rate": 3.249202090561089e-06, "loss": 0.7494, "step": 6237 }, { "epoch": 0.74, "learning_rate": 3.2463528544488722e-06, "loss": 0.7662, "step": 6238 }, { "epoch": 0.74, "learning_rate": 3.243504626048957e-06, "loss": 0.7048, "step": 6239 }, { "epoch": 0.74, "learning_rate": 3.240657405786335e-06, "loss": 0.7266, "step": 6240 }, { "epoch": 0.74, "learning_rate": 3.237811194085836e-06, "loss": 0.7327, "step": 6241 }, { "epoch": 0.74, "learning_rate": 3.2349659913721455e-06, "loss": 0.7009, "step": 6242 }, { "epoch": 0.74, "learning_rate": 3.232121798069795e-06, "loss": 0.7416, "step": 6243 }, { "epoch": 0.74, "learning_rate": 3.2292786146031653e-06, "loss": 0.7706, "step": 6244 }, { "epoch": 0.74, "learning_rate": 3.226436441396491e-06, "loss": 0.7427, "step": 6245 }, { "epoch": 0.74, "learning_rate": 3.2235952788738534e-06, "loss": 0.7489, "step": 6246 }, { "epoch": 0.75, "learning_rate": 3.2207551274591817e-06, "loss": 0.7472, "step": 6247 }, { "epoch": 0.75, "learning_rate": 3.2179159875762532e-06, "loss": 0.7333, "step": 6248 }, { "epoch": 0.75, "learning_rate": 3.2150778596486953e-06, "loss": 0.6959, "step": 6249 }, { "epoch": 0.75, "learning_rate": 3.2122407440999913e-06, "loss": 0.7662, "step": 6250 }, { "epoch": 0.75, "learning_rate": 3.209404641353461e-06, "loss": 0.6964, "step": 6251 }, { "epoch": 0.75, "learning_rate": 3.2065695518322883e-06, "loss": 0.7416, "step": 6252 }, { "epoch": 0.75, "learning_rate": 3.203735475959484e-06, "loss": 0.8052, "step": 6253 }, { "epoch": 0.75, "learning_rate": 3.2009024141579325e-06, "loss": 0.7031, "step": 6254 }, { "epoch": 0.75, "learning_rate": 3.198070366850351e-06, "loss": 0.7243, "step": 6255 }, { "epoch": 0.75, "learning_rate": 3.195239334459306e-06, "loss": 0.7227, "step": 6256 }, { "epoch": 0.75, "learning_rate": 3.192409317407226e-06, "loss": 0.7182, "step": 6257 }, { "epoch": 0.75, "learning_rate": 3.189580316116364e-06, "loss": 0.6769, "step": 6258 }, { "epoch": 0.75, "learning_rate": 3.186752331008848e-06, "loss": 0.7874, "step": 6259 }, { "epoch": 0.75, "learning_rate": 3.183925362506636e-06, "loss": 0.7439, "step": 6260 }, { "epoch": 0.75, "learning_rate": 3.1810994110315376e-06, "loss": 0.6373, "step": 6261 }, { "epoch": 0.75, "learning_rate": 3.1782744770052243e-06, "loss": 0.7433, "step": 6262 }, { "epoch": 0.75, "learning_rate": 3.1754505608491905e-06, "loss": 0.7188, "step": 6263 }, { "epoch": 0.75, "learning_rate": 3.1726276629848042e-06, "loss": 0.7076, "step": 6264 }, { "epoch": 0.75, "learning_rate": 3.1698057838332653e-06, "loss": 0.7467, "step": 6265 }, { "epoch": 0.75, "learning_rate": 3.1669849238156237e-06, "loss": 0.7176, "step": 6266 }, { "epoch": 0.75, "learning_rate": 3.1641650833527903e-06, "loss": 0.7338, "step": 6267 }, { "epoch": 0.75, "learning_rate": 3.1613462628655012e-06, "loss": 0.6908, "step": 6268 }, { "epoch": 0.75, "learning_rate": 3.158528462774362e-06, "loss": 0.7199, "step": 6269 }, { "epoch": 0.75, "learning_rate": 3.155711683499809e-06, "loss": 0.6367, "step": 6270 }, { "epoch": 0.75, "learning_rate": 3.152895925462144e-06, "loss": 0.798, "step": 6271 }, { "epoch": 0.75, "learning_rate": 3.1500811890815006e-06, "loss": 0.7461, "step": 6272 }, { "epoch": 0.75, "learning_rate": 3.1472674747778675e-06, "loss": 0.7539, "step": 6273 }, { "epoch": 0.75, "learning_rate": 3.144454782971078e-06, "loss": 0.6987, "step": 6274 }, { "epoch": 0.75, "learning_rate": 3.141643114080811e-06, "loss": 0.702, "step": 6275 }, { "epoch": 0.75, "learning_rate": 3.1388324685266037e-06, "loss": 0.7059, "step": 6276 }, { "epoch": 0.75, "learning_rate": 3.1360228467278277e-06, "loss": 0.7478, "step": 6277 }, { "epoch": 0.75, "learning_rate": 3.1332142491037067e-06, "loss": 0.692, "step": 6278 }, { "epoch": 0.75, "learning_rate": 3.1304066760733143e-06, "loss": 0.7349, "step": 6279 }, { "epoch": 0.75, "learning_rate": 3.1276001280555636e-06, "loss": 0.6869, "step": 6280 }, { "epoch": 0.75, "learning_rate": 3.124794605469227e-06, "loss": 0.7863, "step": 6281 }, { "epoch": 0.75, "learning_rate": 3.121990108732913e-06, "loss": 0.685, "step": 6282 }, { "epoch": 0.75, "learning_rate": 3.1191866382650804e-06, "loss": 0.7439, "step": 6283 }, { "epoch": 0.75, "learning_rate": 3.1163841944840336e-06, "loss": 0.75, "step": 6284 }, { "epoch": 0.75, "learning_rate": 3.1135827778079308e-06, "loss": 0.6652, "step": 6285 }, { "epoch": 0.75, "learning_rate": 3.1107823886547696e-06, "loss": 0.7081, "step": 6286 }, { "epoch": 0.75, "learning_rate": 3.107983027442395e-06, "loss": 0.726, "step": 6287 }, { "epoch": 0.75, "learning_rate": 3.1051846945885e-06, "loss": 0.7511, "step": 6288 }, { "epoch": 0.75, "learning_rate": 3.1023873905106215e-06, "loss": 0.784, "step": 6289 }, { "epoch": 0.75, "learning_rate": 3.0995911156261517e-06, "loss": 0.697, "step": 6290 }, { "epoch": 0.75, "learning_rate": 3.0967958703523206e-06, "loss": 0.6881, "step": 6291 }, { "epoch": 0.75, "learning_rate": 3.0940016551062058e-06, "loss": 0.7578, "step": 6292 }, { "epoch": 0.75, "learning_rate": 3.0912084703047317e-06, "loss": 0.7266, "step": 6293 }, { "epoch": 0.75, "learning_rate": 3.0884163163646687e-06, "loss": 0.7171, "step": 6294 }, { "epoch": 0.75, "learning_rate": 3.085625193702639e-06, "loss": 0.7243, "step": 6295 }, { "epoch": 0.75, "learning_rate": 3.0828351027351043e-06, "loss": 0.7316, "step": 6296 }, { "epoch": 0.75, "learning_rate": 3.080046043878374e-06, "loss": 0.7193, "step": 6297 }, { "epoch": 0.75, "learning_rate": 3.077258017548603e-06, "loss": 0.7098, "step": 6298 }, { "epoch": 0.75, "learning_rate": 3.0744710241617904e-06, "loss": 0.7271, "step": 6299 }, { "epoch": 0.75, "learning_rate": 3.0716850641337903e-06, "loss": 0.7394, "step": 6300 }, { "epoch": 0.75, "learning_rate": 3.0689001378802895e-06, "loss": 0.7656, "step": 6301 }, { "epoch": 0.75, "learning_rate": 3.066116245816836e-06, "loss": 0.7673, "step": 6302 }, { "epoch": 0.75, "learning_rate": 3.0633333883588035e-06, "loss": 0.7355, "step": 6303 }, { "epoch": 0.75, "learning_rate": 3.0605515659214303e-06, "loss": 0.7249, "step": 6304 }, { "epoch": 0.75, "learning_rate": 3.0577707789197895e-06, "loss": 0.7355, "step": 6305 }, { "epoch": 0.75, "learning_rate": 3.0549910277688e-06, "loss": 0.7076, "step": 6306 }, { "epoch": 0.75, "learning_rate": 3.052212312883237e-06, "loss": 0.7121, "step": 6307 }, { "epoch": 0.75, "learning_rate": 3.0494346346777026e-06, "loss": 0.7991, "step": 6308 }, { "epoch": 0.75, "learning_rate": 3.0466579935666616e-06, "loss": 0.7215, "step": 6309 }, { "epoch": 0.75, "learning_rate": 3.0438823899644145e-06, "loss": 0.7087, "step": 6310 }, { "epoch": 0.75, "learning_rate": 3.0411078242851066e-06, "loss": 0.7215, "step": 6311 }, { "epoch": 0.75, "learning_rate": 3.0383342969427397e-06, "loss": 0.7009, "step": 6312 }, { "epoch": 0.75, "learning_rate": 3.0355618083511394e-06, "loss": 0.736, "step": 6313 }, { "epoch": 0.75, "learning_rate": 3.0327903589240003e-06, "loss": 0.7126, "step": 6314 }, { "epoch": 0.75, "learning_rate": 3.0300199490748426e-06, "loss": 0.683, "step": 6315 }, { "epoch": 0.75, "learning_rate": 3.027250579217046e-06, "loss": 0.7026, "step": 6316 }, { "epoch": 0.75, "learning_rate": 3.0244822497638284e-06, "loss": 0.6814, "step": 6317 }, { "epoch": 0.75, "learning_rate": 3.0217149611282427e-06, "loss": 0.7243, "step": 6318 }, { "epoch": 0.75, "learning_rate": 3.0189487137232065e-06, "loss": 0.6931, "step": 6319 }, { "epoch": 0.75, "learning_rate": 3.0161835079614654e-06, "loss": 0.683, "step": 6320 }, { "epoch": 0.75, "learning_rate": 3.0134193442556215e-06, "loss": 0.7377, "step": 6321 }, { "epoch": 0.75, "learning_rate": 3.0106562230181137e-06, "loss": 0.7433, "step": 6322 }, { "epoch": 0.75, "learning_rate": 3.0078941446612273e-06, "loss": 0.8114, "step": 6323 }, { "epoch": 0.75, "learning_rate": 3.0051331095970925e-06, "loss": 0.76, "step": 6324 }, { "epoch": 0.75, "learning_rate": 3.0023731182376803e-06, "loss": 0.7573, "step": 6325 }, { "epoch": 0.75, "learning_rate": 2.9996141709948144e-06, "loss": 0.7411, "step": 6326 }, { "epoch": 0.75, "learning_rate": 2.9968562682801572e-06, "loss": 0.6853, "step": 6327 }, { "epoch": 0.75, "learning_rate": 2.9940994105052124e-06, "loss": 0.7461, "step": 6328 }, { "epoch": 0.75, "learning_rate": 2.9913435980813334e-06, "loss": 0.7494, "step": 6329 }, { "epoch": 0.75, "learning_rate": 2.98858883141971e-06, "loss": 0.7779, "step": 6330 }, { "epoch": 0.76, "learning_rate": 2.985835110931389e-06, "loss": 0.7439, "step": 6331 }, { "epoch": 0.76, "learning_rate": 2.9830824370272503e-06, "loss": 0.7662, "step": 6332 }, { "epoch": 0.76, "learning_rate": 2.9803308101180195e-06, "loss": 0.7372, "step": 6333 }, { "epoch": 0.76, "learning_rate": 2.9775802306142655e-06, "loss": 0.6869, "step": 6334 }, { "epoch": 0.76, "learning_rate": 2.9748306989264063e-06, "loss": 0.7695, "step": 6335 }, { "epoch": 0.76, "learning_rate": 2.972082215464699e-06, "loss": 0.7656, "step": 6336 }, { "epoch": 0.76, "learning_rate": 2.969334780639245e-06, "loss": 0.7288, "step": 6337 }, { "epoch": 0.76, "learning_rate": 2.966588394859987e-06, "loss": 0.7338, "step": 6338 }, { "epoch": 0.76, "learning_rate": 2.9638430585367127e-06, "loss": 0.6484, "step": 6339 }, { "epoch": 0.76, "learning_rate": 2.9610987720790596e-06, "loss": 0.7098, "step": 6340 }, { "epoch": 0.76, "learning_rate": 2.958355535896499e-06, "loss": 0.6953, "step": 6341 }, { "epoch": 0.76, "learning_rate": 2.9556133503983508e-06, "loss": 0.7366, "step": 6342 }, { "epoch": 0.76, "learning_rate": 2.952872215993775e-06, "loss": 0.7154, "step": 6343 }, { "epoch": 0.76, "learning_rate": 2.9501321330917755e-06, "loss": 0.7215, "step": 6344 }, { "epoch": 0.76, "learning_rate": 2.947393102101205e-06, "loss": 0.7037, "step": 6345 }, { "epoch": 0.76, "learning_rate": 2.9446551234307488e-06, "loss": 0.685, "step": 6346 }, { "epoch": 0.76, "learning_rate": 2.9419181974889498e-06, "loss": 0.7193, "step": 6347 }, { "epoch": 0.76, "learning_rate": 2.9391823246841765e-06, "loss": 0.7372, "step": 6348 }, { "epoch": 0.76, "learning_rate": 2.936447505424648e-06, "loss": 0.683, "step": 6349 }, { "epoch": 0.76, "learning_rate": 2.9337137401184337e-06, "loss": 0.7188, "step": 6350 }, { "epoch": 0.76, "learning_rate": 2.930981029173433e-06, "loss": 0.7048, "step": 6351 }, { "epoch": 0.76, "learning_rate": 2.9282493729974013e-06, "loss": 0.6825, "step": 6352 }, { "epoch": 0.76, "learning_rate": 2.9255187719979206e-06, "loss": 0.7227, "step": 6353 }, { "epoch": 0.76, "learning_rate": 2.92278922658243e-06, "loss": 0.7729, "step": 6354 }, { "epoch": 0.76, "learning_rate": 2.9200607371582024e-06, "loss": 0.7143, "step": 6355 }, { "epoch": 0.76, "learning_rate": 2.917333304132355e-06, "loss": 0.7545, "step": 6356 }, { "epoch": 0.76, "learning_rate": 2.9146069279118562e-06, "loss": 0.7528, "step": 6357 }, { "epoch": 0.76, "learning_rate": 2.9118816089034964e-06, "loss": 0.7606, "step": 6358 }, { "epoch": 0.76, "learning_rate": 2.90915734751393e-06, "loss": 0.7455, "step": 6359 }, { "epoch": 0.76, "learning_rate": 2.9064341441496415e-06, "loss": 0.7483, "step": 6360 }, { "epoch": 0.76, "learning_rate": 2.903711999216957e-06, "loss": 0.6373, "step": 6361 }, { "epoch": 0.76, "learning_rate": 2.900990913122058e-06, "loss": 0.6869, "step": 6362 }, { "epoch": 0.76, "learning_rate": 2.8982708862709454e-06, "loss": 0.755, "step": 6363 }, { "epoch": 0.76, "learning_rate": 2.8955519190694826e-06, "loss": 0.7366, "step": 6364 }, { "epoch": 0.76, "learning_rate": 2.8928340119233624e-06, "loss": 0.7048, "step": 6365 }, { "epoch": 0.76, "learning_rate": 2.890117165238129e-06, "loss": 0.7109, "step": 6366 }, { "epoch": 0.76, "learning_rate": 2.8874013794191603e-06, "loss": 0.6819, "step": 6367 }, { "epoch": 0.76, "learning_rate": 2.88468665487168e-06, "loss": 0.7266, "step": 6368 }, { "epoch": 0.76, "learning_rate": 2.881972992000752e-06, "loss": 0.7188, "step": 6369 }, { "epoch": 0.76, "learning_rate": 2.879260391211278e-06, "loss": 0.8019, "step": 6370 }, { "epoch": 0.76, "learning_rate": 2.876548852908013e-06, "loss": 0.7567, "step": 6371 }, { "epoch": 0.76, "learning_rate": 2.8738383774955436e-06, "loss": 0.697, "step": 6372 }, { "epoch": 0.76, "learning_rate": 2.871128965378297e-06, "loss": 0.7773, "step": 6373 }, { "epoch": 0.76, "learning_rate": 2.8684206169605465e-06, "loss": 0.6624, "step": 6374 }, { "epoch": 0.76, "learning_rate": 2.865713332646404e-06, "loss": 0.7455, "step": 6375 }, { "epoch": 0.76, "learning_rate": 2.863007112839825e-06, "loss": 0.7985, "step": 6376 }, { "epoch": 0.76, "learning_rate": 2.8603019579446067e-06, "loss": 0.6964, "step": 6377 }, { "epoch": 0.76, "learning_rate": 2.8575978683643824e-06, "loss": 0.6585, "step": 6378 }, { "epoch": 0.76, "learning_rate": 2.8548948445026305e-06, "loss": 0.6579, "step": 6379 }, { "epoch": 0.76, "learning_rate": 2.852192886762667e-06, "loss": 0.7511, "step": 6380 }, { "epoch": 0.76, "learning_rate": 2.849491995547656e-06, "loss": 0.7026, "step": 6381 }, { "epoch": 0.76, "learning_rate": 2.846792171260596e-06, "loss": 0.7617, "step": 6382 }, { "epoch": 0.76, "learning_rate": 2.8440934143043263e-06, "loss": 0.7321, "step": 6383 }, { "epoch": 0.76, "learning_rate": 2.8413957250815283e-06, "loss": 0.7182, "step": 6384 }, { "epoch": 0.76, "learning_rate": 2.8386991039947274e-06, "loss": 0.7634, "step": 6385 }, { "epoch": 0.76, "learning_rate": 2.8360035514462867e-06, "loss": 0.7483, "step": 6386 }, { "epoch": 0.76, "learning_rate": 2.833309067838408e-06, "loss": 0.7729, "step": 6387 }, { "epoch": 0.76, "learning_rate": 2.8306156535731355e-06, "loss": 0.7059, "step": 6388 }, { "epoch": 0.76, "learning_rate": 2.8279233090523515e-06, "loss": 0.726, "step": 6389 }, { "epoch": 0.76, "learning_rate": 2.825232034677786e-06, "loss": 0.7126, "step": 6390 }, { "epoch": 0.76, "learning_rate": 2.822541830851002e-06, "loss": 0.7729, "step": 6391 }, { "epoch": 0.76, "learning_rate": 2.8198526979734053e-06, "loss": 0.644, "step": 6392 }, { "epoch": 0.76, "learning_rate": 2.8171646364462415e-06, "loss": 0.6797, "step": 6393 }, { "epoch": 0.76, "learning_rate": 2.8144776466705925e-06, "loss": 0.7483, "step": 6394 }, { "epoch": 0.76, "learning_rate": 2.811791729047392e-06, "loss": 0.6574, "step": 6395 }, { "epoch": 0.76, "learning_rate": 2.809106883977398e-06, "loss": 0.7584, "step": 6396 }, { "epoch": 0.76, "learning_rate": 2.806423111861227e-06, "loss": 0.7059, "step": 6397 }, { "epoch": 0.76, "learning_rate": 2.803740413099313e-06, "loss": 0.7651, "step": 6398 }, { "epoch": 0.76, "learning_rate": 2.8010587880919503e-06, "loss": 0.7015, "step": 6399 }, { "epoch": 0.76, "learning_rate": 2.798378237239261e-06, "loss": 0.7316, "step": 6400 }, { "epoch": 0.76, "learning_rate": 2.7956987609412077e-06, "loss": 0.7338, "step": 6401 }, { "epoch": 0.76, "learning_rate": 2.7930203595976013e-06, "loss": 0.7455, "step": 6402 }, { "epoch": 0.76, "learning_rate": 2.7903430336080828e-06, "loss": 0.7545, "step": 6403 }, { "epoch": 0.76, "learning_rate": 2.787666783372137e-06, "loss": 0.7165, "step": 6404 }, { "epoch": 0.76, "learning_rate": 2.7849916092890872e-06, "loss": 0.764, "step": 6405 }, { "epoch": 0.76, "learning_rate": 2.7823175117580925e-06, "loss": 0.7204, "step": 6406 }, { "epoch": 0.76, "learning_rate": 2.779644491178163e-06, "loss": 0.7299, "step": 6407 }, { "epoch": 0.76, "learning_rate": 2.776972547948137e-06, "loss": 0.7126, "step": 6408 }, { "epoch": 0.76, "learning_rate": 2.7743016824666934e-06, "loss": 0.7254, "step": 6409 }, { "epoch": 0.76, "learning_rate": 2.771631895132354e-06, "loss": 0.7087, "step": 6410 }, { "epoch": 0.76, "learning_rate": 2.768963186343475e-06, "loss": 0.7433, "step": 6411 }, { "epoch": 0.76, "learning_rate": 2.766295556498261e-06, "loss": 0.7243, "step": 6412 }, { "epoch": 0.76, "learning_rate": 2.7636290059947447e-06, "loss": 0.7746, "step": 6413 }, { "epoch": 0.76, "learning_rate": 2.760963535230803e-06, "loss": 0.7316, "step": 6414 }, { "epoch": 0.77, "learning_rate": 2.7582991446041486e-06, "loss": 0.7015, "step": 6415 }, { "epoch": 0.77, "learning_rate": 2.755635834512341e-06, "loss": 0.7059, "step": 6416 }, { "epoch": 0.77, "learning_rate": 2.752973605352771e-06, "loss": 0.7282, "step": 6417 }, { "epoch": 0.77, "learning_rate": 2.7503124575226692e-06, "loss": 0.6975, "step": 6418 }, { "epoch": 0.77, "learning_rate": 2.7476523914191057e-06, "loss": 0.7299, "step": 6419 }, { "epoch": 0.77, "learning_rate": 2.744993407438985e-06, "loss": 0.726, "step": 6420 }, { "epoch": 0.77, "learning_rate": 2.7423355059790624e-06, "loss": 0.7573, "step": 6421 }, { "epoch": 0.77, "learning_rate": 2.7396786874359205e-06, "loss": 0.7662, "step": 6422 }, { "epoch": 0.77, "learning_rate": 2.737022952205982e-06, "loss": 0.8097, "step": 6423 }, { "epoch": 0.77, "learning_rate": 2.7343683006855103e-06, "loss": 0.7232, "step": 6424 }, { "epoch": 0.77, "learning_rate": 2.731714733270603e-06, "loss": 0.7617, "step": 6425 }, { "epoch": 0.77, "learning_rate": 2.729062250357204e-06, "loss": 0.6702, "step": 6426 }, { "epoch": 0.77, "learning_rate": 2.726410852341087e-06, "loss": 0.7394, "step": 6427 }, { "epoch": 0.77, "learning_rate": 2.7237605396178747e-06, "loss": 0.7305, "step": 6428 }, { "epoch": 0.77, "learning_rate": 2.721111312583008e-06, "loss": 0.7612, "step": 6429 }, { "epoch": 0.77, "learning_rate": 2.718463171631789e-06, "loss": 0.7835, "step": 6430 }, { "epoch": 0.77, "learning_rate": 2.7158161171593432e-06, "loss": 0.7299, "step": 6431 }, { "epoch": 0.77, "learning_rate": 2.7131701495606343e-06, "loss": 0.7254, "step": 6432 }, { "epoch": 0.77, "learning_rate": 2.7105252692304775e-06, "loss": 0.7121, "step": 6433 }, { "epoch": 0.77, "learning_rate": 2.707881476563502e-06, "loss": 0.6981, "step": 6434 }, { "epoch": 0.77, "learning_rate": 2.7052387719541996e-06, "loss": 0.7042, "step": 6435 }, { "epoch": 0.77, "learning_rate": 2.7025971557968832e-06, "loss": 0.7656, "step": 6436 }, { "epoch": 0.77, "learning_rate": 2.699956628485707e-06, "loss": 0.7321, "step": 6437 }, { "epoch": 0.77, "learning_rate": 2.6973171904146733e-06, "loss": 0.721, "step": 6438 }, { "epoch": 0.77, "learning_rate": 2.6946788419776006e-06, "loss": 0.7098, "step": 6439 }, { "epoch": 0.77, "learning_rate": 2.6920415835681647e-06, "loss": 0.6942, "step": 6440 }, { "epoch": 0.77, "learning_rate": 2.689405415579871e-06, "loss": 0.7098, "step": 6441 }, { "epoch": 0.77, "learning_rate": 2.6867703384060575e-06, "loss": 0.7305, "step": 6442 }, { "epoch": 0.77, "learning_rate": 2.6841363524399133e-06, "loss": 0.774, "step": 6443 }, { "epoch": 0.77, "learning_rate": 2.6815034580744437e-06, "loss": 0.7394, "step": 6444 }, { "epoch": 0.77, "learning_rate": 2.678871655702514e-06, "loss": 0.6992, "step": 6445 }, { "epoch": 0.77, "learning_rate": 2.6762409457168072e-06, "loss": 0.7394, "step": 6446 }, { "epoch": 0.77, "learning_rate": 2.6736113285098585e-06, "loss": 0.7411, "step": 6447 }, { "epoch": 0.77, "learning_rate": 2.6709828044740304e-06, "loss": 0.7372, "step": 6448 }, { "epoch": 0.77, "learning_rate": 2.6683553740015266e-06, "loss": 0.7154, "step": 6449 }, { "epoch": 0.77, "learning_rate": 2.6657290374843838e-06, "loss": 0.7249, "step": 6450 }, { "epoch": 0.77, "learning_rate": 2.6631037953144765e-06, "loss": 0.7031, "step": 6451 }, { "epoch": 0.77, "learning_rate": 2.6604796478835224e-06, "loss": 0.7227, "step": 6452 }, { "epoch": 0.77, "learning_rate": 2.6578565955830693e-06, "loss": 0.7706, "step": 6453 }, { "epoch": 0.77, "learning_rate": 2.6552346388045014e-06, "loss": 0.7316, "step": 6454 }, { "epoch": 0.77, "learning_rate": 2.6526137779390425e-06, "loss": 0.7377, "step": 6455 }, { "epoch": 0.77, "learning_rate": 2.649994013377747e-06, "loss": 0.7561, "step": 6456 }, { "epoch": 0.77, "learning_rate": 2.647375345511517e-06, "loss": 0.7494, "step": 6457 }, { "epoch": 0.77, "learning_rate": 2.6447577747310813e-06, "loss": 0.702, "step": 6458 }, { "epoch": 0.77, "learning_rate": 2.642141301427009e-06, "loss": 0.7249, "step": 6459 }, { "epoch": 0.77, "learning_rate": 2.639525925989699e-06, "loss": 0.76, "step": 6460 }, { "epoch": 0.77, "learning_rate": 2.636911648809398e-06, "loss": 0.7104, "step": 6461 }, { "epoch": 0.77, "learning_rate": 2.634298470276182e-06, "loss": 0.7115, "step": 6462 }, { "epoch": 0.77, "learning_rate": 2.6316863907799608e-06, "loss": 0.7411, "step": 6463 }, { "epoch": 0.77, "learning_rate": 2.6290754107104844e-06, "loss": 0.7662, "step": 6464 }, { "epoch": 0.77, "learning_rate": 2.6264655304573337e-06, "loss": 0.7227, "step": 6465 }, { "epoch": 0.77, "learning_rate": 2.6238567504099356e-06, "loss": 0.7506, "step": 6466 }, { "epoch": 0.77, "learning_rate": 2.621249070957543e-06, "loss": 0.7734, "step": 6467 }, { "epoch": 0.77, "learning_rate": 2.6186424924892494e-06, "loss": 0.7037, "step": 6468 }, { "epoch": 0.77, "learning_rate": 2.616037015393982e-06, "loss": 0.707, "step": 6469 }, { "epoch": 0.77, "learning_rate": 2.6134326400604994e-06, "loss": 0.6981, "step": 6470 }, { "epoch": 0.77, "learning_rate": 2.610829366877409e-06, "loss": 0.6998, "step": 6471 }, { "epoch": 0.77, "learning_rate": 2.608227196233142e-06, "loss": 0.736, "step": 6472 }, { "epoch": 0.77, "learning_rate": 2.6056261285159667e-06, "loss": 0.716, "step": 6473 }, { "epoch": 0.77, "learning_rate": 2.603026164113991e-06, "loss": 0.7037, "step": 6474 }, { "epoch": 0.77, "learning_rate": 2.6004273034151518e-06, "loss": 0.6741, "step": 6475 }, { "epoch": 0.77, "learning_rate": 2.597829546807231e-06, "loss": 0.74, "step": 6476 }, { "epoch": 0.77, "learning_rate": 2.595232894677835e-06, "loss": 0.8075, "step": 6477 }, { "epoch": 0.77, "learning_rate": 2.5926373474144185e-06, "loss": 0.7746, "step": 6478 }, { "epoch": 0.77, "learning_rate": 2.590042905404252e-06, "loss": 0.7584, "step": 6479 }, { "epoch": 0.77, "learning_rate": 2.5874495690344612e-06, "loss": 0.7706, "step": 6480 }, { "epoch": 0.77, "learning_rate": 2.5848573386919963e-06, "loss": 0.716, "step": 6481 }, { "epoch": 0.77, "learning_rate": 2.5822662147636378e-06, "loss": 0.6574, "step": 6482 }, { "epoch": 0.77, "learning_rate": 2.5796761976360205e-06, "loss": 0.7305, "step": 6483 }, { "epoch": 0.77, "learning_rate": 2.5770872876955877e-06, "loss": 0.6931, "step": 6484 }, { "epoch": 0.77, "learning_rate": 2.574499485328639e-06, "loss": 0.7383, "step": 6485 }, { "epoch": 0.77, "learning_rate": 2.571912790921297e-06, "loss": 0.6819, "step": 6486 }, { "epoch": 0.77, "learning_rate": 2.5693272048595217e-06, "loss": 0.7388, "step": 6487 }, { "epoch": 0.77, "learning_rate": 2.566742727529117e-06, "loss": 0.6842, "step": 6488 }, { "epoch": 0.77, "learning_rate": 2.564159359315701e-06, "loss": 0.784, "step": 6489 }, { "epoch": 0.77, "learning_rate": 2.5615771006047465e-06, "loss": 0.7506, "step": 6490 }, { "epoch": 0.77, "learning_rate": 2.5589959517815478e-06, "loss": 0.755, "step": 6491 }, { "epoch": 0.77, "learning_rate": 2.5564159132312428e-06, "loss": 0.7483, "step": 6492 }, { "epoch": 0.77, "learning_rate": 2.5538369853388003e-06, "loss": 0.6786, "step": 6493 }, { "epoch": 0.77, "learning_rate": 2.551259168489013e-06, "loss": 0.822, "step": 6494 }, { "epoch": 0.77, "learning_rate": 2.5486824630665262e-06, "loss": 0.6992, "step": 6495 }, { "epoch": 0.77, "learning_rate": 2.5461068694558057e-06, "loss": 0.7215, "step": 6496 }, { "epoch": 0.77, "learning_rate": 2.54353238804116e-06, "loss": 0.6825, "step": 6497 }, { "epoch": 0.77, "learning_rate": 2.5409590192067256e-06, "loss": 0.7333, "step": 6498 }, { "epoch": 0.78, "learning_rate": 2.5383867633364754e-06, "loss": 0.736, "step": 6499 }, { "epoch": 0.78, "learning_rate": 2.5358156208142158e-06, "loss": 0.76, "step": 6500 }, { "epoch": 0.78, "learning_rate": 2.5332455920235843e-06, "loss": 0.736, "step": 6501 }, { "epoch": 0.78, "learning_rate": 2.530676677348061e-06, "loss": 0.7232, "step": 6502 }, { "epoch": 0.78, "learning_rate": 2.5281088771709494e-06, "loss": 0.7327, "step": 6503 }, { "epoch": 0.78, "learning_rate": 2.525542191875393e-06, "loss": 0.7271, "step": 6504 }, { "epoch": 0.78, "learning_rate": 2.5229766218443674e-06, "loss": 0.7517, "step": 6505 }, { "epoch": 0.78, "learning_rate": 2.5204121674606773e-06, "loss": 0.8198, "step": 6506 }, { "epoch": 0.78, "learning_rate": 2.5178488291069725e-06, "loss": 0.6819, "step": 6507 }, { "epoch": 0.78, "learning_rate": 2.5152866071657246e-06, "loss": 0.7377, "step": 6508 }, { "epoch": 0.78, "learning_rate": 2.512725502019243e-06, "loss": 0.7383, "step": 6509 }, { "epoch": 0.78, "learning_rate": 2.5101655140496685e-06, "loss": 0.6551, "step": 6510 }, { "epoch": 0.78, "learning_rate": 2.507606643638982e-06, "loss": 0.7059, "step": 6511 }, { "epoch": 0.78, "learning_rate": 2.5050488911689917e-06, "loss": 0.7494, "step": 6512 }, { "epoch": 0.78, "learning_rate": 2.5024922570213384e-06, "loss": 0.7171, "step": 6513 }, { "epoch": 0.78, "learning_rate": 2.499936741577498e-06, "loss": 0.7751, "step": 6514 }, { "epoch": 0.78, "learning_rate": 2.497382345218776e-06, "loss": 0.7478, "step": 6515 }, { "epoch": 0.78, "learning_rate": 2.49482906832632e-06, "loss": 0.7009, "step": 6516 }, { "epoch": 0.78, "learning_rate": 2.4922769112811028e-06, "loss": 0.7266, "step": 6517 }, { "epoch": 0.78, "learning_rate": 2.4897258744639306e-06, "loss": 0.7282, "step": 6518 }, { "epoch": 0.78, "learning_rate": 2.4871759582554456e-06, "loss": 0.7199, "step": 6519 }, { "epoch": 0.78, "learning_rate": 2.4846271630361165e-06, "loss": 0.7472, "step": 6520 }, { "epoch": 0.78, "learning_rate": 2.4820794891862544e-06, "loss": 0.7561, "step": 6521 }, { "epoch": 0.78, "learning_rate": 2.4795329370859943e-06, "loss": 0.7115, "step": 6522 }, { "epoch": 0.78, "learning_rate": 2.476987507115316e-06, "loss": 0.7511, "step": 6523 }, { "epoch": 0.78, "learning_rate": 2.474443199654013e-06, "loss": 0.7651, "step": 6524 }, { "epoch": 0.78, "learning_rate": 2.471900015081722e-06, "loss": 0.7467, "step": 6525 }, { "epoch": 0.78, "learning_rate": 2.4693579537779187e-06, "loss": 0.7232, "step": 6526 }, { "epoch": 0.78, "learning_rate": 2.4668170161218983e-06, "loss": 0.7299, "step": 6527 }, { "epoch": 0.78, "learning_rate": 2.464277202492802e-06, "loss": 0.7305, "step": 6528 }, { "epoch": 0.78, "learning_rate": 2.4617385132695847e-06, "loss": 0.6646, "step": 6529 }, { "epoch": 0.78, "learning_rate": 2.459200948831053e-06, "loss": 0.7383, "step": 6530 }, { "epoch": 0.78, "learning_rate": 2.456664509555835e-06, "loss": 0.7433, "step": 6531 }, { "epoch": 0.78, "learning_rate": 2.454129195822389e-06, "loss": 0.668, "step": 6532 }, { "epoch": 0.78, "learning_rate": 2.451595008009019e-06, "loss": 0.7333, "step": 6533 }, { "epoch": 0.78, "learning_rate": 2.449061946493839e-06, "loss": 0.7104, "step": 6534 }, { "epoch": 0.78, "learning_rate": 2.446530011654816e-06, "loss": 0.6942, "step": 6535 }, { "epoch": 0.78, "learning_rate": 2.443999203869738e-06, "loss": 0.7349, "step": 6536 }, { "epoch": 0.78, "learning_rate": 2.4414695235162246e-06, "loss": 0.7405, "step": 6537 }, { "epoch": 0.78, "learning_rate": 2.438940970971736e-06, "loss": 0.7065, "step": 6538 }, { "epoch": 0.78, "learning_rate": 2.4364135466135495e-06, "loss": 0.721, "step": 6539 }, { "epoch": 0.78, "learning_rate": 2.4338872508187884e-06, "loss": 0.7294, "step": 6540 }, { "epoch": 0.78, "learning_rate": 2.431362083964397e-06, "loss": 0.745, "step": 6541 }, { "epoch": 0.78, "learning_rate": 2.42883804642716e-06, "loss": 0.8521, "step": 6542 }, { "epoch": 0.78, "learning_rate": 2.426315138583689e-06, "loss": 0.7132, "step": 6543 }, { "epoch": 0.78, "learning_rate": 2.4237933608104246e-06, "loss": 0.7098, "step": 6544 }, { "epoch": 0.78, "learning_rate": 2.4212727134836436e-06, "loss": 0.7416, "step": 6545 }, { "epoch": 0.78, "learning_rate": 2.4187531969794476e-06, "loss": 0.7232, "step": 6546 }, { "epoch": 0.78, "learning_rate": 2.41623481167378e-06, "loss": 0.697, "step": 6547 }, { "epoch": 0.78, "learning_rate": 2.4137175579424067e-06, "loss": 0.7277, "step": 6548 }, { "epoch": 0.78, "learning_rate": 2.4112014361609282e-06, "loss": 0.7366, "step": 6549 }, { "epoch": 0.78, "learning_rate": 2.4086864467047734e-06, "loss": 0.7165, "step": 6550 }, { "epoch": 0.78, "learning_rate": 2.406172589949203e-06, "loss": 0.793, "step": 6551 }, { "epoch": 0.78, "learning_rate": 2.4036598662693144e-06, "loss": 0.7277, "step": 6552 }, { "epoch": 0.78, "learning_rate": 2.4011482760400286e-06, "loss": 0.7768, "step": 6553 }, { "epoch": 0.78, "learning_rate": 2.3986378196361004e-06, "loss": 0.6959, "step": 6554 }, { "epoch": 0.78, "learning_rate": 2.3961284974321153e-06, "loss": 0.7294, "step": 6555 }, { "epoch": 0.78, "learning_rate": 2.3936203098024868e-06, "loss": 0.7483, "step": 6556 }, { "epoch": 0.78, "learning_rate": 2.391113257121468e-06, "loss": 0.774, "step": 6557 }, { "epoch": 0.78, "learning_rate": 2.3886073397631317e-06, "loss": 0.6593, "step": 6558 }, { "epoch": 0.78, "learning_rate": 2.3861025581013874e-06, "loss": 0.7249, "step": 6559 }, { "epoch": 0.78, "learning_rate": 2.3835989125099712e-06, "loss": 0.7952, "step": 6560 }, { "epoch": 0.78, "learning_rate": 2.3810964033624582e-06, "loss": 0.7478, "step": 6561 }, { "epoch": 0.78, "learning_rate": 2.378595031032244e-06, "loss": 0.7394, "step": 6562 }, { "epoch": 0.78, "learning_rate": 2.3760947958925583e-06, "loss": 0.6981, "step": 6563 }, { "epoch": 0.78, "learning_rate": 2.3735956983164632e-06, "loss": 0.7277, "step": 6564 }, { "epoch": 0.78, "learning_rate": 2.371097738676845e-06, "loss": 0.7511, "step": 6565 }, { "epoch": 0.78, "learning_rate": 2.368600917346432e-06, "loss": 0.7316, "step": 6566 }, { "epoch": 0.78, "learning_rate": 2.36610523469777e-06, "loss": 0.726, "step": 6567 }, { "epoch": 0.78, "learning_rate": 2.3636106911032407e-06, "loss": 0.6669, "step": 6568 }, { "epoch": 0.78, "learning_rate": 2.361117286935056e-06, "loss": 0.7506, "step": 6569 }, { "epoch": 0.78, "learning_rate": 2.358625022565253e-06, "loss": 0.7589, "step": 6570 }, { "epoch": 0.78, "learning_rate": 2.35613389836571e-06, "loss": 0.7578, "step": 6571 }, { "epoch": 0.78, "learning_rate": 2.3536439147081205e-06, "loss": 0.7411, "step": 6572 }, { "epoch": 0.78, "learning_rate": 2.351155071964024e-06, "loss": 0.7695, "step": 6573 }, { "epoch": 0.78, "learning_rate": 2.3486673705047703e-06, "loss": 0.7439, "step": 6574 }, { "epoch": 0.78, "learning_rate": 2.346180810701558e-06, "loss": 0.6802, "step": 6575 }, { "epoch": 0.78, "learning_rate": 2.3436953929254037e-06, "loss": 0.7455, "step": 6576 }, { "epoch": 0.78, "learning_rate": 2.341211117547154e-06, "loss": 0.7427, "step": 6577 }, { "epoch": 0.78, "learning_rate": 2.3387279849374965e-06, "loss": 0.76, "step": 6578 }, { "epoch": 0.78, "learning_rate": 2.3362459954669293e-06, "loss": 0.7628, "step": 6579 }, { "epoch": 0.78, "learning_rate": 2.3337651495057965e-06, "loss": 0.784, "step": 6580 }, { "epoch": 0.78, "learning_rate": 2.3312854474242643e-06, "loss": 0.707, "step": 6581 }, { "epoch": 0.78, "learning_rate": 2.3288068895923254e-06, "loss": 0.7355, "step": 6582 }, { "epoch": 0.79, "learning_rate": 2.326329476379815e-06, "loss": 0.7489, "step": 6583 }, { "epoch": 0.79, "learning_rate": 2.323853208156376e-06, "loss": 0.7679, "step": 6584 }, { "epoch": 0.79, "learning_rate": 2.3213780852915025e-06, "loss": 0.692, "step": 6585 }, { "epoch": 0.79, "learning_rate": 2.3189041081545026e-06, "loss": 0.7556, "step": 6586 }, { "epoch": 0.79, "learning_rate": 2.316431277114519e-06, "loss": 0.6975, "step": 6587 }, { "epoch": 0.79, "learning_rate": 2.3139595925405287e-06, "loss": 0.7227, "step": 6588 }, { "epoch": 0.79, "learning_rate": 2.3114890548013225e-06, "loss": 0.7511, "step": 6589 }, { "epoch": 0.79, "learning_rate": 2.309019664265536e-06, "loss": 0.7388, "step": 6590 }, { "epoch": 0.79, "learning_rate": 2.3065514213016237e-06, "loss": 0.7517, "step": 6591 }, { "epoch": 0.79, "learning_rate": 2.304084326277878e-06, "loss": 0.7623, "step": 6592 }, { "epoch": 0.79, "learning_rate": 2.301618379562409e-06, "loss": 0.7176, "step": 6593 }, { "epoch": 0.79, "learning_rate": 2.2991535815231636e-06, "loss": 0.7673, "step": 6594 }, { "epoch": 0.79, "learning_rate": 2.2966899325279136e-06, "loss": 0.6847, "step": 6595 }, { "epoch": 0.79, "learning_rate": 2.294227432944257e-06, "loss": 0.6735, "step": 6596 }, { "epoch": 0.79, "learning_rate": 2.2917660831396293e-06, "loss": 0.7003, "step": 6597 }, { "epoch": 0.79, "learning_rate": 2.2893058834812863e-06, "loss": 0.7394, "step": 6598 }, { "epoch": 0.79, "learning_rate": 2.286846834336315e-06, "loss": 0.7427, "step": 6599 }, { "epoch": 0.79, "learning_rate": 2.28438893607163e-06, "loss": 0.7606, "step": 6600 }, { "epoch": 0.79, "learning_rate": 2.2819321890539703e-06, "loss": 0.6925, "step": 6601 }, { "epoch": 0.79, "learning_rate": 2.2794765936499153e-06, "loss": 0.6981, "step": 6602 }, { "epoch": 0.79, "learning_rate": 2.2770221502258584e-06, "loss": 0.7539, "step": 6603 }, { "epoch": 0.79, "learning_rate": 2.2745688591480343e-06, "loss": 0.7294, "step": 6604 }, { "epoch": 0.79, "learning_rate": 2.272116720782488e-06, "loss": 0.7478, "step": 6605 }, { "epoch": 0.79, "learning_rate": 2.2696657354951136e-06, "loss": 0.6998, "step": 6606 }, { "epoch": 0.79, "learning_rate": 2.2672159036516172e-06, "loss": 0.7143, "step": 6607 }, { "epoch": 0.79, "learning_rate": 2.2647672256175378e-06, "loss": 0.75, "step": 6608 }, { "epoch": 0.79, "learning_rate": 2.262319701758251e-06, "loss": 0.7065, "step": 6609 }, { "epoch": 0.79, "learning_rate": 2.25987333243894e-06, "loss": 0.7405, "step": 6610 }, { "epoch": 0.79, "learning_rate": 2.257428118024637e-06, "loss": 0.7243, "step": 6611 }, { "epoch": 0.79, "learning_rate": 2.2549840588801896e-06, "loss": 0.76, "step": 6612 }, { "epoch": 0.79, "learning_rate": 2.2525411553702723e-06, "loss": 0.7656, "step": 6613 }, { "epoch": 0.79, "learning_rate": 2.250099407859401e-06, "loss": 0.6847, "step": 6614 }, { "epoch": 0.79, "learning_rate": 2.2476588167118962e-06, "loss": 0.7467, "step": 6615 }, { "epoch": 0.79, "learning_rate": 2.245219382291929e-06, "loss": 0.7656, "step": 6616 }, { "epoch": 0.79, "learning_rate": 2.242781104963484e-06, "loss": 0.7148, "step": 6617 }, { "epoch": 0.79, "learning_rate": 2.240343985090373e-06, "loss": 0.6881, "step": 6618 }, { "epoch": 0.79, "learning_rate": 2.237908023036248e-06, "loss": 0.7054, "step": 6619 }, { "epoch": 0.79, "learning_rate": 2.2354732191645687e-06, "loss": 0.7232, "step": 6620 }, { "epoch": 0.79, "learning_rate": 2.23303957383864e-06, "loss": 0.7327, "step": 6621 }, { "epoch": 0.79, "learning_rate": 2.2306070874215813e-06, "loss": 0.7266, "step": 6622 }, { "epoch": 0.79, "learning_rate": 2.2281757602763486e-06, "loss": 0.7137, "step": 6623 }, { "epoch": 0.79, "learning_rate": 2.2257455927657177e-06, "loss": 0.6735, "step": 6624 }, { "epoch": 0.79, "learning_rate": 2.2233165852522963e-06, "loss": 0.7254, "step": 6625 }, { "epoch": 0.79, "learning_rate": 2.2208887380985144e-06, "loss": 0.7204, "step": 6626 }, { "epoch": 0.79, "learning_rate": 2.21846205166663e-06, "loss": 0.7494, "step": 6627 }, { "epoch": 0.79, "learning_rate": 2.216036526318733e-06, "loss": 0.7349, "step": 6628 }, { "epoch": 0.79, "learning_rate": 2.213612162416736e-06, "loss": 0.7372, "step": 6629 }, { "epoch": 0.79, "learning_rate": 2.211188960322377e-06, "loss": 0.7098, "step": 6630 }, { "epoch": 0.79, "learning_rate": 2.208766920397222e-06, "loss": 0.7628, "step": 6631 }, { "epoch": 0.79, "learning_rate": 2.2063460430026607e-06, "loss": 0.7193, "step": 6632 }, { "epoch": 0.79, "learning_rate": 2.20392632849992e-06, "loss": 0.716, "step": 6633 }, { "epoch": 0.79, "learning_rate": 2.2015077772500413e-06, "loss": 0.8047, "step": 6634 }, { "epoch": 0.79, "learning_rate": 2.199090389613897e-06, "loss": 0.7204, "step": 6635 }, { "epoch": 0.79, "learning_rate": 2.196674165952183e-06, "loss": 0.7545, "step": 6636 }, { "epoch": 0.79, "learning_rate": 2.1942591066254305e-06, "loss": 0.7282, "step": 6637 }, { "epoch": 0.79, "learning_rate": 2.191845211993987e-06, "loss": 0.7188, "step": 6638 }, { "epoch": 0.79, "learning_rate": 2.189432482418031e-06, "loss": 0.6914, "step": 6639 }, { "epoch": 0.79, "learning_rate": 2.187020918257565e-06, "loss": 0.7115, "step": 6640 }, { "epoch": 0.79, "learning_rate": 2.1846105198724168e-06, "loss": 0.7299, "step": 6641 }, { "epoch": 0.79, "learning_rate": 2.1822012876222467e-06, "loss": 0.7427, "step": 6642 }, { "epoch": 0.79, "learning_rate": 2.179793221866534e-06, "loss": 0.7109, "step": 6643 }, { "epoch": 0.79, "learning_rate": 2.1773863229645874e-06, "loss": 0.745, "step": 6644 }, { "epoch": 0.79, "learning_rate": 2.1749805912755393e-06, "loss": 0.8175, "step": 6645 }, { "epoch": 0.79, "learning_rate": 2.1725760271583474e-06, "loss": 0.6959, "step": 6646 }, { "epoch": 0.79, "learning_rate": 2.1701726309718018e-06, "loss": 0.7098, "step": 6647 }, { "epoch": 0.79, "learning_rate": 2.1677704030745107e-06, "loss": 0.7461, "step": 6648 }, { "epoch": 0.79, "learning_rate": 2.1653693438249113e-06, "loss": 0.726, "step": 6649 }, { "epoch": 0.79, "learning_rate": 2.1629694535812653e-06, "loss": 0.6802, "step": 6650 }, { "epoch": 0.79, "learning_rate": 2.1605707327016578e-06, "loss": 0.7087, "step": 6651 }, { "epoch": 0.79, "learning_rate": 2.1581731815440077e-06, "loss": 0.74, "step": 6652 }, { "epoch": 0.79, "learning_rate": 2.1557768004660484e-06, "loss": 0.6758, "step": 6653 }, { "epoch": 0.79, "learning_rate": 2.1533815898253527e-06, "loss": 0.7824, "step": 6654 }, { "epoch": 0.79, "learning_rate": 2.1509875499793e-06, "loss": 0.7634, "step": 6655 }, { "epoch": 0.79, "learning_rate": 2.148594681285111e-06, "loss": 0.7305, "step": 6656 }, { "epoch": 0.79, "learning_rate": 2.1462029840998242e-06, "loss": 0.7455, "step": 6657 }, { "epoch": 0.79, "learning_rate": 2.1438124587803035e-06, "loss": 0.7422, "step": 6658 }, { "epoch": 0.79, "learning_rate": 2.141423105683246e-06, "loss": 0.7115, "step": 6659 }, { "epoch": 0.79, "learning_rate": 2.1390349251651567e-06, "loss": 0.7712, "step": 6660 }, { "epoch": 0.79, "learning_rate": 2.136647917582385e-06, "loss": 0.6975, "step": 6661 }, { "epoch": 0.79, "learning_rate": 2.134262083291094e-06, "loss": 0.7199, "step": 6662 }, { "epoch": 0.79, "learning_rate": 2.1318774226472703e-06, "loss": 0.7126, "step": 6663 }, { "epoch": 0.79, "learning_rate": 2.129493936006739e-06, "loss": 0.7628, "step": 6664 }, { "epoch": 0.79, "learning_rate": 2.1271116237251287e-06, "loss": 0.6674, "step": 6665 }, { "epoch": 0.79, "learning_rate": 2.124730486157912e-06, "loss": 0.6959, "step": 6666 }, { "epoch": 0.8, "learning_rate": 2.1223505236603736e-06, "loss": 0.7366, "step": 6667 }, { "epoch": 0.8, "learning_rate": 2.1199717365876338e-06, "loss": 0.7316, "step": 6668 }, { "epoch": 0.8, "learning_rate": 2.117594125294632e-06, "loss": 0.6791, "step": 6669 }, { "epoch": 0.8, "learning_rate": 2.115217690136122e-06, "loss": 0.7282, "step": 6670 }, { "epoch": 0.8, "learning_rate": 2.112842431466702e-06, "loss": 0.7383, "step": 6671 }, { "epoch": 0.8, "learning_rate": 2.1104683496407773e-06, "loss": 0.6825, "step": 6672 }, { "epoch": 0.8, "learning_rate": 2.1080954450125925e-06, "loss": 0.6579, "step": 6673 }, { "epoch": 0.8, "learning_rate": 2.1057237179362035e-06, "loss": 0.7249, "step": 6674 }, { "epoch": 0.8, "learning_rate": 2.1033531687654984e-06, "loss": 0.7472, "step": 6675 }, { "epoch": 0.8, "learning_rate": 2.100983797854186e-06, "loss": 0.7656, "step": 6676 }, { "epoch": 0.8, "learning_rate": 2.098615605555797e-06, "loss": 0.692, "step": 6677 }, { "epoch": 0.8, "learning_rate": 2.096248592223695e-06, "loss": 0.774, "step": 6678 }, { "epoch": 0.8, "learning_rate": 2.0938827582110623e-06, "loss": 0.7645, "step": 6679 }, { "epoch": 0.8, "learning_rate": 2.091518103870901e-06, "loss": 0.6847, "step": 6680 }, { "epoch": 0.8, "learning_rate": 2.089154629556045e-06, "loss": 0.7684, "step": 6681 }, { "epoch": 0.8, "learning_rate": 2.0867923356191433e-06, "loss": 0.7684, "step": 6682 }, { "epoch": 0.8, "learning_rate": 2.0844312224126807e-06, "loss": 0.7584, "step": 6683 }, { "epoch": 0.8, "learning_rate": 2.082071290288956e-06, "loss": 0.6998, "step": 6684 }, { "epoch": 0.8, "learning_rate": 2.079712539600096e-06, "loss": 0.6588, "step": 6685 }, { "epoch": 0.8, "learning_rate": 2.0773549706980455e-06, "loss": 0.7009, "step": 6686 }, { "epoch": 0.8, "learning_rate": 2.0749985839345845e-06, "loss": 0.7081, "step": 6687 }, { "epoch": 0.8, "learning_rate": 2.0726433796613055e-06, "loss": 0.7461, "step": 6688 }, { "epoch": 0.8, "learning_rate": 2.0702893582296303e-06, "loss": 0.7015, "step": 6689 }, { "epoch": 0.8, "learning_rate": 2.067936519990802e-06, "loss": 0.716, "step": 6690 }, { "epoch": 0.8, "learning_rate": 2.0655848652958845e-06, "loss": 0.668, "step": 6691 }, { "epoch": 0.8, "learning_rate": 2.0632343944957744e-06, "loss": 0.702, "step": 6692 }, { "epoch": 0.8, "learning_rate": 2.060885107941184e-06, "loss": 0.7204, "step": 6693 }, { "epoch": 0.8, "learning_rate": 2.058537005982648e-06, "loss": 0.673, "step": 6694 }, { "epoch": 0.8, "learning_rate": 2.05619008897053e-06, "loss": 0.7266, "step": 6695 }, { "epoch": 0.8, "learning_rate": 2.053844357255008e-06, "loss": 0.7366, "step": 6696 }, { "epoch": 0.8, "learning_rate": 2.0514998111860974e-06, "loss": 0.7416, "step": 6697 }, { "epoch": 0.8, "learning_rate": 2.0491564511136196e-06, "loss": 0.7176, "step": 6698 }, { "epoch": 0.8, "learning_rate": 2.046814277387237e-06, "loss": 0.7098, "step": 6699 }, { "epoch": 0.8, "learning_rate": 2.044473290356418e-06, "loss": 0.7757, "step": 6700 }, { "epoch": 0.8, "learning_rate": 2.0421334903704613e-06, "loss": 0.7132, "step": 6701 }, { "epoch": 0.8, "learning_rate": 2.0397948777784926e-06, "loss": 0.6953, "step": 6702 }, { "epoch": 0.8, "learning_rate": 2.0374574529294533e-06, "loss": 0.7489, "step": 6703 }, { "epoch": 0.8, "learning_rate": 2.035121216172118e-06, "loss": 0.7299, "step": 6704 }, { "epoch": 0.8, "learning_rate": 2.0327861678550655e-06, "loss": 0.7533, "step": 6705 }, { "epoch": 0.8, "learning_rate": 2.030452308326717e-06, "loss": 0.7545, "step": 6706 }, { "epoch": 0.8, "learning_rate": 2.0281196379353053e-06, "loss": 0.683, "step": 6707 }, { "epoch": 0.8, "learning_rate": 2.025788157028885e-06, "loss": 0.7182, "step": 6708 }, { "epoch": 0.8, "learning_rate": 2.023457865955346e-06, "loss": 0.7109, "step": 6709 }, { "epoch": 0.8, "learning_rate": 2.021128765062379e-06, "loss": 0.7316, "step": 6710 }, { "epoch": 0.8, "learning_rate": 2.018800854697519e-06, "loss": 0.6959, "step": 6711 }, { "epoch": 0.8, "learning_rate": 2.0164741352081096e-06, "loss": 0.644, "step": 6712 }, { "epoch": 0.8, "learning_rate": 2.0141486069413186e-06, "loss": 0.7405, "step": 6713 }, { "epoch": 0.8, "learning_rate": 2.011824270244147e-06, "loss": 0.6496, "step": 6714 }, { "epoch": 0.8, "learning_rate": 2.009501125463398e-06, "loss": 0.716, "step": 6715 }, { "epoch": 0.8, "learning_rate": 2.0071791729457155e-06, "loss": 0.7427, "step": 6716 }, { "epoch": 0.8, "learning_rate": 2.0048584130375548e-06, "loss": 0.7494, "step": 6717 }, { "epoch": 0.8, "learning_rate": 2.0025388460852e-06, "loss": 0.673, "step": 6718 }, { "epoch": 0.8, "learning_rate": 2.000220472434753e-06, "loss": 0.774, "step": 6719 }, { "epoch": 0.8, "learning_rate": 1.997903292432137e-06, "loss": 0.6786, "step": 6720 }, { "epoch": 0.8, "learning_rate": 1.9955873064230992e-06, "loss": 0.7109, "step": 6721 }, { "epoch": 0.8, "learning_rate": 1.9932725147532063e-06, "loss": 0.7232, "step": 6722 }, { "epoch": 0.8, "learning_rate": 1.9909589177678523e-06, "loss": 0.7684, "step": 6723 }, { "epoch": 0.8, "learning_rate": 1.988646515812248e-06, "loss": 0.779, "step": 6724 }, { "epoch": 0.8, "learning_rate": 1.9863353092314264e-06, "loss": 0.7494, "step": 6725 }, { "epoch": 0.8, "learning_rate": 1.9840252983702437e-06, "loss": 0.7511, "step": 6726 }, { "epoch": 0.8, "learning_rate": 1.9817164835733725e-06, "loss": 0.7171, "step": 6727 }, { "epoch": 0.8, "learning_rate": 1.979408865185317e-06, "loss": 0.7383, "step": 6728 }, { "epoch": 0.8, "learning_rate": 1.9771024435503962e-06, "loss": 0.7294, "step": 6729 }, { "epoch": 0.8, "learning_rate": 1.9747972190127507e-06, "loss": 0.7048, "step": 6730 }, { "epoch": 0.8, "learning_rate": 1.9724931919163416e-06, "loss": 0.6903, "step": 6731 }, { "epoch": 0.8, "learning_rate": 1.9701903626049524e-06, "loss": 0.6814, "step": 6732 }, { "epoch": 0.8, "learning_rate": 1.967888731422192e-06, "loss": 0.697, "step": 6733 }, { "epoch": 0.8, "learning_rate": 1.965588298711486e-06, "loss": 0.7243, "step": 6734 }, { "epoch": 0.8, "learning_rate": 1.963289064816082e-06, "loss": 0.7048, "step": 6735 }, { "epoch": 0.8, "learning_rate": 1.9609910300790445e-06, "loss": 0.7333, "step": 6736 }, { "epoch": 0.8, "learning_rate": 1.9586941948432703e-06, "loss": 0.6903, "step": 6737 }, { "epoch": 0.8, "learning_rate": 1.9563985594514677e-06, "loss": 0.7243, "step": 6738 }, { "epoch": 0.8, "learning_rate": 1.9541041242461687e-06, "loss": 0.7405, "step": 6739 }, { "epoch": 0.8, "learning_rate": 1.9518108895697263e-06, "loss": 0.7729, "step": 6740 }, { "epoch": 0.8, "learning_rate": 1.949518855764311e-06, "loss": 0.7157, "step": 6741 }, { "epoch": 0.8, "learning_rate": 1.947228023171922e-06, "loss": 0.7277, "step": 6742 }, { "epoch": 0.8, "learning_rate": 1.9449383921343735e-06, "loss": 0.7919, "step": 6743 }, { "epoch": 0.8, "learning_rate": 1.9426499629933016e-06, "loss": 0.7026, "step": 6744 }, { "epoch": 0.8, "learning_rate": 1.940362736090161e-06, "loss": 0.7941, "step": 6745 }, { "epoch": 0.8, "learning_rate": 1.938076711766229e-06, "loss": 0.7433, "step": 6746 }, { "epoch": 0.8, "learning_rate": 1.9357918903626074e-06, "loss": 0.6886, "step": 6747 }, { "epoch": 0.8, "learning_rate": 1.933508272220208e-06, "loss": 0.7695, "step": 6748 }, { "epoch": 0.8, "learning_rate": 1.9312258576797803e-06, "loss": 0.7461, "step": 6749 }, { "epoch": 0.81, "learning_rate": 1.928944647081872e-06, "loss": 0.7126, "step": 6750 }, { "epoch": 0.81, "learning_rate": 1.92666464076687e-06, "loss": 0.7271, "step": 6751 }, { "epoch": 0.81, "learning_rate": 1.9243858390749715e-06, "loss": 0.6858, "step": 6752 }, { "epoch": 0.81, "learning_rate": 1.9221082423461957e-06, "loss": 0.7182, "step": 6753 }, { "epoch": 0.81, "learning_rate": 1.9198318509203885e-06, "loss": 0.7366, "step": 6754 }, { "epoch": 0.81, "learning_rate": 1.9175566651372023e-06, "loss": 0.692, "step": 6755 }, { "epoch": 0.81, "learning_rate": 1.915282685336124e-06, "loss": 0.736, "step": 6756 }, { "epoch": 0.81, "learning_rate": 1.9130099118564526e-06, "loss": 0.7171, "step": 6757 }, { "epoch": 0.81, "learning_rate": 1.910738345037306e-06, "loss": 0.7238, "step": 6758 }, { "epoch": 0.81, "learning_rate": 1.9084679852176335e-06, "loss": 0.7282, "step": 6759 }, { "epoch": 0.81, "learning_rate": 1.9061988327361835e-06, "loss": 0.7327, "step": 6760 }, { "epoch": 0.81, "learning_rate": 1.9039308879315455e-06, "loss": 0.7031, "step": 6761 }, { "epoch": 0.81, "learning_rate": 1.9016641511421175e-06, "loss": 0.7199, "step": 6762 }, { "epoch": 0.81, "learning_rate": 1.8993986227061145e-06, "loss": 0.7461, "step": 6763 }, { "epoch": 0.81, "learning_rate": 1.8971343029615873e-06, "loss": 0.7612, "step": 6764 }, { "epoch": 0.81, "learning_rate": 1.8948711922463836e-06, "loss": 0.7154, "step": 6765 }, { "epoch": 0.81, "learning_rate": 1.8926092908981886e-06, "loss": 0.7729, "step": 6766 }, { "epoch": 0.81, "learning_rate": 1.890348599254498e-06, "loss": 0.7662, "step": 6767 }, { "epoch": 0.81, "learning_rate": 1.8880891176526327e-06, "loss": 0.6696, "step": 6768 }, { "epoch": 0.81, "learning_rate": 1.8858308464297304e-06, "loss": 0.7785, "step": 6769 }, { "epoch": 0.81, "learning_rate": 1.8835737859227453e-06, "loss": 0.7243, "step": 6770 }, { "epoch": 0.81, "learning_rate": 1.8813179364684543e-06, "loss": 0.7204, "step": 6771 }, { "epoch": 0.81, "learning_rate": 1.8790632984034507e-06, "loss": 0.7243, "step": 6772 }, { "epoch": 0.81, "learning_rate": 1.8768098720641547e-06, "loss": 0.7154, "step": 6773 }, { "epoch": 0.81, "learning_rate": 1.8745576577867975e-06, "loss": 0.7009, "step": 6774 }, { "epoch": 0.81, "learning_rate": 1.872306655907432e-06, "loss": 0.7533, "step": 6775 }, { "epoch": 0.81, "learning_rate": 1.8700568667619302e-06, "loss": 0.7751, "step": 6776 }, { "epoch": 0.81, "learning_rate": 1.8678082906859808e-06, "loss": 0.7573, "step": 6777 }, { "epoch": 0.81, "learning_rate": 1.8655609280151e-06, "loss": 0.75, "step": 6778 }, { "epoch": 0.81, "learning_rate": 1.8633147790846107e-06, "loss": 0.7757, "step": 6779 }, { "epoch": 0.81, "learning_rate": 1.8610698442296693e-06, "loss": 0.7539, "step": 6780 }, { "epoch": 0.81, "learning_rate": 1.8588261237852323e-06, "loss": 0.7467, "step": 6781 }, { "epoch": 0.81, "learning_rate": 1.856583618086093e-06, "loss": 0.6482, "step": 6782 }, { "epoch": 0.81, "learning_rate": 1.8543423274668548e-06, "loss": 0.7321, "step": 6783 }, { "epoch": 0.81, "learning_rate": 1.8521022522619358e-06, "loss": 0.7556, "step": 6784 }, { "epoch": 0.81, "learning_rate": 1.8498633928055864e-06, "loss": 0.7316, "step": 6785 }, { "epoch": 0.81, "learning_rate": 1.8476257494318583e-06, "loss": 0.7215, "step": 6786 }, { "epoch": 0.81, "learning_rate": 1.8453893224746366e-06, "loss": 0.6735, "step": 6787 }, { "epoch": 0.81, "learning_rate": 1.8431541122676156e-06, "loss": 0.7305, "step": 6788 }, { "epoch": 0.81, "learning_rate": 1.8409201191443105e-06, "loss": 0.7098, "step": 6789 }, { "epoch": 0.81, "learning_rate": 1.8386873434380626e-06, "loss": 0.7455, "step": 6790 }, { "epoch": 0.81, "learning_rate": 1.8364557854820142e-06, "loss": 0.7249, "step": 6791 }, { "epoch": 0.81, "learning_rate": 1.8342254456091436e-06, "loss": 0.6802, "step": 6792 }, { "epoch": 0.81, "learning_rate": 1.8319963241522377e-06, "loss": 0.7333, "step": 6793 }, { "epoch": 0.81, "learning_rate": 1.8297684214439015e-06, "loss": 0.6881, "step": 6794 }, { "epoch": 0.81, "learning_rate": 1.8275417378165683e-06, "loss": 0.7015, "step": 6795 }, { "epoch": 0.81, "learning_rate": 1.825316273602471e-06, "loss": 0.6914, "step": 6796 }, { "epoch": 0.81, "learning_rate": 1.8230920291336795e-06, "loss": 0.6903, "step": 6797 }, { "epoch": 0.81, "learning_rate": 1.8208690047420684e-06, "loss": 0.7595, "step": 6798 }, { "epoch": 0.81, "learning_rate": 1.8186472007593415e-06, "loss": 0.7377, "step": 6799 }, { "epoch": 0.81, "learning_rate": 1.8164266175170086e-06, "loss": 0.697, "step": 6800 }, { "epoch": 0.81, "learning_rate": 1.8142072553464073e-06, "loss": 0.6713, "step": 6801 }, { "epoch": 0.81, "learning_rate": 1.811989114578685e-06, "loss": 0.7199, "step": 6802 }, { "epoch": 0.81, "learning_rate": 1.809772195544811e-06, "loss": 0.7277, "step": 6803 }, { "epoch": 0.81, "learning_rate": 1.8075564985755756e-06, "loss": 0.736, "step": 6804 }, { "epoch": 0.81, "learning_rate": 1.8053420240015806e-06, "loss": 0.7684, "step": 6805 }, { "epoch": 0.81, "learning_rate": 1.8031287721532498e-06, "loss": 0.7718, "step": 6806 }, { "epoch": 0.81, "learning_rate": 1.80091674336082e-06, "loss": 0.7701, "step": 6807 }, { "epoch": 0.81, "learning_rate": 1.798705937954347e-06, "loss": 0.7706, "step": 6808 }, { "epoch": 0.81, "learning_rate": 1.7964963562637106e-06, "loss": 0.707, "step": 6809 }, { "epoch": 0.81, "learning_rate": 1.794287998618599e-06, "loss": 0.7829, "step": 6810 }, { "epoch": 0.81, "learning_rate": 1.7920808653485233e-06, "loss": 0.7411, "step": 6811 }, { "epoch": 0.81, "learning_rate": 1.7898749567828056e-06, "loss": 0.7065, "step": 6812 }, { "epoch": 0.81, "learning_rate": 1.787670273250597e-06, "loss": 0.6473, "step": 6813 }, { "epoch": 0.81, "learning_rate": 1.785466815080853e-06, "loss": 0.7199, "step": 6814 }, { "epoch": 0.81, "learning_rate": 1.7832645826023543e-06, "loss": 0.7154, "step": 6815 }, { "epoch": 0.81, "learning_rate": 1.7810635761436955e-06, "loss": 0.7729, "step": 6816 }, { "epoch": 0.81, "learning_rate": 1.7788637960332867e-06, "loss": 0.6992, "step": 6817 }, { "epoch": 0.81, "learning_rate": 1.7766652425993613e-06, "loss": 0.7684, "step": 6818 }, { "epoch": 0.81, "learning_rate": 1.7744679161699641e-06, "loss": 0.7411, "step": 6819 }, { "epoch": 0.81, "learning_rate": 1.772271817072958e-06, "loss": 0.7684, "step": 6820 }, { "epoch": 0.81, "learning_rate": 1.7700769456360234e-06, "loss": 0.6987, "step": 6821 }, { "epoch": 0.81, "learning_rate": 1.7678833021866537e-06, "loss": 0.7533, "step": 6822 }, { "epoch": 0.81, "learning_rate": 1.7656908870521694e-06, "loss": 0.7254, "step": 6823 }, { "epoch": 0.81, "learning_rate": 1.7634997005596977e-06, "loss": 0.7148, "step": 6824 }, { "epoch": 0.81, "learning_rate": 1.761309743036186e-06, "loss": 0.7751, "step": 6825 }, { "epoch": 0.81, "learning_rate": 1.759121014808396e-06, "loss": 0.7316, "step": 6826 }, { "epoch": 0.81, "learning_rate": 1.756933516202909e-06, "loss": 0.7081, "step": 6827 }, { "epoch": 0.81, "learning_rate": 1.7547472475461235e-06, "loss": 0.6652, "step": 6828 }, { "epoch": 0.81, "learning_rate": 1.7525622091642503e-06, "loss": 0.6869, "step": 6829 }, { "epoch": 0.81, "learning_rate": 1.7503784013833257e-06, "loss": 0.7567, "step": 6830 }, { "epoch": 0.81, "learning_rate": 1.7481958245291863e-06, "loss": 0.7612, "step": 6831 }, { "epoch": 0.81, "learning_rate": 1.7460144789275014e-06, "loss": 0.7182, "step": 6832 }, { "epoch": 0.81, "learning_rate": 1.7438343649037482e-06, "loss": 0.683, "step": 6833 }, { "epoch": 0.82, "learning_rate": 1.7416554827832178e-06, "loss": 0.7573, "step": 6834 }, { "epoch": 0.82, "learning_rate": 1.73947783289103e-06, "loss": 0.7807, "step": 6835 }, { "epoch": 0.82, "learning_rate": 1.7373014155521029e-06, "loss": 0.7673, "step": 6836 }, { "epoch": 0.82, "learning_rate": 1.7351262310911853e-06, "loss": 0.6652, "step": 6837 }, { "epoch": 0.82, "learning_rate": 1.7329522798328358e-06, "loss": 0.692, "step": 6838 }, { "epoch": 0.82, "learning_rate": 1.7307795621014267e-06, "loss": 0.6797, "step": 6839 }, { "epoch": 0.82, "learning_rate": 1.7286080782211566e-06, "loss": 0.7121, "step": 6840 }, { "epoch": 0.82, "learning_rate": 1.7264378285160232e-06, "loss": 0.7288, "step": 6841 }, { "epoch": 0.82, "learning_rate": 1.7242688133098584e-06, "loss": 0.7985, "step": 6842 }, { "epoch": 0.82, "learning_rate": 1.7221010329262944e-06, "loss": 0.7494, "step": 6843 }, { "epoch": 0.82, "learning_rate": 1.7199344876887914e-06, "loss": 0.7701, "step": 6844 }, { "epoch": 0.82, "learning_rate": 1.7177691779206196e-06, "loss": 0.7294, "step": 6845 }, { "epoch": 0.82, "learning_rate": 1.7156051039448584e-06, "loss": 0.6797, "step": 6846 }, { "epoch": 0.82, "learning_rate": 1.7134422660844163e-06, "loss": 0.6992, "step": 6847 }, { "epoch": 0.82, "learning_rate": 1.7112806646620051e-06, "loss": 0.6484, "step": 6848 }, { "epoch": 0.82, "learning_rate": 1.7091203000001633e-06, "loss": 0.7031, "step": 6849 }, { "epoch": 0.82, "learning_rate": 1.7069611724212376e-06, "loss": 0.7115, "step": 6850 }, { "epoch": 0.82, "learning_rate": 1.7048032822473893e-06, "loss": 0.7121, "step": 6851 }, { "epoch": 0.82, "learning_rate": 1.7026466298005985e-06, "loss": 0.76, "step": 6852 }, { "epoch": 0.82, "learning_rate": 1.7004912154026575e-06, "loss": 0.6892, "step": 6853 }, { "epoch": 0.82, "learning_rate": 1.6983370393751809e-06, "loss": 0.755, "step": 6854 }, { "epoch": 0.82, "learning_rate": 1.6961841020395898e-06, "loss": 0.7171, "step": 6855 }, { "epoch": 0.82, "learning_rate": 1.6940324037171251e-06, "loss": 0.7623, "step": 6856 }, { "epoch": 0.82, "learning_rate": 1.6918819447288416e-06, "loss": 0.7098, "step": 6857 }, { "epoch": 0.82, "learning_rate": 1.6897327253956064e-06, "loss": 0.7935, "step": 6858 }, { "epoch": 0.82, "learning_rate": 1.6875847460381113e-06, "loss": 0.7148, "step": 6859 }, { "epoch": 0.82, "learning_rate": 1.6854380069768539e-06, "loss": 0.7355, "step": 6860 }, { "epoch": 0.82, "learning_rate": 1.6832925085321472e-06, "loss": 0.769, "step": 6861 }, { "epoch": 0.82, "learning_rate": 1.6811482510241206e-06, "loss": 0.6741, "step": 6862 }, { "epoch": 0.82, "learning_rate": 1.6790052347727237e-06, "loss": 0.702, "step": 6863 }, { "epoch": 0.82, "learning_rate": 1.6768634600977129e-06, "loss": 0.6869, "step": 6864 }, { "epoch": 0.82, "learning_rate": 1.6747229273186628e-06, "loss": 0.7388, "step": 6865 }, { "epoch": 0.82, "learning_rate": 1.672583636754963e-06, "loss": 0.7327, "step": 6866 }, { "epoch": 0.82, "learning_rate": 1.6704455887258142e-06, "loss": 0.7288, "step": 6867 }, { "epoch": 0.82, "learning_rate": 1.668308783550241e-06, "loss": 0.7522, "step": 6868 }, { "epoch": 0.82, "learning_rate": 1.6661732215470717e-06, "loss": 0.7176, "step": 6869 }, { "epoch": 0.82, "learning_rate": 1.6640389030349558e-06, "loss": 0.7093, "step": 6870 }, { "epoch": 0.82, "learning_rate": 1.661905828332353e-06, "loss": 0.7254, "step": 6871 }, { "epoch": 0.82, "learning_rate": 1.6597739977575388e-06, "loss": 0.7098, "step": 6872 }, { "epoch": 0.82, "learning_rate": 1.6576434116286088e-06, "loss": 0.7154, "step": 6873 }, { "epoch": 0.82, "learning_rate": 1.655514070263462e-06, "loss": 0.7723, "step": 6874 }, { "epoch": 0.82, "learning_rate": 1.6533859739798263e-06, "loss": 0.7266, "step": 6875 }, { "epoch": 0.82, "learning_rate": 1.6512591230952258e-06, "loss": 0.7522, "step": 6876 }, { "epoch": 0.82, "learning_rate": 1.6491335179270095e-06, "loss": 0.6897, "step": 6877 }, { "epoch": 0.82, "learning_rate": 1.6470091587923443e-06, "loss": 0.7416, "step": 6878 }, { "epoch": 0.82, "learning_rate": 1.6448860460082007e-06, "loss": 0.7388, "step": 6879 }, { "epoch": 0.82, "learning_rate": 1.642764179891375e-06, "loss": 0.7148, "step": 6880 }, { "epoch": 0.82, "learning_rate": 1.6406435607584626e-06, "loss": 0.692, "step": 6881 }, { "epoch": 0.82, "learning_rate": 1.6385241889258874e-06, "loss": 0.7188, "step": 6882 }, { "epoch": 0.82, "learning_rate": 1.63640606470988e-06, "loss": 0.7037, "step": 6883 }, { "epoch": 0.82, "learning_rate": 1.6342891884264833e-06, "loss": 0.7589, "step": 6884 }, { "epoch": 0.82, "learning_rate": 1.6321735603915622e-06, "loss": 0.7963, "step": 6885 }, { "epoch": 0.82, "learning_rate": 1.6300591809207822e-06, "loss": 0.7031, "step": 6886 }, { "epoch": 0.82, "learning_rate": 1.6279460503296352e-06, "loss": 0.7416, "step": 6887 }, { "epoch": 0.82, "learning_rate": 1.6258341689334212e-06, "loss": 0.6674, "step": 6888 }, { "epoch": 0.82, "learning_rate": 1.6237235370472504e-06, "loss": 0.6747, "step": 6889 }, { "epoch": 0.82, "learning_rate": 1.6216141549860587e-06, "loss": 0.6942, "step": 6890 }, { "epoch": 0.82, "learning_rate": 1.6195060230645766e-06, "loss": 0.7723, "step": 6891 }, { "epoch": 0.82, "learning_rate": 1.6173991415973667e-06, "loss": 0.7176, "step": 6892 }, { "epoch": 0.82, "learning_rate": 1.615293510898791e-06, "loss": 0.7249, "step": 6893 }, { "epoch": 0.82, "learning_rate": 1.6131891312830373e-06, "loss": 0.7171, "step": 6894 }, { "epoch": 0.82, "learning_rate": 1.6110860030640963e-06, "loss": 0.7154, "step": 6895 }, { "epoch": 0.82, "learning_rate": 1.608984126555776e-06, "loss": 0.7171, "step": 6896 }, { "epoch": 0.82, "learning_rate": 1.606883502071699e-06, "loss": 0.7121, "step": 6897 }, { "epoch": 0.82, "learning_rate": 1.6047841299252965e-06, "loss": 0.707, "step": 6898 }, { "epoch": 0.82, "learning_rate": 1.6026860104298203e-06, "loss": 0.7321, "step": 6899 }, { "epoch": 0.82, "learning_rate": 1.6005891438983302e-06, "loss": 0.716, "step": 6900 }, { "epoch": 0.82, "learning_rate": 1.5984935306436977e-06, "loss": 0.6953, "step": 6901 }, { "epoch": 0.82, "learning_rate": 1.5963991709786109e-06, "loss": 0.8025, "step": 6902 }, { "epoch": 0.82, "learning_rate": 1.5943060652155663e-06, "loss": 0.6607, "step": 6903 }, { "epoch": 0.82, "learning_rate": 1.5922142136668817e-06, "loss": 0.6925, "step": 6904 }, { "epoch": 0.82, "learning_rate": 1.5901236166446799e-06, "loss": 0.731, "step": 6905 }, { "epoch": 0.82, "learning_rate": 1.5880342744608978e-06, "loss": 0.7651, "step": 6906 }, { "epoch": 0.82, "learning_rate": 1.5859461874272886e-06, "loss": 0.7059, "step": 6907 }, { "epoch": 0.82, "learning_rate": 1.5838593558554127e-06, "loss": 0.7422, "step": 6908 }, { "epoch": 0.82, "learning_rate": 1.5817737800566513e-06, "loss": 0.7545, "step": 6909 }, { "epoch": 0.82, "learning_rate": 1.5796894603421896e-06, "loss": 0.7768, "step": 6910 }, { "epoch": 0.82, "learning_rate": 1.5776063970230304e-06, "loss": 0.6763, "step": 6911 }, { "epoch": 0.82, "learning_rate": 1.5755245904099858e-06, "loss": 0.6953, "step": 6912 }, { "epoch": 0.82, "learning_rate": 1.5734440408136865e-06, "loss": 0.7695, "step": 6913 }, { "epoch": 0.82, "learning_rate": 1.5713647485445682e-06, "loss": 0.7444, "step": 6914 }, { "epoch": 0.82, "learning_rate": 1.5692867139128842e-06, "loss": 0.7478, "step": 6915 }, { "epoch": 0.82, "learning_rate": 1.5672099372286965e-06, "loss": 0.7461, "step": 6916 }, { "epoch": 0.82, "learning_rate": 1.5651344188018801e-06, "loss": 0.6624, "step": 6917 }, { "epoch": 0.83, "learning_rate": 1.5630601589421268e-06, "loss": 0.755, "step": 6918 }, { "epoch": 0.83, "learning_rate": 1.5609871579589364e-06, "loss": 0.6987, "step": 6919 }, { "epoch": 0.83, "learning_rate": 1.5589154161616194e-06, "loss": 0.721, "step": 6920 }, { "epoch": 0.83, "learning_rate": 1.5568449338593028e-06, "loss": 0.6406, "step": 6921 }, { "epoch": 0.83, "learning_rate": 1.5547757113609197e-06, "loss": 0.7221, "step": 6922 }, { "epoch": 0.83, "learning_rate": 1.5527077489752228e-06, "loss": 0.6791, "step": 6923 }, { "epoch": 0.83, "learning_rate": 1.5506410470107712e-06, "loss": 0.692, "step": 6924 }, { "epoch": 0.83, "learning_rate": 1.5485756057759427e-06, "loss": 0.7422, "step": 6925 }, { "epoch": 0.83, "learning_rate": 1.5465114255789116e-06, "loss": 0.7584, "step": 6926 }, { "epoch": 0.83, "learning_rate": 1.5444485067276839e-06, "loss": 0.7282, "step": 6927 }, { "epoch": 0.83, "learning_rate": 1.5423868495300642e-06, "loss": 0.7494, "step": 6928 }, { "epoch": 0.83, "learning_rate": 1.5403264542936703e-06, "loss": 0.7294, "step": 6929 }, { "epoch": 0.83, "learning_rate": 1.5382673213259413e-06, "loss": 0.7673, "step": 6930 }, { "epoch": 0.83, "learning_rate": 1.5362094509341109e-06, "loss": 0.7985, "step": 6931 }, { "epoch": 0.83, "learning_rate": 1.5341528434252406e-06, "loss": 0.7522, "step": 6932 }, { "epoch": 0.83, "learning_rate": 1.5320974991061966e-06, "loss": 0.7104, "step": 6933 }, { "epoch": 0.83, "learning_rate": 1.5300434182836532e-06, "loss": 0.7589, "step": 6934 }, { "epoch": 0.83, "learning_rate": 1.5279906012641065e-06, "loss": 0.7037, "step": 6935 }, { "epoch": 0.83, "learning_rate": 1.5259390483538493e-06, "loss": 0.7333, "step": 6936 }, { "epoch": 0.83, "learning_rate": 1.5238887598590012e-06, "loss": 0.6702, "step": 6937 }, { "epoch": 0.83, "learning_rate": 1.521839736085482e-06, "loss": 0.6568, "step": 6938 }, { "epoch": 0.83, "learning_rate": 1.5197919773390256e-06, "loss": 0.7188, "step": 6939 }, { "epoch": 0.83, "learning_rate": 1.517745483925186e-06, "loss": 0.6964, "step": 6940 }, { "epoch": 0.83, "learning_rate": 1.5157002561493095e-06, "loss": 0.7472, "step": 6941 }, { "epoch": 0.83, "learning_rate": 1.5136562943165723e-06, "loss": 0.673, "step": 6942 }, { "epoch": 0.83, "learning_rate": 1.5116135987319502e-06, "loss": 0.7427, "step": 6943 }, { "epoch": 0.83, "learning_rate": 1.5095721697002386e-06, "loss": 0.7288, "step": 6944 }, { "epoch": 0.83, "learning_rate": 1.5075320075260368e-06, "loss": 0.8142, "step": 6945 }, { "epoch": 0.83, "learning_rate": 1.5054931125137573e-06, "loss": 0.7628, "step": 6946 }, { "epoch": 0.83, "learning_rate": 1.503455484967623e-06, "loss": 0.774, "step": 6947 }, { "epoch": 0.83, "learning_rate": 1.5014191251916676e-06, "loss": 0.6585, "step": 6948 }, { "epoch": 0.83, "learning_rate": 1.4993840334897413e-06, "loss": 0.7227, "step": 6949 }, { "epoch": 0.83, "learning_rate": 1.497350210165497e-06, "loss": 0.6752, "step": 6950 }, { "epoch": 0.83, "learning_rate": 1.4953176555224013e-06, "loss": 0.7277, "step": 6951 }, { "epoch": 0.83, "learning_rate": 1.4932863698637334e-06, "loss": 0.7182, "step": 6952 }, { "epoch": 0.83, "learning_rate": 1.4912563534925784e-06, "loss": 0.7059, "step": 6953 }, { "epoch": 0.83, "learning_rate": 1.4892276067118393e-06, "loss": 0.7065, "step": 6954 }, { "epoch": 0.83, "learning_rate": 1.4872001298242245e-06, "loss": 0.7098, "step": 6955 }, { "epoch": 0.83, "learning_rate": 1.4851739231322538e-06, "loss": 0.6953, "step": 6956 }, { "epoch": 0.83, "learning_rate": 1.4831489869382542e-06, "loss": 0.7427, "step": 6957 }, { "epoch": 0.83, "learning_rate": 1.4811253215443721e-06, "loss": 0.7427, "step": 6958 }, { "epoch": 0.83, "learning_rate": 1.479102927252557e-06, "loss": 0.7723, "step": 6959 }, { "epoch": 0.83, "learning_rate": 1.4770818043645696e-06, "loss": 0.7137, "step": 6960 }, { "epoch": 0.83, "learning_rate": 1.4750619531819831e-06, "loss": 0.7355, "step": 6961 }, { "epoch": 0.83, "learning_rate": 1.4730433740061756e-06, "loss": 0.7249, "step": 6962 }, { "epoch": 0.83, "learning_rate": 1.4710260671383448e-06, "loss": 0.7249, "step": 6963 }, { "epoch": 0.83, "learning_rate": 1.469010032879491e-06, "loss": 0.7115, "step": 6964 }, { "epoch": 0.83, "learning_rate": 1.466995271530427e-06, "loss": 0.7137, "step": 6965 }, { "epoch": 0.83, "learning_rate": 1.4649817833917767e-06, "loss": 0.7282, "step": 6966 }, { "epoch": 0.83, "learning_rate": 1.4629695687639678e-06, "loss": 0.7137, "step": 6967 }, { "epoch": 0.83, "learning_rate": 1.4609586279472499e-06, "loss": 0.7606, "step": 6968 }, { "epoch": 0.83, "learning_rate": 1.4589489612416729e-06, "loss": 0.7037, "step": 6969 }, { "epoch": 0.83, "learning_rate": 1.456940568947096e-06, "loss": 0.7388, "step": 6970 }, { "epoch": 0.83, "learning_rate": 1.4549334513631996e-06, "loss": 0.7294, "step": 6971 }, { "epoch": 0.83, "learning_rate": 1.4529276087894562e-06, "loss": 0.7294, "step": 6972 }, { "epoch": 0.83, "learning_rate": 1.450923041525165e-06, "loss": 0.7288, "step": 6973 }, { "epoch": 0.83, "learning_rate": 1.448919749869423e-06, "loss": 0.7829, "step": 6974 }, { "epoch": 0.83, "learning_rate": 1.446917734121146e-06, "loss": 0.7037, "step": 6975 }, { "epoch": 0.83, "learning_rate": 1.444916994579052e-06, "loss": 0.7344, "step": 6976 }, { "epoch": 0.83, "learning_rate": 1.4429175315416733e-06, "loss": 0.6735, "step": 6977 }, { "epoch": 0.83, "learning_rate": 1.4409193453073478e-06, "loss": 0.7137, "step": 6978 }, { "epoch": 0.83, "learning_rate": 1.438922436174225e-06, "loss": 0.7327, "step": 6979 }, { "epoch": 0.83, "learning_rate": 1.4369268044402661e-06, "loss": 0.7706, "step": 6980 }, { "epoch": 0.83, "learning_rate": 1.4349324504032391e-06, "loss": 0.6892, "step": 6981 }, { "epoch": 0.83, "learning_rate": 1.4329393743607212e-06, "loss": 0.7528, "step": 6982 }, { "epoch": 0.83, "learning_rate": 1.430947576610099e-06, "loss": 0.7467, "step": 6983 }, { "epoch": 0.83, "learning_rate": 1.4289570574485655e-06, "loss": 0.7366, "step": 6984 }, { "epoch": 0.83, "learning_rate": 1.4269678171731338e-06, "loss": 0.7254, "step": 6985 }, { "epoch": 0.83, "learning_rate": 1.424979856080615e-06, "loss": 0.6998, "step": 6986 }, { "epoch": 0.83, "learning_rate": 1.4229931744676318e-06, "loss": 0.6964, "step": 6987 }, { "epoch": 0.83, "learning_rate": 1.4210077726306159e-06, "loss": 0.7143, "step": 6988 }, { "epoch": 0.83, "learning_rate": 1.4190236508658128e-06, "loss": 0.7612, "step": 6989 }, { "epoch": 0.83, "learning_rate": 1.4170408094692733e-06, "loss": 0.7478, "step": 6990 }, { "epoch": 0.83, "learning_rate": 1.4150592487368553e-06, "loss": 0.7321, "step": 6991 }, { "epoch": 0.83, "learning_rate": 1.4130789689642289e-06, "loss": 0.7612, "step": 6992 }, { "epoch": 0.83, "learning_rate": 1.4110999704468698e-06, "loss": 0.7679, "step": 6993 }, { "epoch": 0.83, "learning_rate": 1.4091222534800675e-06, "loss": 0.7109, "step": 6994 }, { "epoch": 0.83, "learning_rate": 1.407145818358916e-06, "loss": 0.721, "step": 6995 }, { "epoch": 0.83, "learning_rate": 1.4051706653783193e-06, "loss": 0.7467, "step": 6996 }, { "epoch": 0.83, "learning_rate": 1.4031967948329906e-06, "loss": 0.7344, "step": 6997 }, { "epoch": 0.83, "learning_rate": 1.4012242070174487e-06, "loss": 0.7188, "step": 6998 }, { "epoch": 0.83, "learning_rate": 1.3992529022260281e-06, "loss": 0.7215, "step": 6999 }, { "epoch": 0.83, "learning_rate": 1.3972828807528637e-06, "loss": 0.7288, "step": 7000 }, { "epoch": 0.83, "learning_rate": 1.3953141428919058e-06, "loss": 0.673, "step": 7001 }, { "epoch": 0.84, "learning_rate": 1.3933466889369074e-06, "loss": 0.7595, "step": 7002 }, { "epoch": 0.84, "learning_rate": 1.3913805191814312e-06, "loss": 0.6797, "step": 7003 }, { "epoch": 0.84, "learning_rate": 1.3894156339188525e-06, "loss": 0.7249, "step": 7004 }, { "epoch": 0.84, "learning_rate": 1.3874520334423503e-06, "loss": 0.7528, "step": 7005 }, { "epoch": 0.84, "learning_rate": 1.3854897180449178e-06, "loss": 0.7087, "step": 7006 }, { "epoch": 0.84, "learning_rate": 1.3835286880193454e-06, "loss": 0.6992, "step": 7007 }, { "epoch": 0.84, "learning_rate": 1.3815689436582436e-06, "loss": 0.7193, "step": 7008 }, { "epoch": 0.84, "learning_rate": 1.3796104852540249e-06, "loss": 0.7266, "step": 7009 }, { "epoch": 0.84, "learning_rate": 1.3776533130989077e-06, "loss": 0.745, "step": 7010 }, { "epoch": 0.84, "learning_rate": 1.3756974274849299e-06, "loss": 0.7427, "step": 7011 }, { "epoch": 0.84, "learning_rate": 1.373742828703919e-06, "loss": 0.7288, "step": 7012 }, { "epoch": 0.84, "learning_rate": 1.3717895170475293e-06, "loss": 0.6928, "step": 7013 }, { "epoch": 0.84, "learning_rate": 1.3698374928072112e-06, "loss": 0.692, "step": 7014 }, { "epoch": 0.84, "learning_rate": 1.3678867562742238e-06, "loss": 0.7076, "step": 7015 }, { "epoch": 0.84, "learning_rate": 1.3659373077396432e-06, "loss": 0.7517, "step": 7016 }, { "epoch": 0.84, "learning_rate": 1.3639891474943402e-06, "loss": 0.75, "step": 7017 }, { "epoch": 0.84, "learning_rate": 1.3620422758290043e-06, "loss": 0.7427, "step": 7018 }, { "epoch": 0.84, "learning_rate": 1.360096693034124e-06, "loss": 0.7561, "step": 7019 }, { "epoch": 0.84, "learning_rate": 1.3581523994000069e-06, "loss": 0.7796, "step": 7020 }, { "epoch": 0.84, "learning_rate": 1.3562093952167554e-06, "loss": 0.7254, "step": 7021 }, { "epoch": 0.84, "learning_rate": 1.3542676807742872e-06, "loss": 0.7327, "step": 7022 }, { "epoch": 0.84, "learning_rate": 1.352327256362327e-06, "loss": 0.6959, "step": 7023 }, { "epoch": 0.84, "learning_rate": 1.3503881222704008e-06, "loss": 0.7472, "step": 7024 }, { "epoch": 0.84, "learning_rate": 1.3484502787878528e-06, "loss": 0.7829, "step": 7025 }, { "epoch": 0.84, "learning_rate": 1.3465137262038264e-06, "loss": 0.7282, "step": 7026 }, { "epoch": 0.84, "learning_rate": 1.3445784648072745e-06, "loss": 0.7009, "step": 7027 }, { "epoch": 0.84, "learning_rate": 1.3426444948869588e-06, "loss": 0.7109, "step": 7028 }, { "epoch": 0.84, "learning_rate": 1.3407118167314437e-06, "loss": 0.7109, "step": 7029 }, { "epoch": 0.84, "learning_rate": 1.3387804306291097e-06, "loss": 0.7048, "step": 7030 }, { "epoch": 0.84, "learning_rate": 1.3368503368681352e-06, "loss": 0.7081, "step": 7031 }, { "epoch": 0.84, "learning_rate": 1.3349215357365108e-06, "loss": 0.7779, "step": 7032 }, { "epoch": 0.84, "learning_rate": 1.3329940275220343e-06, "loss": 0.7305, "step": 7033 }, { "epoch": 0.84, "learning_rate": 1.3310678125123043e-06, "loss": 0.6987, "step": 7034 }, { "epoch": 0.84, "learning_rate": 1.329142890994739e-06, "loss": 0.7076, "step": 7035 }, { "epoch": 0.84, "learning_rate": 1.3272192632565517e-06, "loss": 0.7679, "step": 7036 }, { "epoch": 0.84, "learning_rate": 1.3252969295847672e-06, "loss": 0.7221, "step": 7037 }, { "epoch": 0.84, "learning_rate": 1.3233758902662164e-06, "loss": 0.6484, "step": 7038 }, { "epoch": 0.84, "learning_rate": 1.3214561455875408e-06, "loss": 0.7701, "step": 7039 }, { "epoch": 0.84, "learning_rate": 1.3195376958351835e-06, "loss": 0.7439, "step": 7040 }, { "epoch": 0.84, "learning_rate": 1.317620541295398e-06, "loss": 0.7015, "step": 7041 }, { "epoch": 0.84, "learning_rate": 1.3157046822542418e-06, "loss": 0.7031, "step": 7042 }, { "epoch": 0.84, "learning_rate": 1.3137901189975778e-06, "loss": 0.7584, "step": 7043 }, { "epoch": 0.84, "learning_rate": 1.3118768518110837e-06, "loss": 0.7232, "step": 7044 }, { "epoch": 0.84, "learning_rate": 1.3099648809802357e-06, "loss": 0.7288, "step": 7045 }, { "epoch": 0.84, "learning_rate": 1.308054206790319e-06, "loss": 0.74, "step": 7046 }, { "epoch": 0.84, "learning_rate": 1.3061448295264256e-06, "loss": 0.6816, "step": 7047 }, { "epoch": 0.84, "learning_rate": 1.304236749473451e-06, "loss": 0.7087, "step": 7048 }, { "epoch": 0.84, "learning_rate": 1.302329966916106e-06, "loss": 0.7176, "step": 7049 }, { "epoch": 0.84, "learning_rate": 1.3004244821388956e-06, "loss": 0.7455, "step": 7050 }, { "epoch": 0.84, "learning_rate": 1.2985202954261444e-06, "loss": 0.7489, "step": 7051 }, { "epoch": 0.84, "learning_rate": 1.2966174070619687e-06, "loss": 0.6429, "step": 7052 }, { "epoch": 0.84, "learning_rate": 1.2947158173303043e-06, "loss": 0.7227, "step": 7053 }, { "epoch": 0.84, "learning_rate": 1.2928155265148846e-06, "loss": 0.7081, "step": 7054 }, { "epoch": 0.84, "learning_rate": 1.2909165348992513e-06, "loss": 0.7349, "step": 7055 }, { "epoch": 0.84, "learning_rate": 1.2890188427667594e-06, "loss": 0.6526, "step": 7056 }, { "epoch": 0.84, "learning_rate": 1.287122450400554e-06, "loss": 0.7154, "step": 7057 }, { "epoch": 0.84, "learning_rate": 1.285227358083604e-06, "loss": 0.7478, "step": 7058 }, { "epoch": 0.84, "learning_rate": 1.2833335660986735e-06, "loss": 0.7651, "step": 7059 }, { "epoch": 0.84, "learning_rate": 1.2814410747283323e-06, "loss": 0.7227, "step": 7060 }, { "epoch": 0.84, "learning_rate": 1.279549884254968e-06, "loss": 0.7126, "step": 7061 }, { "epoch": 0.84, "learning_rate": 1.2776599949607537e-06, "loss": 0.7282, "step": 7062 }, { "epoch": 0.84, "learning_rate": 1.2757714071276884e-06, "loss": 0.6752, "step": 7063 }, { "epoch": 0.84, "learning_rate": 1.2738841210375652e-06, "loss": 0.7545, "step": 7064 }, { "epoch": 0.84, "learning_rate": 1.2719981369719858e-06, "loss": 0.7561, "step": 7065 }, { "epoch": 0.84, "learning_rate": 1.270113455212363e-06, "loss": 0.7031, "step": 7066 }, { "epoch": 0.84, "learning_rate": 1.2682300760399014e-06, "loss": 0.7796, "step": 7067 }, { "epoch": 0.84, "learning_rate": 1.2663479997356286e-06, "loss": 0.7333, "step": 7068 }, { "epoch": 0.84, "learning_rate": 1.2644672265803627e-06, "loss": 0.7533, "step": 7069 }, { "epoch": 0.84, "learning_rate": 1.2625877568547395e-06, "loss": 0.7254, "step": 7070 }, { "epoch": 0.84, "learning_rate": 1.2607095908391931e-06, "loss": 0.76, "step": 7071 }, { "epoch": 0.84, "learning_rate": 1.2588327288139646e-06, "loss": 0.7277, "step": 7072 }, { "epoch": 0.84, "learning_rate": 1.2569571710591e-06, "loss": 0.6981, "step": 7073 }, { "epoch": 0.84, "learning_rate": 1.2550829178544498e-06, "loss": 0.7427, "step": 7074 }, { "epoch": 0.84, "learning_rate": 1.2532099694796762e-06, "loss": 0.7835, "step": 7075 }, { "epoch": 0.84, "learning_rate": 1.2513383262142397e-06, "loss": 0.721, "step": 7076 }, { "epoch": 0.84, "learning_rate": 1.2494679883374084e-06, "loss": 0.6992, "step": 7077 }, { "epoch": 0.84, "learning_rate": 1.2475989561282543e-06, "loss": 0.7517, "step": 7078 }, { "epoch": 0.84, "learning_rate": 1.2457312298656555e-06, "loss": 0.6886, "step": 7079 }, { "epoch": 0.84, "learning_rate": 1.2438648098282978e-06, "loss": 0.7461, "step": 7080 }, { "epoch": 0.84, "learning_rate": 1.2419996962946701e-06, "loss": 0.7132, "step": 7081 }, { "epoch": 0.84, "learning_rate": 1.240135889543066e-06, "loss": 0.75, "step": 7082 }, { "epoch": 0.84, "learning_rate": 1.2382733898515798e-06, "loss": 0.6669, "step": 7083 }, { "epoch": 0.84, "learning_rate": 1.2364121974981215e-06, "loss": 0.6769, "step": 7084 }, { "epoch": 0.84, "learning_rate": 1.2345523127603976e-06, "loss": 0.7321, "step": 7085 }, { "epoch": 0.85, "learning_rate": 1.2326937359159208e-06, "loss": 0.726, "step": 7086 }, { "epoch": 0.85, "learning_rate": 1.2308364672420104e-06, "loss": 0.7333, "step": 7087 }, { "epoch": 0.85, "learning_rate": 1.2289805070157856e-06, "loss": 0.7115, "step": 7088 }, { "epoch": 0.85, "learning_rate": 1.2271258555141818e-06, "loss": 0.716, "step": 7089 }, { "epoch": 0.85, "learning_rate": 1.2252725130139266e-06, "loss": 0.7439, "step": 7090 }, { "epoch": 0.85, "learning_rate": 1.2234204797915594e-06, "loss": 0.7165, "step": 7091 }, { "epoch": 0.85, "learning_rate": 1.2215697561234219e-06, "loss": 0.7584, "step": 7092 }, { "epoch": 0.85, "learning_rate": 1.2197203422856575e-06, "loss": 0.721, "step": 7093 }, { "epoch": 0.85, "learning_rate": 1.217872238554223e-06, "loss": 0.6992, "step": 7094 }, { "epoch": 0.85, "learning_rate": 1.2160254452048703e-06, "loss": 0.7483, "step": 7095 }, { "epoch": 0.85, "learning_rate": 1.2141799625131623e-06, "loss": 0.6914, "step": 7096 }, { "epoch": 0.85, "learning_rate": 1.2123357907544608e-06, "loss": 0.7433, "step": 7097 }, { "epoch": 0.85, "learning_rate": 1.2104929302039347e-06, "loss": 0.7467, "step": 7098 }, { "epoch": 0.85, "learning_rate": 1.2086513811365609e-06, "loss": 0.7333, "step": 7099 }, { "epoch": 0.85, "learning_rate": 1.2068111438271123e-06, "loss": 0.7584, "step": 7100 }, { "epoch": 0.85, "learning_rate": 1.2049722185501777e-06, "loss": 0.7388, "step": 7101 }, { "epoch": 0.85, "learning_rate": 1.2031346055801363e-06, "loss": 0.7355, "step": 7102 }, { "epoch": 0.85, "learning_rate": 1.201298305191182e-06, "loss": 0.7165, "step": 7103 }, { "epoch": 0.85, "learning_rate": 1.199463317657309e-06, "loss": 0.7366, "step": 7104 }, { "epoch": 0.85, "learning_rate": 1.1976296432523138e-06, "loss": 0.7232, "step": 7105 }, { "epoch": 0.85, "learning_rate": 1.1957972822498054e-06, "loss": 0.7165, "step": 7106 }, { "epoch": 0.85, "learning_rate": 1.1939662349231817e-06, "loss": 0.716, "step": 7107 }, { "epoch": 0.85, "learning_rate": 1.1921365015456609e-06, "loss": 0.7266, "step": 7108 }, { "epoch": 0.85, "learning_rate": 1.1903080823902534e-06, "loss": 0.7143, "step": 7109 }, { "epoch": 0.85, "learning_rate": 1.1884809777297778e-06, "loss": 0.7098, "step": 7110 }, { "epoch": 0.85, "learning_rate": 1.1866551878368615e-06, "loss": 0.707, "step": 7111 }, { "epoch": 0.85, "learning_rate": 1.184830712983923e-06, "loss": 0.716, "step": 7112 }, { "epoch": 0.85, "learning_rate": 1.1830075534431985e-06, "loss": 0.7349, "step": 7113 }, { "epoch": 0.85, "learning_rate": 1.1811857094867174e-06, "loss": 0.7204, "step": 7114 }, { "epoch": 0.85, "learning_rate": 1.1793651813863227e-06, "loss": 0.6847, "step": 7115 }, { "epoch": 0.85, "learning_rate": 1.1775459694136538e-06, "loss": 0.7254, "step": 7116 }, { "epoch": 0.85, "learning_rate": 1.17572807384015e-06, "loss": 0.7048, "step": 7117 }, { "epoch": 0.85, "learning_rate": 1.1739114949370656e-06, "loss": 0.7165, "step": 7118 }, { "epoch": 0.85, "learning_rate": 1.172096232975448e-06, "loss": 0.7612, "step": 7119 }, { "epoch": 0.85, "learning_rate": 1.1702822882261588e-06, "loss": 0.7338, "step": 7120 }, { "epoch": 0.85, "learning_rate": 1.1684696609598522e-06, "loss": 0.7115, "step": 7121 }, { "epoch": 0.85, "learning_rate": 1.166658351446992e-06, "loss": 0.7076, "step": 7122 }, { "epoch": 0.85, "learning_rate": 1.1648483599578442e-06, "loss": 0.7533, "step": 7123 }, { "epoch": 0.85, "learning_rate": 1.1630396867624737e-06, "loss": 0.7243, "step": 7124 }, { "epoch": 0.85, "learning_rate": 1.1612323321307594e-06, "loss": 0.7266, "step": 7125 }, { "epoch": 0.85, "learning_rate": 1.1594262963323731e-06, "loss": 0.7109, "step": 7126 }, { "epoch": 0.85, "learning_rate": 1.157621579636794e-06, "loss": 0.7517, "step": 7127 }, { "epoch": 0.85, "learning_rate": 1.155818182313304e-06, "loss": 0.7238, "step": 7128 }, { "epoch": 0.85, "learning_rate": 1.154016104630986e-06, "loss": 0.6931, "step": 7129 }, { "epoch": 0.85, "learning_rate": 1.1522153468587338e-06, "loss": 0.6802, "step": 7130 }, { "epoch": 0.85, "learning_rate": 1.1504159092652334e-06, "loss": 0.6747, "step": 7131 }, { "epoch": 0.85, "learning_rate": 1.1486177921189824e-06, "loss": 0.6936, "step": 7132 }, { "epoch": 0.85, "learning_rate": 1.1468209956882736e-06, "loss": 0.7355, "step": 7133 }, { "epoch": 0.85, "learning_rate": 1.145025520241213e-06, "loss": 0.7188, "step": 7134 }, { "epoch": 0.85, "learning_rate": 1.1432313660457006e-06, "loss": 0.7288, "step": 7135 }, { "epoch": 0.85, "learning_rate": 1.1414385333694422e-06, "loss": 0.7556, "step": 7136 }, { "epoch": 0.85, "learning_rate": 1.1396470224799473e-06, "loss": 0.6496, "step": 7137 }, { "epoch": 0.85, "learning_rate": 1.137856833644525e-06, "loss": 0.7383, "step": 7138 }, { "epoch": 0.85, "learning_rate": 1.136067967130292e-06, "loss": 0.733, "step": 7139 }, { "epoch": 0.85, "learning_rate": 1.134280423204166e-06, "loss": 0.6713, "step": 7140 }, { "epoch": 0.85, "learning_rate": 1.1324942021328655e-06, "loss": 0.7288, "step": 7141 }, { "epoch": 0.85, "learning_rate": 1.130709304182912e-06, "loss": 0.6914, "step": 7142 }, { "epoch": 0.85, "learning_rate": 1.128925729620629e-06, "loss": 0.7366, "step": 7143 }, { "epoch": 0.85, "learning_rate": 1.1271434787121471e-06, "loss": 0.7439, "step": 7144 }, { "epoch": 0.85, "learning_rate": 1.1253625517233935e-06, "loss": 0.7706, "step": 7145 }, { "epoch": 0.85, "learning_rate": 1.1235829489201045e-06, "loss": 0.6908, "step": 7146 }, { "epoch": 0.85, "learning_rate": 1.1218046705678109e-06, "loss": 0.6903, "step": 7147 }, { "epoch": 0.85, "learning_rate": 1.1200277169318485e-06, "loss": 0.6557, "step": 7148 }, { "epoch": 0.85, "learning_rate": 1.1182520882773607e-06, "loss": 0.7003, "step": 7149 }, { "epoch": 0.85, "learning_rate": 1.1164777848692855e-06, "loss": 0.683, "step": 7150 }, { "epoch": 0.85, "learning_rate": 1.1147048069723732e-06, "loss": 0.75, "step": 7151 }, { "epoch": 0.85, "learning_rate": 1.1129331548511613e-06, "loss": 0.7394, "step": 7152 }, { "epoch": 0.85, "learning_rate": 1.111162828770005e-06, "loss": 0.7874, "step": 7153 }, { "epoch": 0.85, "learning_rate": 1.1093938289930517e-06, "loss": 0.7054, "step": 7154 }, { "epoch": 0.85, "learning_rate": 1.1076261557842537e-06, "loss": 0.702, "step": 7155 }, { "epoch": 0.85, "learning_rate": 1.105859809407368e-06, "loss": 0.7271, "step": 7156 }, { "epoch": 0.85, "learning_rate": 1.1040947901259503e-06, "loss": 0.7344, "step": 7157 }, { "epoch": 0.85, "learning_rate": 1.1023310982033586e-06, "loss": 0.7154, "step": 7158 }, { "epoch": 0.85, "learning_rate": 1.1005687339027538e-06, "loss": 0.6585, "step": 7159 }, { "epoch": 0.85, "learning_rate": 1.0988076974870965e-06, "loss": 0.6847, "step": 7160 }, { "epoch": 0.85, "learning_rate": 1.0970479892191555e-06, "loss": 0.7701, "step": 7161 }, { "epoch": 0.85, "learning_rate": 1.095289609361495e-06, "loss": 0.6741, "step": 7162 }, { "epoch": 0.85, "learning_rate": 1.0935325581764822e-06, "loss": 0.803, "step": 7163 }, { "epoch": 0.85, "learning_rate": 1.0917768359262847e-06, "loss": 0.7188, "step": 7164 }, { "epoch": 0.85, "learning_rate": 1.090022442872879e-06, "loss": 0.7422, "step": 7165 }, { "epoch": 0.85, "learning_rate": 1.0882693792780362e-06, "loss": 0.6747, "step": 7166 }, { "epoch": 0.85, "learning_rate": 1.086517645403331e-06, "loss": 0.7545, "step": 7167 }, { "epoch": 0.85, "learning_rate": 1.0847672415101396e-06, "loss": 0.7232, "step": 7168 }, { "epoch": 0.85, "learning_rate": 1.0830181678596374e-06, "loss": 0.7143, "step": 7169 }, { "epoch": 0.86, "learning_rate": 1.081270424712808e-06, "loss": 0.7679, "step": 7170 }, { "epoch": 0.86, "learning_rate": 1.0795240123304308e-06, "loss": 0.7232, "step": 7171 }, { "epoch": 0.86, "learning_rate": 1.0777789309730879e-06, "loss": 0.7494, "step": 7172 }, { "epoch": 0.86, "learning_rate": 1.0760351809011637e-06, "loss": 0.7718, "step": 7173 }, { "epoch": 0.86, "learning_rate": 1.07429276237484e-06, "loss": 0.7215, "step": 7174 }, { "epoch": 0.86, "learning_rate": 1.0725516756541077e-06, "loss": 0.644, "step": 7175 }, { "epoch": 0.86, "learning_rate": 1.0708119209987512e-06, "loss": 0.7271, "step": 7176 }, { "epoch": 0.86, "learning_rate": 1.0690734986683648e-06, "loss": 0.7115, "step": 7177 }, { "epoch": 0.86, "learning_rate": 1.0673364089223336e-06, "loss": 0.7176, "step": 7178 }, { "epoch": 0.86, "learning_rate": 1.0656006520198469e-06, "loss": 0.7383, "step": 7179 }, { "epoch": 0.86, "learning_rate": 1.0638662282199041e-06, "loss": 0.7506, "step": 7180 }, { "epoch": 0.86, "learning_rate": 1.0621331377812915e-06, "loss": 0.7037, "step": 7181 }, { "epoch": 0.86, "learning_rate": 1.0604013809626123e-06, "loss": 0.7243, "step": 7182 }, { "epoch": 0.86, "learning_rate": 1.058670958022252e-06, "loss": 0.6769, "step": 7183 }, { "epoch": 0.86, "learning_rate": 1.0569418692184142e-06, "loss": 0.6981, "step": 7184 }, { "epoch": 0.86, "learning_rate": 1.0552141148090954e-06, "loss": 0.7148, "step": 7185 }, { "epoch": 0.86, "learning_rate": 1.05348769505209e-06, "loss": 0.7054, "step": 7186 }, { "epoch": 0.86, "learning_rate": 1.051762610205005e-06, "loss": 0.6797, "step": 7187 }, { "epoch": 0.86, "learning_rate": 1.050038860525231e-06, "loss": 0.7215, "step": 7188 }, { "epoch": 0.86, "learning_rate": 1.0483164462699758e-06, "loss": 0.745, "step": 7189 }, { "epoch": 0.86, "learning_rate": 1.0465953676962392e-06, "loss": 0.7405, "step": 7190 }, { "epoch": 0.86, "learning_rate": 1.0448756250608205e-06, "loss": 0.7606, "step": 7191 }, { "epoch": 0.86, "learning_rate": 1.0431572186203287e-06, "loss": 0.7494, "step": 7192 }, { "epoch": 0.86, "learning_rate": 1.0414401486311599e-06, "loss": 0.6507, "step": 7193 }, { "epoch": 0.86, "learning_rate": 1.0397244153495255e-06, "loss": 0.7718, "step": 7194 }, { "epoch": 0.86, "learning_rate": 1.0380100190314235e-06, "loss": 0.7355, "step": 7195 }, { "epoch": 0.86, "learning_rate": 1.0362969599326655e-06, "loss": 0.7271, "step": 7196 }, { "epoch": 0.86, "learning_rate": 1.0345852383088539e-06, "loss": 0.7416, "step": 7197 }, { "epoch": 0.86, "learning_rate": 1.0328748544153955e-06, "loss": 0.6161, "step": 7198 }, { "epoch": 0.86, "learning_rate": 1.031165808507496e-06, "loss": 0.7087, "step": 7199 }, { "epoch": 0.86, "learning_rate": 1.0294581008401604e-06, "loss": 0.6936, "step": 7200 }, { "epoch": 0.86, "learning_rate": 1.0277517316682017e-06, "loss": 0.7327, "step": 7201 }, { "epoch": 0.86, "learning_rate": 1.026046701246224e-06, "loss": 0.6398, "step": 7202 }, { "epoch": 0.86, "learning_rate": 1.0243430098286345e-06, "loss": 0.779, "step": 7203 }, { "epoch": 0.86, "learning_rate": 1.0226406576696413e-06, "loss": 0.7254, "step": 7204 }, { "epoch": 0.86, "learning_rate": 1.0209396450232512e-06, "loss": 0.7148, "step": 7205 }, { "epoch": 0.86, "learning_rate": 1.0192399721432765e-06, "loss": 0.6825, "step": 7206 }, { "epoch": 0.86, "learning_rate": 1.0175416392833238e-06, "loss": 0.7048, "step": 7207 }, { "epoch": 0.86, "learning_rate": 1.0158446466967996e-06, "loss": 0.745, "step": 7208 }, { "epoch": 0.86, "learning_rate": 1.0141489946369154e-06, "loss": 0.707, "step": 7209 }, { "epoch": 0.86, "learning_rate": 1.012454683356674e-06, "loss": 0.7729, "step": 7210 }, { "epoch": 0.86, "learning_rate": 1.010761713108891e-06, "loss": 0.7695, "step": 7211 }, { "epoch": 0.86, "learning_rate": 1.009070084146171e-06, "loss": 0.74, "step": 7212 }, { "epoch": 0.86, "learning_rate": 1.007379796720922e-06, "loss": 0.7539, "step": 7213 }, { "epoch": 0.86, "learning_rate": 1.0056908510853514e-06, "loss": 0.7215, "step": 7214 }, { "epoch": 0.86, "learning_rate": 1.0040032474914685e-06, "loss": 0.678, "step": 7215 }, { "epoch": 0.86, "learning_rate": 1.0023169861910808e-06, "loss": 0.7656, "step": 7216 }, { "epoch": 0.86, "learning_rate": 1.000632067435795e-06, "loss": 0.6881, "step": 7217 }, { "epoch": 0.86, "learning_rate": 9.989484914770175e-07, "loss": 0.7444, "step": 7218 }, { "epoch": 0.86, "learning_rate": 9.97266258565953e-07, "loss": 0.6629, "step": 7219 }, { "epoch": 0.86, "learning_rate": 9.95585368953612e-07, "loss": 0.736, "step": 7220 }, { "epoch": 0.86, "learning_rate": 9.939058228907984e-07, "loss": 0.726, "step": 7221 }, { "epoch": 0.86, "learning_rate": 9.922276206281156e-07, "loss": 0.6724, "step": 7222 }, { "epoch": 0.86, "learning_rate": 9.905507624159715e-07, "loss": 0.7617, "step": 7223 }, { "epoch": 0.86, "learning_rate": 9.88875248504565e-07, "loss": 0.7171, "step": 7224 }, { "epoch": 0.86, "learning_rate": 9.872010791439057e-07, "loss": 0.7455, "step": 7225 }, { "epoch": 0.86, "learning_rate": 9.85528254583793e-07, "loss": 0.75, "step": 7226 }, { "epoch": 0.86, "learning_rate": 9.838567750738325e-07, "loss": 0.7059, "step": 7227 }, { "epoch": 0.86, "learning_rate": 9.821866408634206e-07, "loss": 0.7249, "step": 7228 }, { "epoch": 0.86, "learning_rate": 9.805178522017621e-07, "loss": 0.731, "step": 7229 }, { "epoch": 0.86, "learning_rate": 9.78850409337857e-07, "loss": 0.7411, "step": 7230 }, { "epoch": 0.86, "learning_rate": 9.771843125205015e-07, "loss": 0.7427, "step": 7231 }, { "epoch": 0.86, "learning_rate": 9.755195619983005e-07, "loss": 0.7271, "step": 7232 }, { "epoch": 0.86, "learning_rate": 9.738561580196436e-07, "loss": 0.7327, "step": 7233 }, { "epoch": 0.86, "learning_rate": 9.721941008327329e-07, "loss": 0.6518, "step": 7234 }, { "epoch": 0.86, "learning_rate": 9.705333906855619e-07, "loss": 0.7338, "step": 7235 }, { "epoch": 0.86, "learning_rate": 9.688740278259245e-07, "loss": 0.6669, "step": 7236 }, { "epoch": 0.86, "learning_rate": 9.672160125014197e-07, "loss": 0.7026, "step": 7237 }, { "epoch": 0.86, "learning_rate": 9.655593449594313e-07, "loss": 0.7461, "step": 7238 }, { "epoch": 0.86, "learning_rate": 9.639040254471587e-07, "loss": 0.7439, "step": 7239 }, { "epoch": 0.86, "learning_rate": 9.622500542115886e-07, "loss": 0.6836, "step": 7240 }, { "epoch": 0.86, "learning_rate": 9.605974314995092e-07, "loss": 0.7427, "step": 7241 }, { "epoch": 0.86, "learning_rate": 9.589461575575131e-07, "loss": 0.697, "step": 7242 }, { "epoch": 0.86, "learning_rate": 9.572962326319813e-07, "loss": 0.7422, "step": 7243 }, { "epoch": 0.86, "learning_rate": 9.556476569691032e-07, "loss": 0.7171, "step": 7244 }, { "epoch": 0.86, "learning_rate": 9.540004308148598e-07, "loss": 0.7377, "step": 7245 }, { "epoch": 0.86, "learning_rate": 9.523545544150381e-07, "loss": 0.7612, "step": 7246 }, { "epoch": 0.86, "learning_rate": 9.507100280152171e-07, "loss": 0.7634, "step": 7247 }, { "epoch": 0.86, "learning_rate": 9.490668518607759e-07, "loss": 0.7271, "step": 7248 }, { "epoch": 0.86, "learning_rate": 9.474250261968953e-07, "loss": 0.6719, "step": 7249 }, { "epoch": 0.86, "learning_rate": 9.457845512685482e-07, "loss": 0.7366, "step": 7250 }, { "epoch": 0.86, "learning_rate": 9.441454273205142e-07, "loss": 0.7913, "step": 7251 }, { "epoch": 0.86, "learning_rate": 9.425076545973654e-07, "loss": 0.7623, "step": 7252 }, { "epoch": 0.86, "learning_rate": 9.408712333434744e-07, "loss": 0.7288, "step": 7253 }, { "epoch": 0.87, "learning_rate": 9.392361638030123e-07, "loss": 0.6908, "step": 7254 }, { "epoch": 0.87, "learning_rate": 9.37602446219944e-07, "loss": 0.721, "step": 7255 }, { "epoch": 0.87, "learning_rate": 9.359700808380423e-07, "loss": 0.7081, "step": 7256 }, { "epoch": 0.87, "learning_rate": 9.343390679008702e-07, "loss": 0.7388, "step": 7257 }, { "epoch": 0.87, "learning_rate": 9.327094076517918e-07, "loss": 0.6886, "step": 7258 }, { "epoch": 0.87, "learning_rate": 9.310811003339659e-07, "loss": 0.6791, "step": 7259 }, { "epoch": 0.87, "learning_rate": 9.294541461903561e-07, "loss": 0.6797, "step": 7260 }, { "epoch": 0.87, "learning_rate": 9.278285454637204e-07, "loss": 0.6948, "step": 7261 }, { "epoch": 0.87, "learning_rate": 9.262042983966124e-07, "loss": 0.7762, "step": 7262 }, { "epoch": 0.87, "learning_rate": 9.245814052313873e-07, "loss": 0.736, "step": 7263 }, { "epoch": 0.87, "learning_rate": 9.229598662101946e-07, "loss": 0.7294, "step": 7264 }, { "epoch": 0.87, "learning_rate": 9.213396815749898e-07, "loss": 0.745, "step": 7265 }, { "epoch": 0.87, "learning_rate": 9.197208515675172e-07, "loss": 0.6724, "step": 7266 }, { "epoch": 0.87, "learning_rate": 9.181033764293234e-07, "loss": 0.7852, "step": 7267 }, { "epoch": 0.87, "learning_rate": 9.164872564017513e-07, "loss": 0.6306, "step": 7268 }, { "epoch": 0.87, "learning_rate": 9.148724917259411e-07, "loss": 0.6652, "step": 7269 }, { "epoch": 0.87, "learning_rate": 9.132590826428356e-07, "loss": 0.7846, "step": 7270 }, { "epoch": 0.87, "learning_rate": 9.11647029393169e-07, "loss": 0.7199, "step": 7271 }, { "epoch": 0.87, "learning_rate": 9.100363322174777e-07, "loss": 0.7121, "step": 7272 }, { "epoch": 0.87, "learning_rate": 9.084269913560928e-07, "loss": 0.7388, "step": 7273 }, { "epoch": 0.87, "learning_rate": 9.068190070491423e-07, "loss": 0.7561, "step": 7274 }, { "epoch": 0.87, "learning_rate": 9.052123795365563e-07, "loss": 0.7243, "step": 7275 }, { "epoch": 0.87, "learning_rate": 9.036071090580589e-07, "loss": 0.6931, "step": 7276 }, { "epoch": 0.87, "learning_rate": 9.020031958531761e-07, "loss": 0.7405, "step": 7277 }, { "epoch": 0.87, "learning_rate": 9.00400640161222e-07, "loss": 0.7188, "step": 7278 }, { "epoch": 0.87, "learning_rate": 8.987994422213175e-07, "loss": 0.707, "step": 7279 }, { "epoch": 0.87, "learning_rate": 8.971996022723784e-07, "loss": 0.7556, "step": 7280 }, { "epoch": 0.87, "learning_rate": 8.956011205531123e-07, "loss": 0.755, "step": 7281 }, { "epoch": 0.87, "learning_rate": 8.940039973020364e-07, "loss": 0.7249, "step": 7282 }, { "epoch": 0.87, "learning_rate": 8.924082327574491e-07, "loss": 0.7706, "step": 7283 }, { "epoch": 0.87, "learning_rate": 8.908138271574607e-07, "loss": 0.7154, "step": 7284 }, { "epoch": 0.87, "learning_rate": 8.8922078073997e-07, "loss": 0.731, "step": 7285 }, { "epoch": 0.87, "learning_rate": 8.876290937426746e-07, "loss": 0.7556, "step": 7286 }, { "epoch": 0.87, "learning_rate": 8.860387664030756e-07, "loss": 0.7718, "step": 7287 }, { "epoch": 0.87, "learning_rate": 8.844497989584588e-07, "loss": 0.7321, "step": 7288 }, { "epoch": 0.87, "learning_rate": 8.828621916459191e-07, "loss": 0.7143, "step": 7289 }, { "epoch": 0.87, "learning_rate": 8.8127594470234e-07, "loss": 0.6825, "step": 7290 }, { "epoch": 0.87, "learning_rate": 8.796910583644091e-07, "loss": 0.7249, "step": 7291 }, { "epoch": 0.87, "learning_rate": 8.781075328686084e-07, "loss": 0.716, "step": 7292 }, { "epoch": 0.87, "learning_rate": 8.765253684512087e-07, "loss": 0.7623, "step": 7293 }, { "epoch": 0.87, "learning_rate": 8.749445653482913e-07, "loss": 0.7366, "step": 7294 }, { "epoch": 0.87, "learning_rate": 8.733651237957253e-07, "loss": 0.6758, "step": 7295 }, { "epoch": 0.87, "learning_rate": 8.717870440291809e-07, "loss": 0.7015, "step": 7296 }, { "epoch": 0.87, "learning_rate": 8.702103262841233e-07, "loss": 0.7606, "step": 7297 }, { "epoch": 0.87, "learning_rate": 8.686349707958142e-07, "loss": 0.7121, "step": 7298 }, { "epoch": 0.87, "learning_rate": 8.670609777993122e-07, "loss": 0.7807, "step": 7299 }, { "epoch": 0.87, "learning_rate": 8.654883475294717e-07, "loss": 0.7506, "step": 7300 }, { "epoch": 0.87, "learning_rate": 8.639170802209485e-07, "loss": 0.7472, "step": 7301 }, { "epoch": 0.87, "learning_rate": 8.623471761081903e-07, "loss": 0.7394, "step": 7302 }, { "epoch": 0.87, "learning_rate": 8.60778635425441e-07, "loss": 0.7143, "step": 7303 }, { "epoch": 0.87, "learning_rate": 8.592114584067434e-07, "loss": 0.7254, "step": 7304 }, { "epoch": 0.87, "learning_rate": 8.57645645285935e-07, "loss": 0.7277, "step": 7305 }, { "epoch": 0.87, "learning_rate": 8.560811962966543e-07, "loss": 0.6936, "step": 7306 }, { "epoch": 0.87, "learning_rate": 8.545181116723311e-07, "loss": 0.7048, "step": 7307 }, { "epoch": 0.87, "learning_rate": 8.529563916461925e-07, "loss": 0.7009, "step": 7308 }, { "epoch": 0.87, "learning_rate": 8.513960364512619e-07, "loss": 0.7506, "step": 7309 }, { "epoch": 0.87, "learning_rate": 8.498370463203642e-07, "loss": 0.7539, "step": 7310 }, { "epoch": 0.87, "learning_rate": 8.482794214861135e-07, "loss": 0.7015, "step": 7311 }, { "epoch": 0.87, "learning_rate": 8.467231621809235e-07, "loss": 0.7188, "step": 7312 }, { "epoch": 0.87, "learning_rate": 8.451682686370032e-07, "loss": 0.7076, "step": 7313 }, { "epoch": 0.87, "learning_rate": 8.436147410863583e-07, "loss": 0.6959, "step": 7314 }, { "epoch": 0.87, "learning_rate": 8.420625797607929e-07, "loss": 0.7444, "step": 7315 }, { "epoch": 0.87, "learning_rate": 8.405117848919042e-07, "loss": 0.7227, "step": 7316 }, { "epoch": 0.87, "learning_rate": 8.38962356711086e-07, "loss": 0.7338, "step": 7317 }, { "epoch": 0.87, "learning_rate": 8.374142954495291e-07, "loss": 0.7171, "step": 7318 }, { "epoch": 0.87, "learning_rate": 8.358676013382161e-07, "loss": 0.6585, "step": 7319 }, { "epoch": 0.87, "learning_rate": 8.34322274607936e-07, "loss": 0.6897, "step": 7320 }, { "epoch": 0.87, "learning_rate": 8.32778315489261e-07, "loss": 0.7405, "step": 7321 }, { "epoch": 0.87, "learning_rate": 8.312357242125724e-07, "loss": 0.7946, "step": 7322 }, { "epoch": 0.87, "learning_rate": 8.296945010080349e-07, "loss": 0.7612, "step": 7323 }, { "epoch": 0.87, "learning_rate": 8.281546461056133e-07, "loss": 0.7656, "step": 7324 }, { "epoch": 0.87, "learning_rate": 8.266161597350742e-07, "loss": 0.6724, "step": 7325 }, { "epoch": 0.87, "learning_rate": 8.250790421259713e-07, "loss": 0.7081, "step": 7326 }, { "epoch": 0.87, "learning_rate": 8.235432935076638e-07, "loss": 0.7246, "step": 7327 }, { "epoch": 0.87, "learning_rate": 8.220089141092935e-07, "loss": 0.7171, "step": 7328 }, { "epoch": 0.87, "learning_rate": 8.204759041598098e-07, "loss": 0.7254, "step": 7329 }, { "epoch": 0.87, "learning_rate": 8.18944263887953e-07, "loss": 0.6769, "step": 7330 }, { "epoch": 0.87, "learning_rate": 8.174139935222558e-07, "loss": 0.6931, "step": 7331 }, { "epoch": 0.87, "learning_rate": 8.158850932910578e-07, "loss": 0.7517, "step": 7332 }, { "epoch": 0.87, "learning_rate": 8.143575634224765e-07, "loss": 0.7042, "step": 7333 }, { "epoch": 0.87, "learning_rate": 8.128314041444418e-07, "loss": 0.7595, "step": 7334 }, { "epoch": 0.87, "learning_rate": 8.113066156846694e-07, "loss": 0.7266, "step": 7335 }, { "epoch": 0.87, "learning_rate": 8.097831982706716e-07, "loss": 0.7109, "step": 7336 }, { "epoch": 0.88, "learning_rate": 8.082611521297634e-07, "loss": 0.7427, "step": 7337 }, { "epoch": 0.88, "learning_rate": 8.067404774890431e-07, "loss": 0.692, "step": 7338 }, { "epoch": 0.88, "learning_rate": 8.052211745754135e-07, "loss": 0.7612, "step": 7339 }, { "epoch": 0.88, "learning_rate": 8.03703243615569e-07, "loss": 0.7182, "step": 7340 }, { "epoch": 0.88, "learning_rate": 8.021866848360016e-07, "loss": 0.716, "step": 7341 }, { "epoch": 0.88, "learning_rate": 8.006714984629971e-07, "loss": 0.7422, "step": 7342 }, { "epoch": 0.88, "learning_rate": 7.991576847226357e-07, "loss": 0.7282, "step": 7343 }, { "epoch": 0.88, "learning_rate": 7.976452438407934e-07, "loss": 0.6892, "step": 7344 }, { "epoch": 0.88, "learning_rate": 7.961341760431418e-07, "loss": 0.7081, "step": 7345 }, { "epoch": 0.88, "learning_rate": 7.946244815551485e-07, "loss": 0.7494, "step": 7346 }, { "epoch": 0.88, "learning_rate": 7.931161606020743e-07, "loss": 0.7522, "step": 7347 }, { "epoch": 0.88, "learning_rate": 7.91609213408977e-07, "loss": 0.7517, "step": 7348 }, { "epoch": 0.88, "learning_rate": 7.901036402007067e-07, "loss": 0.7377, "step": 7349 }, { "epoch": 0.88, "learning_rate": 7.885994412019093e-07, "loss": 0.6914, "step": 7350 }, { "epoch": 0.88, "learning_rate": 7.870966166370297e-07, "loss": 0.6936, "step": 7351 }, { "epoch": 0.88, "learning_rate": 7.855951667303008e-07, "loss": 0.7065, "step": 7352 }, { "epoch": 0.88, "learning_rate": 7.840950917057599e-07, "loss": 0.6975, "step": 7353 }, { "epoch": 0.88, "learning_rate": 7.82596391787227e-07, "loss": 0.6892, "step": 7354 }, { "epoch": 0.88, "learning_rate": 7.810990671983254e-07, "loss": 0.7589, "step": 7355 }, { "epoch": 0.88, "learning_rate": 7.796031181624719e-07, "loss": 0.7461, "step": 7356 }, { "epoch": 0.88, "learning_rate": 7.781085449028758e-07, "loss": 0.673, "step": 7357 }, { "epoch": 0.88, "learning_rate": 7.766153476425465e-07, "loss": 0.7288, "step": 7358 }, { "epoch": 0.88, "learning_rate": 7.751235266042767e-07, "loss": 0.7009, "step": 7359 }, { "epoch": 0.88, "learning_rate": 7.736330820106685e-07, "loss": 0.7017, "step": 7360 }, { "epoch": 0.88, "learning_rate": 7.721440140841075e-07, "loss": 0.7243, "step": 7361 }, { "epoch": 0.88, "learning_rate": 7.706563230467767e-07, "loss": 0.6786, "step": 7362 }, { "epoch": 0.88, "learning_rate": 7.6917000912066e-07, "loss": 0.7333, "step": 7363 }, { "epoch": 0.88, "learning_rate": 7.676850725275232e-07, "loss": 0.6836, "step": 7364 }, { "epoch": 0.88, "learning_rate": 7.662015134889389e-07, "loss": 0.6897, "step": 7365 }, { "epoch": 0.88, "learning_rate": 7.64719332226267e-07, "loss": 0.7489, "step": 7366 }, { "epoch": 0.88, "learning_rate": 7.632385289606636e-07, "loss": 0.7768, "step": 7367 }, { "epoch": 0.88, "learning_rate": 7.617591039130833e-07, "loss": 0.7383, "step": 7368 }, { "epoch": 0.88, "learning_rate": 7.602810573042652e-07, "loss": 0.784, "step": 7369 }, { "epoch": 0.88, "learning_rate": 7.588043893547525e-07, "loss": 0.6987, "step": 7370 }, { "epoch": 0.88, "learning_rate": 7.573291002848782e-07, "loss": 0.7388, "step": 7371 }, { "epoch": 0.88, "learning_rate": 7.558551903147704e-07, "loss": 0.7829, "step": 7372 }, { "epoch": 0.88, "learning_rate": 7.543826596643522e-07, "loss": 0.7148, "step": 7373 }, { "epoch": 0.88, "learning_rate": 7.529115085533401e-07, "loss": 0.772, "step": 7374 }, { "epoch": 0.88, "learning_rate": 7.514417372012428e-07, "loss": 0.7506, "step": 7375 }, { "epoch": 0.88, "learning_rate": 7.499733458273639e-07, "loss": 0.7511, "step": 7376 }, { "epoch": 0.88, "learning_rate": 7.48506334650807e-07, "loss": 0.7042, "step": 7377 }, { "epoch": 0.88, "learning_rate": 7.470407038904614e-07, "loss": 0.7277, "step": 7378 }, { "epoch": 0.88, "learning_rate": 7.455764537650156e-07, "loss": 0.7048, "step": 7379 }, { "epoch": 0.88, "learning_rate": 7.441135844929493e-07, "loss": 0.7447, "step": 7380 }, { "epoch": 0.88, "learning_rate": 7.426520962925354e-07, "loss": 0.7148, "step": 7381 }, { "epoch": 0.88, "learning_rate": 7.411919893818486e-07, "loss": 0.7651, "step": 7382 }, { "epoch": 0.88, "learning_rate": 7.397332639787469e-07, "loss": 0.7026, "step": 7383 }, { "epoch": 0.88, "learning_rate": 7.382759203008882e-07, "loss": 0.6864, "step": 7384 }, { "epoch": 0.88, "learning_rate": 7.368199585657232e-07, "loss": 0.6744, "step": 7385 }, { "epoch": 0.88, "learning_rate": 7.353653789904924e-07, "loss": 0.7913, "step": 7386 }, { "epoch": 0.88, "learning_rate": 7.339121817922401e-07, "loss": 0.6981, "step": 7387 }, { "epoch": 0.88, "learning_rate": 7.32460367187795e-07, "loss": 0.7785, "step": 7388 }, { "epoch": 0.88, "learning_rate": 7.310099353937816e-07, "loss": 0.6953, "step": 7389 }, { "epoch": 0.88, "learning_rate": 7.29560886626618e-07, "loss": 0.7327, "step": 7390 }, { "epoch": 0.88, "learning_rate": 7.28113221102521e-07, "loss": 0.7377, "step": 7391 }, { "epoch": 0.88, "learning_rate": 7.266669390374936e-07, "loss": 0.7522, "step": 7392 }, { "epoch": 0.88, "learning_rate": 7.252220406473376e-07, "loss": 0.6791, "step": 7393 }, { "epoch": 0.88, "learning_rate": 7.237785261476449e-07, "loss": 0.6641, "step": 7394 }, { "epoch": 0.88, "learning_rate": 7.22336395753801e-07, "loss": 0.7282, "step": 7395 }, { "epoch": 0.88, "learning_rate": 7.208956496809893e-07, "loss": 0.7461, "step": 7396 }, { "epoch": 0.88, "learning_rate": 7.194562881441835e-07, "loss": 0.7383, "step": 7397 }, { "epoch": 0.88, "learning_rate": 7.180183113581507e-07, "loss": 0.6691, "step": 7398 }, { "epoch": 0.88, "learning_rate": 7.165817195374492e-07, "loss": 0.7472, "step": 7399 }, { "epoch": 0.88, "learning_rate": 7.151465128964341e-07, "loss": 0.7333, "step": 7400 }, { "epoch": 0.88, "learning_rate": 7.137126916492543e-07, "loss": 0.6808, "step": 7401 }, { "epoch": 0.88, "learning_rate": 7.122802560098474e-07, "loss": 0.7277, "step": 7402 }, { "epoch": 0.88, "learning_rate": 7.108492061919537e-07, "loss": 0.6875, "step": 7403 }, { "epoch": 0.88, "learning_rate": 7.094195424090911e-07, "loss": 0.7349, "step": 7404 }, { "epoch": 0.88, "learning_rate": 7.079912648745868e-07, "loss": 0.678, "step": 7405 }, { "epoch": 0.88, "learning_rate": 7.065643738015515e-07, "loss": 0.736, "step": 7406 }, { "epoch": 0.88, "learning_rate": 7.051388694028905e-07, "loss": 0.7115, "step": 7407 }, { "epoch": 0.88, "learning_rate": 7.03714751891309e-07, "loss": 0.6903, "step": 7408 }, { "epoch": 0.88, "learning_rate": 7.022920214792927e-07, "loss": 0.7037, "step": 7409 }, { "epoch": 0.88, "learning_rate": 7.008706783791309e-07, "loss": 0.7355, "step": 7410 }, { "epoch": 0.88, "learning_rate": 6.994507228029024e-07, "loss": 0.6987, "step": 7411 }, { "epoch": 0.88, "learning_rate": 6.98032154962478e-07, "loss": 0.7288, "step": 7412 }, { "epoch": 0.88, "learning_rate": 6.966149750695239e-07, "loss": 0.7266, "step": 7413 }, { "epoch": 0.88, "learning_rate": 6.951991833354943e-07, "loss": 0.6473, "step": 7414 }, { "epoch": 0.88, "learning_rate": 6.937847799716435e-07, "loss": 0.6501, "step": 7415 }, { "epoch": 0.88, "learning_rate": 6.923717651890128e-07, "loss": 0.7048, "step": 7416 }, { "epoch": 0.88, "learning_rate": 6.909601391984366e-07, "loss": 0.702, "step": 7417 }, { "epoch": 0.88, "learning_rate": 6.8954990221055e-07, "loss": 0.7076, "step": 7418 }, { "epoch": 0.88, "learning_rate": 6.881410544357658e-07, "loss": 0.6674, "step": 7419 }, { "epoch": 0.88, "learning_rate": 6.867335960843047e-07, "loss": 0.6836, "step": 7420 }, { "epoch": 0.89, "learning_rate": 6.853275273661708e-07, "loss": 0.7355, "step": 7421 }, { "epoch": 0.89, "learning_rate": 6.839228484911653e-07, "loss": 0.7271, "step": 7422 }, { "epoch": 0.89, "learning_rate": 6.825195596688794e-07, "loss": 0.7009, "step": 7423 }, { "epoch": 0.89, "learning_rate": 6.811176611087e-07, "loss": 0.6814, "step": 7424 }, { "epoch": 0.89, "learning_rate": 6.79717153019801e-07, "loss": 0.7338, "step": 7425 }, { "epoch": 0.89, "learning_rate": 6.783180356111541e-07, "loss": 0.7148, "step": 7426 }, { "epoch": 0.89, "learning_rate": 6.769203090915233e-07, "loss": 0.7271, "step": 7427 }, { "epoch": 0.89, "learning_rate": 6.755239736694619e-07, "loss": 0.7405, "step": 7428 }, { "epoch": 0.89, "learning_rate": 6.741290295533165e-07, "loss": 0.7539, "step": 7429 }, { "epoch": 0.89, "learning_rate": 6.727354769512285e-07, "loss": 0.7299, "step": 7430 }, { "epoch": 0.89, "learning_rate": 6.71343316071128e-07, "loss": 0.6981, "step": 7431 }, { "epoch": 0.89, "learning_rate": 6.699525471207413e-07, "loss": 0.6735, "step": 7432 }, { "epoch": 0.89, "learning_rate": 6.685631703075857e-07, "loss": 0.692, "step": 7433 }, { "epoch": 0.89, "learning_rate": 6.671751858389686e-07, "loss": 0.7333, "step": 7434 }, { "epoch": 0.89, "learning_rate": 6.657885939219899e-07, "loss": 0.6551, "step": 7435 }, { "epoch": 0.89, "learning_rate": 6.644033947635476e-07, "loss": 0.7059, "step": 7436 }, { "epoch": 0.89, "learning_rate": 6.630195885703239e-07, "loss": 0.7104, "step": 7437 }, { "epoch": 0.89, "learning_rate": 6.616371755487971e-07, "loss": 0.7517, "step": 7438 }, { "epoch": 0.89, "learning_rate": 6.602561559052378e-07, "loss": 0.6685, "step": 7439 }, { "epoch": 0.89, "learning_rate": 6.588765298457067e-07, "loss": 0.6908, "step": 7440 }, { "epoch": 0.89, "learning_rate": 6.574982975760613e-07, "loss": 0.7377, "step": 7441 }, { "epoch": 0.89, "learning_rate": 6.561214593019449e-07, "loss": 0.6956, "step": 7442 }, { "epoch": 0.89, "learning_rate": 6.547460152287965e-07, "loss": 0.7227, "step": 7443 }, { "epoch": 0.89, "learning_rate": 6.533719655618453e-07, "loss": 0.7402, "step": 7444 }, { "epoch": 0.89, "learning_rate": 6.519993105061139e-07, "loss": 0.7098, "step": 7445 }, { "epoch": 0.89, "learning_rate": 6.506280502664176e-07, "loss": 0.7483, "step": 7446 }, { "epoch": 0.89, "learning_rate": 6.492581850473611e-07, "loss": 0.7015, "step": 7447 }, { "epoch": 0.89, "learning_rate": 6.478897150533414e-07, "loss": 0.7818, "step": 7448 }, { "epoch": 0.89, "learning_rate": 6.465226404885494e-07, "loss": 0.7327, "step": 7449 }, { "epoch": 0.89, "learning_rate": 6.451569615569653e-07, "loss": 0.7277, "step": 7450 }, { "epoch": 0.89, "learning_rate": 6.437926784623627e-07, "loss": 0.7333, "step": 7451 }, { "epoch": 0.89, "learning_rate": 6.424297914083055e-07, "loss": 0.7494, "step": 7452 }, { "epoch": 0.89, "learning_rate": 6.410683005981544e-07, "loss": 0.7232, "step": 7453 }, { "epoch": 0.89, "learning_rate": 6.397082062350512e-07, "loss": 0.6702, "step": 7454 }, { "epoch": 0.89, "learning_rate": 6.383495085219404e-07, "loss": 0.6529, "step": 7455 }, { "epoch": 0.89, "learning_rate": 6.36992207661552e-07, "loss": 0.6847, "step": 7456 }, { "epoch": 0.89, "learning_rate": 6.356363038564072e-07, "loss": 0.7238, "step": 7457 }, { "epoch": 0.89, "learning_rate": 6.342817973088255e-07, "loss": 0.6931, "step": 7458 }, { "epoch": 0.89, "learning_rate": 6.329286882209063e-07, "loss": 0.6886, "step": 7459 }, { "epoch": 0.89, "learning_rate": 6.315769767945512e-07, "loss": 0.7439, "step": 7460 }, { "epoch": 0.89, "learning_rate": 6.302266632314491e-07, "loss": 0.7612, "step": 7461 }, { "epoch": 0.89, "learning_rate": 6.288777477330787e-07, "loss": 0.7405, "step": 7462 }, { "epoch": 0.89, "learning_rate": 6.275302305007147e-07, "loss": 0.7204, "step": 7463 }, { "epoch": 0.89, "learning_rate": 6.261841117354161e-07, "loss": 0.697, "step": 7464 }, { "epoch": 0.89, "learning_rate": 6.248393916380413e-07, "loss": 0.7695, "step": 7465 }, { "epoch": 0.89, "learning_rate": 6.234960704092319e-07, "loss": 0.7489, "step": 7466 }, { "epoch": 0.89, "learning_rate": 6.221541482494298e-07, "loss": 0.74, "step": 7467 }, { "epoch": 0.89, "learning_rate": 6.208136253588626e-07, "loss": 0.7294, "step": 7468 }, { "epoch": 0.89, "learning_rate": 6.194745019375459e-07, "loss": 0.6903, "step": 7469 }, { "epoch": 0.89, "learning_rate": 6.181367781852942e-07, "loss": 0.7333, "step": 7470 }, { "epoch": 0.89, "learning_rate": 6.168004543017059e-07, "loss": 0.7148, "step": 7471 }, { "epoch": 0.89, "learning_rate": 6.154655304861778e-07, "loss": 0.7065, "step": 7472 }, { "epoch": 0.89, "learning_rate": 6.141320069378931e-07, "loss": 0.7048, "step": 7473 }, { "epoch": 0.89, "learning_rate": 6.127998838558258e-07, "loss": 0.7383, "step": 7474 }, { "epoch": 0.89, "learning_rate": 6.114691614387425e-07, "loss": 0.7645, "step": 7475 }, { "epoch": 0.89, "learning_rate": 6.101398398851988e-07, "loss": 0.6959, "step": 7476 }, { "epoch": 0.89, "learning_rate": 6.08811919393546e-07, "loss": 0.7126, "step": 7477 }, { "epoch": 0.89, "learning_rate": 6.074854001619224e-07, "loss": 0.7539, "step": 7478 }, { "epoch": 0.89, "learning_rate": 6.061602823882573e-07, "loss": 0.7461, "step": 7479 }, { "epoch": 0.89, "learning_rate": 6.048365662702716e-07, "loss": 0.7165, "step": 7480 }, { "epoch": 0.89, "learning_rate": 6.035142520054749e-07, "loss": 0.7188, "step": 7481 }, { "epoch": 0.89, "learning_rate": 6.02193339791175e-07, "loss": 0.6758, "step": 7482 }, { "epoch": 0.89, "learning_rate": 6.00873829824462e-07, "loss": 0.7042, "step": 7483 }, { "epoch": 0.89, "learning_rate": 5.995557223022208e-07, "loss": 0.7199, "step": 7484 }, { "epoch": 0.89, "learning_rate": 5.98239017421125e-07, "loss": 0.7065, "step": 7485 }, { "epoch": 0.89, "learning_rate": 5.969237153776419e-07, "loss": 0.7115, "step": 7486 }, { "epoch": 0.89, "learning_rate": 5.95609816368029e-07, "loss": 0.7121, "step": 7487 }, { "epoch": 0.89, "learning_rate": 5.942973205883306e-07, "loss": 0.6853, "step": 7488 }, { "epoch": 0.89, "learning_rate": 5.929862282343857e-07, "loss": 0.7355, "step": 7489 }, { "epoch": 0.89, "learning_rate": 5.916765395018198e-07, "loss": 0.7221, "step": 7490 }, { "epoch": 0.89, "learning_rate": 5.903682545860567e-07, "loss": 0.7327, "step": 7491 }, { "epoch": 0.89, "learning_rate": 5.890613736823026e-07, "loss": 0.7321, "step": 7492 }, { "epoch": 0.89, "learning_rate": 5.87755896985559e-07, "loss": 0.7059, "step": 7493 }, { "epoch": 0.89, "learning_rate": 5.864518246906137e-07, "loss": 0.716, "step": 7494 }, { "epoch": 0.89, "learning_rate": 5.851491569920476e-07, "loss": 0.7299, "step": 7495 }, { "epoch": 0.89, "learning_rate": 5.83847894084234e-07, "loss": 0.7433, "step": 7496 }, { "epoch": 0.89, "learning_rate": 5.825480361613334e-07, "loss": 0.683, "step": 7497 }, { "epoch": 0.89, "learning_rate": 5.812495834172993e-07, "loss": 0.745, "step": 7498 }, { "epoch": 0.89, "learning_rate": 5.799525360458713e-07, "loss": 0.6981, "step": 7499 }, { "epoch": 0.89, "learning_rate": 5.786568942405823e-07, "loss": 0.7494, "step": 7500 }, { "epoch": 0.89, "learning_rate": 5.773626581947566e-07, "loss": 0.7578, "step": 7501 }, { "epoch": 0.89, "learning_rate": 5.760698281015054e-07, "loss": 0.7154, "step": 7502 }, { "epoch": 0.89, "learning_rate": 5.747784041537363e-07, "loss": 0.6671, "step": 7503 }, { "epoch": 0.89, "learning_rate": 5.734883865441377e-07, "loss": 0.7338, "step": 7504 }, { "epoch": 0.9, "learning_rate": 5.721997754651953e-07, "loss": 0.7746, "step": 7505 }, { "epoch": 0.9, "learning_rate": 5.709125711091834e-07, "loss": 0.7081, "step": 7506 }, { "epoch": 0.9, "learning_rate": 5.696267736681638e-07, "loss": 0.7204, "step": 7507 }, { "epoch": 0.9, "learning_rate": 5.68342383333994e-07, "loss": 0.7121, "step": 7508 }, { "epoch": 0.9, "learning_rate": 5.670594002983142e-07, "loss": 0.7254, "step": 7509 }, { "epoch": 0.9, "learning_rate": 5.657778247525614e-07, "loss": 0.7037, "step": 7510 }, { "epoch": 0.9, "learning_rate": 5.644976568879579e-07, "loss": 0.7768, "step": 7511 }, { "epoch": 0.9, "learning_rate": 5.632188968955176e-07, "loss": 0.7031, "step": 7512 }, { "epoch": 0.9, "learning_rate": 5.61941544966047e-07, "loss": 0.7746, "step": 7513 }, { "epoch": 0.9, "learning_rate": 5.606656012901357e-07, "loss": 0.7489, "step": 7514 }, { "epoch": 0.9, "learning_rate": 5.593910660581703e-07, "loss": 0.7545, "step": 7515 }, { "epoch": 0.9, "learning_rate": 5.58117939460322e-07, "loss": 0.6934, "step": 7516 }, { "epoch": 0.9, "learning_rate": 5.568462216865567e-07, "loss": 0.7584, "step": 7517 }, { "epoch": 0.9, "learning_rate": 5.555759129266269e-07, "loss": 0.7651, "step": 7518 }, { "epoch": 0.9, "learning_rate": 5.543070133700756e-07, "loss": 0.736, "step": 7519 }, { "epoch": 0.9, "learning_rate": 5.530395232062347e-07, "loss": 0.6853, "step": 7520 }, { "epoch": 0.9, "learning_rate": 5.517734426242249e-07, "loss": 0.7511, "step": 7521 }, { "epoch": 0.9, "learning_rate": 5.50508771812962e-07, "loss": 0.6914, "step": 7522 }, { "epoch": 0.9, "learning_rate": 5.49245510961145e-07, "loss": 0.7662, "step": 7523 }, { "epoch": 0.9, "learning_rate": 5.479836602572664e-07, "loss": 0.6842, "step": 7524 }, { "epoch": 0.9, "learning_rate": 5.467232198896055e-07, "loss": 0.707, "step": 7525 }, { "epoch": 0.9, "learning_rate": 5.454641900462332e-07, "loss": 0.7093, "step": 7526 }, { "epoch": 0.9, "learning_rate": 5.442065709150113e-07, "loss": 0.7394, "step": 7527 }, { "epoch": 0.9, "learning_rate": 5.429503626835874e-07, "loss": 0.707, "step": 7528 }, { "epoch": 0.9, "learning_rate": 5.416955655394018e-07, "loss": 0.736, "step": 7529 }, { "epoch": 0.9, "learning_rate": 5.404421796696812e-07, "loss": 0.7087, "step": 7530 }, { "epoch": 0.9, "learning_rate": 5.391902052614429e-07, "loss": 0.7478, "step": 7531 }, { "epoch": 0.9, "learning_rate": 5.379396425014971e-07, "loss": 0.6981, "step": 7532 }, { "epoch": 0.9, "learning_rate": 5.366904915764393e-07, "loss": 0.7433, "step": 7533 }, { "epoch": 0.9, "learning_rate": 5.354427526726547e-07, "loss": 0.7076, "step": 7534 }, { "epoch": 0.9, "learning_rate": 5.341964259763166e-07, "loss": 0.7065, "step": 7535 }, { "epoch": 0.9, "learning_rate": 5.32951511673394e-07, "loss": 0.74, "step": 7536 }, { "epoch": 0.9, "learning_rate": 5.317080099496374e-07, "loss": 0.7422, "step": 7537 }, { "epoch": 0.9, "learning_rate": 5.304659209905905e-07, "loss": 0.7121, "step": 7538 }, { "epoch": 0.9, "learning_rate": 5.292252449815882e-07, "loss": 0.7249, "step": 7539 }, { "epoch": 0.9, "learning_rate": 5.27985982107746e-07, "loss": 0.6925, "step": 7540 }, { "epoch": 0.9, "learning_rate": 5.267481325539791e-07, "loss": 0.6825, "step": 7541 }, { "epoch": 0.9, "learning_rate": 5.255116965049867e-07, "loss": 0.7277, "step": 7542 }, { "epoch": 0.9, "learning_rate": 5.242766741452554e-07, "loss": 0.731, "step": 7543 }, { "epoch": 0.9, "learning_rate": 5.230430656590669e-07, "loss": 0.7623, "step": 7544 }, { "epoch": 0.9, "learning_rate": 5.218108712304826e-07, "loss": 0.7104, "step": 7545 }, { "epoch": 0.9, "learning_rate": 5.205800910433623e-07, "loss": 0.7628, "step": 7546 }, { "epoch": 0.9, "learning_rate": 5.19350725281349e-07, "loss": 0.7165, "step": 7547 }, { "epoch": 0.9, "learning_rate": 5.181227741278772e-07, "loss": 0.6931, "step": 7548 }, { "epoch": 0.9, "learning_rate": 5.168962377661712e-07, "loss": 0.6696, "step": 7549 }, { "epoch": 0.9, "learning_rate": 5.156711163792405e-07, "loss": 0.7316, "step": 7550 }, { "epoch": 0.9, "learning_rate": 5.144474101498853e-07, "loss": 0.736, "step": 7551 }, { "epoch": 0.9, "learning_rate": 5.132251192606952e-07, "loss": 0.7266, "step": 7552 }, { "epoch": 0.9, "learning_rate": 5.120042438940498e-07, "loss": 0.7366, "step": 7553 }, { "epoch": 0.9, "learning_rate": 5.107847842321156e-07, "loss": 0.6908, "step": 7554 }, { "epoch": 0.9, "learning_rate": 5.095667404568471e-07, "loss": 0.6853, "step": 7555 }, { "epoch": 0.9, "learning_rate": 5.083501127499901e-07, "loss": 0.7573, "step": 7556 }, { "epoch": 0.9, "learning_rate": 5.07134901293076e-07, "loss": 0.7467, "step": 7557 }, { "epoch": 0.9, "learning_rate": 5.059211062674274e-07, "loss": 0.7215, "step": 7558 }, { "epoch": 0.9, "learning_rate": 5.047087278541563e-07, "loss": 0.7411, "step": 7559 }, { "epoch": 0.9, "learning_rate": 5.0349776623416e-07, "loss": 0.7561, "step": 7560 }, { "epoch": 0.9, "learning_rate": 5.022882215881264e-07, "loss": 0.7188, "step": 7561 }, { "epoch": 0.9, "learning_rate": 5.01080094096531e-07, "loss": 0.7316, "step": 7562 }, { "epoch": 0.9, "learning_rate": 4.998733839396408e-07, "loss": 0.7366, "step": 7563 }, { "epoch": 0.9, "learning_rate": 4.986680912975083e-07, "loss": 0.6842, "step": 7564 }, { "epoch": 0.9, "learning_rate": 4.974642163499755e-07, "loss": 0.7081, "step": 7565 }, { "epoch": 0.9, "learning_rate": 4.962617592766694e-07, "loss": 0.7366, "step": 7566 }, { "epoch": 0.9, "learning_rate": 4.950607202570145e-07, "loss": 0.7031, "step": 7567 }, { "epoch": 0.9, "learning_rate": 4.938610994702142e-07, "loss": 0.7199, "step": 7568 }, { "epoch": 0.9, "learning_rate": 4.92662897095264e-07, "loss": 0.7467, "step": 7569 }, { "epoch": 0.9, "learning_rate": 4.9146611331095e-07, "loss": 0.7344, "step": 7570 }, { "epoch": 0.9, "learning_rate": 4.902707482958414e-07, "loss": 0.7327, "step": 7571 }, { "epoch": 0.9, "learning_rate": 4.89076802228301e-07, "loss": 0.7383, "step": 7572 }, { "epoch": 0.9, "learning_rate": 4.878842752864776e-07, "loss": 0.7439, "step": 7573 }, { "epoch": 0.9, "learning_rate": 4.866931676483067e-07, "loss": 0.6959, "step": 7574 }, { "epoch": 0.9, "learning_rate": 4.855034794915148e-07, "loss": 0.7238, "step": 7575 }, { "epoch": 0.9, "learning_rate": 4.843152109936144e-07, "loss": 0.76, "step": 7576 }, { "epoch": 0.9, "learning_rate": 4.831283623319083e-07, "loss": 0.6708, "step": 7577 }, { "epoch": 0.9, "learning_rate": 4.819429336834846e-07, "loss": 0.7316, "step": 7578 }, { "epoch": 0.9, "learning_rate": 4.807589252252254e-07, "loss": 0.7662, "step": 7579 }, { "epoch": 0.9, "learning_rate": 4.795763371337903e-07, "loss": 0.7946, "step": 7580 }, { "epoch": 0.9, "learning_rate": 4.783951695856392e-07, "loss": 0.7026, "step": 7581 }, { "epoch": 0.9, "learning_rate": 4.772154227570113e-07, "loss": 0.7266, "step": 7582 }, { "epoch": 0.9, "learning_rate": 4.7603709682393586e-07, "loss": 0.7266, "step": 7583 }, { "epoch": 0.9, "learning_rate": 4.748601919622353e-07, "loss": 0.7076, "step": 7584 }, { "epoch": 0.9, "learning_rate": 4.7368470834750937e-07, "loss": 0.6992, "step": 7585 }, { "epoch": 0.9, "learning_rate": 4.7251064615515764e-07, "loss": 0.7294, "step": 7586 }, { "epoch": 0.9, "learning_rate": 4.7133800556035893e-07, "loss": 0.6964, "step": 7587 }, { "epoch": 0.9, "learning_rate": 4.7016678673808325e-07, "loss": 0.7081, "step": 7588 }, { "epoch": 0.91, "learning_rate": 4.6899698986309196e-07, "loss": 0.7003, "step": 7589 }, { "epoch": 0.91, "learning_rate": 4.678286151099254e-07, "loss": 0.7483, "step": 7590 }, { "epoch": 0.91, "learning_rate": 4.666616626529197e-07, "loss": 0.6702, "step": 7591 }, { "epoch": 0.91, "learning_rate": 4.654961326661955e-07, "loss": 0.7522, "step": 7592 }, { "epoch": 0.91, "learning_rate": 4.643320253236594e-07, "loss": 0.7522, "step": 7593 }, { "epoch": 0.91, "learning_rate": 4.6316934079901346e-07, "loss": 0.7087, "step": 7594 }, { "epoch": 0.91, "learning_rate": 4.6200807926573664e-07, "loss": 0.7126, "step": 7595 }, { "epoch": 0.91, "learning_rate": 4.608482408971027e-07, "loss": 0.7366, "step": 7596 }, { "epoch": 0.91, "learning_rate": 4.596898258661708e-07, "loss": 0.7009, "step": 7597 }, { "epoch": 0.91, "learning_rate": 4.5853283434578953e-07, "loss": 0.6641, "step": 7598 }, { "epoch": 0.91, "learning_rate": 4.5737726650859296e-07, "loss": 0.7645, "step": 7599 }, { "epoch": 0.91, "learning_rate": 4.562231225270031e-07, "loss": 0.74, "step": 7600 }, { "epoch": 0.91, "learning_rate": 4.550704025732311e-07, "loss": 0.7377, "step": 7601 }, { "epoch": 0.91, "learning_rate": 4.5391910681927056e-07, "loss": 0.7338, "step": 7602 }, { "epoch": 0.91, "learning_rate": 4.5276923543691175e-07, "loss": 0.6858, "step": 7603 }, { "epoch": 0.91, "learning_rate": 4.5162078859772417e-07, "loss": 0.6814, "step": 7604 }, { "epoch": 0.91, "learning_rate": 4.504737664730685e-07, "loss": 0.7383, "step": 7605 }, { "epoch": 0.91, "learning_rate": 4.4932816923409115e-07, "loss": 0.7221, "step": 7606 }, { "epoch": 0.91, "learning_rate": 4.481839970517254e-07, "loss": 0.7282, "step": 7607 }, { "epoch": 0.91, "learning_rate": 4.4704125009669807e-07, "loss": 0.7835, "step": 7608 }, { "epoch": 0.91, "learning_rate": 4.4589992853951493e-07, "loss": 0.7444, "step": 7609 }, { "epoch": 0.91, "learning_rate": 4.447600325504731e-07, "loss": 0.6897, "step": 7610 }, { "epoch": 0.91, "learning_rate": 4.436215622996554e-07, "loss": 0.7533, "step": 7611 }, { "epoch": 0.91, "learning_rate": 4.424845179569359e-07, "loss": 0.7254, "step": 7612 }, { "epoch": 0.91, "learning_rate": 4.413488996919713e-07, "loss": 0.7545, "step": 7613 }, { "epoch": 0.91, "learning_rate": 4.4021470767420913e-07, "loss": 0.736, "step": 7614 }, { "epoch": 0.91, "learning_rate": 4.390819420728798e-07, "loss": 0.731, "step": 7615 }, { "epoch": 0.91, "learning_rate": 4.3795060305700356e-07, "loss": 0.7266, "step": 7616 }, { "epoch": 0.91, "learning_rate": 4.368206907953887e-07, "loss": 0.7243, "step": 7617 }, { "epoch": 0.91, "learning_rate": 4.356922054566304e-07, "loss": 0.7254, "step": 7618 }, { "epoch": 0.91, "learning_rate": 4.345651472091084e-07, "loss": 0.683, "step": 7619 }, { "epoch": 0.91, "learning_rate": 4.334395162209926e-07, "loss": 0.7081, "step": 7620 }, { "epoch": 0.91, "learning_rate": 4.3231531266023527e-07, "loss": 0.7277, "step": 7621 }, { "epoch": 0.91, "learning_rate": 4.311925366945835e-07, "loss": 0.6641, "step": 7622 }, { "epoch": 0.91, "learning_rate": 4.3007118849156425e-07, "loss": 0.6897, "step": 7623 }, { "epoch": 0.91, "learning_rate": 4.2895126821849377e-07, "loss": 0.7288, "step": 7624 }, { "epoch": 0.91, "learning_rate": 4.278327760424772e-07, "loss": 0.7701, "step": 7625 }, { "epoch": 0.91, "learning_rate": 4.267157121304011e-07, "loss": 0.7461, "step": 7626 }, { "epoch": 0.91, "learning_rate": 4.2560007664894763e-07, "loss": 0.7333, "step": 7627 }, { "epoch": 0.91, "learning_rate": 4.2448586976457705e-07, "loss": 0.7372, "step": 7628 }, { "epoch": 0.91, "learning_rate": 4.2337309164354414e-07, "loss": 0.6948, "step": 7629 }, { "epoch": 0.91, "learning_rate": 4.222617424518805e-07, "loss": 0.731, "step": 7630 }, { "epoch": 0.91, "learning_rate": 4.2115182235541675e-07, "loss": 0.7109, "step": 7631 }, { "epoch": 0.91, "learning_rate": 4.200433315197616e-07, "loss": 0.7561, "step": 7632 }, { "epoch": 0.91, "learning_rate": 4.189362701103117e-07, "loss": 0.649, "step": 7633 }, { "epoch": 0.91, "learning_rate": 4.17830638292257e-07, "loss": 0.6936, "step": 7634 }, { "epoch": 0.91, "learning_rate": 4.167264362305612e-07, "loss": 0.7154, "step": 7635 }, { "epoch": 0.91, "learning_rate": 4.15623664089988e-07, "loss": 0.6602, "step": 7636 }, { "epoch": 0.91, "learning_rate": 4.1452232203508134e-07, "loss": 0.7054, "step": 7637 }, { "epoch": 0.91, "learning_rate": 4.1342241023016983e-07, "loss": 0.7405, "step": 7638 }, { "epoch": 0.91, "learning_rate": 4.1232392883937655e-07, "loss": 0.7517, "step": 7639 }, { "epoch": 0.91, "learning_rate": 4.1122687802659934e-07, "loss": 0.6819, "step": 7640 }, { "epoch": 0.91, "learning_rate": 4.10131257955535e-07, "loss": 0.7031, "step": 7641 }, { "epoch": 0.91, "learning_rate": 4.090370687896561e-07, "loss": 0.7006, "step": 7642 }, { "epoch": 0.91, "learning_rate": 4.0794431069223207e-07, "loss": 0.7115, "step": 7643 }, { "epoch": 0.91, "learning_rate": 4.0685298382631133e-07, "loss": 0.7383, "step": 7644 }, { "epoch": 0.91, "learning_rate": 4.057630883547281e-07, "loss": 0.6875, "step": 7645 }, { "epoch": 0.91, "learning_rate": 4.046746244401101e-07, "loss": 0.7081, "step": 7646 }, { "epoch": 0.91, "learning_rate": 4.0358759224486285e-07, "loss": 0.7416, "step": 7647 }, { "epoch": 0.91, "learning_rate": 4.0250199193118565e-07, "loss": 0.697, "step": 7648 }, { "epoch": 0.91, "learning_rate": 4.014178236610611e-07, "loss": 0.6836, "step": 7649 }, { "epoch": 0.91, "learning_rate": 4.0033508759625637e-07, "loss": 0.7533, "step": 7650 }, { "epoch": 0.91, "learning_rate": 3.9925378389832793e-07, "loss": 0.6869, "step": 7651 }, { "epoch": 0.91, "learning_rate": 3.981739127286144e-07, "loss": 0.6925, "step": 7652 }, { "epoch": 0.91, "learning_rate": 3.970954742482469e-07, "loss": 0.7489, "step": 7653 }, { "epoch": 0.91, "learning_rate": 3.96018468618139e-07, "loss": 0.6844, "step": 7654 }, { "epoch": 0.91, "learning_rate": 3.9494289599898873e-07, "loss": 0.7617, "step": 7655 }, { "epoch": 0.91, "learning_rate": 3.938687565512844e-07, "loss": 0.7679, "step": 7656 }, { "epoch": 0.91, "learning_rate": 3.9279605043529567e-07, "loss": 0.7467, "step": 7657 }, { "epoch": 0.91, "learning_rate": 3.9172477781108554e-07, "loss": 0.7154, "step": 7658 }, { "epoch": 0.91, "learning_rate": 3.9065493883849505e-07, "loss": 0.6735, "step": 7659 }, { "epoch": 0.91, "learning_rate": 3.8958653367715536e-07, "loss": 0.7115, "step": 7660 }, { "epoch": 0.91, "learning_rate": 3.8851956248648457e-07, "loss": 0.7277, "step": 7661 }, { "epoch": 0.91, "learning_rate": 3.8745402542568534e-07, "loss": 0.7483, "step": 7662 }, { "epoch": 0.91, "learning_rate": 3.86389922653746e-07, "loss": 0.7059, "step": 7663 }, { "epoch": 0.91, "learning_rate": 3.8532725432944173e-07, "loss": 0.6842, "step": 7664 }, { "epoch": 0.91, "learning_rate": 3.8426602061133354e-07, "loss": 0.7506, "step": 7665 }, { "epoch": 0.91, "learning_rate": 3.83206221657767e-07, "loss": 0.7157, "step": 7666 }, { "epoch": 0.91, "learning_rate": 3.8214785762687556e-07, "loss": 0.6786, "step": 7667 }, { "epoch": 0.91, "learning_rate": 3.810909286765796e-07, "loss": 0.6808, "step": 7668 }, { "epoch": 0.91, "learning_rate": 3.8003543496458075e-07, "loss": 0.7098, "step": 7669 }, { "epoch": 0.91, "learning_rate": 3.789813766483719e-07, "loss": 0.7249, "step": 7670 }, { "epoch": 0.91, "learning_rate": 3.779287538852261e-07, "loss": 0.6998, "step": 7671 }, { "epoch": 0.91, "learning_rate": 3.768775668322078e-07, "loss": 0.7143, "step": 7672 }, { "epoch": 0.92, "learning_rate": 3.7582781564616254e-07, "loss": 0.7455, "step": 7673 }, { "epoch": 0.92, "learning_rate": 3.7477950048372846e-07, "loss": 0.7472, "step": 7674 }, { "epoch": 0.92, "learning_rate": 3.737326215013204e-07, "loss": 0.6328, "step": 7675 }, { "epoch": 0.92, "learning_rate": 3.726871788551423e-07, "loss": 0.8058, "step": 7676 }, { "epoch": 0.92, "learning_rate": 3.716431727011882e-07, "loss": 0.6724, "step": 7677 }, { "epoch": 0.92, "learning_rate": 3.706006031952325e-07, "loss": 0.7645, "step": 7678 }, { "epoch": 0.92, "learning_rate": 3.695594704928396e-07, "loss": 0.6998, "step": 7679 }, { "epoch": 0.92, "learning_rate": 3.6851977474935183e-07, "loss": 0.6819, "step": 7680 }, { "epoch": 0.92, "learning_rate": 3.6748151611990747e-07, "loss": 0.7478, "step": 7681 }, { "epoch": 0.92, "learning_rate": 3.6644469475942356e-07, "loss": 0.7427, "step": 7682 }, { "epoch": 0.92, "learning_rate": 3.65409310822602e-07, "loss": 0.7321, "step": 7683 }, { "epoch": 0.92, "learning_rate": 3.6437536446393694e-07, "loss": 0.7015, "step": 7684 }, { "epoch": 0.92, "learning_rate": 3.6334285583769833e-07, "loss": 0.7015, "step": 7685 }, { "epoch": 0.92, "learning_rate": 3.623117850979507e-07, "loss": 0.6864, "step": 7686 }, { "epoch": 0.92, "learning_rate": 3.612821523985399e-07, "loss": 0.7355, "step": 7687 }, { "epoch": 0.92, "learning_rate": 3.6025395789309525e-07, "loss": 0.7539, "step": 7688 }, { "epoch": 0.92, "learning_rate": 3.5922720173503844e-07, "loss": 0.7277, "step": 7689 }, { "epoch": 0.92, "learning_rate": 3.5820188407756474e-07, "loss": 0.7768, "step": 7690 }, { "epoch": 0.92, "learning_rate": 3.571780050736684e-07, "loss": 0.7388, "step": 7691 }, { "epoch": 0.92, "learning_rate": 3.5615556487611835e-07, "loss": 0.7517, "step": 7692 }, { "epoch": 0.92, "learning_rate": 3.551345636374748e-07, "loss": 0.726, "step": 7693 }, { "epoch": 0.92, "learning_rate": 3.5411500151008247e-07, "loss": 0.7031, "step": 7694 }, { "epoch": 0.92, "learning_rate": 3.5309687864606756e-07, "loss": 0.6814, "step": 7695 }, { "epoch": 0.92, "learning_rate": 3.520801951973474e-07, "loss": 0.6925, "step": 7696 }, { "epoch": 0.92, "learning_rate": 3.510649513156172e-07, "loss": 0.7026, "step": 7697 }, { "epoch": 0.92, "learning_rate": 3.50051147152366e-07, "loss": 0.6892, "step": 7698 }, { "epoch": 0.92, "learning_rate": 3.490387828588626e-07, "loss": 0.7282, "step": 7699 }, { "epoch": 0.92, "learning_rate": 3.480278585861596e-07, "loss": 0.7294, "step": 7700 }, { "epoch": 0.92, "learning_rate": 3.4701837448509966e-07, "loss": 0.7009, "step": 7701 }, { "epoch": 0.92, "learning_rate": 3.460103307063056e-07, "loss": 0.716, "step": 7702 }, { "epoch": 0.92, "learning_rate": 3.450037274001905e-07, "loss": 0.7132, "step": 7703 }, { "epoch": 0.92, "learning_rate": 3.4399856471694747e-07, "loss": 0.6908, "step": 7704 }, { "epoch": 0.92, "learning_rate": 3.429948428065588e-07, "loss": 0.6842, "step": 7705 }, { "epoch": 0.92, "learning_rate": 3.4199256181878803e-07, "loss": 0.7132, "step": 7706 }, { "epoch": 0.92, "learning_rate": 3.4099172190318666e-07, "loss": 0.7176, "step": 7707 }, { "epoch": 0.92, "learning_rate": 3.399923232090896e-07, "loss": 0.7182, "step": 7708 }, { "epoch": 0.92, "learning_rate": 3.3899436588561874e-07, "loss": 0.6936, "step": 7709 }, { "epoch": 0.92, "learning_rate": 3.379978500816772e-07, "loss": 0.7076, "step": 7710 }, { "epoch": 0.92, "learning_rate": 3.370027759459549e-07, "loss": 0.7045, "step": 7711 }, { "epoch": 0.92, "learning_rate": 3.360091436269308e-07, "loss": 0.7132, "step": 7712 }, { "epoch": 0.92, "learning_rate": 3.3501695327286087e-07, "loss": 0.6875, "step": 7713 }, { "epoch": 0.92, "learning_rate": 3.340262050317922e-07, "loss": 0.7377, "step": 7714 }, { "epoch": 0.92, "learning_rate": 3.330368990515531e-07, "loss": 0.7042, "step": 7715 }, { "epoch": 0.92, "learning_rate": 3.320490354797579e-07, "loss": 0.7349, "step": 7716 }, { "epoch": 0.92, "learning_rate": 3.310626144638074e-07, "loss": 0.7422, "step": 7717 }, { "epoch": 0.92, "learning_rate": 3.3007763615088394e-07, "loss": 0.6998, "step": 7718 }, { "epoch": 0.92, "learning_rate": 3.2909410068795777e-07, "loss": 0.7009, "step": 7719 }, { "epoch": 0.92, "learning_rate": 3.2811200822178035e-07, "loss": 0.6925, "step": 7720 }, { "epoch": 0.92, "learning_rate": 3.2713135889889005e-07, "loss": 0.7589, "step": 7721 }, { "epoch": 0.92, "learning_rate": 3.26152152865612e-07, "loss": 0.7271, "step": 7722 }, { "epoch": 0.92, "learning_rate": 3.2517439026805044e-07, "loss": 0.6858, "step": 7723 }, { "epoch": 0.92, "learning_rate": 3.241980712521009e-07, "loss": 0.7433, "step": 7724 }, { "epoch": 0.92, "learning_rate": 3.23223195963438e-07, "loss": 0.6669, "step": 7725 }, { "epoch": 0.92, "learning_rate": 3.22249764547522e-07, "loss": 0.7042, "step": 7726 }, { "epoch": 0.92, "learning_rate": 3.2127777714960117e-07, "loss": 0.6724, "step": 7727 }, { "epoch": 0.92, "learning_rate": 3.2030723391470284e-07, "loss": 0.7589, "step": 7728 }, { "epoch": 0.92, "learning_rate": 3.1933813498764455e-07, "loss": 0.6624, "step": 7729 }, { "epoch": 0.92, "learning_rate": 3.183704805130239e-07, "loss": 0.6825, "step": 7730 }, { "epoch": 0.92, "learning_rate": 3.174042706352265e-07, "loss": 0.7785, "step": 7731 }, { "epoch": 0.92, "learning_rate": 3.1643950549841817e-07, "loss": 0.7645, "step": 7732 }, { "epoch": 0.92, "learning_rate": 3.1547618524655265e-07, "loss": 0.7377, "step": 7733 }, { "epoch": 0.92, "learning_rate": 3.145143100233694e-07, "loss": 0.7009, "step": 7734 }, { "epoch": 0.92, "learning_rate": 3.1355387997238587e-07, "loss": 0.7651, "step": 7735 }, { "epoch": 0.92, "learning_rate": 3.1259489523691177e-07, "loss": 0.7266, "step": 7736 }, { "epoch": 0.92, "learning_rate": 3.1163735596003386e-07, "loss": 0.7344, "step": 7737 }, { "epoch": 0.92, "learning_rate": 3.106812622846278e-07, "loss": 0.7561, "step": 7738 }, { "epoch": 0.92, "learning_rate": 3.0972661435335394e-07, "loss": 0.692, "step": 7739 }, { "epoch": 0.92, "learning_rate": 3.0877341230865385e-07, "loss": 0.7461, "step": 7740 }, { "epoch": 0.92, "learning_rate": 3.0782165629275606e-07, "loss": 0.6847, "step": 7741 }, { "epoch": 0.92, "learning_rate": 3.0687134644767026e-07, "loss": 0.7718, "step": 7742 }, { "epoch": 0.92, "learning_rate": 3.059224829151941e-07, "loss": 0.7467, "step": 7743 }, { "epoch": 0.92, "learning_rate": 3.0497506583690663e-07, "loss": 0.7065, "step": 7744 }, { "epoch": 0.92, "learning_rate": 3.040290953541736e-07, "loss": 0.7494, "step": 7745 }, { "epoch": 0.92, "learning_rate": 3.0308457160814096e-07, "loss": 0.6886, "step": 7746 }, { "epoch": 0.92, "learning_rate": 3.021414947397416e-07, "loss": 0.7193, "step": 7747 }, { "epoch": 0.92, "learning_rate": 3.01199864889693e-07, "loss": 0.7199, "step": 7748 }, { "epoch": 0.92, "learning_rate": 3.002596821984971e-07, "loss": 0.7824, "step": 7749 }, { "epoch": 0.92, "learning_rate": 2.993209468064362e-07, "loss": 0.7137, "step": 7750 }, { "epoch": 0.92, "learning_rate": 2.9838365885358044e-07, "loss": 0.6964, "step": 7751 }, { "epoch": 0.92, "learning_rate": 2.974478184797813e-07, "loss": 0.6858, "step": 7752 }, { "epoch": 0.92, "learning_rate": 2.9651342582467714e-07, "loss": 0.7662, "step": 7753 }, { "epoch": 0.92, "learning_rate": 2.9558048102768856e-07, "loss": 0.7422, "step": 7754 }, { "epoch": 0.92, "learning_rate": 2.9464898422802093e-07, "loss": 0.6847, "step": 7755 }, { "epoch": 0.92, "learning_rate": 2.937189355646597e-07, "loss": 0.7612, "step": 7756 }, { "epoch": 0.93, "learning_rate": 2.9279033517638166e-07, "loss": 0.7517, "step": 7757 }, { "epoch": 0.93, "learning_rate": 2.9186318320174157e-07, "loss": 0.7081, "step": 7758 }, { "epoch": 0.93, "learning_rate": 2.909374797790787e-07, "loss": 0.755, "step": 7759 }, { "epoch": 0.93, "learning_rate": 2.900132250465204e-07, "loss": 0.6814, "step": 7760 }, { "epoch": 0.93, "learning_rate": 2.8909041914197076e-07, "loss": 0.7411, "step": 7761 }, { "epoch": 0.93, "learning_rate": 2.8816906220312523e-07, "loss": 0.7528, "step": 7762 }, { "epoch": 0.93, "learning_rate": 2.8724915436745717e-07, "loss": 0.7238, "step": 7763 }, { "epoch": 0.93, "learning_rate": 2.8633069577222673e-07, "loss": 0.7087, "step": 7764 }, { "epoch": 0.93, "learning_rate": 2.854136865544799e-07, "loss": 0.7355, "step": 7765 }, { "epoch": 0.93, "learning_rate": 2.844981268510394e-07, "loss": 0.774, "step": 7766 }, { "epoch": 0.93, "learning_rate": 2.835840167985193e-07, "loss": 0.7277, "step": 7767 }, { "epoch": 0.93, "learning_rate": 2.8267135653331277e-07, "loss": 0.7003, "step": 7768 }, { "epoch": 0.93, "learning_rate": 2.817601461915964e-07, "loss": 0.7059, "step": 7769 }, { "epoch": 0.93, "learning_rate": 2.8085038590933587e-07, "loss": 0.7171, "step": 7770 }, { "epoch": 0.93, "learning_rate": 2.799420758222715e-07, "loss": 0.683, "step": 7771 }, { "epoch": 0.93, "learning_rate": 2.7903521606593707e-07, "loss": 0.7333, "step": 7772 }, { "epoch": 0.93, "learning_rate": 2.7812980677564104e-07, "loss": 0.7188, "step": 7773 }, { "epoch": 0.93, "learning_rate": 2.772258480864831e-07, "loss": 0.7439, "step": 7774 }, { "epoch": 0.93, "learning_rate": 2.7632334013334207e-07, "loss": 0.7221, "step": 7775 }, { "epoch": 0.93, "learning_rate": 2.7542228305088125e-07, "loss": 0.7545, "step": 7776 }, { "epoch": 0.93, "learning_rate": 2.745226769735465e-07, "loss": 0.7188, "step": 7777 }, { "epoch": 0.93, "learning_rate": 2.736245220355671e-07, "loss": 0.7305, "step": 7778 }, { "epoch": 0.93, "learning_rate": 2.727278183709592e-07, "loss": 0.7109, "step": 7779 }, { "epoch": 0.93, "learning_rate": 2.7183256611352016e-07, "loss": 0.7104, "step": 7780 }, { "epoch": 0.93, "learning_rate": 2.7093876539682984e-07, "loss": 0.7232, "step": 7781 }, { "epoch": 0.93, "learning_rate": 2.7004641635425155e-07, "loss": 0.7277, "step": 7782 }, { "epoch": 0.93, "learning_rate": 2.691555191189321e-07, "loss": 0.7589, "step": 7783 }, { "epoch": 0.93, "learning_rate": 2.682660738238052e-07, "loss": 0.7467, "step": 7784 }, { "epoch": 0.93, "learning_rate": 2.673780806015835e-07, "loss": 0.7204, "step": 7785 }, { "epoch": 0.93, "learning_rate": 2.6649153958476447e-07, "loss": 0.6914, "step": 7786 }, { "epoch": 0.93, "learning_rate": 2.6560645090562777e-07, "loss": 0.6708, "step": 7787 }, { "epoch": 0.93, "learning_rate": 2.6472281469623995e-07, "loss": 0.7494, "step": 7788 }, { "epoch": 0.93, "learning_rate": 2.6384063108844784e-07, "loss": 0.7059, "step": 7789 }, { "epoch": 0.93, "learning_rate": 2.629599002138816e-07, "loss": 0.7533, "step": 7790 }, { "epoch": 0.93, "learning_rate": 2.620806222039551e-07, "loss": 0.7349, "step": 7791 }, { "epoch": 0.93, "learning_rate": 2.612027971898645e-07, "loss": 0.7109, "step": 7792 }, { "epoch": 0.93, "learning_rate": 2.6032642530259167e-07, "loss": 0.7243, "step": 7793 }, { "epoch": 0.93, "learning_rate": 2.594515066729009e-07, "loss": 0.7109, "step": 7794 }, { "epoch": 0.93, "learning_rate": 2.5857804143133656e-07, "loss": 0.7294, "step": 7795 }, { "epoch": 0.93, "learning_rate": 2.577060297082301e-07, "loss": 0.6987, "step": 7796 }, { "epoch": 0.93, "learning_rate": 2.5683547163369293e-07, "loss": 0.6925, "step": 7797 }, { "epoch": 0.93, "learning_rate": 2.5596636733762335e-07, "loss": 0.7506, "step": 7798 }, { "epoch": 0.93, "learning_rate": 2.550987169496999e-07, "loss": 0.7433, "step": 7799 }, { "epoch": 0.93, "learning_rate": 2.5423252059938344e-07, "loss": 0.7467, "step": 7800 }, { "epoch": 0.93, "learning_rate": 2.5336777841592053e-07, "loss": 0.6936, "step": 7801 }, { "epoch": 0.93, "learning_rate": 2.525044905283369e-07, "loss": 0.707, "step": 7802 }, { "epoch": 0.93, "learning_rate": 2.516426570654473e-07, "loss": 0.7232, "step": 7803 }, { "epoch": 0.93, "learning_rate": 2.5078227815584335e-07, "loss": 0.6735, "step": 7804 }, { "epoch": 0.93, "learning_rate": 2.499233539279056e-07, "loss": 0.7433, "step": 7805 }, { "epoch": 0.93, "learning_rate": 2.490658845097904e-07, "loss": 0.6585, "step": 7806 }, { "epoch": 0.93, "learning_rate": 2.482098700294422e-07, "loss": 0.7333, "step": 7807 }, { "epoch": 0.93, "learning_rate": 2.473553106145876e-07, "loss": 0.7299, "step": 7808 }, { "epoch": 0.93, "learning_rate": 2.465022063927347e-07, "loss": 0.6858, "step": 7809 }, { "epoch": 0.93, "learning_rate": 2.456505574911772e-07, "loss": 0.7494, "step": 7810 }, { "epoch": 0.93, "learning_rate": 2.448003640369867e-07, "loss": 0.7154, "step": 7811 }, { "epoch": 0.93, "learning_rate": 2.4395162615702295e-07, "loss": 0.7427, "step": 7812 }, { "epoch": 0.93, "learning_rate": 2.431043439779246e-07, "loss": 0.7171, "step": 7813 }, { "epoch": 0.93, "learning_rate": 2.4225851762611497e-07, "loss": 0.7176, "step": 7814 }, { "epoch": 0.93, "learning_rate": 2.41414147227802e-07, "loss": 0.7645, "step": 7815 }, { "epoch": 0.93, "learning_rate": 2.4057123290897156e-07, "loss": 0.7015, "step": 7816 }, { "epoch": 0.93, "learning_rate": 2.397297747953964e-07, "loss": 0.6763, "step": 7817 }, { "epoch": 0.93, "learning_rate": 2.388897730126294e-07, "loss": 0.6987, "step": 7818 }, { "epoch": 0.93, "learning_rate": 2.380512276860092e-07, "loss": 0.7422, "step": 7819 }, { "epoch": 0.93, "learning_rate": 2.372141389406546e-07, "loss": 0.7193, "step": 7820 }, { "epoch": 0.93, "learning_rate": 2.3637850690146568e-07, "loss": 0.7143, "step": 7821 }, { "epoch": 0.93, "learning_rate": 2.3554433169313052e-07, "loss": 0.74, "step": 7822 }, { "epoch": 0.93, "learning_rate": 2.3471161344011283e-07, "loss": 0.7176, "step": 7823 }, { "epoch": 0.93, "learning_rate": 2.3388035226666551e-07, "loss": 0.7472, "step": 7824 }, { "epoch": 0.93, "learning_rate": 2.330505482968204e-07, "loss": 0.731, "step": 7825 }, { "epoch": 0.93, "learning_rate": 2.322222016543918e-07, "loss": 0.6853, "step": 7826 }, { "epoch": 0.93, "learning_rate": 2.3139531246297752e-07, "loss": 0.76, "step": 7827 }, { "epoch": 0.93, "learning_rate": 2.3056988084595777e-07, "loss": 0.7182, "step": 7828 }, { "epoch": 0.93, "learning_rate": 2.2974590692649623e-07, "loss": 0.62, "step": 7829 }, { "epoch": 0.93, "learning_rate": 2.289233908275379e-07, "loss": 0.7723, "step": 7830 }, { "epoch": 0.93, "learning_rate": 2.2810233267181015e-07, "loss": 0.7338, "step": 7831 }, { "epoch": 0.93, "learning_rate": 2.2728273258182277e-07, "loss": 0.7439, "step": 7832 }, { "epoch": 0.93, "learning_rate": 2.2646459067986793e-07, "loss": 0.6724, "step": 7833 }, { "epoch": 0.93, "learning_rate": 2.256479070880224e-07, "loss": 0.6825, "step": 7834 }, { "epoch": 0.93, "learning_rate": 2.2483268192814323e-07, "loss": 0.6814, "step": 7835 }, { "epoch": 0.93, "learning_rate": 2.240189153218686e-07, "loss": 0.7723, "step": 7836 }, { "epoch": 0.93, "learning_rate": 2.232066073906214e-07, "loss": 0.6936, "step": 7837 }, { "epoch": 0.93, "learning_rate": 2.2239575825560688e-07, "loss": 0.745, "step": 7838 }, { "epoch": 0.93, "learning_rate": 2.2158636803781165e-07, "loss": 0.721, "step": 7839 }, { "epoch": 0.94, "learning_rate": 2.207784368580046e-07, "loss": 0.7087, "step": 7840 }, { "epoch": 0.94, "learning_rate": 2.1997196483673822e-07, "loss": 0.6964, "step": 7841 }, { "epoch": 0.94, "learning_rate": 2.1916695209434402e-07, "loss": 0.6763, "step": 7842 }, { "epoch": 0.94, "learning_rate": 2.1836339875094036e-07, "loss": 0.7427, "step": 7843 }, { "epoch": 0.94, "learning_rate": 2.175613049264247e-07, "loss": 0.7533, "step": 7844 }, { "epoch": 0.94, "learning_rate": 2.167606707404779e-07, "loss": 0.7751, "step": 7845 }, { "epoch": 0.94, "learning_rate": 2.1596149631256112e-07, "loss": 0.7327, "step": 7846 }, { "epoch": 0.94, "learning_rate": 2.151637817619201e-07, "loss": 0.7238, "step": 7847 }, { "epoch": 0.94, "learning_rate": 2.143675272075829e-07, "loss": 0.7506, "step": 7848 }, { "epoch": 0.94, "learning_rate": 2.135727327683579e-07, "loss": 0.7578, "step": 7849 }, { "epoch": 0.94, "learning_rate": 2.1277939856283681e-07, "loss": 0.6869, "step": 7850 }, { "epoch": 0.94, "learning_rate": 2.1198752470939277e-07, "loss": 0.7746, "step": 7851 }, { "epoch": 0.94, "learning_rate": 2.1119711132618015e-07, "loss": 0.7472, "step": 7852 }, { "epoch": 0.94, "learning_rate": 2.1040815853113906e-07, "loss": 0.6942, "step": 7853 }, { "epoch": 0.94, "learning_rate": 2.0962066644198754e-07, "loss": 0.7494, "step": 7854 }, { "epoch": 0.94, "learning_rate": 2.0883463517622825e-07, "loss": 0.6652, "step": 7855 }, { "epoch": 0.94, "learning_rate": 2.080500648511441e-07, "loss": 0.7254, "step": 7856 }, { "epoch": 0.94, "learning_rate": 2.0726695558380139e-07, "loss": 0.6903, "step": 7857 }, { "epoch": 0.94, "learning_rate": 2.0648530749104778e-07, "loss": 0.6853, "step": 7858 }, { "epoch": 0.94, "learning_rate": 2.0570512068951331e-07, "loss": 0.7388, "step": 7859 }, { "epoch": 0.94, "learning_rate": 2.0492639529561042e-07, "loss": 0.784, "step": 7860 }, { "epoch": 0.94, "learning_rate": 2.0414913142553062e-07, "loss": 0.7366, "step": 7861 }, { "epoch": 0.94, "learning_rate": 2.033733291952511e-07, "loss": 0.7316, "step": 7862 }, { "epoch": 0.94, "learning_rate": 2.025989887205304e-07, "loss": 0.7623, "step": 7863 }, { "epoch": 0.94, "learning_rate": 2.01826110116905e-07, "loss": 0.6847, "step": 7864 }, { "epoch": 0.94, "learning_rate": 2.010546934996993e-07, "loss": 0.6942, "step": 7865 }, { "epoch": 0.94, "learning_rate": 2.0028473898401347e-07, "loss": 0.7723, "step": 7866 }, { "epoch": 0.94, "learning_rate": 1.9951624668473446e-07, "loss": 0.7695, "step": 7867 }, { "epoch": 0.94, "learning_rate": 1.9874921671652835e-07, "loss": 0.7366, "step": 7868 }, { "epoch": 0.94, "learning_rate": 1.979836491938447e-07, "loss": 0.7182, "step": 7869 }, { "epoch": 0.94, "learning_rate": 1.9721954423091328e-07, "loss": 0.7087, "step": 7870 }, { "epoch": 0.94, "learning_rate": 1.9645690194174728e-07, "loss": 0.6948, "step": 7871 }, { "epoch": 0.94, "learning_rate": 1.956957224401379e-07, "loss": 0.6914, "step": 7872 }, { "epoch": 0.94, "learning_rate": 1.949360058396621e-07, "loss": 0.7182, "step": 7873 }, { "epoch": 0.94, "learning_rate": 1.9417775225367917e-07, "loss": 0.7617, "step": 7874 }, { "epoch": 0.94, "learning_rate": 1.9342096179532644e-07, "loss": 0.7662, "step": 7875 }, { "epoch": 0.94, "learning_rate": 1.9266563457752462e-07, "loss": 0.7171, "step": 7876 }, { "epoch": 0.94, "learning_rate": 1.9191177071297584e-07, "loss": 0.7232, "step": 7877 }, { "epoch": 0.94, "learning_rate": 1.9115937031416454e-07, "loss": 0.7188, "step": 7878 }, { "epoch": 0.94, "learning_rate": 1.9040843349335757e-07, "loss": 0.7282, "step": 7879 }, { "epoch": 0.94, "learning_rate": 1.89658960362602e-07, "loss": 0.7165, "step": 7880 }, { "epoch": 0.94, "learning_rate": 1.8891095103372504e-07, "loss": 0.8025, "step": 7881 }, { "epoch": 0.94, "learning_rate": 1.881644056183396e-07, "loss": 0.7176, "step": 7882 }, { "epoch": 0.94, "learning_rate": 1.8741932422783548e-07, "loss": 0.7081, "step": 7883 }, { "epoch": 0.94, "learning_rate": 1.8667570697338712e-07, "loss": 0.7065, "step": 7884 }, { "epoch": 0.94, "learning_rate": 1.8593355396595126e-07, "loss": 0.7349, "step": 7885 }, { "epoch": 0.94, "learning_rate": 1.8519286531626267e-07, "loss": 0.678, "step": 7886 }, { "epoch": 0.94, "learning_rate": 1.8445364113483966e-07, "loss": 0.707, "step": 7887 }, { "epoch": 0.94, "learning_rate": 1.8371588153198393e-07, "loss": 0.7277, "step": 7888 }, { "epoch": 0.94, "learning_rate": 1.8297958661777527e-07, "loss": 0.7472, "step": 7889 }, { "epoch": 0.94, "learning_rate": 1.8224475650207573e-07, "loss": 0.7254, "step": 7890 }, { "epoch": 0.94, "learning_rate": 1.8151139129452988e-07, "loss": 0.6942, "step": 7891 }, { "epoch": 0.94, "learning_rate": 1.807794911045635e-07, "loss": 0.7126, "step": 7892 }, { "epoch": 0.94, "learning_rate": 1.8004905604138367e-07, "loss": 0.7266, "step": 7893 }, { "epoch": 0.94, "learning_rate": 1.7932008621397766e-07, "loss": 0.7148, "step": 7894 }, { "epoch": 0.94, "learning_rate": 1.7859258173111626e-07, "loss": 0.7003, "step": 7895 }, { "epoch": 0.94, "learning_rate": 1.778665427013504e-07, "loss": 0.6903, "step": 7896 }, { "epoch": 0.94, "learning_rate": 1.771419692330112e-07, "loss": 0.7109, "step": 7897 }, { "epoch": 0.94, "learning_rate": 1.7641886143421327e-07, "loss": 0.7188, "step": 7898 }, { "epoch": 0.94, "learning_rate": 1.7569721941285033e-07, "loss": 0.7701, "step": 7899 }, { "epoch": 0.94, "learning_rate": 1.749770432766029e-07, "loss": 0.6802, "step": 7900 }, { "epoch": 0.94, "learning_rate": 1.7425833313292283e-07, "loss": 0.6987, "step": 7901 }, { "epoch": 0.94, "learning_rate": 1.735410890890521e-07, "loss": 0.7042, "step": 7902 }, { "epoch": 0.94, "learning_rate": 1.7282531125201062e-07, "loss": 0.731, "step": 7903 }, { "epoch": 0.94, "learning_rate": 1.7211099972859857e-07, "loss": 0.7009, "step": 7904 }, { "epoch": 0.94, "learning_rate": 1.7139815462540065e-07, "loss": 0.7193, "step": 7905 }, { "epoch": 0.94, "learning_rate": 1.7068677604877738e-07, "loss": 0.7701, "step": 7906 }, { "epoch": 0.94, "learning_rate": 1.6997686410487602e-07, "loss": 0.7729, "step": 7907 }, { "epoch": 0.94, "learning_rate": 1.6926841889962187e-07, "loss": 0.7383, "step": 7908 }, { "epoch": 0.94, "learning_rate": 1.6856144053872037e-07, "loss": 0.7455, "step": 7909 }, { "epoch": 0.94, "learning_rate": 1.678559291276638e-07, "loss": 0.678, "step": 7910 }, { "epoch": 0.94, "learning_rate": 1.6715188477171794e-07, "loss": 0.7662, "step": 7911 }, { "epoch": 0.94, "learning_rate": 1.6644930757593546e-07, "loss": 0.7232, "step": 7912 }, { "epoch": 0.94, "learning_rate": 1.6574819764514694e-07, "loss": 0.7305, "step": 7913 }, { "epoch": 0.94, "learning_rate": 1.6504855508396422e-07, "loss": 0.6908, "step": 7914 }, { "epoch": 0.94, "learning_rate": 1.6435037999678272e-07, "loss": 0.7232, "step": 7915 }, { "epoch": 0.94, "learning_rate": 1.6365367248777686e-07, "loss": 0.7662, "step": 7916 }, { "epoch": 0.94, "learning_rate": 1.6295843266090238e-07, "loss": 0.7416, "step": 7917 }, { "epoch": 0.94, "learning_rate": 1.622646606198952e-07, "loss": 0.7087, "step": 7918 }, { "epoch": 0.94, "learning_rate": 1.6157235646827362e-07, "loss": 0.6892, "step": 7919 }, { "epoch": 0.94, "learning_rate": 1.6088152030933723e-07, "loss": 0.7294, "step": 7920 }, { "epoch": 0.94, "learning_rate": 1.601921522461658e-07, "loss": 0.7243, "step": 7921 }, { "epoch": 0.94, "learning_rate": 1.5950425238161816e-07, "loss": 0.6853, "step": 7922 }, { "epoch": 0.94, "learning_rate": 1.5881782081833663e-07, "loss": 0.7182, "step": 7923 }, { "epoch": 0.95, "learning_rate": 1.5813285765874487e-07, "loss": 0.6256, "step": 7924 }, { "epoch": 0.95, "learning_rate": 1.5744936300504555e-07, "loss": 0.7818, "step": 7925 }, { "epoch": 0.95, "learning_rate": 1.5676733695922264e-07, "loss": 0.7249, "step": 7926 }, { "epoch": 0.95, "learning_rate": 1.5608677962304142e-07, "loss": 0.7344, "step": 7927 }, { "epoch": 0.95, "learning_rate": 1.5540769109804843e-07, "loss": 0.6869, "step": 7928 }, { "epoch": 0.95, "learning_rate": 1.547300714855693e-07, "loss": 0.75, "step": 7929 }, { "epoch": 0.95, "learning_rate": 1.5405392088671312e-07, "loss": 0.7266, "step": 7930 }, { "epoch": 0.95, "learning_rate": 1.5337923940236922e-07, "loss": 0.7282, "step": 7931 }, { "epoch": 0.95, "learning_rate": 1.527060271332048e-07, "loss": 0.7081, "step": 7932 }, { "epoch": 0.95, "learning_rate": 1.520342841796707e-07, "loss": 0.7048, "step": 7933 }, { "epoch": 0.95, "learning_rate": 1.5136401064199667e-07, "loss": 0.7467, "step": 7934 }, { "epoch": 0.95, "learning_rate": 1.506952066201961e-07, "loss": 0.7238, "step": 7935 }, { "epoch": 0.95, "learning_rate": 1.5002787221406133e-07, "loss": 0.6948, "step": 7936 }, { "epoch": 0.95, "learning_rate": 1.4936200752316387e-07, "loss": 0.6903, "step": 7937 }, { "epoch": 0.95, "learning_rate": 1.4869761264685756e-07, "loss": 0.7595, "step": 7938 }, { "epoch": 0.95, "learning_rate": 1.4803468768427865e-07, "loss": 0.7294, "step": 7939 }, { "epoch": 0.95, "learning_rate": 1.4737323273434024e-07, "loss": 0.7773, "step": 7940 }, { "epoch": 0.95, "learning_rate": 1.4671324789574004e-07, "loss": 0.7193, "step": 7941 }, { "epoch": 0.95, "learning_rate": 1.4605473326695152e-07, "loss": 0.6975, "step": 7942 }, { "epoch": 0.95, "learning_rate": 1.4539768894623495e-07, "loss": 0.7316, "step": 7943 }, { "epoch": 0.95, "learning_rate": 1.4474211503162528e-07, "loss": 0.697, "step": 7944 }, { "epoch": 0.95, "learning_rate": 1.4408801162094199e-07, "loss": 0.7031, "step": 7945 }, { "epoch": 0.95, "learning_rate": 1.4343537881178593e-07, "loss": 0.5968, "step": 7946 }, { "epoch": 0.95, "learning_rate": 1.4278421670153252e-07, "loss": 0.7104, "step": 7947 }, { "epoch": 0.95, "learning_rate": 1.4213452538734406e-07, "loss": 0.6724, "step": 7948 }, { "epoch": 0.95, "learning_rate": 1.4148630496615968e-07, "loss": 0.7729, "step": 7949 }, { "epoch": 0.95, "learning_rate": 1.4083955553470308e-07, "loss": 0.7093, "step": 7950 }, { "epoch": 0.95, "learning_rate": 1.4019427718947377e-07, "loss": 0.6869, "step": 7951 }, { "epoch": 0.95, "learning_rate": 1.395504700267536e-07, "loss": 0.7188, "step": 7952 }, { "epoch": 0.95, "learning_rate": 1.3890813414260572e-07, "loss": 0.7271, "step": 7953 }, { "epoch": 0.95, "learning_rate": 1.382672696328724e-07, "loss": 0.7154, "step": 7954 }, { "epoch": 0.95, "learning_rate": 1.3762787659317823e-07, "loss": 0.7522, "step": 7955 }, { "epoch": 0.95, "learning_rate": 1.3698995511892687e-07, "loss": 0.7115, "step": 7956 }, { "epoch": 0.95, "learning_rate": 1.3635350530530224e-07, "loss": 0.678, "step": 7957 }, { "epoch": 0.95, "learning_rate": 1.357185272472694e-07, "loss": 0.7003, "step": 7958 }, { "epoch": 0.95, "learning_rate": 1.3508502103957266e-07, "loss": 0.6975, "step": 7959 }, { "epoch": 0.95, "learning_rate": 1.3445298677673858e-07, "loss": 0.668, "step": 7960 }, { "epoch": 0.95, "learning_rate": 1.338224245530728e-07, "loss": 0.7266, "step": 7961 }, { "epoch": 0.95, "learning_rate": 1.3319333446266124e-07, "loss": 0.7249, "step": 7962 }, { "epoch": 0.95, "learning_rate": 1.325657165993699e-07, "loss": 0.7305, "step": 7963 }, { "epoch": 0.95, "learning_rate": 1.319395710568472e-07, "loss": 0.6964, "step": 7964 }, { "epoch": 0.95, "learning_rate": 1.3131489792851948e-07, "loss": 0.6814, "step": 7965 }, { "epoch": 0.95, "learning_rate": 1.3069169730759446e-07, "loss": 0.716, "step": 7966 }, { "epoch": 0.95, "learning_rate": 1.3006996928705996e-07, "loss": 0.6814, "step": 7967 }, { "epoch": 0.95, "learning_rate": 1.2944971395968288e-07, "loss": 0.745, "step": 7968 }, { "epoch": 0.95, "learning_rate": 1.2883093141801472e-07, "loss": 0.6959, "step": 7969 }, { "epoch": 0.95, "learning_rate": 1.2821362175438058e-07, "loss": 0.7506, "step": 7970 }, { "epoch": 0.95, "learning_rate": 1.2759778506089115e-07, "loss": 0.7383, "step": 7971 }, { "epoch": 0.95, "learning_rate": 1.2698342142943632e-07, "loss": 0.731, "step": 7972 }, { "epoch": 0.95, "learning_rate": 1.2637053095168162e-07, "loss": 0.7734, "step": 7973 }, { "epoch": 0.95, "learning_rate": 1.2575911371908057e-07, "loss": 0.7054, "step": 7974 }, { "epoch": 0.95, "learning_rate": 1.2514916982286128e-07, "loss": 0.7243, "step": 7975 }, { "epoch": 0.95, "learning_rate": 1.2454069935403325e-07, "loss": 0.6948, "step": 7976 }, { "epoch": 0.95, "learning_rate": 1.239337024033871e-07, "loss": 0.7723, "step": 7977 }, { "epoch": 0.95, "learning_rate": 1.2332817906149151e-07, "loss": 0.7561, "step": 7978 }, { "epoch": 0.95, "learning_rate": 1.227241294186987e-07, "loss": 0.7277, "step": 7979 }, { "epoch": 0.95, "learning_rate": 1.2212155356513655e-07, "loss": 0.7327, "step": 7980 }, { "epoch": 0.95, "learning_rate": 1.2152045159071756e-07, "loss": 0.6875, "step": 7981 }, { "epoch": 0.95, "learning_rate": 1.2092082358513112e-07, "loss": 0.736, "step": 7982 }, { "epoch": 0.95, "learning_rate": 1.20322669637849e-07, "loss": 0.7277, "step": 7983 }, { "epoch": 0.95, "learning_rate": 1.197259898381198e-07, "loss": 0.6881, "step": 7984 }, { "epoch": 0.95, "learning_rate": 1.191307842749756e-07, "loss": 0.6747, "step": 7985 }, { "epoch": 0.95, "learning_rate": 1.1853705303722762e-07, "loss": 0.7215, "step": 7986 }, { "epoch": 0.95, "learning_rate": 1.17944796213465e-07, "loss": 0.7416, "step": 7987 }, { "epoch": 0.95, "learning_rate": 1.1735401389205925e-07, "loss": 0.6858, "step": 7988 }, { "epoch": 0.95, "learning_rate": 1.1676470616116098e-07, "loss": 0.736, "step": 7989 }, { "epoch": 0.95, "learning_rate": 1.1617687310869986e-07, "loss": 0.7377, "step": 7990 }, { "epoch": 0.95, "learning_rate": 1.1559051482238903e-07, "loss": 0.7528, "step": 7991 }, { "epoch": 0.95, "learning_rate": 1.1500563138971522e-07, "loss": 0.6752, "step": 7992 }, { "epoch": 0.95, "learning_rate": 1.1442222289795302e-07, "loss": 0.7076, "step": 7993 }, { "epoch": 0.95, "learning_rate": 1.138402894341506e-07, "loss": 0.7288, "step": 7994 }, { "epoch": 0.95, "learning_rate": 1.1325983108513849e-07, "loss": 0.7076, "step": 7995 }, { "epoch": 0.95, "learning_rate": 1.1268084793752742e-07, "loss": 0.745, "step": 7996 }, { "epoch": 0.95, "learning_rate": 1.1210334007770718e-07, "loss": 0.75, "step": 7997 }, { "epoch": 0.95, "learning_rate": 1.1152730759184882e-07, "loss": 0.7054, "step": 7998 }, { "epoch": 0.95, "learning_rate": 1.1095275056589916e-07, "loss": 0.7193, "step": 7999 }, { "epoch": 0.95, "learning_rate": 1.1037966908559184e-07, "loss": 0.7573, "step": 8000 }, { "epoch": 0.95, "learning_rate": 1.09808063236434e-07, "loss": 0.7606, "step": 8001 }, { "epoch": 0.95, "learning_rate": 1.0923793310371634e-07, "loss": 0.7511, "step": 8002 }, { "epoch": 0.95, "learning_rate": 1.0866927877250632e-07, "loss": 0.7645, "step": 8003 }, { "epoch": 0.95, "learning_rate": 1.0810210032765389e-07, "loss": 0.7054, "step": 8004 }, { "epoch": 0.95, "learning_rate": 1.0753639785378689e-07, "loss": 0.7065, "step": 8005 }, { "epoch": 0.95, "learning_rate": 1.0697217143531669e-07, "loss": 0.6607, "step": 8006 }, { "epoch": 0.95, "learning_rate": 1.0640942115642817e-07, "loss": 0.7204, "step": 8007 }, { "epoch": 0.96, "learning_rate": 1.0584814710109193e-07, "loss": 0.7444, "step": 8008 }, { "epoch": 0.96, "learning_rate": 1.052883493530521e-07, "loss": 0.6786, "step": 8009 }, { "epoch": 0.96, "learning_rate": 1.0473002799584076e-07, "loss": 0.7427, "step": 8010 }, { "epoch": 0.96, "learning_rate": 1.0417318311276236e-07, "loss": 0.7037, "step": 8011 }, { "epoch": 0.96, "learning_rate": 1.0361781478690492e-07, "loss": 0.7545, "step": 8012 }, { "epoch": 0.96, "learning_rate": 1.0306392310113322e-07, "loss": 0.7439, "step": 8013 }, { "epoch": 0.96, "learning_rate": 1.0251150813809563e-07, "loss": 0.7416, "step": 8014 }, { "epoch": 0.96, "learning_rate": 1.0196056998021619e-07, "loss": 0.7121, "step": 8015 }, { "epoch": 0.96, "learning_rate": 1.014111087097025e-07, "loss": 0.7221, "step": 8016 }, { "epoch": 0.96, "learning_rate": 1.0086312440853786e-07, "loss": 0.7333, "step": 8017 }, { "epoch": 0.96, "learning_rate": 1.0031661715848795e-07, "loss": 0.7333, "step": 8018 }, { "epoch": 0.96, "learning_rate": 9.977158704109646e-08, "loss": 0.7227, "step": 8019 }, { "epoch": 0.96, "learning_rate": 9.922803413768834e-08, "loss": 0.7165, "step": 8020 }, { "epoch": 0.96, "learning_rate": 9.868595852936758e-08, "loss": 0.745, "step": 8021 }, { "epoch": 0.96, "learning_rate": 9.814536029701616e-08, "loss": 0.6602, "step": 8022 }, { "epoch": 0.96, "step": 8022, "total_flos": 2840201517072384.0, "train_loss": 0.7857581807309272, "train_runtime": 111494.8304, "train_samples_per_second": 8.423, "train_steps_per_second": 0.075 } ], "max_steps": 8385, "num_train_epochs": 1, "total_flos": 2840201517072384.0, "trial_name": null, "trial_params": null }