{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "global_step": 9186, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 7.246376811594204e-08, "loss": 1.6201, "step": 1 }, { "epoch": 0.0, "learning_rate": 1.4492753623188408e-07, "loss": 1.5254, "step": 2 }, { "epoch": 0.0, "learning_rate": 2.173913043478261e-07, "loss": 1.4692, "step": 3 }, { "epoch": 0.0, "learning_rate": 2.8985507246376816e-07, "loss": 1.1284, "step": 4 }, { "epoch": 0.0, "learning_rate": 3.623188405797102e-07, "loss": 1.2202, "step": 5 }, { "epoch": 0.0, "learning_rate": 4.347826086956522e-07, "loss": 1.0637, "step": 6 }, { "epoch": 0.0, "learning_rate": 5.072463768115942e-07, "loss": 1.1514, "step": 7 }, { "epoch": 0.0, "learning_rate": 5.797101449275363e-07, "loss": 1.3628, "step": 8 }, { "epoch": 0.0, "learning_rate": 6.521739130434783e-07, "loss": 1.4985, "step": 9 }, { "epoch": 0.0, "learning_rate": 7.246376811594204e-07, "loss": 1.333, "step": 10 }, { "epoch": 0.0, "learning_rate": 7.971014492753623e-07, "loss": 1.4092, "step": 11 }, { "epoch": 0.0, "learning_rate": 8.695652173913044e-07, "loss": 1.4258, "step": 12 }, { "epoch": 0.0, "learning_rate": 9.420289855072465e-07, "loss": 0.8296, "step": 13 }, { "epoch": 0.0, "learning_rate": 1.0144927536231885e-06, "loss": 1.1089, "step": 14 }, { "epoch": 0.0, "learning_rate": 1.0869565217391306e-06, "loss": 0.9351, "step": 15 }, { "epoch": 0.0, "learning_rate": 1.1594202898550726e-06, "loss": 1.2119, "step": 16 }, { "epoch": 0.0, "learning_rate": 1.2318840579710147e-06, "loss": 1.0312, "step": 17 }, { "epoch": 0.0, "learning_rate": 1.3043478260869566e-06, "loss": 1.1577, "step": 18 }, { "epoch": 0.0, "learning_rate": 1.3768115942028987e-06, "loss": 1.2446, "step": 19 }, { "epoch": 0.0, "learning_rate": 1.4492753623188408e-06, "loss": 1.0796, "step": 20 }, { "epoch": 0.0, "learning_rate": 1.521739130434783e-06, "loss": 1.04, "step": 21 }, { "epoch": 0.0, "learning_rate": 1.5942028985507246e-06, "loss": 0.9966, "step": 22 }, { "epoch": 0.0, "learning_rate": 1.6666666666666667e-06, "loss": 0.9473, "step": 23 }, { "epoch": 0.0, "learning_rate": 1.7391304347826088e-06, "loss": 1.0503, "step": 24 }, { "epoch": 0.0, "learning_rate": 1.8115942028985508e-06, "loss": 1.0654, "step": 25 }, { "epoch": 0.0, "learning_rate": 1.884057971014493e-06, "loss": 1.0059, "step": 26 }, { "epoch": 0.0, "learning_rate": 1.956521739130435e-06, "loss": 0.97, "step": 27 }, { "epoch": 0.0, "learning_rate": 2.028985507246377e-06, "loss": 0.9495, "step": 28 }, { "epoch": 0.0, "learning_rate": 2.101449275362319e-06, "loss": 0.9268, "step": 29 }, { "epoch": 0.0, "learning_rate": 2.173913043478261e-06, "loss": 0.856, "step": 30 }, { "epoch": 0.0, "learning_rate": 2.246376811594203e-06, "loss": 0.9858, "step": 31 }, { "epoch": 0.0, "learning_rate": 2.3188405797101453e-06, "loss": 1.103, "step": 32 }, { "epoch": 0.0, "learning_rate": 2.391304347826087e-06, "loss": 0.998, "step": 33 }, { "epoch": 0.0, "learning_rate": 2.4637681159420295e-06, "loss": 0.9033, "step": 34 }, { "epoch": 0.0, "learning_rate": 2.5362318840579714e-06, "loss": 0.8668, "step": 35 }, { "epoch": 0.0, "learning_rate": 2.6086956521739132e-06, "loss": 1.064, "step": 36 }, { "epoch": 0.0, "learning_rate": 2.6811594202898555e-06, "loss": 0.9932, "step": 37 }, { "epoch": 0.0, "learning_rate": 2.7536231884057974e-06, "loss": 0.9062, "step": 38 }, { "epoch": 0.0, "learning_rate": 2.8260869565217393e-06, "loss": 0.9722, "step": 39 }, { "epoch": 0.0, "learning_rate": 2.8985507246376816e-06, "loss": 0.8701, "step": 40 }, { "epoch": 0.0, "learning_rate": 2.9710144927536235e-06, "loss": 1.1641, "step": 41 }, { "epoch": 0.0, "learning_rate": 3.043478260869566e-06, "loss": 0.9292, "step": 42 }, { "epoch": 0.0, "learning_rate": 3.1159420289855073e-06, "loss": 0.8762, "step": 43 }, { "epoch": 0.0, "learning_rate": 3.188405797101449e-06, "loss": 0.9395, "step": 44 }, { "epoch": 0.0, "learning_rate": 3.2608695652173914e-06, "loss": 0.9224, "step": 45 }, { "epoch": 0.01, "learning_rate": 3.3333333333333333e-06, "loss": 0.7432, "step": 46 }, { "epoch": 0.01, "learning_rate": 3.4057971014492756e-06, "loss": 0.7942, "step": 47 }, { "epoch": 0.01, "learning_rate": 3.4782608695652175e-06, "loss": 0.8472, "step": 48 }, { "epoch": 0.01, "learning_rate": 3.55072463768116e-06, "loss": 0.8242, "step": 49 }, { "epoch": 0.01, "learning_rate": 3.6231884057971017e-06, "loss": 0.9824, "step": 50 }, { "epoch": 0.01, "learning_rate": 3.6956521739130436e-06, "loss": 0.7917, "step": 51 }, { "epoch": 0.01, "learning_rate": 3.768115942028986e-06, "loss": 0.8086, "step": 52 }, { "epoch": 0.01, "learning_rate": 3.840579710144928e-06, "loss": 0.8315, "step": 53 }, { "epoch": 0.01, "learning_rate": 3.91304347826087e-06, "loss": 1.0889, "step": 54 }, { "epoch": 0.01, "learning_rate": 3.9855072463768115e-06, "loss": 1.0933, "step": 55 }, { "epoch": 0.01, "learning_rate": 4.057971014492754e-06, "loss": 0.8918, "step": 56 }, { "epoch": 0.01, "learning_rate": 4.130434782608696e-06, "loss": 0.7971, "step": 57 }, { "epoch": 0.01, "learning_rate": 4.202898550724638e-06, "loss": 0.9346, "step": 58 }, { "epoch": 0.01, "learning_rate": 4.27536231884058e-06, "loss": 0.9639, "step": 59 }, { "epoch": 0.01, "learning_rate": 4.347826086956522e-06, "loss": 0.854, "step": 60 }, { "epoch": 0.01, "learning_rate": 4.4202898550724645e-06, "loss": 0.7671, "step": 61 }, { "epoch": 0.01, "learning_rate": 4.492753623188406e-06, "loss": 0.8625, "step": 62 }, { "epoch": 0.01, "learning_rate": 4.565217391304348e-06, "loss": 0.7461, "step": 63 }, { "epoch": 0.01, "learning_rate": 4.637681159420291e-06, "loss": 0.8457, "step": 64 }, { "epoch": 0.01, "learning_rate": 4.710144927536232e-06, "loss": 0.7734, "step": 65 }, { "epoch": 0.01, "learning_rate": 4.782608695652174e-06, "loss": 0.9785, "step": 66 }, { "epoch": 0.01, "learning_rate": 4.855072463768117e-06, "loss": 1.0093, "step": 67 }, { "epoch": 0.01, "learning_rate": 4.927536231884059e-06, "loss": 0.9368, "step": 68 }, { "epoch": 0.01, "learning_rate": 5e-06, "loss": 1.0151, "step": 69 }, { "epoch": 0.01, "learning_rate": 5.072463768115943e-06, "loss": 0.7881, "step": 70 }, { "epoch": 0.01, "learning_rate": 5.144927536231884e-06, "loss": 0.9116, "step": 71 }, { "epoch": 0.01, "learning_rate": 5.2173913043478265e-06, "loss": 0.9812, "step": 72 }, { "epoch": 0.01, "learning_rate": 5.289855072463769e-06, "loss": 0.8457, "step": 73 }, { "epoch": 0.01, "learning_rate": 5.362318840579711e-06, "loss": 0.8276, "step": 74 }, { "epoch": 0.01, "learning_rate": 5.4347826086956525e-06, "loss": 0.7373, "step": 75 }, { "epoch": 0.01, "learning_rate": 5.507246376811595e-06, "loss": 0.7637, "step": 76 }, { "epoch": 0.01, "learning_rate": 5.579710144927537e-06, "loss": 0.8115, "step": 77 }, { "epoch": 0.01, "learning_rate": 5.652173913043479e-06, "loss": 0.8105, "step": 78 }, { "epoch": 0.01, "learning_rate": 5.724637681159421e-06, "loss": 0.8633, "step": 79 }, { "epoch": 0.01, "learning_rate": 5.797101449275363e-06, "loss": 0.905, "step": 80 }, { "epoch": 0.01, "learning_rate": 5.8695652173913055e-06, "loss": 0.9592, "step": 81 }, { "epoch": 0.01, "learning_rate": 5.942028985507247e-06, "loss": 0.7703, "step": 82 }, { "epoch": 0.01, "learning_rate": 6.014492753623189e-06, "loss": 0.6851, "step": 83 }, { "epoch": 0.01, "learning_rate": 6.086956521739132e-06, "loss": 0.8843, "step": 84 }, { "epoch": 0.01, "learning_rate": 6.159420289855072e-06, "loss": 0.7788, "step": 85 }, { "epoch": 0.01, "learning_rate": 6.2318840579710145e-06, "loss": 0.8718, "step": 86 }, { "epoch": 0.01, "learning_rate": 6.304347826086958e-06, "loss": 0.9507, "step": 87 }, { "epoch": 0.01, "learning_rate": 6.376811594202898e-06, "loss": 0.8779, "step": 88 }, { "epoch": 0.01, "learning_rate": 6.449275362318841e-06, "loss": 0.7993, "step": 89 }, { "epoch": 0.01, "learning_rate": 6.521739130434783e-06, "loss": 0.8965, "step": 90 }, { "epoch": 0.01, "learning_rate": 6.594202898550725e-06, "loss": 0.9883, "step": 91 }, { "epoch": 0.01, "learning_rate": 6.666666666666667e-06, "loss": 0.6929, "step": 92 }, { "epoch": 0.01, "learning_rate": 6.739130434782609e-06, "loss": 0.8115, "step": 93 }, { "epoch": 0.01, "learning_rate": 6.811594202898551e-06, "loss": 0.8496, "step": 94 }, { "epoch": 0.01, "learning_rate": 6.884057971014493e-06, "loss": 0.8127, "step": 95 }, { "epoch": 0.01, "learning_rate": 6.956521739130435e-06, "loss": 0.7905, "step": 96 }, { "epoch": 0.01, "learning_rate": 7.028985507246377e-06, "loss": 0.8706, "step": 97 }, { "epoch": 0.01, "learning_rate": 7.10144927536232e-06, "loss": 0.8164, "step": 98 }, { "epoch": 0.01, "learning_rate": 7.173913043478261e-06, "loss": 0.7659, "step": 99 }, { "epoch": 0.01, "learning_rate": 7.246376811594203e-06, "loss": 0.8301, "step": 100 }, { "epoch": 0.01, "learning_rate": 7.318840579710146e-06, "loss": 0.7166, "step": 101 }, { "epoch": 0.01, "learning_rate": 7.391304347826087e-06, "loss": 0.8467, "step": 102 }, { "epoch": 0.01, "learning_rate": 7.4637681159420295e-06, "loss": 0.8818, "step": 103 }, { "epoch": 0.01, "learning_rate": 7.536231884057972e-06, "loss": 0.802, "step": 104 }, { "epoch": 0.01, "learning_rate": 7.608695652173914e-06, "loss": 0.9077, "step": 105 }, { "epoch": 0.01, "learning_rate": 7.681159420289856e-06, "loss": 0.8701, "step": 106 }, { "epoch": 0.01, "learning_rate": 7.753623188405797e-06, "loss": 0.6914, "step": 107 }, { "epoch": 0.01, "learning_rate": 7.82608695652174e-06, "loss": 0.8489, "step": 108 }, { "epoch": 0.01, "learning_rate": 7.898550724637682e-06, "loss": 1.0479, "step": 109 }, { "epoch": 0.01, "learning_rate": 7.971014492753623e-06, "loss": 0.7786, "step": 110 }, { "epoch": 0.01, "learning_rate": 8.043478260869566e-06, "loss": 0.8335, "step": 111 }, { "epoch": 0.01, "learning_rate": 8.115942028985508e-06, "loss": 0.7278, "step": 112 }, { "epoch": 0.01, "learning_rate": 8.188405797101449e-06, "loss": 0.7615, "step": 113 }, { "epoch": 0.01, "learning_rate": 8.260869565217392e-06, "loss": 0.8862, "step": 114 }, { "epoch": 0.01, "learning_rate": 8.333333333333334e-06, "loss": 0.8499, "step": 115 }, { "epoch": 0.01, "learning_rate": 8.405797101449275e-06, "loss": 0.9197, "step": 116 }, { "epoch": 0.01, "learning_rate": 8.478260869565218e-06, "loss": 0.7915, "step": 117 }, { "epoch": 0.01, "learning_rate": 8.55072463768116e-06, "loss": 0.7266, "step": 118 }, { "epoch": 0.01, "learning_rate": 8.623188405797103e-06, "loss": 0.7205, "step": 119 }, { "epoch": 0.01, "learning_rate": 8.695652173913044e-06, "loss": 0.8267, "step": 120 }, { "epoch": 0.01, "learning_rate": 8.768115942028986e-06, "loss": 0.9368, "step": 121 }, { "epoch": 0.01, "learning_rate": 8.840579710144929e-06, "loss": 0.9153, "step": 122 }, { "epoch": 0.01, "learning_rate": 8.91304347826087e-06, "loss": 0.8132, "step": 123 }, { "epoch": 0.01, "learning_rate": 8.985507246376812e-06, "loss": 0.8794, "step": 124 }, { "epoch": 0.01, "learning_rate": 9.057971014492755e-06, "loss": 0.9395, "step": 125 }, { "epoch": 0.01, "learning_rate": 9.130434782608697e-06, "loss": 0.8298, "step": 126 }, { "epoch": 0.01, "learning_rate": 9.202898550724638e-06, "loss": 0.9292, "step": 127 }, { "epoch": 0.01, "learning_rate": 9.275362318840581e-06, "loss": 0.9678, "step": 128 }, { "epoch": 0.01, "learning_rate": 9.347826086956523e-06, "loss": 0.729, "step": 129 }, { "epoch": 0.01, "learning_rate": 9.420289855072464e-06, "loss": 0.8628, "step": 130 }, { "epoch": 0.01, "learning_rate": 9.492753623188407e-06, "loss": 0.7214, "step": 131 }, { "epoch": 0.01, "learning_rate": 9.565217391304349e-06, "loss": 0.7515, "step": 132 }, { "epoch": 0.01, "learning_rate": 9.63768115942029e-06, "loss": 0.8938, "step": 133 }, { "epoch": 0.01, "learning_rate": 9.710144927536233e-06, "loss": 0.7532, "step": 134 }, { "epoch": 0.01, "learning_rate": 9.782608695652175e-06, "loss": 0.8188, "step": 135 }, { "epoch": 0.01, "learning_rate": 9.855072463768118e-06, "loss": 0.7847, "step": 136 }, { "epoch": 0.01, "learning_rate": 9.927536231884058e-06, "loss": 0.8315, "step": 137 }, { "epoch": 0.02, "learning_rate": 1e-05, "loss": 0.7534, "step": 138 }, { "epoch": 0.02, "learning_rate": 1.0072463768115944e-05, "loss": 1.0107, "step": 139 }, { "epoch": 0.02, "learning_rate": 1.0144927536231885e-05, "loss": 0.6855, "step": 140 }, { "epoch": 0.02, "learning_rate": 1.0217391304347829e-05, "loss": 0.8608, "step": 141 }, { "epoch": 0.02, "learning_rate": 1.0289855072463768e-05, "loss": 0.8237, "step": 142 }, { "epoch": 0.02, "learning_rate": 1.036231884057971e-05, "loss": 0.9321, "step": 143 }, { "epoch": 0.02, "learning_rate": 1.0434782608695653e-05, "loss": 0.7959, "step": 144 }, { "epoch": 0.02, "learning_rate": 1.0507246376811594e-05, "loss": 0.7668, "step": 145 }, { "epoch": 0.02, "learning_rate": 1.0579710144927538e-05, "loss": 0.8438, "step": 146 }, { "epoch": 0.02, "learning_rate": 1.0652173913043479e-05, "loss": 0.845, "step": 147 }, { "epoch": 0.02, "learning_rate": 1.0724637681159422e-05, "loss": 0.7578, "step": 148 }, { "epoch": 0.02, "learning_rate": 1.0797101449275362e-05, "loss": 0.689, "step": 149 }, { "epoch": 0.02, "learning_rate": 1.0869565217391305e-05, "loss": 0.7043, "step": 150 }, { "epoch": 0.02, "learning_rate": 1.0942028985507247e-05, "loss": 0.8618, "step": 151 }, { "epoch": 0.02, "learning_rate": 1.101449275362319e-05, "loss": 0.8682, "step": 152 }, { "epoch": 0.02, "learning_rate": 1.1086956521739131e-05, "loss": 0.7075, "step": 153 }, { "epoch": 0.02, "learning_rate": 1.1159420289855074e-05, "loss": 0.8062, "step": 154 }, { "epoch": 0.02, "learning_rate": 1.1231884057971016e-05, "loss": 0.8843, "step": 155 }, { "epoch": 0.02, "learning_rate": 1.1304347826086957e-05, "loss": 0.8301, "step": 156 }, { "epoch": 0.02, "learning_rate": 1.1376811594202899e-05, "loss": 0.8218, "step": 157 }, { "epoch": 0.02, "learning_rate": 1.1449275362318842e-05, "loss": 0.7791, "step": 158 }, { "epoch": 0.02, "learning_rate": 1.1521739130434783e-05, "loss": 0.8325, "step": 159 }, { "epoch": 0.02, "learning_rate": 1.1594202898550726e-05, "loss": 0.7637, "step": 160 }, { "epoch": 0.02, "learning_rate": 1.1666666666666668e-05, "loss": 0.7339, "step": 161 }, { "epoch": 0.02, "learning_rate": 1.1739130434782611e-05, "loss": 0.6667, "step": 162 }, { "epoch": 0.02, "learning_rate": 1.181159420289855e-05, "loss": 0.9146, "step": 163 }, { "epoch": 0.02, "learning_rate": 1.1884057971014494e-05, "loss": 0.853, "step": 164 }, { "epoch": 0.02, "learning_rate": 1.1956521739130435e-05, "loss": 0.8569, "step": 165 }, { "epoch": 0.02, "learning_rate": 1.2028985507246379e-05, "loss": 0.7698, "step": 166 }, { "epoch": 0.02, "learning_rate": 1.210144927536232e-05, "loss": 0.7109, "step": 167 }, { "epoch": 0.02, "learning_rate": 1.2173913043478263e-05, "loss": 0.8789, "step": 168 }, { "epoch": 0.02, "learning_rate": 1.2246376811594205e-05, "loss": 0.9209, "step": 169 }, { "epoch": 0.02, "learning_rate": 1.2318840579710144e-05, "loss": 0.6963, "step": 170 }, { "epoch": 0.02, "learning_rate": 1.2391304347826088e-05, "loss": 0.8198, "step": 171 }, { "epoch": 0.02, "learning_rate": 1.2463768115942029e-05, "loss": 0.8745, "step": 172 }, { "epoch": 0.02, "learning_rate": 1.2536231884057972e-05, "loss": 0.7642, "step": 173 }, { "epoch": 0.02, "learning_rate": 1.2608695652173915e-05, "loss": 0.8618, "step": 174 }, { "epoch": 0.02, "learning_rate": 1.2681159420289857e-05, "loss": 0.7563, "step": 175 }, { "epoch": 0.02, "learning_rate": 1.2753623188405797e-05, "loss": 0.8486, "step": 176 }, { "epoch": 0.02, "learning_rate": 1.282608695652174e-05, "loss": 0.8115, "step": 177 }, { "epoch": 0.02, "learning_rate": 1.2898550724637681e-05, "loss": 0.8589, "step": 178 }, { "epoch": 0.02, "learning_rate": 1.2971014492753624e-05, "loss": 0.8293, "step": 179 }, { "epoch": 0.02, "learning_rate": 1.3043478260869566e-05, "loss": 0.7578, "step": 180 }, { "epoch": 0.02, "learning_rate": 1.3115942028985509e-05, "loss": 0.814, "step": 181 }, { "epoch": 0.02, "learning_rate": 1.318840579710145e-05, "loss": 0.73, "step": 182 }, { "epoch": 0.02, "learning_rate": 1.3260869565217392e-05, "loss": 0.9165, "step": 183 }, { "epoch": 0.02, "learning_rate": 1.3333333333333333e-05, "loss": 0.792, "step": 184 }, { "epoch": 0.02, "learning_rate": 1.3405797101449276e-05, "loss": 0.8201, "step": 185 }, { "epoch": 0.02, "learning_rate": 1.3478260869565218e-05, "loss": 0.9004, "step": 186 }, { "epoch": 0.02, "learning_rate": 1.3550724637681161e-05, "loss": 0.824, "step": 187 }, { "epoch": 0.02, "learning_rate": 1.3623188405797103e-05, "loss": 0.8828, "step": 188 }, { "epoch": 0.02, "learning_rate": 1.3695652173913046e-05, "loss": 0.6858, "step": 189 }, { "epoch": 0.02, "learning_rate": 1.3768115942028985e-05, "loss": 0.845, "step": 190 }, { "epoch": 0.02, "learning_rate": 1.3840579710144929e-05, "loss": 0.9058, "step": 191 }, { "epoch": 0.02, "learning_rate": 1.391304347826087e-05, "loss": 0.8281, "step": 192 }, { "epoch": 0.02, "learning_rate": 1.3985507246376813e-05, "loss": 0.854, "step": 193 }, { "epoch": 0.02, "learning_rate": 1.4057971014492755e-05, "loss": 0.8774, "step": 194 }, { "epoch": 0.02, "learning_rate": 1.4130434782608698e-05, "loss": 0.8894, "step": 195 }, { "epoch": 0.02, "learning_rate": 1.420289855072464e-05, "loss": 0.7769, "step": 196 }, { "epoch": 0.02, "learning_rate": 1.427536231884058e-05, "loss": 0.8445, "step": 197 }, { "epoch": 0.02, "learning_rate": 1.4347826086956522e-05, "loss": 0.7761, "step": 198 }, { "epoch": 0.02, "learning_rate": 1.4420289855072465e-05, "loss": 0.7239, "step": 199 }, { "epoch": 0.02, "learning_rate": 1.4492753623188407e-05, "loss": 0.9365, "step": 200 }, { "epoch": 0.02, "learning_rate": 1.456521739130435e-05, "loss": 0.8435, "step": 201 }, { "epoch": 0.02, "learning_rate": 1.4637681159420291e-05, "loss": 0.7932, "step": 202 }, { "epoch": 0.02, "learning_rate": 1.4710144927536235e-05, "loss": 0.7544, "step": 203 }, { "epoch": 0.02, "learning_rate": 1.4782608695652174e-05, "loss": 0.7107, "step": 204 }, { "epoch": 0.02, "learning_rate": 1.4855072463768116e-05, "loss": 0.7629, "step": 205 }, { "epoch": 0.02, "learning_rate": 1.4927536231884059e-05, "loss": 0.8564, "step": 206 }, { "epoch": 0.02, "learning_rate": 1.5000000000000002e-05, "loss": 0.7388, "step": 207 }, { "epoch": 0.02, "learning_rate": 1.5072463768115944e-05, "loss": 0.9766, "step": 208 }, { "epoch": 0.02, "learning_rate": 1.5144927536231887e-05, "loss": 0.875, "step": 209 }, { "epoch": 0.02, "learning_rate": 1.5217391304347828e-05, "loss": 0.6892, "step": 210 }, { "epoch": 0.02, "learning_rate": 1.5289855072463768e-05, "loss": 0.7104, "step": 211 }, { "epoch": 0.02, "learning_rate": 1.536231884057971e-05, "loss": 0.6956, "step": 212 }, { "epoch": 0.02, "learning_rate": 1.5434782608695654e-05, "loss": 0.9146, "step": 213 }, { "epoch": 0.02, "learning_rate": 1.5507246376811594e-05, "loss": 0.9814, "step": 214 }, { "epoch": 0.02, "learning_rate": 1.5579710144927537e-05, "loss": 0.7295, "step": 215 }, { "epoch": 0.02, "learning_rate": 1.565217391304348e-05, "loss": 0.7893, "step": 216 }, { "epoch": 0.02, "learning_rate": 1.5724637681159423e-05, "loss": 0.7778, "step": 217 }, { "epoch": 0.02, "learning_rate": 1.5797101449275363e-05, "loss": 0.9043, "step": 218 }, { "epoch": 0.02, "learning_rate": 1.5869565217391306e-05, "loss": 0.7507, "step": 219 }, { "epoch": 0.02, "learning_rate": 1.5942028985507246e-05, "loss": 0.793, "step": 220 }, { "epoch": 0.02, "learning_rate": 1.601449275362319e-05, "loss": 0.9004, "step": 221 }, { "epoch": 0.02, "learning_rate": 1.6086956521739132e-05, "loss": 0.7091, "step": 222 }, { "epoch": 0.02, "learning_rate": 1.6159420289855076e-05, "loss": 0.8201, "step": 223 }, { "epoch": 0.02, "learning_rate": 1.6231884057971015e-05, "loss": 0.7832, "step": 224 }, { "epoch": 0.02, "learning_rate": 1.630434782608696e-05, "loss": 0.884, "step": 225 }, { "epoch": 0.02, "learning_rate": 1.6376811594202898e-05, "loss": 0.7214, "step": 226 }, { "epoch": 0.02, "learning_rate": 1.644927536231884e-05, "loss": 0.8237, "step": 227 }, { "epoch": 0.02, "learning_rate": 1.6521739130434785e-05, "loss": 0.7856, "step": 228 }, { "epoch": 0.02, "learning_rate": 1.6594202898550728e-05, "loss": 0.7241, "step": 229 }, { "epoch": 0.03, "learning_rate": 1.6666666666666667e-05, "loss": 0.8293, "step": 230 }, { "epoch": 0.03, "learning_rate": 1.673913043478261e-05, "loss": 0.8701, "step": 231 }, { "epoch": 0.03, "learning_rate": 1.681159420289855e-05, "loss": 0.8911, "step": 232 }, { "epoch": 0.03, "learning_rate": 1.6884057971014494e-05, "loss": 0.7935, "step": 233 }, { "epoch": 0.03, "learning_rate": 1.6956521739130437e-05, "loss": 0.7671, "step": 234 }, { "epoch": 0.03, "learning_rate": 1.702898550724638e-05, "loss": 0.8977, "step": 235 }, { "epoch": 0.03, "learning_rate": 1.710144927536232e-05, "loss": 0.6592, "step": 236 }, { "epoch": 0.03, "learning_rate": 1.7173913043478263e-05, "loss": 0.686, "step": 237 }, { "epoch": 0.03, "learning_rate": 1.7246376811594206e-05, "loss": 0.7583, "step": 238 }, { "epoch": 0.03, "learning_rate": 1.7318840579710146e-05, "loss": 0.7515, "step": 239 }, { "epoch": 0.03, "learning_rate": 1.739130434782609e-05, "loss": 0.8291, "step": 240 }, { "epoch": 0.03, "learning_rate": 1.746376811594203e-05, "loss": 0.7014, "step": 241 }, { "epoch": 0.03, "learning_rate": 1.7536231884057972e-05, "loss": 0.8108, "step": 242 }, { "epoch": 0.03, "learning_rate": 1.7608695652173915e-05, "loss": 0.73, "step": 243 }, { "epoch": 0.03, "learning_rate": 1.7681159420289858e-05, "loss": 0.7981, "step": 244 }, { "epoch": 0.03, "learning_rate": 1.7753623188405798e-05, "loss": 0.9341, "step": 245 }, { "epoch": 0.03, "learning_rate": 1.782608695652174e-05, "loss": 0.8623, "step": 246 }, { "epoch": 0.03, "learning_rate": 1.789855072463768e-05, "loss": 0.8491, "step": 247 }, { "epoch": 0.03, "learning_rate": 1.7971014492753624e-05, "loss": 0.8506, "step": 248 }, { "epoch": 0.03, "learning_rate": 1.8043478260869567e-05, "loss": 0.8774, "step": 249 }, { "epoch": 0.03, "learning_rate": 1.811594202898551e-05, "loss": 0.5945, "step": 250 }, { "epoch": 0.03, "learning_rate": 1.818840579710145e-05, "loss": 0.7953, "step": 251 }, { "epoch": 0.03, "learning_rate": 1.8260869565217393e-05, "loss": 0.8208, "step": 252 }, { "epoch": 0.03, "learning_rate": 1.8333333333333333e-05, "loss": 0.6819, "step": 253 }, { "epoch": 0.03, "learning_rate": 1.8405797101449276e-05, "loss": 0.7324, "step": 254 }, { "epoch": 0.03, "learning_rate": 1.847826086956522e-05, "loss": 0.7642, "step": 255 }, { "epoch": 0.03, "learning_rate": 1.8550724637681162e-05, "loss": 0.915, "step": 256 }, { "epoch": 0.03, "learning_rate": 1.8623188405797102e-05, "loss": 0.7271, "step": 257 }, { "epoch": 0.03, "learning_rate": 1.8695652173913045e-05, "loss": 0.7803, "step": 258 }, { "epoch": 0.03, "learning_rate": 1.8768115942028985e-05, "loss": 0.7424, "step": 259 }, { "epoch": 0.03, "learning_rate": 1.8840579710144928e-05, "loss": 0.7759, "step": 260 }, { "epoch": 0.03, "learning_rate": 1.891304347826087e-05, "loss": 0.8098, "step": 261 }, { "epoch": 0.03, "learning_rate": 1.8985507246376814e-05, "loss": 0.8462, "step": 262 }, { "epoch": 0.03, "learning_rate": 1.9057971014492754e-05, "loss": 0.7598, "step": 263 }, { "epoch": 0.03, "learning_rate": 1.9130434782608697e-05, "loss": 0.7874, "step": 264 }, { "epoch": 0.03, "learning_rate": 1.920289855072464e-05, "loss": 0.6667, "step": 265 }, { "epoch": 0.03, "learning_rate": 1.927536231884058e-05, "loss": 0.7654, "step": 266 }, { "epoch": 0.03, "learning_rate": 1.9347826086956523e-05, "loss": 0.8596, "step": 267 }, { "epoch": 0.03, "learning_rate": 1.9420289855072467e-05, "loss": 0.8086, "step": 268 }, { "epoch": 0.03, "learning_rate": 1.9492753623188406e-05, "loss": 0.814, "step": 269 }, { "epoch": 0.03, "learning_rate": 1.956521739130435e-05, "loss": 0.8127, "step": 270 }, { "epoch": 0.03, "learning_rate": 1.9637681159420293e-05, "loss": 0.7368, "step": 271 }, { "epoch": 0.03, "learning_rate": 1.9710144927536236e-05, "loss": 0.7556, "step": 272 }, { "epoch": 0.03, "learning_rate": 1.9782608695652176e-05, "loss": 0.7571, "step": 273 }, { "epoch": 0.03, "learning_rate": 1.9855072463768115e-05, "loss": 0.6216, "step": 274 }, { "epoch": 0.03, "learning_rate": 1.992753623188406e-05, "loss": 0.7393, "step": 275 }, { "epoch": 0.03, "learning_rate": 2e-05, "loss": 0.7009, "step": 276 }, { "epoch": 0.03, "learning_rate": 1.9999999378395234e-05, "loss": 0.7905, "step": 277 }, { "epoch": 0.03, "learning_rate": 1.9999997513581006e-05, "loss": 0.8564, "step": 278 }, { "epoch": 0.03, "learning_rate": 1.999999440555755e-05, "loss": 0.8579, "step": 279 }, { "epoch": 0.03, "learning_rate": 1.9999990054325255e-05, "loss": 0.7251, "step": 280 }, { "epoch": 0.03, "learning_rate": 1.999998445988466e-05, "loss": 0.6663, "step": 281 }, { "epoch": 0.03, "learning_rate": 1.9999977622236463e-05, "loss": 0.814, "step": 282 }, { "epoch": 0.03, "learning_rate": 1.9999969541381508e-05, "loss": 0.759, "step": 283 }, { "epoch": 0.03, "learning_rate": 1.9999960217320806e-05, "loss": 0.7495, "step": 284 }, { "epoch": 0.03, "learning_rate": 1.9999949650055512e-05, "loss": 0.8193, "step": 285 }, { "epoch": 0.03, "learning_rate": 1.999993783958694e-05, "loss": 0.8926, "step": 286 }, { "epoch": 0.03, "learning_rate": 1.9999924785916563e-05, "loss": 0.8101, "step": 287 }, { "epoch": 0.03, "learning_rate": 1.9999910489045997e-05, "loss": 0.8862, "step": 288 }, { "epoch": 0.03, "learning_rate": 1.9999894948977027e-05, "loss": 0.6477, "step": 289 }, { "epoch": 0.03, "learning_rate": 1.9999878165711575e-05, "loss": 0.7568, "step": 290 }, { "epoch": 0.03, "learning_rate": 1.9999860139251737e-05, "loss": 0.7527, "step": 291 }, { "epoch": 0.03, "learning_rate": 1.999984086959975e-05, "loss": 0.8247, "step": 292 }, { "epoch": 0.03, "learning_rate": 1.9999820356758008e-05, "loss": 0.7876, "step": 293 }, { "epoch": 0.03, "learning_rate": 1.9999798600729067e-05, "loss": 0.8647, "step": 294 }, { "epoch": 0.03, "learning_rate": 1.9999775601515626e-05, "loss": 0.7734, "step": 295 }, { "epoch": 0.03, "learning_rate": 1.9999751359120544e-05, "loss": 0.8274, "step": 296 }, { "epoch": 0.03, "learning_rate": 1.999972587354684e-05, "loss": 0.8501, "step": 297 }, { "epoch": 0.03, "learning_rate": 1.999969914479768e-05, "loss": 0.8506, "step": 298 }, { "epoch": 0.03, "learning_rate": 1.9999671172876384e-05, "loss": 0.751, "step": 299 }, { "epoch": 0.03, "learning_rate": 1.999964195778643e-05, "loss": 0.8179, "step": 300 }, { "epoch": 0.03, "learning_rate": 1.9999611499531454e-05, "loss": 0.8755, "step": 301 }, { "epoch": 0.03, "learning_rate": 1.999957979811524e-05, "loss": 0.7671, "step": 302 }, { "epoch": 0.03, "learning_rate": 1.9999546853541728e-05, "loss": 0.8535, "step": 303 }, { "epoch": 0.03, "learning_rate": 1.999951266581502e-05, "loss": 0.7539, "step": 304 }, { "epoch": 0.03, "learning_rate": 1.9999477234939358e-05, "loss": 0.8447, "step": 305 }, { "epoch": 0.03, "learning_rate": 1.9999440560919153e-05, "loss": 0.8147, "step": 306 }, { "epoch": 0.03, "learning_rate": 1.9999402643758957e-05, "loss": 0.751, "step": 307 }, { "epoch": 0.03, "learning_rate": 1.999936348346349e-05, "loss": 0.7061, "step": 308 }, { "epoch": 0.03, "learning_rate": 1.9999323080037623e-05, "loss": 0.8672, "step": 309 }, { "epoch": 0.03, "learning_rate": 1.999928143348637e-05, "loss": 0.8213, "step": 310 }, { "epoch": 0.03, "learning_rate": 1.999923854381492e-05, "loss": 0.7698, "step": 311 }, { "epoch": 0.03, "learning_rate": 1.9999194411028596e-05, "loss": 0.8005, "step": 312 }, { "epoch": 0.03, "learning_rate": 1.9999149035132884e-05, "loss": 0.6045, "step": 313 }, { "epoch": 0.03, "learning_rate": 1.999910241613343e-05, "loss": 0.9482, "step": 314 }, { "epoch": 0.03, "learning_rate": 1.9999054554036032e-05, "loss": 0.7783, "step": 315 }, { "epoch": 0.03, "learning_rate": 1.999900544884663e-05, "loss": 0.7334, "step": 316 }, { "epoch": 0.03, "learning_rate": 1.999895510057134e-05, "loss": 0.8354, "step": 317 }, { "epoch": 0.03, "learning_rate": 1.9998903509216415e-05, "loss": 0.7954, "step": 318 }, { "epoch": 0.03, "learning_rate": 1.999885067478827e-05, "loss": 0.7346, "step": 319 }, { "epoch": 0.03, "learning_rate": 1.9998796597293477e-05, "loss": 0.7954, "step": 320 }, { "epoch": 0.03, "learning_rate": 1.9998741276738753e-05, "loss": 0.7612, "step": 321 }, { "epoch": 0.04, "learning_rate": 1.999868471313098e-05, "loss": 0.8076, "step": 322 }, { "epoch": 0.04, "learning_rate": 1.9998626906477184e-05, "loss": 0.9087, "step": 323 }, { "epoch": 0.04, "learning_rate": 1.999856785678456e-05, "loss": 0.7925, "step": 324 }, { "epoch": 0.04, "learning_rate": 1.9998507564060447e-05, "loss": 0.8442, "step": 325 }, { "epoch": 0.04, "learning_rate": 1.9998446028312334e-05, "loss": 0.7778, "step": 326 }, { "epoch": 0.04, "learning_rate": 1.9998383249547878e-05, "loss": 0.7402, "step": 327 }, { "epoch": 0.04, "learning_rate": 1.9998319227774884e-05, "loss": 0.8193, "step": 328 }, { "epoch": 0.04, "learning_rate": 1.9998253963001305e-05, "loss": 0.8455, "step": 329 }, { "epoch": 0.04, "learning_rate": 1.999818745523526e-05, "loss": 0.7251, "step": 330 }, { "epoch": 0.04, "learning_rate": 1.9998119704485016e-05, "loss": 0.8599, "step": 331 }, { "epoch": 0.04, "learning_rate": 1.9998050710758998e-05, "loss": 0.7024, "step": 332 }, { "epoch": 0.04, "learning_rate": 1.9997980474065776e-05, "loss": 0.7444, "step": 333 }, { "epoch": 0.04, "learning_rate": 1.999790899441409e-05, "loss": 0.7871, "step": 334 }, { "epoch": 0.04, "learning_rate": 1.9997836271812824e-05, "loss": 0.7356, "step": 335 }, { "epoch": 0.04, "learning_rate": 1.999776230627102e-05, "loss": 0.751, "step": 336 }, { "epoch": 0.04, "learning_rate": 1.999768709779787e-05, "loss": 0.8584, "step": 337 }, { "epoch": 0.04, "learning_rate": 1.9997610646402728e-05, "loss": 0.6842, "step": 338 }, { "epoch": 0.04, "learning_rate": 1.9997532952095093e-05, "loss": 0.7168, "step": 339 }, { "epoch": 0.04, "learning_rate": 1.999745401488463e-05, "loss": 0.825, "step": 340 }, { "epoch": 0.04, "learning_rate": 1.999737383478115e-05, "loss": 0.7974, "step": 341 }, { "epoch": 0.04, "learning_rate": 1.999729241179462e-05, "loss": 0.6487, "step": 342 }, { "epoch": 0.04, "learning_rate": 1.999720974593516e-05, "loss": 0.6724, "step": 343 }, { "epoch": 0.04, "learning_rate": 1.9997125837213058e-05, "loss": 0.7656, "step": 344 }, { "epoch": 0.04, "learning_rate": 1.999704068563873e-05, "loss": 0.6682, "step": 345 }, { "epoch": 0.04, "learning_rate": 1.9996954291222778e-05, "loss": 0.8501, "step": 346 }, { "epoch": 0.04, "learning_rate": 1.9996866653975933e-05, "loss": 0.6877, "step": 347 }, { "epoch": 0.04, "learning_rate": 1.9996777773909093e-05, "loss": 0.7673, "step": 348 }, { "epoch": 0.04, "learning_rate": 1.9996687651033303e-05, "loss": 0.7168, "step": 349 }, { "epoch": 0.04, "learning_rate": 1.9996596285359776e-05, "loss": 0.6709, "step": 350 }, { "epoch": 0.04, "learning_rate": 1.9996503676899863e-05, "loss": 0.6836, "step": 351 }, { "epoch": 0.04, "learning_rate": 1.9996409825665083e-05, "loss": 0.7241, "step": 352 }, { "epoch": 0.04, "learning_rate": 1.9996314731667096e-05, "loss": 0.7515, "step": 353 }, { "epoch": 0.04, "learning_rate": 1.999621839491773e-05, "loss": 0.8364, "step": 354 }, { "epoch": 0.04, "learning_rate": 1.9996120815428963e-05, "loss": 0.9292, "step": 355 }, { "epoch": 0.04, "learning_rate": 1.999602199321292e-05, "loss": 0.6812, "step": 356 }, { "epoch": 0.04, "learning_rate": 1.9995921928281893e-05, "loss": 0.7986, "step": 357 }, { "epoch": 0.04, "learning_rate": 1.999582062064832e-05, "loss": 0.7, "step": 358 }, { "epoch": 0.04, "learning_rate": 1.9995718070324793e-05, "loss": 0.8438, "step": 359 }, { "epoch": 0.04, "learning_rate": 1.9995614277324066e-05, "loss": 0.8586, "step": 360 }, { "epoch": 0.04, "learning_rate": 1.999550924165904e-05, "loss": 0.7295, "step": 361 }, { "epoch": 0.04, "learning_rate": 1.999540296334277e-05, "loss": 0.6302, "step": 362 }, { "epoch": 0.04, "learning_rate": 1.999529544238847e-05, "loss": 0.739, "step": 363 }, { "epoch": 0.04, "learning_rate": 1.9995186678809513e-05, "loss": 0.8804, "step": 364 }, { "epoch": 0.04, "learning_rate": 1.9995076672619413e-05, "loss": 0.9055, "step": 365 }, { "epoch": 0.04, "learning_rate": 1.9994965423831853e-05, "loss": 0.7773, "step": 366 }, { "epoch": 0.04, "learning_rate": 1.9994852932460658e-05, "loss": 0.9116, "step": 367 }, { "epoch": 0.04, "learning_rate": 1.9994739198519813e-05, "loss": 0.7747, "step": 368 }, { "epoch": 0.04, "learning_rate": 1.9994624222023465e-05, "loss": 0.5842, "step": 369 }, { "epoch": 0.04, "learning_rate": 1.99945080029859e-05, "loss": 0.8115, "step": 370 }, { "epoch": 0.04, "learning_rate": 1.9994390541421568e-05, "loss": 0.8145, "step": 371 }, { "epoch": 0.04, "learning_rate": 1.9994271837345072e-05, "loss": 0.6934, "step": 372 }, { "epoch": 0.04, "learning_rate": 1.9994151890771172e-05, "loss": 0.8047, "step": 373 }, { "epoch": 0.04, "learning_rate": 1.9994030701714783e-05, "loss": 0.8887, "step": 374 }, { "epoch": 0.04, "learning_rate": 1.999390827019096e-05, "loss": 0.7437, "step": 375 }, { "epoch": 0.04, "learning_rate": 1.9993784596214932e-05, "loss": 0.813, "step": 376 }, { "epoch": 0.04, "learning_rate": 1.9993659679802073e-05, "loss": 0.8137, "step": 377 }, { "epoch": 0.04, "learning_rate": 1.999353352096791e-05, "loss": 0.7692, "step": 378 }, { "epoch": 0.04, "learning_rate": 1.999340611972813e-05, "loss": 0.8054, "step": 379 }, { "epoch": 0.04, "learning_rate": 1.9993277476098572e-05, "loss": 0.8096, "step": 380 }, { "epoch": 0.04, "learning_rate": 1.9993147590095232e-05, "loss": 0.8462, "step": 381 }, { "epoch": 0.04, "learning_rate": 1.999301646173425e-05, "loss": 0.8115, "step": 382 }, { "epoch": 0.04, "learning_rate": 1.9992884091031934e-05, "loss": 0.7556, "step": 383 }, { "epoch": 0.04, "learning_rate": 1.999275047800474e-05, "loss": 0.8479, "step": 384 }, { "epoch": 0.04, "learning_rate": 1.999261562266927e-05, "loss": 0.9358, "step": 385 }, { "epoch": 0.04, "learning_rate": 1.9992479525042305e-05, "loss": 0.7263, "step": 386 }, { "epoch": 0.04, "learning_rate": 1.9992342185140748e-05, "loss": 0.7383, "step": 387 }, { "epoch": 0.04, "learning_rate": 1.9992203602981687e-05, "loss": 0.7246, "step": 388 }, { "epoch": 0.04, "learning_rate": 1.9992063778582345e-05, "loss": 0.8374, "step": 389 }, { "epoch": 0.04, "learning_rate": 1.9991922711960104e-05, "loss": 0.7358, "step": 390 }, { "epoch": 0.04, "learning_rate": 1.9991780403132503e-05, "loss": 0.874, "step": 391 }, { "epoch": 0.04, "learning_rate": 1.9991636852117234e-05, "loss": 0.7476, "step": 392 }, { "epoch": 0.04, "learning_rate": 1.9991492058932143e-05, "loss": 0.7695, "step": 393 }, { "epoch": 0.04, "learning_rate": 1.999134602359523e-05, "loss": 0.7947, "step": 394 }, { "epoch": 0.04, "learning_rate": 1.9991198746124652e-05, "loss": 0.6174, "step": 395 }, { "epoch": 0.04, "learning_rate": 1.999105022653872e-05, "loss": 0.9526, "step": 396 }, { "epoch": 0.04, "learning_rate": 1.9990900464855895e-05, "loss": 0.9282, "step": 397 }, { "epoch": 0.04, "learning_rate": 1.9990749461094794e-05, "loss": 0.7917, "step": 398 }, { "epoch": 0.04, "learning_rate": 1.9990597215274196e-05, "loss": 0.6816, "step": 399 }, { "epoch": 0.04, "learning_rate": 1.9990443727413025e-05, "loss": 0.6807, "step": 400 }, { "epoch": 0.04, "learning_rate": 1.9990288997530357e-05, "loss": 0.8438, "step": 401 }, { "epoch": 0.04, "learning_rate": 1.999013302564544e-05, "loss": 0.8652, "step": 402 }, { "epoch": 0.04, "learning_rate": 1.998997581177766e-05, "loss": 0.7209, "step": 403 }, { "epoch": 0.04, "learning_rate": 1.998981735594655e-05, "loss": 0.8016, "step": 404 }, { "epoch": 0.04, "learning_rate": 1.998965765817183e-05, "loss": 0.7751, "step": 405 }, { "epoch": 0.04, "learning_rate": 1.998949671847334e-05, "loss": 0.6525, "step": 406 }, { "epoch": 0.04, "learning_rate": 1.998933453687109e-05, "loss": 0.8125, "step": 407 }, { "epoch": 0.04, "learning_rate": 1.998917111338525e-05, "loss": 0.7749, "step": 408 }, { "epoch": 0.04, "learning_rate": 1.9989006448036123e-05, "loss": 0.9229, "step": 409 }, { "epoch": 0.04, "learning_rate": 1.998884054084419e-05, "loss": 0.7659, "step": 410 }, { "epoch": 0.04, "learning_rate": 1.9988673391830082e-05, "loss": 0.9224, "step": 411 }, { "epoch": 0.04, "learning_rate": 1.998850500101457e-05, "loss": 0.7625, "step": 412 }, { "epoch": 0.04, "learning_rate": 1.9988335368418585e-05, "loss": 0.6022, "step": 413 }, { "epoch": 0.05, "learning_rate": 1.9988164494063226e-05, "loss": 0.7891, "step": 414 }, { "epoch": 0.05, "learning_rate": 1.9987992377969734e-05, "loss": 0.8521, "step": 415 }, { "epoch": 0.05, "learning_rate": 1.9987819020159503e-05, "loss": 0.7231, "step": 416 }, { "epoch": 0.05, "learning_rate": 1.9987644420654087e-05, "loss": 0.7771, "step": 417 }, { "epoch": 0.05, "learning_rate": 1.9987468579475192e-05, "loss": 0.7744, "step": 418 }, { "epoch": 0.05, "learning_rate": 1.998729149664468e-05, "loss": 0.8232, "step": 419 }, { "epoch": 0.05, "learning_rate": 1.9987113172184562e-05, "loss": 0.8145, "step": 420 }, { "epoch": 0.05, "learning_rate": 1.998693360611701e-05, "loss": 0.699, "step": 421 }, { "epoch": 0.05, "learning_rate": 1.998675279846435e-05, "loss": 0.8838, "step": 422 }, { "epoch": 0.05, "learning_rate": 1.9986570749249062e-05, "loss": 0.7393, "step": 423 }, { "epoch": 0.05, "learning_rate": 1.998638745849377e-05, "loss": 0.7344, "step": 424 }, { "epoch": 0.05, "learning_rate": 1.998620292622127e-05, "loss": 0.8438, "step": 425 }, { "epoch": 0.05, "learning_rate": 1.9986017152454497e-05, "loss": 0.7993, "step": 426 }, { "epoch": 0.05, "learning_rate": 1.9985830137216545e-05, "loss": 0.8301, "step": 427 }, { "epoch": 0.05, "learning_rate": 1.998564188053067e-05, "loss": 0.9331, "step": 428 }, { "epoch": 0.05, "learning_rate": 1.9985452382420277e-05, "loss": 0.73, "step": 429 }, { "epoch": 0.05, "learning_rate": 1.9985261642908917e-05, "loss": 0.939, "step": 430 }, { "epoch": 0.05, "learning_rate": 1.998506966202031e-05, "loss": 0.6113, "step": 431 }, { "epoch": 0.05, "learning_rate": 1.998487643977832e-05, "loss": 0.8281, "step": 432 }, { "epoch": 0.05, "learning_rate": 1.998468197620697e-05, "loss": 0.6758, "step": 433 }, { "epoch": 0.05, "learning_rate": 1.9984486271330433e-05, "loss": 0.6802, "step": 434 }, { "epoch": 0.05, "learning_rate": 1.9984289325173042e-05, "loss": 0.741, "step": 435 }, { "epoch": 0.05, "learning_rate": 1.998409113775928e-05, "loss": 0.7791, "step": 436 }, { "epoch": 0.05, "learning_rate": 1.998389170911379e-05, "loss": 0.7495, "step": 437 }, { "epoch": 0.05, "learning_rate": 1.9983691039261358e-05, "loss": 0.761, "step": 438 }, { "epoch": 0.05, "learning_rate": 1.9983489128226937e-05, "loss": 0.9243, "step": 439 }, { "epoch": 0.05, "learning_rate": 1.9983285976035626e-05, "loss": 0.7566, "step": 440 }, { "epoch": 0.05, "learning_rate": 1.9983081582712684e-05, "loss": 0.7651, "step": 441 }, { "epoch": 0.05, "learning_rate": 1.9982875948283518e-05, "loss": 0.8008, "step": 442 }, { "epoch": 0.05, "learning_rate": 1.9982669072773696e-05, "loss": 0.7161, "step": 443 }, { "epoch": 0.05, "learning_rate": 1.9982460956208932e-05, "loss": 0.7734, "step": 444 }, { "epoch": 0.05, "learning_rate": 1.9982251598615107e-05, "loss": 0.7883, "step": 445 }, { "epoch": 0.05, "learning_rate": 1.9982041000018237e-05, "loss": 0.8398, "step": 446 }, { "epoch": 0.05, "learning_rate": 1.9981829160444515e-05, "loss": 0.9006, "step": 447 }, { "epoch": 0.05, "learning_rate": 1.998161607992027e-05, "loss": 0.7402, "step": 448 }, { "epoch": 0.05, "learning_rate": 1.9981401758471998e-05, "loss": 0.8843, "step": 449 }, { "epoch": 0.05, "learning_rate": 1.998118619612634e-05, "loss": 0.6699, "step": 450 }, { "epoch": 0.05, "learning_rate": 1.99809693929101e-05, "loss": 0.7048, "step": 451 }, { "epoch": 0.05, "learning_rate": 1.998075134885022e-05, "loss": 0.792, "step": 452 }, { "epoch": 0.05, "learning_rate": 1.9980532063973817e-05, "loss": 0.7755, "step": 453 }, { "epoch": 0.05, "learning_rate": 1.9980311538308153e-05, "loss": 0.728, "step": 454 }, { "epoch": 0.05, "learning_rate": 1.998008977188064e-05, "loss": 0.8569, "step": 455 }, { "epoch": 0.05, "learning_rate": 1.9979866764718846e-05, "loss": 0.9233, "step": 456 }, { "epoch": 0.05, "learning_rate": 1.9979642516850498e-05, "loss": 0.6948, "step": 457 }, { "epoch": 0.05, "learning_rate": 1.9979417028303478e-05, "loss": 0.7725, "step": 458 }, { "epoch": 0.05, "learning_rate": 1.997919029910582e-05, "loss": 0.5383, "step": 459 }, { "epoch": 0.05, "learning_rate": 1.9978962329285704e-05, "loss": 0.8406, "step": 460 }, { "epoch": 0.05, "learning_rate": 1.997873311887147e-05, "loss": 0.825, "step": 461 }, { "epoch": 0.05, "learning_rate": 1.9978502667891626e-05, "loss": 0.7837, "step": 462 }, { "epoch": 0.05, "learning_rate": 1.9978270976374813e-05, "loss": 0.7734, "step": 463 }, { "epoch": 0.05, "learning_rate": 1.9978038044349833e-05, "loss": 0.7673, "step": 464 }, { "epoch": 0.05, "learning_rate": 1.997780387184565e-05, "loss": 0.8208, "step": 465 }, { "epoch": 0.05, "learning_rate": 1.9977568458891377e-05, "loss": 0.8325, "step": 466 }, { "epoch": 0.05, "learning_rate": 1.997733180551628e-05, "loss": 0.7175, "step": 467 }, { "epoch": 0.05, "learning_rate": 1.997709391174977e-05, "loss": 0.7937, "step": 468 }, { "epoch": 0.05, "learning_rate": 1.9976854777621436e-05, "loss": 0.7212, "step": 469 }, { "epoch": 0.05, "learning_rate": 1.9976614403161e-05, "loss": 0.7722, "step": 470 }, { "epoch": 0.05, "learning_rate": 1.997637278839835e-05, "loss": 0.8877, "step": 471 }, { "epoch": 0.05, "learning_rate": 1.997612993336352e-05, "loss": 0.7996, "step": 472 }, { "epoch": 0.05, "learning_rate": 1.9975885838086702e-05, "loss": 0.7795, "step": 473 }, { "epoch": 0.05, "learning_rate": 1.9975640502598243e-05, "loss": 0.8721, "step": 474 }, { "epoch": 0.05, "learning_rate": 1.9975393926928645e-05, "loss": 0.7363, "step": 475 }, { "epoch": 0.05, "learning_rate": 1.997514611110856e-05, "loss": 0.709, "step": 476 }, { "epoch": 0.05, "learning_rate": 1.99748970551688e-05, "loss": 0.8433, "step": 477 }, { "epoch": 0.05, "learning_rate": 1.9974646759140322e-05, "loss": 0.8279, "step": 478 }, { "epoch": 0.05, "learning_rate": 1.9974395223054254e-05, "loss": 0.6201, "step": 479 }, { "epoch": 0.05, "learning_rate": 1.9974142446941855e-05, "loss": 0.7622, "step": 480 }, { "epoch": 0.05, "learning_rate": 1.9973888430834553e-05, "loss": 0.8018, "step": 481 }, { "epoch": 0.05, "learning_rate": 1.9973633174763932e-05, "loss": 0.8096, "step": 482 }, { "epoch": 0.05, "learning_rate": 1.9973376678761726e-05, "loss": 0.7649, "step": 483 }, { "epoch": 0.05, "learning_rate": 1.9973118942859817e-05, "loss": 0.7695, "step": 484 }, { "epoch": 0.05, "learning_rate": 1.9972859967090253e-05, "loss": 0.8027, "step": 485 }, { "epoch": 0.05, "learning_rate": 1.9972599751485225e-05, "loss": 1.0513, "step": 486 }, { "epoch": 0.05, "learning_rate": 1.9972338296077086e-05, "loss": 0.8462, "step": 487 }, { "epoch": 0.05, "learning_rate": 1.9972075600898342e-05, "loss": 0.8003, "step": 488 }, { "epoch": 0.05, "learning_rate": 1.997181166598165e-05, "loss": 0.8049, "step": 489 }, { "epoch": 0.05, "learning_rate": 1.997154649135982e-05, "loss": 0.7388, "step": 490 }, { "epoch": 0.05, "learning_rate": 1.997128007706582e-05, "loss": 0.6924, "step": 491 }, { "epoch": 0.05, "learning_rate": 1.9971012423132776e-05, "loss": 0.8262, "step": 492 }, { "epoch": 0.05, "learning_rate": 1.9970743529593956e-05, "loss": 0.8599, "step": 493 }, { "epoch": 0.05, "learning_rate": 1.997047339648279e-05, "loss": 0.6179, "step": 494 }, { "epoch": 0.05, "learning_rate": 1.997020202383287e-05, "loss": 0.8687, "step": 495 }, { "epoch": 0.05, "learning_rate": 1.996992941167792e-05, "loss": 0.7524, "step": 496 }, { "epoch": 0.05, "learning_rate": 1.9969655560051842e-05, "loss": 0.8682, "step": 497 }, { "epoch": 0.05, "learning_rate": 1.9969380468988676e-05, "loss": 0.9185, "step": 498 }, { "epoch": 0.05, "learning_rate": 1.9969104138522622e-05, "loss": 0.8552, "step": 499 }, { "epoch": 0.05, "learning_rate": 1.9968826568688036e-05, "loss": 0.8245, "step": 500 }, { "epoch": 0.05, "learning_rate": 1.9968547759519426e-05, "loss": 0.7422, "step": 501 }, { "epoch": 0.05, "learning_rate": 1.9968267711051446e-05, "loss": 0.7983, "step": 502 }, { "epoch": 0.05, "learning_rate": 1.9967986423318926e-05, "loss": 0.7356, "step": 503 }, { "epoch": 0.05, "learning_rate": 1.996770389635682e-05, "loss": 0.7498, "step": 504 }, { "epoch": 0.05, "learning_rate": 1.996742013020027e-05, "loss": 0.8569, "step": 505 }, { "epoch": 0.06, "learning_rate": 1.996713512488454e-05, "loss": 0.7666, "step": 506 }, { "epoch": 0.06, "learning_rate": 1.996684888044506e-05, "loss": 0.667, "step": 507 }, { "epoch": 0.06, "learning_rate": 1.996656139691743e-05, "loss": 0.8152, "step": 508 }, { "epoch": 0.06, "learning_rate": 1.9966272674337382e-05, "loss": 0.7852, "step": 509 }, { "epoch": 0.06, "learning_rate": 1.996598271274081e-05, "loss": 0.8457, "step": 510 }, { "epoch": 0.06, "learning_rate": 1.996569151216376e-05, "loss": 0.8921, "step": 511 }, { "epoch": 0.06, "learning_rate": 1.996539907264244e-05, "loss": 0.8789, "step": 512 }, { "epoch": 0.06, "learning_rate": 1.9965105394213203e-05, "loss": 0.8916, "step": 513 }, { "epoch": 0.06, "learning_rate": 1.9964810476912563e-05, "loss": 0.6951, "step": 514 }, { "epoch": 0.06, "learning_rate": 1.996451432077718e-05, "loss": 0.8252, "step": 515 }, { "epoch": 0.06, "learning_rate": 1.9964216925843876e-05, "loss": 0.8296, "step": 516 }, { "epoch": 0.06, "learning_rate": 1.996391829214962e-05, "loss": 0.8701, "step": 517 }, { "epoch": 0.06, "learning_rate": 1.996361841973154e-05, "loss": 0.8154, "step": 518 }, { "epoch": 0.06, "learning_rate": 1.9963317308626916e-05, "loss": 0.6643, "step": 519 }, { "epoch": 0.06, "learning_rate": 1.9963014958873182e-05, "loss": 0.7292, "step": 520 }, { "epoch": 0.06, "learning_rate": 1.996271137050793e-05, "loss": 0.8286, "step": 521 }, { "epoch": 0.06, "learning_rate": 1.99624065435689e-05, "loss": 0.876, "step": 522 }, { "epoch": 0.06, "learning_rate": 1.9962100478093984e-05, "loss": 0.7273, "step": 523 }, { "epoch": 0.06, "learning_rate": 1.996179317412124e-05, "loss": 0.7217, "step": 524 }, { "epoch": 0.06, "learning_rate": 1.996148463168887e-05, "loss": 0.8384, "step": 525 }, { "epoch": 0.06, "learning_rate": 1.9961174850835224e-05, "loss": 0.8232, "step": 526 }, { "epoch": 0.06, "learning_rate": 1.9960863831598827e-05, "loss": 0.8892, "step": 527 }, { "epoch": 0.06, "learning_rate": 1.996055157401834e-05, "loss": 0.6963, "step": 528 }, { "epoch": 0.06, "learning_rate": 1.996023807813258e-05, "loss": 0.832, "step": 529 }, { "epoch": 0.06, "learning_rate": 1.9959923343980525e-05, "loss": 0.7129, "step": 530 }, { "epoch": 0.06, "learning_rate": 1.9959607371601303e-05, "loss": 0.8638, "step": 531 }, { "epoch": 0.06, "learning_rate": 1.9959290161034194e-05, "loss": 0.8975, "step": 532 }, { "epoch": 0.06, "learning_rate": 1.9958971712318632e-05, "loss": 0.8096, "step": 533 }, { "epoch": 0.06, "learning_rate": 1.9958652025494212e-05, "loss": 0.812, "step": 534 }, { "epoch": 0.06, "learning_rate": 1.9958331100600677e-05, "loss": 0.7307, "step": 535 }, { "epoch": 0.06, "learning_rate": 1.995800893767792e-05, "loss": 0.7417, "step": 536 }, { "epoch": 0.06, "learning_rate": 1.9957685536765998e-05, "loss": 0.7969, "step": 537 }, { "epoch": 0.06, "learning_rate": 1.9957360897905113e-05, "loss": 0.6433, "step": 538 }, { "epoch": 0.06, "learning_rate": 1.995703502113562e-05, "loss": 0.7942, "step": 539 }, { "epoch": 0.06, "learning_rate": 1.9956707906498046e-05, "loss": 0.7593, "step": 540 }, { "epoch": 0.06, "learning_rate": 1.9956379554033046e-05, "loss": 0.9419, "step": 541 }, { "epoch": 0.06, "learning_rate": 1.9956049963781447e-05, "loss": 0.7324, "step": 542 }, { "epoch": 0.06, "learning_rate": 1.995571913578422e-05, "loss": 0.8511, "step": 543 }, { "epoch": 0.06, "learning_rate": 1.99553870700825e-05, "loss": 0.8477, "step": 544 }, { "epoch": 0.06, "learning_rate": 1.9955053766717564e-05, "loss": 0.7627, "step": 545 }, { "epoch": 0.06, "learning_rate": 1.9954719225730847e-05, "loss": 0.6914, "step": 546 }, { "epoch": 0.06, "learning_rate": 1.9954383447163946e-05, "loss": 0.6987, "step": 547 }, { "epoch": 0.06, "learning_rate": 1.99540464310586e-05, "loss": 0.6848, "step": 548 }, { "epoch": 0.06, "learning_rate": 1.9953708177456713e-05, "loss": 0.8052, "step": 549 }, { "epoch": 0.06, "learning_rate": 1.995336868640033e-05, "loss": 0.8857, "step": 550 }, { "epoch": 0.06, "learning_rate": 1.9953027957931658e-05, "loss": 0.804, "step": 551 }, { "epoch": 0.06, "learning_rate": 1.9952685992093064e-05, "loss": 0.7695, "step": 552 }, { "epoch": 0.06, "learning_rate": 1.9952342788927053e-05, "loss": 0.6836, "step": 553 }, { "epoch": 0.06, "learning_rate": 1.99519983484763e-05, "loss": 0.835, "step": 554 }, { "epoch": 0.06, "learning_rate": 1.9951652670783615e-05, "loss": 0.8359, "step": 555 }, { "epoch": 0.06, "learning_rate": 1.9951305755891982e-05, "loss": 0.8521, "step": 556 }, { "epoch": 0.06, "learning_rate": 1.9950957603844528e-05, "loss": 0.72, "step": 557 }, { "epoch": 0.06, "learning_rate": 1.9950608214684536e-05, "loss": 0.8438, "step": 558 }, { "epoch": 0.06, "learning_rate": 1.9950257588455445e-05, "loss": 0.6897, "step": 559 }, { "epoch": 0.06, "learning_rate": 1.9949905725200835e-05, "loss": 0.7078, "step": 560 }, { "epoch": 0.06, "learning_rate": 1.994955262496446e-05, "loss": 0.6465, "step": 561 }, { "epoch": 0.06, "learning_rate": 1.9949198287790215e-05, "loss": 0.8037, "step": 562 }, { "epoch": 0.06, "learning_rate": 1.994884271372215e-05, "loss": 0.792, "step": 563 }, { "epoch": 0.06, "learning_rate": 1.9948485902804472e-05, "loss": 0.7712, "step": 564 }, { "epoch": 0.06, "learning_rate": 1.994812785508154e-05, "loss": 0.7209, "step": 565 }, { "epoch": 0.06, "learning_rate": 1.9947768570597865e-05, "loss": 0.8164, "step": 566 }, { "epoch": 0.06, "learning_rate": 1.994740804939811e-05, "loss": 0.7195, "step": 567 }, { "epoch": 0.06, "learning_rate": 1.9947046291527107e-05, "loss": 0.8213, "step": 568 }, { "epoch": 0.06, "learning_rate": 1.9946683297029823e-05, "loss": 0.771, "step": 569 }, { "epoch": 0.06, "learning_rate": 1.9946319065951382e-05, "loss": 0.7316, "step": 570 }, { "epoch": 0.06, "learning_rate": 1.9945953598337074e-05, "loss": 0.708, "step": 571 }, { "epoch": 0.06, "learning_rate": 1.994558689423233e-05, "loss": 0.6287, "step": 572 }, { "epoch": 0.06, "learning_rate": 1.9945218953682736e-05, "loss": 0.667, "step": 573 }, { "epoch": 0.06, "learning_rate": 1.9944849776734037e-05, "loss": 0.7964, "step": 574 }, { "epoch": 0.06, "learning_rate": 1.994447936343213e-05, "loss": 0.79, "step": 575 }, { "epoch": 0.06, "learning_rate": 1.9944107713823068e-05, "loss": 0.7839, "step": 576 }, { "epoch": 0.06, "learning_rate": 1.9943734827953052e-05, "loss": 0.7834, "step": 577 }, { "epoch": 0.06, "learning_rate": 1.994336070586844e-05, "loss": 0.8701, "step": 578 }, { "epoch": 0.06, "learning_rate": 1.994298534761574e-05, "loss": 0.7307, "step": 579 }, { "epoch": 0.06, "learning_rate": 1.994260875324162e-05, "loss": 0.7607, "step": 580 }, { "epoch": 0.06, "learning_rate": 1.99422309227929e-05, "loss": 0.7224, "step": 581 }, { "epoch": 0.06, "learning_rate": 1.994185185631655e-05, "loss": 0.7063, "step": 582 }, { "epoch": 0.06, "learning_rate": 1.9941471553859695e-05, "loss": 0.8125, "step": 583 }, { "epoch": 0.06, "learning_rate": 1.9941090015469614e-05, "loss": 0.8247, "step": 584 }, { "epoch": 0.06, "learning_rate": 1.9940707241193746e-05, "loss": 0.7942, "step": 585 }, { "epoch": 0.06, "learning_rate": 1.9940323231079674e-05, "loss": 0.8337, "step": 586 }, { "epoch": 0.06, "learning_rate": 1.9939937985175137e-05, "loss": 0.8193, "step": 587 }, { "epoch": 0.06, "learning_rate": 1.993955150352803e-05, "loss": 0.8389, "step": 588 }, { "epoch": 0.06, "learning_rate": 1.9939163786186402e-05, "loss": 0.8196, "step": 589 }, { "epoch": 0.06, "learning_rate": 1.9938774833198455e-05, "loss": 0.6453, "step": 590 }, { "epoch": 0.06, "learning_rate": 1.9938384644612542e-05, "loss": 0.6526, "step": 591 }, { "epoch": 0.06, "learning_rate": 1.9937993220477173e-05, "loss": 0.7312, "step": 592 }, { "epoch": 0.06, "learning_rate": 1.993760056084101e-05, "loss": 0.7739, "step": 593 }, { "epoch": 0.06, "learning_rate": 1.993720666575287e-05, "loss": 0.8931, "step": 594 }, { "epoch": 0.06, "learning_rate": 1.9936811535261714e-05, "loss": 0.7048, "step": 595 }, { "epoch": 0.06, "learning_rate": 1.993641516941668e-05, "loss": 0.7422, "step": 596 }, { "epoch": 0.06, "learning_rate": 1.9936017568267032e-05, "loss": 0.9478, "step": 597 }, { "epoch": 0.07, "learning_rate": 1.9935618731862205e-05, "loss": 0.7637, "step": 598 }, { "epoch": 0.07, "learning_rate": 1.9935218660251782e-05, "loss": 0.9038, "step": 599 }, { "epoch": 0.07, "learning_rate": 1.99348173534855e-05, "loss": 0.894, "step": 600 }, { "epoch": 0.07, "learning_rate": 1.9934414811613257e-05, "loss": 0.6948, "step": 601 }, { "epoch": 0.07, "learning_rate": 1.9934011034685087e-05, "loss": 0.7336, "step": 602 }, { "epoch": 0.07, "learning_rate": 1.9933606022751188e-05, "loss": 0.7688, "step": 603 }, { "epoch": 0.07, "learning_rate": 1.9933199775861917e-05, "loss": 0.9297, "step": 604 }, { "epoch": 0.07, "learning_rate": 1.993279229406778e-05, "loss": 0.7988, "step": 605 }, { "epoch": 0.07, "learning_rate": 1.9932383577419432e-05, "loss": 0.8911, "step": 606 }, { "epoch": 0.07, "learning_rate": 1.9931973625967683e-05, "loss": 0.8035, "step": 607 }, { "epoch": 0.07, "learning_rate": 1.9931562439763504e-05, "loss": 0.8835, "step": 608 }, { "epoch": 0.07, "learning_rate": 1.9931150018858013e-05, "loss": 0.783, "step": 609 }, { "epoch": 0.07, "learning_rate": 1.9930736363302477e-05, "loss": 0.8191, "step": 610 }, { "epoch": 0.07, "learning_rate": 1.9930321473148327e-05, "loss": 0.7871, "step": 611 }, { "epoch": 0.07, "learning_rate": 1.9929905348447143e-05, "loss": 0.7588, "step": 612 }, { "epoch": 0.07, "learning_rate": 1.9929487989250657e-05, "loss": 0.8118, "step": 613 }, { "epoch": 0.07, "learning_rate": 1.9929069395610753e-05, "loss": 0.7993, "step": 614 }, { "epoch": 0.07, "learning_rate": 1.9928649567579476e-05, "loss": 0.8486, "step": 615 }, { "epoch": 0.07, "learning_rate": 1.9928228505209017e-05, "loss": 0.7793, "step": 616 }, { "epoch": 0.07, "learning_rate": 1.9927806208551718e-05, "loss": 0.8804, "step": 617 }, { "epoch": 0.07, "learning_rate": 1.992738267766009e-05, "loss": 0.7297, "step": 618 }, { "epoch": 0.07, "learning_rate": 1.992695791258677e-05, "loss": 0.9211, "step": 619 }, { "epoch": 0.07, "learning_rate": 1.9926531913384583e-05, "loss": 0.634, "step": 620 }, { "epoch": 0.07, "learning_rate": 1.9926104680106484e-05, "loss": 0.8057, "step": 621 }, { "epoch": 0.07, "learning_rate": 1.9925676212805582e-05, "loss": 0.7664, "step": 622 }, { "epoch": 0.07, "learning_rate": 1.9925246511535146e-05, "loss": 0.7412, "step": 623 }, { "epoch": 0.07, "learning_rate": 1.9924815576348604e-05, "loss": 0.7993, "step": 624 }, { "epoch": 0.07, "learning_rate": 1.9924383407299525e-05, "loss": 0.7261, "step": 625 }, { "epoch": 0.07, "learning_rate": 1.992395000444163e-05, "loss": 0.7988, "step": 626 }, { "epoch": 0.07, "learning_rate": 1.9923515367828812e-05, "loss": 0.7195, "step": 627 }, { "epoch": 0.07, "learning_rate": 1.99230794975151e-05, "loss": 0.9307, "step": 628 }, { "epoch": 0.07, "learning_rate": 1.9922642393554678e-05, "loss": 0.835, "step": 629 }, { "epoch": 0.07, "learning_rate": 1.9922204056001896e-05, "loss": 0.8494, "step": 630 }, { "epoch": 0.07, "learning_rate": 1.9921764484911242e-05, "loss": 0.8062, "step": 631 }, { "epoch": 0.07, "learning_rate": 1.9921323680337363e-05, "loss": 0.8716, "step": 632 }, { "epoch": 0.07, "learning_rate": 1.9920881642335064e-05, "loss": 0.7412, "step": 633 }, { "epoch": 0.07, "learning_rate": 1.99204383709593e-05, "loss": 0.6487, "step": 634 }, { "epoch": 0.07, "learning_rate": 1.9919993866265176e-05, "loss": 0.7759, "step": 635 }, { "epoch": 0.07, "learning_rate": 1.9919548128307954e-05, "loss": 0.7979, "step": 636 }, { "epoch": 0.07, "learning_rate": 1.991910115714305e-05, "loss": 0.6714, "step": 637 }, { "epoch": 0.07, "learning_rate": 1.9918652952826032e-05, "loss": 0.7612, "step": 638 }, { "epoch": 0.07, "learning_rate": 1.9918203515412616e-05, "loss": 0.8267, "step": 639 }, { "epoch": 0.07, "learning_rate": 1.9917752844958685e-05, "loss": 0.7383, "step": 640 }, { "epoch": 0.07, "learning_rate": 1.9917300941520262e-05, "loss": 0.8198, "step": 641 }, { "epoch": 0.07, "learning_rate": 1.9916847805153528e-05, "loss": 0.7576, "step": 642 }, { "epoch": 0.07, "learning_rate": 1.991639343591482e-05, "loss": 0.844, "step": 643 }, { "epoch": 0.07, "learning_rate": 1.991593783386062e-05, "loss": 0.7935, "step": 644 }, { "epoch": 0.07, "learning_rate": 1.9915480999047573e-05, "loss": 0.7466, "step": 645 }, { "epoch": 0.07, "learning_rate": 1.991502293153247e-05, "loss": 0.6753, "step": 646 }, { "epoch": 0.07, "learning_rate": 1.9914563631372267e-05, "loss": 0.7339, "step": 647 }, { "epoch": 0.07, "learning_rate": 1.9914103098624055e-05, "loss": 0.7017, "step": 648 }, { "epoch": 0.07, "learning_rate": 1.9913641333345094e-05, "loss": 0.7979, "step": 649 }, { "epoch": 0.07, "learning_rate": 1.9913178335592784e-05, "loss": 0.813, "step": 650 }, { "epoch": 0.07, "learning_rate": 1.9912714105424694e-05, "loss": 0.6677, "step": 651 }, { "epoch": 0.07, "learning_rate": 1.9912248642898532e-05, "loss": 0.5476, "step": 652 }, { "epoch": 0.07, "learning_rate": 1.9911781948072163e-05, "loss": 0.6646, "step": 653 }, { "epoch": 0.07, "learning_rate": 1.9911314021003614e-05, "loss": 0.855, "step": 654 }, { "epoch": 0.07, "learning_rate": 1.9910844861751052e-05, "loss": 0.8472, "step": 655 }, { "epoch": 0.07, "learning_rate": 1.9910374470372805e-05, "loss": 0.7688, "step": 656 }, { "epoch": 0.07, "learning_rate": 1.9909902846927355e-05, "loss": 0.8188, "step": 657 }, { "epoch": 0.07, "learning_rate": 1.9909429991473334e-05, "loss": 0.7629, "step": 658 }, { "epoch": 0.07, "learning_rate": 1.9908955904069526e-05, "loss": 0.7471, "step": 659 }, { "epoch": 0.07, "learning_rate": 1.9908480584774867e-05, "loss": 0.6426, "step": 660 }, { "epoch": 0.07, "learning_rate": 1.9908004033648452e-05, "loss": 0.8096, "step": 661 }, { "epoch": 0.07, "learning_rate": 1.9907526250749535e-05, "loss": 0.8718, "step": 662 }, { "epoch": 0.07, "learning_rate": 1.99070472361375e-05, "loss": 0.7905, "step": 663 }, { "epoch": 0.07, "learning_rate": 1.9906566989871905e-05, "loss": 0.8857, "step": 664 }, { "epoch": 0.07, "learning_rate": 1.9906085512012458e-05, "loss": 0.7573, "step": 665 }, { "epoch": 0.07, "learning_rate": 1.990560280261901e-05, "loss": 0.7979, "step": 666 }, { "epoch": 0.07, "learning_rate": 1.9905118861751574e-05, "loss": 0.7603, "step": 667 }, { "epoch": 0.07, "learning_rate": 1.9904633689470317e-05, "loss": 0.8169, "step": 668 }, { "epoch": 0.07, "learning_rate": 1.9904147285835557e-05, "loss": 0.6892, "step": 669 }, { "epoch": 0.07, "learning_rate": 1.9903659650907762e-05, "loss": 0.7312, "step": 670 }, { "epoch": 0.07, "learning_rate": 1.990317078474755e-05, "loss": 0.8125, "step": 671 }, { "epoch": 0.07, "learning_rate": 1.9902680687415704e-05, "loss": 0.7881, "step": 672 }, { "epoch": 0.07, "learning_rate": 1.9902189358973153e-05, "loss": 0.75, "step": 673 }, { "epoch": 0.07, "learning_rate": 1.9901696799480977e-05, "loss": 0.7998, "step": 674 }, { "epoch": 0.07, "learning_rate": 1.9901203009000413e-05, "loss": 0.9492, "step": 675 }, { "epoch": 0.07, "learning_rate": 1.9900707987592847e-05, "loss": 0.7202, "step": 676 }, { "epoch": 0.07, "learning_rate": 1.9900211735319825e-05, "loss": 0.8848, "step": 677 }, { "epoch": 0.07, "learning_rate": 1.9899714252243037e-05, "loss": 0.7729, "step": 678 }, { "epoch": 0.07, "learning_rate": 1.989921553842433e-05, "loss": 0.7849, "step": 679 }, { "epoch": 0.07, "learning_rate": 1.989871559392571e-05, "loss": 0.7668, "step": 680 }, { "epoch": 0.07, "learning_rate": 1.989821441880933e-05, "loss": 0.6731, "step": 681 }, { "epoch": 0.07, "learning_rate": 1.989771201313749e-05, "loss": 0.7603, "step": 682 }, { "epoch": 0.07, "learning_rate": 1.9897208376972655e-05, "loss": 0.6531, "step": 683 }, { "epoch": 0.07, "learning_rate": 1.9896703510377436e-05, "loss": 0.6902, "step": 684 }, { "epoch": 0.07, "learning_rate": 1.9896197413414602e-05, "loss": 0.8386, "step": 685 }, { "epoch": 0.07, "learning_rate": 1.9895690086147065e-05, "loss": 0.8027, "step": 686 }, { "epoch": 0.07, "learning_rate": 1.98951815286379e-05, "loss": 0.7319, "step": 687 }, { "epoch": 0.07, "learning_rate": 1.9894671740950333e-05, "loss": 0.7715, "step": 688 }, { "epoch": 0.08, "learning_rate": 1.989416072314774e-05, "loss": 0.6687, "step": 689 }, { "epoch": 0.08, "learning_rate": 1.9893648475293646e-05, "loss": 0.6755, "step": 690 }, { "epoch": 0.08, "learning_rate": 1.9893134997451742e-05, "loss": 0.8154, "step": 691 }, { "epoch": 0.08, "learning_rate": 1.989262028968586e-05, "loss": 0.6995, "step": 692 }, { "epoch": 0.08, "learning_rate": 1.9892104352059988e-05, "loss": 0.6531, "step": 693 }, { "epoch": 0.08, "learning_rate": 1.9891587184638274e-05, "loss": 0.8311, "step": 694 }, { "epoch": 0.08, "learning_rate": 1.9891068787485006e-05, "loss": 0.8701, "step": 695 }, { "epoch": 0.08, "learning_rate": 1.9890549160664633e-05, "loss": 0.7789, "step": 696 }, { "epoch": 0.08, "learning_rate": 1.9890028304241754e-05, "loss": 0.6589, "step": 697 }, { "epoch": 0.08, "learning_rate": 1.988950621828113e-05, "loss": 0.7454, "step": 698 }, { "epoch": 0.08, "learning_rate": 1.9888982902847658e-05, "loss": 0.6772, "step": 699 }, { "epoch": 0.08, "learning_rate": 1.9888458358006403e-05, "loss": 0.7432, "step": 700 }, { "epoch": 0.08, "learning_rate": 1.9887932583822572e-05, "loss": 0.7668, "step": 701 }, { "epoch": 0.08, "learning_rate": 1.988740558036154e-05, "loss": 0.7725, "step": 702 }, { "epoch": 0.08, "learning_rate": 1.988687734768881e-05, "loss": 0.8726, "step": 703 }, { "epoch": 0.08, "learning_rate": 1.9886347885870063e-05, "loss": 0.8135, "step": 704 }, { "epoch": 0.08, "learning_rate": 1.9885817194971116e-05, "loss": 0.7131, "step": 705 }, { "epoch": 0.08, "learning_rate": 1.9885285275057954e-05, "loss": 0.7534, "step": 706 }, { "epoch": 0.08, "learning_rate": 1.9884752126196693e-05, "loss": 0.769, "step": 707 }, { "epoch": 0.08, "learning_rate": 1.9884217748453625e-05, "loss": 0.6892, "step": 708 }, { "epoch": 0.08, "learning_rate": 1.988368214189518e-05, "loss": 0.78, "step": 709 }, { "epoch": 0.08, "learning_rate": 1.988314530658795e-05, "loss": 0.6562, "step": 710 }, { "epoch": 0.08, "learning_rate": 1.9882607242598663e-05, "loss": 0.7068, "step": 711 }, { "epoch": 0.08, "learning_rate": 1.9882067949994224e-05, "loss": 0.783, "step": 712 }, { "epoch": 0.08, "learning_rate": 1.988152742884167e-05, "loss": 0.8242, "step": 713 }, { "epoch": 0.08, "learning_rate": 1.9880985679208206e-05, "loss": 0.7271, "step": 714 }, { "epoch": 0.08, "learning_rate": 1.9880442701161177e-05, "loss": 0.6938, "step": 715 }, { "epoch": 0.08, "learning_rate": 1.9879898494768093e-05, "loss": 0.8079, "step": 716 }, { "epoch": 0.08, "learning_rate": 1.98793530600966e-05, "loss": 0.6987, "step": 717 }, { "epoch": 0.08, "learning_rate": 1.987880639721452e-05, "loss": 0.6799, "step": 718 }, { "epoch": 0.08, "learning_rate": 1.9878258506189804e-05, "loss": 0.7471, "step": 719 }, { "epoch": 0.08, "learning_rate": 1.9877709387090573e-05, "loss": 0.7429, "step": 720 }, { "epoch": 0.08, "learning_rate": 1.987715903998509e-05, "loss": 0.7698, "step": 721 }, { "epoch": 0.08, "learning_rate": 1.9876607464941777e-05, "loss": 0.709, "step": 722 }, { "epoch": 0.08, "learning_rate": 1.9876054662029203e-05, "loss": 0.7432, "step": 723 }, { "epoch": 0.08, "learning_rate": 1.9875500631316095e-05, "loss": 0.7917, "step": 724 }, { "epoch": 0.08, "learning_rate": 1.9874945372871335e-05, "loss": 0.9043, "step": 725 }, { "epoch": 0.08, "learning_rate": 1.9874388886763944e-05, "loss": 0.8687, "step": 726 }, { "epoch": 0.08, "learning_rate": 1.9873831173063113e-05, "loss": 0.7961, "step": 727 }, { "epoch": 0.08, "learning_rate": 1.9873272231838174e-05, "loss": 0.7791, "step": 728 }, { "epoch": 0.08, "learning_rate": 1.9872712063158615e-05, "loss": 0.8276, "step": 729 }, { "epoch": 0.08, "learning_rate": 1.987215066709408e-05, "loss": 0.8286, "step": 730 }, { "epoch": 0.08, "learning_rate": 1.987158804371436e-05, "loss": 0.8813, "step": 731 }, { "epoch": 0.08, "learning_rate": 1.98710241930894e-05, "loss": 0.6575, "step": 732 }, { "epoch": 0.08, "learning_rate": 1.9870459115289295e-05, "loss": 0.6797, "step": 733 }, { "epoch": 0.08, "learning_rate": 1.9869892810384304e-05, "loss": 0.7773, "step": 734 }, { "epoch": 0.08, "learning_rate": 1.9869325278444824e-05, "loss": 0.8269, "step": 735 }, { "epoch": 0.08, "learning_rate": 1.9868756519541416e-05, "loss": 0.7729, "step": 736 }, { "epoch": 0.08, "learning_rate": 1.9868186533744783e-05, "loss": 0.916, "step": 737 }, { "epoch": 0.08, "learning_rate": 1.9867615321125796e-05, "loss": 0.8521, "step": 738 }, { "epoch": 0.08, "learning_rate": 1.9867042881755457e-05, "loss": 0.9043, "step": 739 }, { "epoch": 0.08, "learning_rate": 1.9866469215704938e-05, "loss": 0.7969, "step": 740 }, { "epoch": 0.08, "learning_rate": 1.9865894323045558e-05, "loss": 0.7617, "step": 741 }, { "epoch": 0.08, "learning_rate": 1.9865318203848786e-05, "loss": 0.875, "step": 742 }, { "epoch": 0.08, "learning_rate": 1.9864740858186246e-05, "loss": 0.7236, "step": 743 }, { "epoch": 0.08, "learning_rate": 1.986416228612972e-05, "loss": 0.74, "step": 744 }, { "epoch": 0.08, "learning_rate": 1.9863582487751127e-05, "loss": 0.8232, "step": 745 }, { "epoch": 0.08, "learning_rate": 1.9863001463122557e-05, "loss": 0.8738, "step": 746 }, { "epoch": 0.08, "learning_rate": 1.986241921231624e-05, "loss": 0.8013, "step": 747 }, { "epoch": 0.08, "learning_rate": 1.9861835735404558e-05, "loss": 0.7793, "step": 748 }, { "epoch": 0.08, "learning_rate": 1.9861251032460053e-05, "loss": 0.668, "step": 749 }, { "epoch": 0.08, "learning_rate": 1.9860665103555418e-05, "loss": 0.8169, "step": 750 }, { "epoch": 0.08, "learning_rate": 1.9860077948763488e-05, "loss": 0.8018, "step": 751 }, { "epoch": 0.08, "learning_rate": 1.985948956815727e-05, "loss": 0.8062, "step": 752 }, { "epoch": 0.08, "learning_rate": 1.9858899961809904e-05, "loss": 0.7554, "step": 753 }, { "epoch": 0.08, "learning_rate": 1.9858309129794694e-05, "loss": 0.7935, "step": 754 }, { "epoch": 0.08, "learning_rate": 1.9857717072185094e-05, "loss": 0.7075, "step": 755 }, { "epoch": 0.08, "learning_rate": 1.9857123789054707e-05, "loss": 0.7488, "step": 756 }, { "epoch": 0.08, "learning_rate": 1.985652928047729e-05, "loss": 0.77, "step": 757 }, { "epoch": 0.08, "learning_rate": 1.985593354652675e-05, "loss": 0.7554, "step": 758 }, { "epoch": 0.08, "learning_rate": 1.9855336587277153e-05, "loss": 0.8623, "step": 759 }, { "epoch": 0.08, "learning_rate": 1.9854738402802715e-05, "loss": 0.7087, "step": 760 }, { "epoch": 0.08, "learning_rate": 1.9854138993177804e-05, "loss": 0.7297, "step": 761 }, { "epoch": 0.08, "learning_rate": 1.9853538358476933e-05, "loss": 0.7544, "step": 762 }, { "epoch": 0.08, "learning_rate": 1.9852936498774774e-05, "loss": 0.9019, "step": 763 }, { "epoch": 0.08, "learning_rate": 1.9852333414146158e-05, "loss": 0.7905, "step": 764 }, { "epoch": 0.08, "learning_rate": 1.9851729104666053e-05, "loss": 0.7183, "step": 765 }, { "epoch": 0.08, "learning_rate": 1.9851123570409595e-05, "loss": 0.8174, "step": 766 }, { "epoch": 0.08, "learning_rate": 1.9850516811452057e-05, "loss": 0.7844, "step": 767 }, { "epoch": 0.08, "learning_rate": 1.9849908827868874e-05, "loss": 0.6118, "step": 768 }, { "epoch": 0.08, "learning_rate": 1.9849299619735637e-05, "loss": 0.8071, "step": 769 }, { "epoch": 0.08, "learning_rate": 1.9848689187128076e-05, "loss": 0.7107, "step": 770 }, { "epoch": 0.08, "learning_rate": 1.9848077530122083e-05, "loss": 0.7278, "step": 771 }, { "epoch": 0.08, "learning_rate": 1.98474646487937e-05, "loss": 0.7065, "step": 772 }, { "epoch": 0.08, "learning_rate": 1.984685054321912e-05, "loss": 0.738, "step": 773 }, { "epoch": 0.08, "learning_rate": 1.9846235213474694e-05, "loss": 0.7236, "step": 774 }, { "epoch": 0.08, "learning_rate": 1.9845618659636914e-05, "loss": 0.7827, "step": 775 }, { "epoch": 0.08, "learning_rate": 1.9845000881782434e-05, "loss": 0.8916, "step": 776 }, { "epoch": 0.08, "learning_rate": 1.9844381879988056e-05, "loss": 0.8408, "step": 777 }, { "epoch": 0.08, "learning_rate": 1.9843761654330734e-05, "loss": 0.675, "step": 778 }, { "epoch": 0.08, "learning_rate": 1.9843140204887576e-05, "loss": 0.698, "step": 779 }, { "epoch": 0.08, "learning_rate": 1.9842517531735837e-05, "loss": 0.7874, "step": 780 }, { "epoch": 0.09, "learning_rate": 1.9841893634952938e-05, "loss": 0.6577, "step": 781 }, { "epoch": 0.09, "learning_rate": 1.9841268514616434e-05, "loss": 0.8369, "step": 782 }, { "epoch": 0.09, "learning_rate": 1.9840642170804044e-05, "loss": 0.7385, "step": 783 }, { "epoch": 0.09, "learning_rate": 1.9840014603593637e-05, "loss": 0.6787, "step": 784 }, { "epoch": 0.09, "learning_rate": 1.983938581306323e-05, "loss": 0.9185, "step": 785 }, { "epoch": 0.09, "learning_rate": 1.9838755799290993e-05, "loss": 0.7139, "step": 786 }, { "epoch": 0.09, "learning_rate": 1.9838124562355255e-05, "loss": 0.7869, "step": 787 }, { "epoch": 0.09, "learning_rate": 1.9837492102334488e-05, "loss": 0.8213, "step": 788 }, { "epoch": 0.09, "learning_rate": 1.9836858419307325e-05, "loss": 0.8206, "step": 789 }, { "epoch": 0.09, "learning_rate": 1.983622351335254e-05, "loss": 0.8076, "step": 790 }, { "epoch": 0.09, "learning_rate": 1.9835587384549067e-05, "loss": 0.8071, "step": 791 }, { "epoch": 0.09, "learning_rate": 1.9834950032975988e-05, "loss": 0.8667, "step": 792 }, { "epoch": 0.09, "learning_rate": 1.9834311458712547e-05, "loss": 0.6807, "step": 793 }, { "epoch": 0.09, "learning_rate": 1.9833671661838125e-05, "loss": 0.6792, "step": 794 }, { "epoch": 0.09, "learning_rate": 1.9833030642432264e-05, "loss": 0.7231, "step": 795 }, { "epoch": 0.09, "learning_rate": 1.9832388400574658e-05, "loss": 0.7124, "step": 796 }, { "epoch": 0.09, "learning_rate": 1.983174493634515e-05, "loss": 0.8696, "step": 797 }, { "epoch": 0.09, "learning_rate": 1.9831100249823732e-05, "loss": 0.7651, "step": 798 }, { "epoch": 0.09, "learning_rate": 1.9830454341090563e-05, "loss": 0.7947, "step": 799 }, { "epoch": 0.09, "learning_rate": 1.9829807210225927e-05, "loss": 0.7607, "step": 800 }, { "epoch": 0.09, "learning_rate": 1.9829158857310288e-05, "loss": 0.7158, "step": 801 }, { "epoch": 0.09, "learning_rate": 1.9828509282424247e-05, "loss": 0.8284, "step": 802 }, { "epoch": 0.09, "learning_rate": 1.982785848564856e-05, "loss": 0.8691, "step": 803 }, { "epoch": 0.09, "learning_rate": 1.9827206467064133e-05, "loss": 0.821, "step": 804 }, { "epoch": 0.09, "learning_rate": 1.982655322675203e-05, "loss": 0.5441, "step": 805 }, { "epoch": 0.09, "learning_rate": 1.9825898764793455e-05, "loss": 0.8472, "step": 806 }, { "epoch": 0.09, "learning_rate": 1.9825243081269778e-05, "loss": 0.658, "step": 807 }, { "epoch": 0.09, "learning_rate": 1.9824586176262506e-05, "loss": 0.7817, "step": 808 }, { "epoch": 0.09, "learning_rate": 1.9823928049853315e-05, "loss": 0.7002, "step": 809 }, { "epoch": 0.09, "learning_rate": 1.982326870212402e-05, "loss": 0.7117, "step": 810 }, { "epoch": 0.09, "learning_rate": 1.9822608133156596e-05, "loss": 0.6836, "step": 811 }, { "epoch": 0.09, "learning_rate": 1.9821946343033155e-05, "loss": 0.8042, "step": 812 }, { "epoch": 0.09, "learning_rate": 1.9821283331835982e-05, "loss": 0.7705, "step": 813 }, { "epoch": 0.09, "learning_rate": 1.98206190996475e-05, "loss": 0.9021, "step": 814 }, { "epoch": 0.09, "learning_rate": 1.9819953646550286e-05, "loss": 0.7871, "step": 815 }, { "epoch": 0.09, "learning_rate": 1.9819286972627066e-05, "loss": 0.7224, "step": 816 }, { "epoch": 0.09, "learning_rate": 1.9818619077960732e-05, "loss": 0.6926, "step": 817 }, { "epoch": 0.09, "learning_rate": 1.981794996263431e-05, "loss": 0.8213, "step": 818 }, { "epoch": 0.09, "learning_rate": 1.981727962673098e-05, "loss": 0.7463, "step": 819 }, { "epoch": 0.09, "learning_rate": 1.981660807033409e-05, "loss": 0.7373, "step": 820 }, { "epoch": 0.09, "learning_rate": 1.981593529352712e-05, "loss": 0.8608, "step": 821 }, { "epoch": 0.09, "learning_rate": 1.9815261296393715e-05, "loss": 0.7949, "step": 822 }, { "epoch": 0.09, "learning_rate": 1.9814586079017667e-05, "loss": 0.8154, "step": 823 }, { "epoch": 0.09, "learning_rate": 1.9813909641482918e-05, "loss": 0.8081, "step": 824 }, { "epoch": 0.09, "learning_rate": 1.9813231983873563e-05, "loss": 0.6785, "step": 825 }, { "epoch": 0.09, "learning_rate": 1.9812553106273848e-05, "loss": 0.7822, "step": 826 }, { "epoch": 0.09, "learning_rate": 1.9811873008768175e-05, "loss": 0.738, "step": 827 }, { "epoch": 0.09, "learning_rate": 1.9811191691441092e-05, "loss": 0.7969, "step": 828 }, { "epoch": 0.09, "learning_rate": 1.9810509154377302e-05, "loss": 0.7983, "step": 829 }, { "epoch": 0.09, "learning_rate": 1.9809825397661657e-05, "loss": 0.8833, "step": 830 }, { "epoch": 0.09, "learning_rate": 1.9809140421379168e-05, "loss": 0.7896, "step": 831 }, { "epoch": 0.09, "learning_rate": 1.980845422561498e-05, "loss": 0.9058, "step": 832 }, { "epoch": 0.09, "learning_rate": 1.9807766810454416e-05, "loss": 0.7556, "step": 833 }, { "epoch": 0.09, "learning_rate": 1.9807078175982925e-05, "loss": 0.5894, "step": 834 }, { "epoch": 0.09, "learning_rate": 1.9806388322286124e-05, "loss": 0.9023, "step": 835 }, { "epoch": 0.09, "learning_rate": 1.9805697249449774e-05, "loss": 0.8037, "step": 836 }, { "epoch": 0.09, "learning_rate": 1.9805004957559795e-05, "loss": 0.8193, "step": 837 }, { "epoch": 0.09, "learning_rate": 1.980431144670225e-05, "loss": 0.8838, "step": 838 }, { "epoch": 0.09, "learning_rate": 1.980361671696335e-05, "loss": 0.803, "step": 839 }, { "epoch": 0.09, "learning_rate": 1.9802920768429473e-05, "loss": 0.7979, "step": 840 }, { "epoch": 0.09, "learning_rate": 1.9802223601187138e-05, "loss": 0.728, "step": 841 }, { "epoch": 0.09, "learning_rate": 1.9801525215323017e-05, "loss": 0.7998, "step": 842 }, { "epoch": 0.09, "learning_rate": 1.9800825610923937e-05, "loss": 0.8833, "step": 843 }, { "epoch": 0.09, "learning_rate": 1.980012478807687e-05, "loss": 0.7759, "step": 844 }, { "epoch": 0.09, "learning_rate": 1.979942274686894e-05, "loss": 0.8647, "step": 845 }, { "epoch": 0.09, "learning_rate": 1.979871948738743e-05, "loss": 0.7319, "step": 846 }, { "epoch": 0.09, "learning_rate": 1.979801500971977e-05, "loss": 0.7161, "step": 847 }, { "epoch": 0.09, "learning_rate": 1.979730931395354e-05, "loss": 0.7993, "step": 848 }, { "epoch": 0.09, "learning_rate": 1.9796602400176476e-05, "loss": 0.7817, "step": 849 }, { "epoch": 0.09, "learning_rate": 1.9795894268476456e-05, "loss": 0.7937, "step": 850 }, { "epoch": 0.09, "learning_rate": 1.979518491894152e-05, "loss": 0.8147, "step": 851 }, { "epoch": 0.09, "learning_rate": 1.9794474351659854e-05, "loss": 0.8008, "step": 852 }, { "epoch": 0.09, "learning_rate": 1.9793762566719797e-05, "loss": 0.791, "step": 853 }, { "epoch": 0.09, "learning_rate": 1.9793049564209834e-05, "loss": 0.8555, "step": 854 }, { "epoch": 0.09, "learning_rate": 1.9792335344218614e-05, "loss": 0.791, "step": 855 }, { "epoch": 0.09, "learning_rate": 1.9791619906834928e-05, "loss": 0.7874, "step": 856 }, { "epoch": 0.09, "learning_rate": 1.9790903252147714e-05, "loss": 0.7207, "step": 857 }, { "epoch": 0.09, "learning_rate": 1.979018538024607e-05, "loss": 0.7026, "step": 858 }, { "epoch": 0.09, "learning_rate": 1.9789466291219246e-05, "loss": 0.7866, "step": 859 }, { "epoch": 0.09, "learning_rate": 1.9788745985156634e-05, "loss": 0.8076, "step": 860 }, { "epoch": 0.09, "learning_rate": 1.978802446214779e-05, "loss": 0.8396, "step": 861 }, { "epoch": 0.09, "learning_rate": 1.9787301722282408e-05, "loss": 0.7505, "step": 862 }, { "epoch": 0.09, "learning_rate": 1.9786577765650342e-05, "loss": 0.7312, "step": 863 }, { "epoch": 0.09, "learning_rate": 1.97858525923416e-05, "loss": 0.7571, "step": 864 }, { "epoch": 0.09, "learning_rate": 1.9785126202446325e-05, "loss": 0.6804, "step": 865 }, { "epoch": 0.09, "learning_rate": 1.9784398596054833e-05, "loss": 0.8071, "step": 866 }, { "epoch": 0.09, "learning_rate": 1.9783669773257577e-05, "loss": 0.6841, "step": 867 }, { "epoch": 0.09, "learning_rate": 1.9782939734145166e-05, "loss": 0.7288, "step": 868 }, { "epoch": 0.09, "learning_rate": 1.9782208478808352e-05, "loss": 0.7241, "step": 869 }, { "epoch": 0.09, "learning_rate": 1.9781476007338058e-05, "loss": 0.8367, "step": 870 }, { "epoch": 0.09, "learning_rate": 1.9780742319825336e-05, "loss": 0.7639, "step": 871 }, { "epoch": 0.09, "learning_rate": 1.9780007416361403e-05, "loss": 0.7544, "step": 872 }, { "epoch": 0.1, "learning_rate": 1.977927129703762e-05, "loss": 0.6448, "step": 873 }, { "epoch": 0.1, "learning_rate": 1.9778533961945503e-05, "loss": 0.759, "step": 874 }, { "epoch": 0.1, "learning_rate": 1.977779541117672e-05, "loss": 0.793, "step": 875 }, { "epoch": 0.1, "learning_rate": 1.9777055644823087e-05, "loss": 0.7893, "step": 876 }, { "epoch": 0.1, "learning_rate": 1.977631466297657e-05, "loss": 0.802, "step": 877 }, { "epoch": 0.1, "learning_rate": 1.9775572465729297e-05, "loss": 0.7024, "step": 878 }, { "epoch": 0.1, "learning_rate": 1.977482905317353e-05, "loss": 0.782, "step": 879 }, { "epoch": 0.1, "learning_rate": 1.977408442540169e-05, "loss": 0.7883, "step": 880 }, { "epoch": 0.1, "learning_rate": 1.9773338582506357e-05, "loss": 0.7075, "step": 881 }, { "epoch": 0.1, "learning_rate": 1.977259152458025e-05, "loss": 0.8486, "step": 882 }, { "epoch": 0.1, "learning_rate": 1.9771843251716247e-05, "loss": 0.8525, "step": 883 }, { "epoch": 0.1, "learning_rate": 1.977109376400737e-05, "loss": 0.8711, "step": 884 }, { "epoch": 0.1, "learning_rate": 1.9770343061546797e-05, "loss": 0.7246, "step": 885 }, { "epoch": 0.1, "learning_rate": 1.976959114442786e-05, "loss": 0.6855, "step": 886 }, { "epoch": 0.1, "learning_rate": 1.9768838012744034e-05, "loss": 0.7144, "step": 887 }, { "epoch": 0.1, "learning_rate": 1.9768083666588954e-05, "loss": 0.8354, "step": 888 }, { "epoch": 0.1, "learning_rate": 1.9767328106056395e-05, "loss": 0.8193, "step": 889 }, { "epoch": 0.1, "learning_rate": 1.976657133124029e-05, "loss": 0.8735, "step": 890 }, { "epoch": 0.1, "learning_rate": 1.9765813342234726e-05, "loss": 0.7383, "step": 891 }, { "epoch": 0.1, "learning_rate": 1.976505413913393e-05, "loss": 0.9199, "step": 892 }, { "epoch": 0.1, "learning_rate": 1.9764293722032295e-05, "loss": 0.8491, "step": 893 }, { "epoch": 0.1, "learning_rate": 1.976353209102435e-05, "loss": 0.7637, "step": 894 }, { "epoch": 0.1, "learning_rate": 1.976276924620479e-05, "loss": 0.7683, "step": 895 }, { "epoch": 0.1, "learning_rate": 1.9762005187668442e-05, "loss": 0.835, "step": 896 }, { "epoch": 0.1, "learning_rate": 1.9761239915510302e-05, "loss": 0.7786, "step": 897 }, { "epoch": 0.1, "learning_rate": 1.9760473429825508e-05, "loss": 0.782, "step": 898 }, { "epoch": 0.1, "learning_rate": 1.9759705730709347e-05, "loss": 0.7256, "step": 899 }, { "epoch": 0.1, "learning_rate": 1.9758936818257263e-05, "loss": 0.8218, "step": 900 }, { "epoch": 0.1, "learning_rate": 1.9758166692564848e-05, "loss": 0.8062, "step": 901 }, { "epoch": 0.1, "learning_rate": 1.9757395353727845e-05, "loss": 0.7961, "step": 902 }, { "epoch": 0.1, "learning_rate": 1.9756622801842144e-05, "loss": 0.6921, "step": 903 }, { "epoch": 0.1, "learning_rate": 1.9755849037003795e-05, "loss": 0.8088, "step": 904 }, { "epoch": 0.1, "learning_rate": 1.9755074059308988e-05, "loss": 0.7349, "step": 905 }, { "epoch": 0.1, "learning_rate": 1.9754297868854075e-05, "loss": 0.6515, "step": 906 }, { "epoch": 0.1, "learning_rate": 1.975352046573554e-05, "loss": 0.7217, "step": 907 }, { "epoch": 0.1, "learning_rate": 1.975274185005005e-05, "loss": 0.7361, "step": 908 }, { "epoch": 0.1, "learning_rate": 1.9751962021894385e-05, "loss": 0.7424, "step": 909 }, { "epoch": 0.1, "learning_rate": 1.975118098136551e-05, "loss": 0.7817, "step": 910 }, { "epoch": 0.1, "learning_rate": 1.975039872856051e-05, "loss": 0.7944, "step": 911 }, { "epoch": 0.1, "learning_rate": 1.9749615263576642e-05, "loss": 0.7085, "step": 912 }, { "epoch": 0.1, "learning_rate": 1.9748830586511307e-05, "loss": 0.6277, "step": 913 }, { "epoch": 0.1, "learning_rate": 1.974804469746206e-05, "loss": 0.793, "step": 914 }, { "epoch": 0.1, "learning_rate": 1.9747257596526594e-05, "loss": 0.7009, "step": 915 }, { "epoch": 0.1, "learning_rate": 1.9746469283802773e-05, "loss": 0.9146, "step": 916 }, { "epoch": 0.1, "learning_rate": 1.9745679759388597e-05, "loss": 0.7754, "step": 917 }, { "epoch": 0.1, "learning_rate": 1.9744889023382217e-05, "loss": 0.8398, "step": 918 }, { "epoch": 0.1, "learning_rate": 1.974409707588194e-05, "loss": 0.8101, "step": 919 }, { "epoch": 0.1, "learning_rate": 1.9743303916986226e-05, "loss": 0.7271, "step": 920 }, { "epoch": 0.1, "learning_rate": 1.9742509546793673e-05, "loss": 0.781, "step": 921 }, { "epoch": 0.1, "learning_rate": 1.9741713965403044e-05, "loss": 0.832, "step": 922 }, { "epoch": 0.1, "learning_rate": 1.9740917172913247e-05, "loss": 0.7861, "step": 923 }, { "epoch": 0.1, "learning_rate": 1.9740119169423337e-05, "loss": 0.8445, "step": 924 }, { "epoch": 0.1, "learning_rate": 1.9739319955032522e-05, "loss": 0.7822, "step": 925 }, { "epoch": 0.1, "learning_rate": 1.9738519529840162e-05, "loss": 0.7292, "step": 926 }, { "epoch": 0.1, "learning_rate": 1.973771789394577e-05, "loss": 0.8296, "step": 927 }, { "epoch": 0.1, "learning_rate": 1.9736915047449002e-05, "loss": 0.7583, "step": 928 }, { "epoch": 0.1, "learning_rate": 1.9736110990449672e-05, "loss": 0.8818, "step": 929 }, { "epoch": 0.1, "learning_rate": 1.973530572304773e-05, "loss": 0.8137, "step": 930 }, { "epoch": 0.1, "learning_rate": 1.9734499245343306e-05, "loss": 0.8384, "step": 931 }, { "epoch": 0.1, "learning_rate": 1.973369155743665e-05, "loss": 0.7251, "step": 932 }, { "epoch": 0.1, "learning_rate": 1.973288265942818e-05, "loss": 0.7244, "step": 933 }, { "epoch": 0.1, "learning_rate": 1.9732072551418452e-05, "loss": 0.8047, "step": 934 }, { "epoch": 0.1, "learning_rate": 1.9731261233508185e-05, "loss": 0.749, "step": 935 }, { "epoch": 0.1, "learning_rate": 1.973044870579824e-05, "loss": 0.7263, "step": 936 }, { "epoch": 0.1, "learning_rate": 1.9729634968389636e-05, "loss": 0.8423, "step": 937 }, { "epoch": 0.1, "learning_rate": 1.972882002138353e-05, "loss": 0.8044, "step": 938 }, { "epoch": 0.1, "learning_rate": 1.9728003864881242e-05, "loss": 0.6931, "step": 939 }, { "epoch": 0.1, "learning_rate": 1.972718649898424e-05, "loss": 0.884, "step": 940 }, { "epoch": 0.1, "learning_rate": 1.9726367923794134e-05, "loss": 0.7744, "step": 941 }, { "epoch": 0.1, "learning_rate": 1.9725548139412693e-05, "loss": 0.6665, "step": 942 }, { "epoch": 0.1, "learning_rate": 1.9724727145941834e-05, "loss": 0.6982, "step": 943 }, { "epoch": 0.1, "learning_rate": 1.9723904943483617e-05, "loss": 0.7417, "step": 944 }, { "epoch": 0.1, "learning_rate": 1.9723081532140272e-05, "loss": 0.8572, "step": 945 }, { "epoch": 0.1, "learning_rate": 1.9722256912014153e-05, "loss": 0.8301, "step": 946 }, { "epoch": 0.1, "learning_rate": 1.9721431083207786e-05, "loss": 0.6091, "step": 947 }, { "epoch": 0.1, "learning_rate": 1.9720604045823835e-05, "loss": 0.8604, "step": 948 }, { "epoch": 0.1, "learning_rate": 1.971977579996512e-05, "loss": 0.7507, "step": 949 }, { "epoch": 0.1, "learning_rate": 1.9718946345734608e-05, "loss": 0.8591, "step": 950 }, { "epoch": 0.1, "learning_rate": 1.9718115683235418e-05, "loss": 0.863, "step": 951 }, { "epoch": 0.1, "learning_rate": 1.9717283812570817e-05, "loss": 0.8545, "step": 952 }, { "epoch": 0.1, "learning_rate": 1.971645073384423e-05, "loss": 0.7803, "step": 953 }, { "epoch": 0.1, "learning_rate": 1.971561644715922e-05, "loss": 0.8623, "step": 954 }, { "epoch": 0.1, "learning_rate": 1.971478095261951e-05, "loss": 0.7576, "step": 955 }, { "epoch": 0.1, "learning_rate": 1.971394425032896e-05, "loss": 0.5522, "step": 956 }, { "epoch": 0.1, "learning_rate": 1.9713106340391607e-05, "loss": 0.9182, "step": 957 }, { "epoch": 0.1, "learning_rate": 1.9712267222911605e-05, "loss": 0.7783, "step": 958 }, { "epoch": 0.1, "learning_rate": 1.971142689799328e-05, "loss": 0.6868, "step": 959 }, { "epoch": 0.1, "learning_rate": 1.9710585365741105e-05, "loss": 0.9111, "step": 960 }, { "epoch": 0.1, "learning_rate": 1.9709742626259695e-05, "loss": 0.9351, "step": 961 }, { "epoch": 0.1, "learning_rate": 1.9708898679653824e-05, "loss": 0.6182, "step": 962 }, { "epoch": 0.1, "learning_rate": 1.970805352602841e-05, "loss": 0.8677, "step": 963 }, { "epoch": 0.1, "learning_rate": 1.9707207165488522e-05, "loss": 0.9004, "step": 964 }, { "epoch": 0.11, "learning_rate": 1.9706359598139383e-05, "loss": 0.8779, "step": 965 }, { "epoch": 0.11, "learning_rate": 1.970551082408636e-05, "loss": 0.7158, "step": 966 }, { "epoch": 0.11, "learning_rate": 1.970466084343498e-05, "loss": 0.8047, "step": 967 }, { "epoch": 0.11, "learning_rate": 1.970380965629091e-05, "loss": 0.8936, "step": 968 }, { "epoch": 0.11, "learning_rate": 1.9702957262759964e-05, "loss": 0.7285, "step": 969 }, { "epoch": 0.11, "learning_rate": 1.9702103662948124e-05, "loss": 0.8042, "step": 970 }, { "epoch": 0.11, "learning_rate": 1.97012488569615e-05, "loss": 0.8259, "step": 971 }, { "epoch": 0.11, "learning_rate": 1.970039284490637e-05, "loss": 0.7361, "step": 972 }, { "epoch": 0.11, "learning_rate": 1.969953562688915e-05, "loss": 0.7827, "step": 973 }, { "epoch": 0.11, "learning_rate": 1.9698677203016408e-05, "loss": 0.8628, "step": 974 }, { "epoch": 0.11, "learning_rate": 1.9697817573394874e-05, "loss": 0.8018, "step": 975 }, { "epoch": 0.11, "learning_rate": 1.9696956738131406e-05, "loss": 0.8403, "step": 976 }, { "epoch": 0.11, "learning_rate": 1.969609469733303e-05, "loss": 0.7769, "step": 977 }, { "epoch": 0.11, "learning_rate": 1.9695231451106914e-05, "loss": 0.6765, "step": 978 }, { "epoch": 0.11, "learning_rate": 1.9694366999560382e-05, "loss": 0.8213, "step": 979 }, { "epoch": 0.11, "learning_rate": 1.9693501342800895e-05, "loss": 0.7725, "step": 980 }, { "epoch": 0.11, "learning_rate": 1.969263448093608e-05, "loss": 0.5605, "step": 981 }, { "epoch": 0.11, "learning_rate": 1.96917664140737e-05, "loss": 0.8804, "step": 982 }, { "epoch": 0.11, "learning_rate": 1.969089714232168e-05, "loss": 0.8359, "step": 983 }, { "epoch": 0.11, "learning_rate": 1.9690026665788084e-05, "loss": 0.855, "step": 984 }, { "epoch": 0.11, "learning_rate": 1.9689154984581132e-05, "loss": 0.7307, "step": 985 }, { "epoch": 0.11, "learning_rate": 1.9688282098809195e-05, "loss": 0.7593, "step": 986 }, { "epoch": 0.11, "learning_rate": 1.9687408008580785e-05, "loss": 0.7905, "step": 987 }, { "epoch": 0.11, "learning_rate": 1.968653271400458e-05, "loss": 0.6416, "step": 988 }, { "epoch": 0.11, "learning_rate": 1.9685656215189384e-05, "loss": 0.772, "step": 989 }, { "epoch": 0.11, "learning_rate": 1.9684778512244172e-05, "loss": 0.6882, "step": 990 }, { "epoch": 0.11, "learning_rate": 1.9683899605278062e-05, "loss": 0.739, "step": 991 }, { "epoch": 0.11, "learning_rate": 1.9683019494400314e-05, "loss": 0.6506, "step": 992 }, { "epoch": 0.11, "learning_rate": 1.968213817972035e-05, "loss": 0.8867, "step": 993 }, { "epoch": 0.11, "learning_rate": 1.9681255661347734e-05, "loss": 0.6907, "step": 994 }, { "epoch": 0.11, "learning_rate": 1.9680371939392186e-05, "loss": 0.7842, "step": 995 }, { "epoch": 0.11, "learning_rate": 1.9679487013963566e-05, "loss": 0.8501, "step": 996 }, { "epoch": 0.11, "learning_rate": 1.9678600885171888e-05, "loss": 0.7146, "step": 997 }, { "epoch": 0.11, "learning_rate": 1.967771355312732e-05, "loss": 0.7979, "step": 998 }, { "epoch": 0.11, "learning_rate": 1.9676825017940167e-05, "loss": 0.7598, "step": 999 }, { "epoch": 0.11, "learning_rate": 1.9675935279720906e-05, "loss": 0.8057, "step": 1000 }, { "epoch": 0.11, "learning_rate": 1.9675044338580144e-05, "loss": 0.8623, "step": 1001 }, { "epoch": 0.11, "learning_rate": 1.967415219462864e-05, "loss": 0.709, "step": 1002 }, { "epoch": 0.11, "learning_rate": 1.9673258847977313e-05, "loss": 0.7104, "step": 1003 }, { "epoch": 0.11, "learning_rate": 1.9672364298737217e-05, "loss": 0.6475, "step": 1004 }, { "epoch": 0.11, "learning_rate": 1.9671468547019575e-05, "loss": 0.8401, "step": 1005 }, { "epoch": 0.11, "learning_rate": 1.9670571592935733e-05, "loss": 0.7468, "step": 1006 }, { "epoch": 0.11, "learning_rate": 1.9669673436597212e-05, "loss": 0.6919, "step": 1007 }, { "epoch": 0.11, "learning_rate": 1.9668774078115668e-05, "loss": 0.7754, "step": 1008 }, { "epoch": 0.11, "learning_rate": 1.966787351760291e-05, "loss": 0.7729, "step": 1009 }, { "epoch": 0.11, "learning_rate": 1.9666971755170893e-05, "loss": 0.8164, "step": 1010 }, { "epoch": 0.11, "learning_rate": 1.9666068790931733e-05, "loss": 0.6978, "step": 1011 }, { "epoch": 0.11, "learning_rate": 1.9665164624997684e-05, "loss": 0.7366, "step": 1012 }, { "epoch": 0.11, "learning_rate": 1.966425925748115e-05, "loss": 0.7998, "step": 1013 }, { "epoch": 0.11, "learning_rate": 1.9663352688494686e-05, "loss": 0.6492, "step": 1014 }, { "epoch": 0.11, "learning_rate": 1.9662444918151006e-05, "loss": 0.8892, "step": 1015 }, { "epoch": 0.11, "learning_rate": 1.9661535946562954e-05, "loss": 0.793, "step": 1016 }, { "epoch": 0.11, "learning_rate": 1.9660625773843542e-05, "loss": 0.7563, "step": 1017 }, { "epoch": 0.11, "learning_rate": 1.9659714400105922e-05, "loss": 0.7256, "step": 1018 }, { "epoch": 0.11, "learning_rate": 1.9658801825463394e-05, "loss": 0.7261, "step": 1019 }, { "epoch": 0.11, "learning_rate": 1.9657888050029416e-05, "loss": 0.7268, "step": 1020 }, { "epoch": 0.11, "learning_rate": 1.965697307391758e-05, "loss": 0.752, "step": 1021 }, { "epoch": 0.11, "learning_rate": 1.9656056897241648e-05, "loss": 0.8374, "step": 1022 }, { "epoch": 0.11, "learning_rate": 1.965513952011551e-05, "loss": 0.8206, "step": 1023 }, { "epoch": 0.11, "learning_rate": 1.9654220942653223e-05, "loss": 0.692, "step": 1024 }, { "epoch": 0.11, "learning_rate": 1.965330116496898e-05, "loss": 0.7214, "step": 1025 }, { "epoch": 0.11, "learning_rate": 1.9652380187177128e-05, "loss": 0.7903, "step": 1026 }, { "epoch": 0.11, "learning_rate": 1.965145800939217e-05, "loss": 0.8096, "step": 1027 }, { "epoch": 0.11, "learning_rate": 1.9650534631728747e-05, "loss": 0.8071, "step": 1028 }, { "epoch": 0.11, "learning_rate": 1.9649610054301656e-05, "loss": 0.645, "step": 1029 }, { "epoch": 0.11, "learning_rate": 1.9648684277225837e-05, "loss": 0.8652, "step": 1030 }, { "epoch": 0.11, "learning_rate": 1.964775730061639e-05, "loss": 0.7319, "step": 1031 }, { "epoch": 0.11, "learning_rate": 1.964682912458856e-05, "loss": 0.7988, "step": 1032 }, { "epoch": 0.11, "learning_rate": 1.964589974925773e-05, "loss": 0.769, "step": 1033 }, { "epoch": 0.11, "learning_rate": 1.9644969174739442e-05, "loss": 0.7334, "step": 1034 }, { "epoch": 0.11, "learning_rate": 1.964403740114939e-05, "loss": 0.8381, "step": 1035 }, { "epoch": 0.11, "learning_rate": 1.964310442860341e-05, "loss": 0.772, "step": 1036 }, { "epoch": 0.11, "learning_rate": 1.9642170257217497e-05, "loss": 0.8188, "step": 1037 }, { "epoch": 0.11, "learning_rate": 1.9641234887107777e-05, "loss": 0.7676, "step": 1038 }, { "epoch": 0.11, "learning_rate": 1.9640298318390544e-05, "loss": 0.8667, "step": 1039 }, { "epoch": 0.11, "learning_rate": 1.9639360551182232e-05, "loss": 0.7578, "step": 1040 }, { "epoch": 0.11, "learning_rate": 1.9638421585599422e-05, "loss": 0.7654, "step": 1041 }, { "epoch": 0.11, "learning_rate": 1.9637481421758847e-05, "loss": 0.6824, "step": 1042 }, { "epoch": 0.11, "learning_rate": 1.9636540059777396e-05, "loss": 0.7437, "step": 1043 }, { "epoch": 0.11, "learning_rate": 1.9635597499772096e-05, "loss": 0.7332, "step": 1044 }, { "epoch": 0.11, "learning_rate": 1.963465374186012e-05, "loss": 0.8174, "step": 1045 }, { "epoch": 0.11, "learning_rate": 1.9633708786158803e-05, "loss": 0.6721, "step": 1046 }, { "epoch": 0.11, "learning_rate": 1.963276263278563e-05, "loss": 0.8237, "step": 1047 }, { "epoch": 0.11, "learning_rate": 1.9631815281858214e-05, "loss": 0.7988, "step": 1048 }, { "epoch": 0.11, "learning_rate": 1.963086673349434e-05, "loss": 0.6553, "step": 1049 }, { "epoch": 0.11, "learning_rate": 1.9629916987811924e-05, "loss": 0.7859, "step": 1050 }, { "epoch": 0.11, "learning_rate": 1.9628966044929048e-05, "loss": 0.877, "step": 1051 }, { "epoch": 0.11, "learning_rate": 1.9628013904963934e-05, "loss": 0.7581, "step": 1052 }, { "epoch": 0.11, "learning_rate": 1.962706056803495e-05, "loss": 0.78, "step": 1053 }, { "epoch": 0.11, "learning_rate": 1.962610603426061e-05, "loss": 0.8511, "step": 1054 }, { "epoch": 0.11, "learning_rate": 1.962515030375959e-05, "loss": 0.7402, "step": 1055 }, { "epoch": 0.11, "learning_rate": 1.9624193376650708e-05, "loss": 0.7307, "step": 1056 }, { "epoch": 0.12, "learning_rate": 1.9623235253052924e-05, "loss": 0.8406, "step": 1057 }, { "epoch": 0.12, "learning_rate": 1.962227593308536e-05, "loss": 0.8062, "step": 1058 }, { "epoch": 0.12, "learning_rate": 1.9621315416867274e-05, "loss": 0.8979, "step": 1059 }, { "epoch": 0.12, "learning_rate": 1.962035370451808e-05, "loss": 0.8486, "step": 1060 }, { "epoch": 0.12, "learning_rate": 1.961939079615734e-05, "loss": 0.8296, "step": 1061 }, { "epoch": 0.12, "learning_rate": 1.961842669190476e-05, "loss": 0.835, "step": 1062 }, { "epoch": 0.12, "learning_rate": 1.9617461391880206e-05, "loss": 0.681, "step": 1063 }, { "epoch": 0.12, "learning_rate": 1.961649489620368e-05, "loss": 0.8008, "step": 1064 }, { "epoch": 0.12, "learning_rate": 1.9615527204995332e-05, "loss": 0.6606, "step": 1065 }, { "epoch": 0.12, "learning_rate": 1.961455831837548e-05, "loss": 0.8931, "step": 1066 }, { "epoch": 0.12, "learning_rate": 1.9613588236464564e-05, "loss": 0.7456, "step": 1067 }, { "epoch": 0.12, "learning_rate": 1.961261695938319e-05, "loss": 0.7791, "step": 1068 }, { "epoch": 0.12, "learning_rate": 1.961164448725211e-05, "loss": 0.7852, "step": 1069 }, { "epoch": 0.12, "learning_rate": 1.961067082019222e-05, "loss": 0.5964, "step": 1070 }, { "epoch": 0.12, "learning_rate": 1.960969595832457e-05, "loss": 0.6873, "step": 1071 }, { "epoch": 0.12, "learning_rate": 1.960871990177036e-05, "loss": 0.7056, "step": 1072 }, { "epoch": 0.12, "learning_rate": 1.960774265065092e-05, "loss": 0.8457, "step": 1073 }, { "epoch": 0.12, "learning_rate": 1.960676420508776e-05, "loss": 0.6899, "step": 1074 }, { "epoch": 0.12, "learning_rate": 1.9605784565202505e-05, "loss": 0.7515, "step": 1075 }, { "epoch": 0.12, "learning_rate": 1.9604803731116953e-05, "loss": 0.7288, "step": 1076 }, { "epoch": 0.12, "learning_rate": 1.9603821702953047e-05, "loss": 0.7874, "step": 1077 }, { "epoch": 0.12, "learning_rate": 1.9602838480832864e-05, "loss": 0.8179, "step": 1078 }, { "epoch": 0.12, "learning_rate": 1.9601854064878645e-05, "loss": 0.8535, "step": 1079 }, { "epoch": 0.12, "learning_rate": 1.960086845521277e-05, "loss": 0.7583, "step": 1080 }, { "epoch": 0.12, "learning_rate": 1.9599881651957776e-05, "loss": 0.7097, "step": 1081 }, { "epoch": 0.12, "learning_rate": 1.9598893655236343e-05, "loss": 0.6785, "step": 1082 }, { "epoch": 0.12, "learning_rate": 1.9597904465171293e-05, "loss": 0.7493, "step": 1083 }, { "epoch": 0.12, "learning_rate": 1.9596914081885606e-05, "loss": 0.7915, "step": 1084 }, { "epoch": 0.12, "learning_rate": 1.959592250550241e-05, "loss": 0.8188, "step": 1085 }, { "epoch": 0.12, "learning_rate": 1.9594929736144978e-05, "loss": 0.7837, "step": 1086 }, { "epoch": 0.12, "learning_rate": 1.9593935773936726e-05, "loss": 0.8403, "step": 1087 }, { "epoch": 0.12, "learning_rate": 1.9592940619001235e-05, "loss": 0.7446, "step": 1088 }, { "epoch": 0.12, "learning_rate": 1.9591944271462216e-05, "loss": 0.7737, "step": 1089 }, { "epoch": 0.12, "learning_rate": 1.959094673144354e-05, "loss": 0.6671, "step": 1090 }, { "epoch": 0.12, "learning_rate": 1.9589947999069217e-05, "loss": 0.7446, "step": 1091 }, { "epoch": 0.12, "learning_rate": 1.9588948074463418e-05, "loss": 0.7554, "step": 1092 }, { "epoch": 0.12, "learning_rate": 1.9587946957750445e-05, "loss": 0.709, "step": 1093 }, { "epoch": 0.12, "learning_rate": 1.9586944649054765e-05, "loss": 0.791, "step": 1094 }, { "epoch": 0.12, "learning_rate": 1.9585941148500987e-05, "loss": 0.688, "step": 1095 }, { "epoch": 0.12, "learning_rate": 1.958493645621386e-05, "loss": 0.7244, "step": 1096 }, { "epoch": 0.12, "learning_rate": 1.958393057231829e-05, "loss": 0.7104, "step": 1097 }, { "epoch": 0.12, "learning_rate": 1.9582923496939337e-05, "loss": 0.7373, "step": 1098 }, { "epoch": 0.12, "learning_rate": 1.9581915230202197e-05, "loss": 0.7119, "step": 1099 }, { "epoch": 0.12, "learning_rate": 1.9580905772232214e-05, "loss": 0.6514, "step": 1100 }, { "epoch": 0.12, "learning_rate": 1.957989512315489e-05, "loss": 0.6997, "step": 1101 }, { "epoch": 0.12, "learning_rate": 1.957888328309587e-05, "loss": 0.7878, "step": 1102 }, { "epoch": 0.12, "learning_rate": 1.9577870252180945e-05, "loss": 0.6831, "step": 1103 }, { "epoch": 0.12, "learning_rate": 1.9576856030536055e-05, "loss": 0.8799, "step": 1104 }, { "epoch": 0.12, "learning_rate": 1.957584061828729e-05, "loss": 0.7888, "step": 1105 }, { "epoch": 0.12, "learning_rate": 1.957482401556089e-05, "loss": 0.7988, "step": 1106 }, { "epoch": 0.12, "learning_rate": 1.9573806222483234e-05, "loss": 0.6895, "step": 1107 }, { "epoch": 0.12, "learning_rate": 1.9572787239180862e-05, "loss": 0.7739, "step": 1108 }, { "epoch": 0.12, "learning_rate": 1.957176706578045e-05, "loss": 0.6846, "step": 1109 }, { "epoch": 0.12, "learning_rate": 1.957074570240883e-05, "loss": 0.7412, "step": 1110 }, { "epoch": 0.12, "learning_rate": 1.9569723149192978e-05, "loss": 0.8213, "step": 1111 }, { "epoch": 0.12, "learning_rate": 1.9568699406260016e-05, "loss": 0.7422, "step": 1112 }, { "epoch": 0.12, "learning_rate": 1.956767447373722e-05, "loss": 0.8452, "step": 1113 }, { "epoch": 0.12, "learning_rate": 1.9566648351752008e-05, "loss": 0.7847, "step": 1114 }, { "epoch": 0.12, "learning_rate": 1.956562104043195e-05, "loss": 0.7256, "step": 1115 }, { "epoch": 0.12, "learning_rate": 1.956459253990476e-05, "loss": 0.6096, "step": 1116 }, { "epoch": 0.12, "learning_rate": 1.956356285029831e-05, "loss": 0.791, "step": 1117 }, { "epoch": 0.12, "learning_rate": 1.95625319717406e-05, "loss": 0.8284, "step": 1118 }, { "epoch": 0.12, "learning_rate": 1.9561499904359805e-05, "loss": 0.7153, "step": 1119 }, { "epoch": 0.12, "learning_rate": 1.9560466648284215e-05, "loss": 0.8457, "step": 1120 }, { "epoch": 0.12, "learning_rate": 1.9559432203642298e-05, "loss": 0.842, "step": 1121 }, { "epoch": 0.12, "learning_rate": 1.955839657056265e-05, "loss": 0.6704, "step": 1122 }, { "epoch": 0.12, "learning_rate": 1.9557359749174033e-05, "loss": 0.832, "step": 1123 }, { "epoch": 0.12, "learning_rate": 1.955632173960533e-05, "loss": 0.7139, "step": 1124 }, { "epoch": 0.12, "learning_rate": 1.9555282541985598e-05, "loss": 0.8032, "step": 1125 }, { "epoch": 0.12, "learning_rate": 1.955424215644403e-05, "loss": 0.7852, "step": 1126 }, { "epoch": 0.12, "learning_rate": 1.9553200583109964e-05, "loss": 0.7793, "step": 1127 }, { "epoch": 0.12, "learning_rate": 1.955215782211289e-05, "loss": 0.7024, "step": 1128 }, { "epoch": 0.12, "learning_rate": 1.955111387358245e-05, "loss": 0.8059, "step": 1129 }, { "epoch": 0.12, "learning_rate": 1.955006873764842e-05, "loss": 0.8237, "step": 1130 }, { "epoch": 0.12, "learning_rate": 1.9549022414440738e-05, "loss": 0.74, "step": 1131 }, { "epoch": 0.12, "learning_rate": 1.954797490408949e-05, "loss": 0.7844, "step": 1132 }, { "epoch": 0.12, "learning_rate": 1.954692620672489e-05, "loss": 0.7974, "step": 1133 }, { "epoch": 0.12, "learning_rate": 1.954587632247732e-05, "loss": 0.7607, "step": 1134 }, { "epoch": 0.12, "learning_rate": 1.9544825251477304e-05, "loss": 0.7532, "step": 1135 }, { "epoch": 0.12, "learning_rate": 1.954377299385551e-05, "loss": 0.8408, "step": 1136 }, { "epoch": 0.12, "learning_rate": 1.9542719549742757e-05, "loss": 0.6445, "step": 1137 }, { "epoch": 0.12, "learning_rate": 1.954166491927001e-05, "loss": 0.7515, "step": 1138 }, { "epoch": 0.12, "learning_rate": 1.954060910256838e-05, "loss": 0.7017, "step": 1139 }, { "epoch": 0.12, "learning_rate": 1.9539552099769128e-05, "loss": 0.7649, "step": 1140 }, { "epoch": 0.12, "learning_rate": 1.953849391100366e-05, "loss": 0.7136, "step": 1141 }, { "epoch": 0.12, "learning_rate": 1.9537434536403536e-05, "loss": 0.834, "step": 1142 }, { "epoch": 0.12, "learning_rate": 1.9536373976100454e-05, "loss": 0.7878, "step": 1143 }, { "epoch": 0.12, "learning_rate": 1.9535312230226268e-05, "loss": 0.7847, "step": 1144 }, { "epoch": 0.12, "learning_rate": 1.9534249298912968e-05, "loss": 0.7886, "step": 1145 }, { "epoch": 0.12, "learning_rate": 1.9533185182292705e-05, "loss": 0.7153, "step": 1146 }, { "epoch": 0.12, "learning_rate": 1.953211988049777e-05, "loss": 0.7639, "step": 1147 }, { "epoch": 0.12, "learning_rate": 1.9531053393660597e-05, "loss": 0.6877, "step": 1148 }, { "epoch": 0.13, "learning_rate": 1.952998572191378e-05, "loss": 0.7366, "step": 1149 }, { "epoch": 0.13, "learning_rate": 1.952891686539005e-05, "loss": 0.7476, "step": 1150 }, { "epoch": 0.13, "learning_rate": 1.952784682422229e-05, "loss": 0.771, "step": 1151 }, { "epoch": 0.13, "learning_rate": 1.9526775598543522e-05, "loss": 0.7756, "step": 1152 }, { "epoch": 0.13, "learning_rate": 1.952570318848693e-05, "loss": 0.7109, "step": 1153 }, { "epoch": 0.13, "learning_rate": 1.9524629594185832e-05, "loss": 0.6367, "step": 1154 }, { "epoch": 0.13, "learning_rate": 1.9523554815773703e-05, "loss": 0.7104, "step": 1155 }, { "epoch": 0.13, "learning_rate": 1.9522478853384154e-05, "loss": 0.8306, "step": 1156 }, { "epoch": 0.13, "learning_rate": 1.9521401707150957e-05, "loss": 0.8213, "step": 1157 }, { "epoch": 0.13, "learning_rate": 1.9520323377208017e-05, "loss": 0.7974, "step": 1158 }, { "epoch": 0.13, "learning_rate": 1.9519243863689395e-05, "loss": 0.8237, "step": 1159 }, { "epoch": 0.13, "learning_rate": 1.95181631667293e-05, "loss": 0.7913, "step": 1160 }, { "epoch": 0.13, "learning_rate": 1.9517081286462082e-05, "loss": 0.6018, "step": 1161 }, { "epoch": 0.13, "learning_rate": 1.9515998223022242e-05, "loss": 0.7393, "step": 1162 }, { "epoch": 0.13, "learning_rate": 1.9514913976544428e-05, "loss": 0.7676, "step": 1163 }, { "epoch": 0.13, "learning_rate": 1.951382854716344e-05, "loss": 0.7002, "step": 1164 }, { "epoch": 0.13, "learning_rate": 1.9512741935014208e-05, "loss": 0.7319, "step": 1165 }, { "epoch": 0.13, "learning_rate": 1.951165414023183e-05, "loss": 0.8496, "step": 1166 }, { "epoch": 0.13, "learning_rate": 1.9510565162951538e-05, "loss": 0.7432, "step": 1167 }, { "epoch": 0.13, "learning_rate": 1.9509475003308712e-05, "loss": 0.6707, "step": 1168 }, { "epoch": 0.13, "learning_rate": 1.9508383661438892e-05, "loss": 0.8003, "step": 1169 }, { "epoch": 0.13, "learning_rate": 1.9507291137477744e-05, "loss": 0.7842, "step": 1170 }, { "epoch": 0.13, "learning_rate": 1.9506197431561093e-05, "loss": 0.7759, "step": 1171 }, { "epoch": 0.13, "learning_rate": 1.9505102543824916e-05, "loss": 0.7456, "step": 1172 }, { "epoch": 0.13, "learning_rate": 1.9504006474405327e-05, "loss": 0.8132, "step": 1173 }, { "epoch": 0.13, "learning_rate": 1.9502909223438588e-05, "loss": 0.7104, "step": 1174 }, { "epoch": 0.13, "learning_rate": 1.950181079106111e-05, "loss": 0.8135, "step": 1175 }, { "epoch": 0.13, "learning_rate": 1.9500711177409456e-05, "loss": 0.7373, "step": 1176 }, { "epoch": 0.13, "learning_rate": 1.9499610382620326e-05, "loss": 0.791, "step": 1177 }, { "epoch": 0.13, "learning_rate": 1.9498508406830577e-05, "loss": 0.6802, "step": 1178 }, { "epoch": 0.13, "learning_rate": 1.9497405250177203e-05, "loss": 0.7212, "step": 1179 }, { "epoch": 0.13, "learning_rate": 1.949630091279735e-05, "loss": 0.8228, "step": 1180 }, { "epoch": 0.13, "learning_rate": 1.9495195394828314e-05, "loss": 0.7439, "step": 1181 }, { "epoch": 0.13, "learning_rate": 1.9494088696407532e-05, "loss": 0.7314, "step": 1182 }, { "epoch": 0.13, "learning_rate": 1.9492980817672586e-05, "loss": 0.7192, "step": 1183 }, { "epoch": 0.13, "learning_rate": 1.9491871758761217e-05, "loss": 0.824, "step": 1184 }, { "epoch": 0.13, "learning_rate": 1.9490761519811295e-05, "loss": 0.8374, "step": 1185 }, { "epoch": 0.13, "learning_rate": 1.948965010096085e-05, "loss": 0.7637, "step": 1186 }, { "epoch": 0.13, "learning_rate": 1.9488537502348057e-05, "loss": 0.8423, "step": 1187 }, { "epoch": 0.13, "learning_rate": 1.9487423724111233e-05, "loss": 0.7715, "step": 1188 }, { "epoch": 0.13, "learning_rate": 1.9486308766388843e-05, "loss": 0.6433, "step": 1189 }, { "epoch": 0.13, "learning_rate": 1.9485192629319502e-05, "loss": 0.7549, "step": 1190 }, { "epoch": 0.13, "learning_rate": 1.9484075313041968e-05, "loss": 0.8027, "step": 1191 }, { "epoch": 0.13, "learning_rate": 1.9482956817695147e-05, "loss": 0.7515, "step": 1192 }, { "epoch": 0.13, "learning_rate": 1.948183714341809e-05, "loss": 0.8711, "step": 1193 }, { "epoch": 0.13, "learning_rate": 1.9480716290349998e-05, "loss": 0.8054, "step": 1194 }, { "epoch": 0.13, "learning_rate": 1.9479594258630214e-05, "loss": 0.8086, "step": 1195 }, { "epoch": 0.13, "learning_rate": 1.9478471048398233e-05, "loss": 0.8333, "step": 1196 }, { "epoch": 0.13, "learning_rate": 1.9477346659793692e-05, "loss": 0.6028, "step": 1197 }, { "epoch": 0.13, "learning_rate": 1.9476221092956376e-05, "loss": 0.657, "step": 1198 }, { "epoch": 0.13, "learning_rate": 1.9475094348026217e-05, "loss": 0.7402, "step": 1199 }, { "epoch": 0.13, "learning_rate": 1.9473966425143292e-05, "loss": 0.7705, "step": 1200 }, { "epoch": 0.13, "learning_rate": 1.947283732444783e-05, "loss": 0.7939, "step": 1201 }, { "epoch": 0.13, "learning_rate": 1.9471707046080196e-05, "loss": 0.6721, "step": 1202 }, { "epoch": 0.13, "learning_rate": 1.947057559018091e-05, "loss": 0.678, "step": 1203 }, { "epoch": 0.13, "learning_rate": 1.9469442956890636e-05, "loss": 0.8184, "step": 1204 }, { "epoch": 0.13, "learning_rate": 1.9468309146350182e-05, "loss": 0.8108, "step": 1205 }, { "epoch": 0.13, "learning_rate": 1.9467174158700507e-05, "loss": 0.7847, "step": 1206 }, { "epoch": 0.13, "learning_rate": 1.946603799408271e-05, "loss": 0.8218, "step": 1207 }, { "epoch": 0.13, "learning_rate": 1.9464900652638043e-05, "loss": 0.7104, "step": 1208 }, { "epoch": 0.13, "learning_rate": 1.94637621345079e-05, "loss": 0.6775, "step": 1209 }, { "epoch": 0.13, "learning_rate": 1.9462622439833824e-05, "loss": 0.7261, "step": 1210 }, { "epoch": 0.13, "learning_rate": 1.946148156875751e-05, "loss": 0.7214, "step": 1211 }, { "epoch": 0.13, "learning_rate": 1.946033952142077e-05, "loss": 0.8921, "step": 1212 }, { "epoch": 0.13, "learning_rate": 1.9459196297965612e-05, "loss": 0.8438, "step": 1213 }, { "epoch": 0.13, "learning_rate": 1.9458051898534145e-05, "loss": 0.8311, "step": 1214 }, { "epoch": 0.13, "learning_rate": 1.9456906323268643e-05, "loss": 0.6277, "step": 1215 }, { "epoch": 0.13, "learning_rate": 1.9455759572311535e-05, "loss": 0.7729, "step": 1216 }, { "epoch": 0.13, "learning_rate": 1.9454611645805378e-05, "loss": 0.7776, "step": 1217 }, { "epoch": 0.13, "learning_rate": 1.945346254389288e-05, "loss": 0.8643, "step": 1218 }, { "epoch": 0.13, "learning_rate": 1.945231226671691e-05, "loss": 0.7771, "step": 1219 }, { "epoch": 0.13, "learning_rate": 1.945116081442046e-05, "loss": 0.6997, "step": 1220 }, { "epoch": 0.13, "learning_rate": 1.9450008187146685e-05, "loss": 0.7554, "step": 1221 }, { "epoch": 0.13, "learning_rate": 1.944885438503888e-05, "loss": 0.6733, "step": 1222 }, { "epoch": 0.13, "learning_rate": 1.9447699408240493e-05, "loss": 0.7239, "step": 1223 }, { "epoch": 0.13, "learning_rate": 1.94465432568951e-05, "loss": 0.7224, "step": 1224 }, { "epoch": 0.13, "learning_rate": 1.9445385931146444e-05, "loss": 0.7661, "step": 1225 }, { "epoch": 0.13, "learning_rate": 1.94442274311384e-05, "loss": 0.8569, "step": 1226 }, { "epoch": 0.13, "learning_rate": 1.9443067757015e-05, "loss": 0.6714, "step": 1227 }, { "epoch": 0.13, "learning_rate": 1.9441906908920404e-05, "loss": 0.7655, "step": 1228 }, { "epoch": 0.13, "learning_rate": 1.9440744886998942e-05, "loss": 0.8096, "step": 1229 }, { "epoch": 0.13, "learning_rate": 1.943958169139507e-05, "loss": 0.8315, "step": 1230 }, { "epoch": 0.13, "learning_rate": 1.94384173222534e-05, "loss": 0.677, "step": 1231 }, { "epoch": 0.13, "learning_rate": 1.943725177971869e-05, "loss": 0.6331, "step": 1232 }, { "epoch": 0.13, "learning_rate": 1.9436085063935837e-05, "loss": 0.79, "step": 1233 }, { "epoch": 0.13, "learning_rate": 1.943491717504989e-05, "loss": 0.7031, "step": 1234 }, { "epoch": 0.13, "learning_rate": 1.9433748113206046e-05, "loss": 0.7981, "step": 1235 }, { "epoch": 0.13, "learning_rate": 1.9432577878549635e-05, "loss": 0.8247, "step": 1236 }, { "epoch": 0.13, "learning_rate": 1.943140647122615e-05, "loss": 0.7378, "step": 1237 }, { "epoch": 0.13, "learning_rate": 1.943023389138122e-05, "loss": 0.7708, "step": 1238 }, { "epoch": 0.13, "learning_rate": 1.942906013916062e-05, "loss": 0.7561, "step": 1239 }, { "epoch": 0.13, "learning_rate": 1.942788521471027e-05, "loss": 0.7644, "step": 1240 }, { "epoch": 0.14, "learning_rate": 1.9426709118176237e-05, "loss": 0.7588, "step": 1241 }, { "epoch": 0.14, "learning_rate": 1.942553184970474e-05, "loss": 0.7236, "step": 1242 }, { "epoch": 0.14, "learning_rate": 1.942435340944213e-05, "loss": 0.8203, "step": 1243 }, { "epoch": 0.14, "learning_rate": 1.9423173797534924e-05, "loss": 0.6897, "step": 1244 }, { "epoch": 0.14, "learning_rate": 1.9421993014129762e-05, "loss": 0.7546, "step": 1245 }, { "epoch": 0.14, "learning_rate": 1.9420811059373444e-05, "loss": 0.7239, "step": 1246 }, { "epoch": 0.14, "learning_rate": 1.9419627933412906e-05, "loss": 0.6816, "step": 1247 }, { "epoch": 0.14, "learning_rate": 1.941844363639525e-05, "loss": 0.7417, "step": 1248 }, { "epoch": 0.14, "learning_rate": 1.9417258168467694e-05, "loss": 0.7671, "step": 1249 }, { "epoch": 0.14, "learning_rate": 1.941607152977762e-05, "loss": 0.6731, "step": 1250 }, { "epoch": 0.14, "learning_rate": 1.9414883720472557e-05, "loss": 0.6584, "step": 1251 }, { "epoch": 0.14, "learning_rate": 1.9413694740700172e-05, "loss": 0.7388, "step": 1252 }, { "epoch": 0.14, "learning_rate": 1.941250459060828e-05, "loss": 0.7969, "step": 1253 }, { "epoch": 0.14, "learning_rate": 1.9411313270344836e-05, "loss": 0.7817, "step": 1254 }, { "epoch": 0.14, "learning_rate": 1.9410120780057958e-05, "loss": 0.8193, "step": 1255 }, { "epoch": 0.14, "learning_rate": 1.9408927119895888e-05, "loss": 0.7434, "step": 1256 }, { "epoch": 0.14, "learning_rate": 1.9407732290007023e-05, "loss": 0.8066, "step": 1257 }, { "epoch": 0.14, "learning_rate": 1.9406536290539914e-05, "loss": 0.71, "step": 1258 }, { "epoch": 0.14, "learning_rate": 1.9405339121643237e-05, "loss": 0.78, "step": 1259 }, { "epoch": 0.14, "learning_rate": 1.9404140783465837e-05, "loss": 0.7324, "step": 1260 }, { "epoch": 0.14, "learning_rate": 1.940294127615668e-05, "loss": 0.7039, "step": 1261 }, { "epoch": 0.14, "learning_rate": 1.9401740599864905e-05, "loss": 0.804, "step": 1262 }, { "epoch": 0.14, "learning_rate": 1.9400538754739765e-05, "loss": 0.7734, "step": 1263 }, { "epoch": 0.14, "learning_rate": 1.9399335740930688e-05, "loss": 0.761, "step": 1264 }, { "epoch": 0.14, "learning_rate": 1.9398131558587225e-05, "loss": 0.7012, "step": 1265 }, { "epoch": 0.14, "learning_rate": 1.9396926207859085e-05, "loss": 0.7419, "step": 1266 }, { "epoch": 0.14, "learning_rate": 1.9395719688896118e-05, "loss": 0.7227, "step": 1267 }, { "epoch": 0.14, "learning_rate": 1.939451200184832e-05, "loss": 0.7642, "step": 1268 }, { "epoch": 0.14, "learning_rate": 1.939330314686583e-05, "loss": 0.6836, "step": 1269 }, { "epoch": 0.14, "learning_rate": 1.9392093124098937e-05, "loss": 0.7417, "step": 1270 }, { "epoch": 0.14, "learning_rate": 1.9390881933698068e-05, "loss": 0.7146, "step": 1271 }, { "epoch": 0.14, "learning_rate": 1.93896695758138e-05, "loss": 0.8555, "step": 1272 }, { "epoch": 0.14, "learning_rate": 1.9388456050596858e-05, "loss": 0.7231, "step": 1273 }, { "epoch": 0.14, "learning_rate": 1.938724135819811e-05, "loss": 0.8652, "step": 1274 }, { "epoch": 0.14, "learning_rate": 1.938602549876856e-05, "loss": 0.8359, "step": 1275 }, { "epoch": 0.14, "learning_rate": 1.938480847245937e-05, "loss": 0.7629, "step": 1276 }, { "epoch": 0.14, "learning_rate": 1.938359027942184e-05, "loss": 0.7654, "step": 1277 }, { "epoch": 0.14, "learning_rate": 1.938237091980742e-05, "loss": 0.7278, "step": 1278 }, { "epoch": 0.14, "learning_rate": 1.9381150393767697e-05, "loss": 0.6875, "step": 1279 }, { "epoch": 0.14, "learning_rate": 1.9379928701454415e-05, "loss": 0.6965, "step": 1280 }, { "epoch": 0.14, "learning_rate": 1.937870584301945e-05, "loss": 0.6992, "step": 1281 }, { "epoch": 0.14, "learning_rate": 1.9377481818614833e-05, "loss": 0.7764, "step": 1282 }, { "epoch": 0.14, "learning_rate": 1.937625662839273e-05, "loss": 0.8225, "step": 1283 }, { "epoch": 0.14, "learning_rate": 1.9375030272505463e-05, "loss": 0.8262, "step": 1284 }, { "epoch": 0.14, "learning_rate": 1.9373802751105493e-05, "loss": 0.7305, "step": 1285 }, { "epoch": 0.14, "learning_rate": 1.9372574064345424e-05, "loss": 0.8486, "step": 1286 }, { "epoch": 0.14, "learning_rate": 1.9371344212378013e-05, "loss": 0.7964, "step": 1287 }, { "epoch": 0.14, "learning_rate": 1.937011319535615e-05, "loss": 0.8076, "step": 1288 }, { "epoch": 0.14, "learning_rate": 1.936888101343288e-05, "loss": 0.7485, "step": 1289 }, { "epoch": 0.14, "learning_rate": 1.9367647666761384e-05, "loss": 0.6499, "step": 1290 }, { "epoch": 0.14, "learning_rate": 1.9366413155495002e-05, "loss": 0.7097, "step": 1291 }, { "epoch": 0.14, "learning_rate": 1.9365177479787203e-05, "loss": 0.7747, "step": 1292 }, { "epoch": 0.14, "learning_rate": 1.9363940639791607e-05, "loss": 0.6541, "step": 1293 }, { "epoch": 0.14, "learning_rate": 1.9362702635661983e-05, "loss": 0.7241, "step": 1294 }, { "epoch": 0.14, "learning_rate": 1.9361463467552236e-05, "loss": 0.7974, "step": 1295 }, { "epoch": 0.14, "learning_rate": 1.9360223135616423e-05, "loss": 0.7197, "step": 1296 }, { "epoch": 0.14, "learning_rate": 1.935898164000875e-05, "loss": 0.7317, "step": 1297 }, { "epoch": 0.14, "learning_rate": 1.935773898088355e-05, "loss": 0.8779, "step": 1298 }, { "epoch": 0.14, "learning_rate": 1.9356495158395317e-05, "loss": 0.7141, "step": 1299 }, { "epoch": 0.14, "learning_rate": 1.9355250172698682e-05, "loss": 0.7004, "step": 1300 }, { "epoch": 0.14, "learning_rate": 1.9354004023948426e-05, "loss": 0.7517, "step": 1301 }, { "epoch": 0.14, "learning_rate": 1.9352756712299467e-05, "loss": 0.8633, "step": 1302 }, { "epoch": 0.14, "learning_rate": 1.9351508237906877e-05, "loss": 0.8037, "step": 1303 }, { "epoch": 0.14, "learning_rate": 1.9350258600925863e-05, "loss": 0.7422, "step": 1304 }, { "epoch": 0.14, "learning_rate": 1.9349007801511784e-05, "loss": 0.7502, "step": 1305 }, { "epoch": 0.14, "learning_rate": 1.9347755839820138e-05, "loss": 0.7261, "step": 1306 }, { "epoch": 0.14, "learning_rate": 1.9346502716006573e-05, "loss": 0.7612, "step": 1307 }, { "epoch": 0.14, "learning_rate": 1.934524843022688e-05, "loss": 0.7161, "step": 1308 }, { "epoch": 0.14, "learning_rate": 1.9343992982636984e-05, "loss": 0.7451, "step": 1309 }, { "epoch": 0.14, "learning_rate": 1.9342736373392976e-05, "loss": 0.6443, "step": 1310 }, { "epoch": 0.14, "learning_rate": 1.9341478602651068e-05, "loss": 0.8076, "step": 1311 }, { "epoch": 0.14, "learning_rate": 1.9340219670567636e-05, "loss": 0.739, "step": 1312 }, { "epoch": 0.14, "learning_rate": 1.9338959577299185e-05, "loss": 0.8125, "step": 1313 }, { "epoch": 0.14, "learning_rate": 1.933769832300237e-05, "loss": 0.7759, "step": 1314 }, { "epoch": 0.14, "learning_rate": 1.9336435907834e-05, "loss": 0.7373, "step": 1315 }, { "epoch": 0.14, "learning_rate": 1.9335172331951014e-05, "loss": 0.6694, "step": 1316 }, { "epoch": 0.14, "learning_rate": 1.93339075955105e-05, "loss": 0.8125, "step": 1317 }, { "epoch": 0.14, "learning_rate": 1.9332641698669693e-05, "loss": 0.853, "step": 1318 }, { "epoch": 0.14, "learning_rate": 1.9331374641585968e-05, "loss": 0.8867, "step": 1319 }, { "epoch": 0.14, "learning_rate": 1.9330106424416852e-05, "loss": 0.7629, "step": 1320 }, { "epoch": 0.14, "learning_rate": 1.932883704732001e-05, "loss": 0.7578, "step": 1321 }, { "epoch": 0.14, "learning_rate": 1.9327566510453243e-05, "loss": 0.8228, "step": 1322 }, { "epoch": 0.14, "learning_rate": 1.9326294813974517e-05, "loss": 0.7566, "step": 1323 }, { "epoch": 0.14, "learning_rate": 1.9325021958041924e-05, "loss": 0.696, "step": 1324 }, { "epoch": 0.14, "learning_rate": 1.932374794281371e-05, "loss": 0.7832, "step": 1325 }, { "epoch": 0.14, "learning_rate": 1.932247276844826e-05, "loss": 0.9224, "step": 1326 }, { "epoch": 0.14, "learning_rate": 1.9321196435104104e-05, "loss": 0.781, "step": 1327 }, { "epoch": 0.14, "learning_rate": 1.931991894293992e-05, "loss": 0.6985, "step": 1328 }, { "epoch": 0.14, "learning_rate": 1.9318640292114526e-05, "loss": 0.6475, "step": 1329 }, { "epoch": 0.14, "learning_rate": 1.9317360482786882e-05, "loss": 0.8403, "step": 1330 }, { "epoch": 0.14, "learning_rate": 1.9316079515116096e-05, "loss": 0.7568, "step": 1331 }, { "epoch": 0.15, "learning_rate": 1.9314797389261426e-05, "loss": 0.8037, "step": 1332 }, { "epoch": 0.15, "learning_rate": 1.9313514105382258e-05, "loss": 0.7141, "step": 1333 }, { "epoch": 0.15, "learning_rate": 1.9312229663638134e-05, "loss": 0.7603, "step": 1334 }, { "epoch": 0.15, "learning_rate": 1.931094406418874e-05, "loss": 0.8171, "step": 1335 }, { "epoch": 0.15, "learning_rate": 1.93096573071939e-05, "loss": 0.8, "step": 1336 }, { "epoch": 0.15, "learning_rate": 1.9308369392813587e-05, "loss": 0.7891, "step": 1337 }, { "epoch": 0.15, "learning_rate": 1.9307080321207913e-05, "loss": 0.6421, "step": 1338 }, { "epoch": 0.15, "learning_rate": 1.9305790092537137e-05, "loss": 0.7266, "step": 1339 }, { "epoch": 0.15, "learning_rate": 1.9304498706961663e-05, "loss": 0.8398, "step": 1340 }, { "epoch": 0.15, "learning_rate": 1.9303206164642037e-05, "loss": 0.6553, "step": 1341 }, { "epoch": 0.15, "learning_rate": 1.930191246573895e-05, "loss": 0.7673, "step": 1342 }, { "epoch": 0.15, "learning_rate": 1.9300617610413232e-05, "loss": 0.7737, "step": 1343 }, { "epoch": 0.15, "learning_rate": 1.9299321598825867e-05, "loss": 0.7383, "step": 1344 }, { "epoch": 0.15, "learning_rate": 1.929802443113797e-05, "loss": 0.8135, "step": 1345 }, { "epoch": 0.15, "learning_rate": 1.929672610751081e-05, "loss": 0.7397, "step": 1346 }, { "epoch": 0.15, "learning_rate": 1.9295426628105792e-05, "loss": 0.8203, "step": 1347 }, { "epoch": 0.15, "learning_rate": 1.9294125993084477e-05, "loss": 0.7078, "step": 1348 }, { "epoch": 0.15, "learning_rate": 1.9292824202608548e-05, "loss": 0.8081, "step": 1349 }, { "epoch": 0.15, "learning_rate": 1.929152125683986e-05, "loss": 0.8599, "step": 1350 }, { "epoch": 0.15, "learning_rate": 1.9290217155940382e-05, "loss": 0.7827, "step": 1351 }, { "epoch": 0.15, "learning_rate": 1.928891190007225e-05, "loss": 0.6118, "step": 1352 }, { "epoch": 0.15, "learning_rate": 1.9287605489397732e-05, "loss": 0.7473, "step": 1353 }, { "epoch": 0.15, "learning_rate": 1.9286297924079244e-05, "loss": 0.8728, "step": 1354 }, { "epoch": 0.15, "learning_rate": 1.928498920427934e-05, "loss": 0.5486, "step": 1355 }, { "epoch": 0.15, "learning_rate": 1.9283679330160726e-05, "loss": 0.6382, "step": 1356 }, { "epoch": 0.15, "learning_rate": 1.928236830188625e-05, "loss": 0.752, "step": 1357 }, { "epoch": 0.15, "learning_rate": 1.9281056119618884e-05, "loss": 0.7083, "step": 1358 }, { "epoch": 0.15, "learning_rate": 1.9279742783521776e-05, "loss": 0.686, "step": 1359 }, { "epoch": 0.15, "learning_rate": 1.9278428293758194e-05, "loss": 0.7703, "step": 1360 }, { "epoch": 0.15, "learning_rate": 1.927711265049156e-05, "loss": 0.7168, "step": 1361 }, { "epoch": 0.15, "learning_rate": 1.9275795853885433e-05, "loss": 0.875, "step": 1362 }, { "epoch": 0.15, "learning_rate": 1.927447790410352e-05, "loss": 0.698, "step": 1363 }, { "epoch": 0.15, "learning_rate": 1.927315880130967e-05, "loss": 0.8413, "step": 1364 }, { "epoch": 0.15, "learning_rate": 1.9271838545667876e-05, "loss": 0.7744, "step": 1365 }, { "epoch": 0.15, "learning_rate": 1.927051713734227e-05, "loss": 0.7815, "step": 1366 }, { "epoch": 0.15, "learning_rate": 1.9269194576497135e-05, "loss": 0.7603, "step": 1367 }, { "epoch": 0.15, "learning_rate": 1.9267870863296888e-05, "loss": 0.7366, "step": 1368 }, { "epoch": 0.15, "learning_rate": 1.92665459979061e-05, "loss": 0.7656, "step": 1369 }, { "epoch": 0.15, "learning_rate": 1.9265219980489475e-05, "loss": 0.8398, "step": 1370 }, { "epoch": 0.15, "learning_rate": 1.9263892811211865e-05, "loss": 0.7598, "step": 1371 }, { "epoch": 0.15, "learning_rate": 1.9262564490238268e-05, "loss": 0.7639, "step": 1372 }, { "epoch": 0.15, "learning_rate": 1.926123501773382e-05, "loss": 0.7451, "step": 1373 }, { "epoch": 0.15, "learning_rate": 1.9259904393863804e-05, "loss": 0.7688, "step": 1374 }, { "epoch": 0.15, "learning_rate": 1.9258572618793644e-05, "loss": 0.7092, "step": 1375 }, { "epoch": 0.15, "learning_rate": 1.9257239692688907e-05, "loss": 0.8291, "step": 1376 }, { "epoch": 0.15, "learning_rate": 1.92559056157153e-05, "loss": 0.7812, "step": 1377 }, { "epoch": 0.15, "learning_rate": 1.9254570388038683e-05, "loss": 0.7739, "step": 1378 }, { "epoch": 0.15, "learning_rate": 1.9253234009825047e-05, "loss": 0.6572, "step": 1379 }, { "epoch": 0.15, "learning_rate": 1.9251896481240536e-05, "loss": 0.7871, "step": 1380 }, { "epoch": 0.15, "learning_rate": 1.9250557802451432e-05, "loss": 0.7649, "step": 1381 }, { "epoch": 0.15, "learning_rate": 1.9249217973624164e-05, "loss": 0.6785, "step": 1382 }, { "epoch": 0.15, "learning_rate": 1.9247876994925293e-05, "loss": 0.7766, "step": 1383 }, { "epoch": 0.15, "learning_rate": 1.9246534866521535e-05, "loss": 0.8342, "step": 1384 }, { "epoch": 0.15, "learning_rate": 1.9245191588579744e-05, "loss": 0.7651, "step": 1385 }, { "epoch": 0.15, "learning_rate": 1.9243847161266924e-05, "loss": 0.7119, "step": 1386 }, { "epoch": 0.15, "learning_rate": 1.92425015847502e-05, "loss": 0.9282, "step": 1387 }, { "epoch": 0.15, "learning_rate": 1.9241154859196875e-05, "loss": 0.7549, "step": 1388 }, { "epoch": 0.15, "learning_rate": 1.923980698477436e-05, "loss": 0.8491, "step": 1389 }, { "epoch": 0.15, "learning_rate": 1.9238457961650228e-05, "loss": 0.6924, "step": 1390 }, { "epoch": 0.15, "learning_rate": 1.9237107789992195e-05, "loss": 0.749, "step": 1391 }, { "epoch": 0.15, "learning_rate": 1.9235756469968112e-05, "loss": 0.7819, "step": 1392 }, { "epoch": 0.15, "learning_rate": 1.923440400174598e-05, "loss": 0.7075, "step": 1393 }, { "epoch": 0.15, "learning_rate": 1.923305038549393e-05, "loss": 0.8479, "step": 1394 }, { "epoch": 0.15, "learning_rate": 1.9231695621380257e-05, "loss": 0.7275, "step": 1395 }, { "epoch": 0.15, "learning_rate": 1.9230339709573376e-05, "loss": 0.7329, "step": 1396 }, { "epoch": 0.15, "learning_rate": 1.9228982650241863e-05, "loss": 0.6165, "step": 1397 }, { "epoch": 0.15, "learning_rate": 1.9227624443554425e-05, "loss": 0.604, "step": 1398 }, { "epoch": 0.15, "learning_rate": 1.9226265089679915e-05, "loss": 0.8418, "step": 1399 }, { "epoch": 0.15, "learning_rate": 1.9224904588787334e-05, "loss": 0.7988, "step": 1400 }, { "epoch": 0.15, "learning_rate": 1.9223542941045817e-05, "loss": 0.6958, "step": 1401 }, { "epoch": 0.15, "learning_rate": 1.922218014662464e-05, "loss": 0.7161, "step": 1402 }, { "epoch": 0.15, "learning_rate": 1.922081620569324e-05, "loss": 0.8074, "step": 1403 }, { "epoch": 0.15, "learning_rate": 1.9219451118421173e-05, "loss": 0.6394, "step": 1404 }, { "epoch": 0.15, "learning_rate": 1.921808488497815e-05, "loss": 0.7935, "step": 1405 }, { "epoch": 0.15, "learning_rate": 1.9216717505534025e-05, "loss": 0.7607, "step": 1406 }, { "epoch": 0.15, "learning_rate": 1.921534898025879e-05, "loss": 0.783, "step": 1407 }, { "epoch": 0.15, "learning_rate": 1.921397930932258e-05, "loss": 0.7961, "step": 1408 }, { "epoch": 0.15, "learning_rate": 1.921260849289568e-05, "loss": 0.7534, "step": 1409 }, { "epoch": 0.15, "learning_rate": 1.92112365311485e-05, "loss": 0.8413, "step": 1410 }, { "epoch": 0.15, "learning_rate": 1.920986342425162e-05, "loss": 0.8083, "step": 1411 }, { "epoch": 0.15, "learning_rate": 1.9208489172375725e-05, "loss": 0.7463, "step": 1412 }, { "epoch": 0.15, "learning_rate": 1.9207113775691682e-05, "loss": 0.6609, "step": 1413 }, { "epoch": 0.15, "learning_rate": 1.9205737234370475e-05, "loss": 0.6643, "step": 1414 }, { "epoch": 0.15, "learning_rate": 1.9204359548583233e-05, "loss": 0.7346, "step": 1415 }, { "epoch": 0.15, "learning_rate": 1.920298071850123e-05, "loss": 0.7014, "step": 1416 }, { "epoch": 0.15, "learning_rate": 1.9201600744295897e-05, "loss": 0.7964, "step": 1417 }, { "epoch": 0.15, "learning_rate": 1.9200219626138777e-05, "loss": 0.8149, "step": 1418 }, { "epoch": 0.15, "learning_rate": 1.9198837364201587e-05, "loss": 0.7876, "step": 1419 }, { "epoch": 0.15, "learning_rate": 1.9197453958656157e-05, "loss": 0.8359, "step": 1420 }, { "epoch": 0.15, "learning_rate": 1.9196069409674484e-05, "loss": 0.8359, "step": 1421 }, { "epoch": 0.15, "learning_rate": 1.9194683717428688e-05, "loss": 0.7944, "step": 1422 }, { "epoch": 0.15, "learning_rate": 1.919329688209105e-05, "loss": 0.7595, "step": 1423 }, { "epoch": 0.16, "learning_rate": 1.919190890383397e-05, "loss": 0.7241, "step": 1424 }, { "epoch": 0.16, "learning_rate": 1.9190519782830016e-05, "loss": 0.8252, "step": 1425 }, { "epoch": 0.16, "learning_rate": 1.9189129519251873e-05, "loss": 0.7617, "step": 1426 }, { "epoch": 0.16, "learning_rate": 1.9187738113272388e-05, "loss": 0.8496, "step": 1427 }, { "epoch": 0.16, "learning_rate": 1.918634556506454e-05, "loss": 0.7439, "step": 1428 }, { "epoch": 0.16, "learning_rate": 1.9184951874801445e-05, "loss": 0.9512, "step": 1429 }, { "epoch": 0.16, "learning_rate": 1.918355704265638e-05, "loss": 0.7048, "step": 1430 }, { "epoch": 0.16, "learning_rate": 1.9182161068802742e-05, "loss": 0.6907, "step": 1431 }, { "epoch": 0.16, "learning_rate": 1.918076395341408e-05, "loss": 0.8047, "step": 1432 }, { "epoch": 0.16, "learning_rate": 1.91793656966641e-05, "loss": 0.7947, "step": 1433 }, { "epoch": 0.16, "learning_rate": 1.9177966298726615e-05, "loss": 0.8845, "step": 1434 }, { "epoch": 0.16, "learning_rate": 1.917656575977561e-05, "loss": 0.7598, "step": 1435 }, { "epoch": 0.16, "learning_rate": 1.9175164079985196e-05, "loss": 0.6802, "step": 1436 }, { "epoch": 0.16, "learning_rate": 1.9173761259529634e-05, "loss": 0.7563, "step": 1437 }, { "epoch": 0.16, "learning_rate": 1.9172357298583327e-05, "loss": 0.7793, "step": 1438 }, { "epoch": 0.16, "learning_rate": 1.917095219732081e-05, "loss": 0.7832, "step": 1439 }, { "epoch": 0.16, "learning_rate": 1.9169545955916773e-05, "loss": 0.6931, "step": 1440 }, { "epoch": 0.16, "learning_rate": 1.9168138574546037e-05, "loss": 0.8154, "step": 1441 }, { "epoch": 0.16, "learning_rate": 1.916673005338357e-05, "loss": 0.769, "step": 1442 }, { "epoch": 0.16, "learning_rate": 1.916532039260448e-05, "loss": 0.8457, "step": 1443 }, { "epoch": 0.16, "learning_rate": 1.916390959238402e-05, "loss": 0.7915, "step": 1444 }, { "epoch": 0.16, "learning_rate": 1.9162497652897583e-05, "loss": 0.8142, "step": 1445 }, { "epoch": 0.16, "learning_rate": 1.9161084574320696e-05, "loss": 0.8093, "step": 1446 }, { "epoch": 0.16, "learning_rate": 1.915967035682904e-05, "loss": 0.6675, "step": 1447 }, { "epoch": 0.16, "learning_rate": 1.9158255000598435e-05, "loss": 0.8364, "step": 1448 }, { "epoch": 0.16, "learning_rate": 1.9156838505804826e-05, "loss": 0.7588, "step": 1449 }, { "epoch": 0.16, "learning_rate": 1.9155420872624328e-05, "loss": 0.7913, "step": 1450 }, { "epoch": 0.16, "learning_rate": 1.9154002101233175e-05, "loss": 0.7603, "step": 1451 }, { "epoch": 0.16, "learning_rate": 1.915258219180775e-05, "loss": 0.7915, "step": 1452 }, { "epoch": 0.16, "learning_rate": 1.915116114452458e-05, "loss": 0.7881, "step": 1453 }, { "epoch": 0.16, "learning_rate": 1.914973895956033e-05, "loss": 0.7656, "step": 1454 }, { "epoch": 0.16, "learning_rate": 1.9148315637091805e-05, "loss": 0.853, "step": 1455 }, { "epoch": 0.16, "learning_rate": 1.9146891177295956e-05, "loss": 0.7759, "step": 1456 }, { "epoch": 0.16, "learning_rate": 1.9145465580349875e-05, "loss": 0.7141, "step": 1457 }, { "epoch": 0.16, "learning_rate": 1.914403884643079e-05, "loss": 0.7417, "step": 1458 }, { "epoch": 0.16, "learning_rate": 1.9142610975716076e-05, "loss": 0.7939, "step": 1459 }, { "epoch": 0.16, "learning_rate": 1.9141181968383248e-05, "loss": 0.7954, "step": 1460 }, { "epoch": 0.16, "learning_rate": 1.913975182460996e-05, "loss": 0.7087, "step": 1461 }, { "epoch": 0.16, "learning_rate": 1.9138320544574006e-05, "loss": 0.7388, "step": 1462 }, { "epoch": 0.16, "learning_rate": 1.913688812845333e-05, "loss": 0.7114, "step": 1463 }, { "epoch": 0.16, "learning_rate": 1.913545457642601e-05, "loss": 0.8384, "step": 1464 }, { "epoch": 0.16, "learning_rate": 1.9134019888670267e-05, "loss": 0.7329, "step": 1465 }, { "epoch": 0.16, "learning_rate": 1.9132584065364455e-05, "loss": 0.8501, "step": 1466 }, { "epoch": 0.16, "learning_rate": 1.9131147106687085e-05, "loss": 0.7249, "step": 1467 }, { "epoch": 0.16, "learning_rate": 1.9129709012816803e-05, "loss": 0.8848, "step": 1468 }, { "epoch": 0.16, "learning_rate": 1.9128269783932384e-05, "loss": 0.7437, "step": 1469 }, { "epoch": 0.16, "learning_rate": 1.9126829420212764e-05, "loss": 0.9355, "step": 1470 }, { "epoch": 0.16, "learning_rate": 1.9125387921837008e-05, "loss": 0.6497, "step": 1471 }, { "epoch": 0.16, "learning_rate": 1.912394528898432e-05, "loss": 0.71, "step": 1472 }, { "epoch": 0.16, "learning_rate": 1.9122501521834052e-05, "loss": 0.738, "step": 1473 }, { "epoch": 0.16, "learning_rate": 1.91210566205657e-05, "loss": 0.7188, "step": 1474 }, { "epoch": 0.16, "learning_rate": 1.911961058535889e-05, "loss": 0.7686, "step": 1475 }, { "epoch": 0.16, "learning_rate": 1.9118163416393392e-05, "loss": 0.8193, "step": 1476 }, { "epoch": 0.16, "learning_rate": 1.9116715113849126e-05, "loss": 0.8413, "step": 1477 }, { "epoch": 0.16, "learning_rate": 1.911526567790614e-05, "loss": 0.8096, "step": 1478 }, { "epoch": 0.16, "learning_rate": 1.9113815108744635e-05, "loss": 0.7898, "step": 1479 }, { "epoch": 0.16, "learning_rate": 1.911236340654494e-05, "loss": 0.7551, "step": 1480 }, { "epoch": 0.16, "learning_rate": 1.9110910571487543e-05, "loss": 0.7583, "step": 1481 }, { "epoch": 0.16, "learning_rate": 1.910945660375305e-05, "loss": 0.7168, "step": 1482 }, { "epoch": 0.16, "learning_rate": 1.910800150352223e-05, "loss": 0.7986, "step": 1483 }, { "epoch": 0.16, "learning_rate": 1.9106545270975974e-05, "loss": 0.8472, "step": 1484 }, { "epoch": 0.16, "learning_rate": 1.910508790629533e-05, "loss": 0.812, "step": 1485 }, { "epoch": 0.16, "learning_rate": 1.9103629409661468e-05, "loss": 0.8301, "step": 1486 }, { "epoch": 0.16, "learning_rate": 1.910216978125572e-05, "loss": 0.856, "step": 1487 }, { "epoch": 0.16, "learning_rate": 1.9100709021259544e-05, "loss": 0.7505, "step": 1488 }, { "epoch": 0.16, "learning_rate": 1.9099247129854542e-05, "loss": 0.7419, "step": 1489 }, { "epoch": 0.16, "learning_rate": 1.9097784107222463e-05, "loss": 0.896, "step": 1490 }, { "epoch": 0.16, "learning_rate": 1.9096319953545186e-05, "loss": 0.6963, "step": 1491 }, { "epoch": 0.16, "learning_rate": 1.9094854669004738e-05, "loss": 0.7302, "step": 1492 }, { "epoch": 0.16, "learning_rate": 1.9093388253783285e-05, "loss": 0.6621, "step": 1493 }, { "epoch": 0.16, "learning_rate": 1.909192070806313e-05, "loss": 0.7214, "step": 1494 }, { "epoch": 0.16, "learning_rate": 1.9090452032026724e-05, "loss": 0.6582, "step": 1495 }, { "epoch": 0.16, "learning_rate": 1.9088982225856653e-05, "loss": 0.7148, "step": 1496 }, { "epoch": 0.16, "learning_rate": 1.9087511289735646e-05, "loss": 0.6362, "step": 1497 }, { "epoch": 0.16, "learning_rate": 1.9086039223846566e-05, "loss": 0.7139, "step": 1498 }, { "epoch": 0.16, "learning_rate": 1.9084566028372426e-05, "loss": 0.6873, "step": 1499 }, { "epoch": 0.16, "learning_rate": 1.9083091703496373e-05, "loss": 0.7725, "step": 1500 }, { "epoch": 0.16, "learning_rate": 1.9081616249401696e-05, "loss": 0.729, "step": 1501 }, { "epoch": 0.16, "learning_rate": 1.9080139666271834e-05, "loss": 0.7593, "step": 1502 }, { "epoch": 0.16, "learning_rate": 1.907866195429034e-05, "loss": 0.8491, "step": 1503 }, { "epoch": 0.16, "learning_rate": 1.9077183113640943e-05, "loss": 0.8594, "step": 1504 }, { "epoch": 0.16, "learning_rate": 1.907570314450748e-05, "loss": 0.7693, "step": 1505 }, { "epoch": 0.16, "learning_rate": 1.9074222047073945e-05, "loss": 0.7534, "step": 1506 }, { "epoch": 0.16, "learning_rate": 1.9072739821524477e-05, "loss": 0.6904, "step": 1507 }, { "epoch": 0.16, "learning_rate": 1.907125646804334e-05, "loss": 0.8037, "step": 1508 }, { "epoch": 0.16, "learning_rate": 1.9069771986814948e-05, "loss": 0.7007, "step": 1509 }, { "epoch": 0.16, "learning_rate": 1.9068286378023855e-05, "loss": 0.7566, "step": 1510 }, { "epoch": 0.16, "learning_rate": 1.906679964185475e-05, "loss": 0.7544, "step": 1511 }, { "epoch": 0.16, "learning_rate": 1.906531177849247e-05, "loss": 0.7666, "step": 1512 }, { "epoch": 0.16, "learning_rate": 1.906382278812198e-05, "loss": 0.813, "step": 1513 }, { "epoch": 0.16, "learning_rate": 1.9062332670928397e-05, "loss": 0.8096, "step": 1514 }, { "epoch": 0.16, "learning_rate": 1.9060841427096978e-05, "loss": 0.7432, "step": 1515 }, { "epoch": 0.17, "learning_rate": 1.905934905681311e-05, "loss": 0.7544, "step": 1516 }, { "epoch": 0.17, "learning_rate": 1.905785556026233e-05, "loss": 0.832, "step": 1517 }, { "epoch": 0.17, "learning_rate": 1.905636093763031e-05, "loss": 0.613, "step": 1518 }, { "epoch": 0.17, "learning_rate": 1.905486518910286e-05, "loss": 0.7527, "step": 1519 }, { "epoch": 0.17, "learning_rate": 1.9053368314865933e-05, "loss": 0.656, "step": 1520 }, { "epoch": 0.17, "learning_rate": 1.9051870315105626e-05, "loss": 0.7715, "step": 1521 }, { "epoch": 0.17, "learning_rate": 1.905037119000817e-05, "loss": 0.7349, "step": 1522 }, { "epoch": 0.17, "learning_rate": 1.9048870939759932e-05, "loss": 0.7451, "step": 1523 }, { "epoch": 0.17, "learning_rate": 1.9047369564547434e-05, "loss": 0.6323, "step": 1524 }, { "epoch": 0.17, "learning_rate": 1.9045867064557324e-05, "loss": 0.8223, "step": 1525 }, { "epoch": 0.17, "learning_rate": 1.9044363439976393e-05, "loss": 0.7312, "step": 1526 }, { "epoch": 0.17, "learning_rate": 1.9042858690991574e-05, "loss": 0.8354, "step": 1527 }, { "epoch": 0.17, "learning_rate": 1.9041352817789937e-05, "loss": 0.7354, "step": 1528 }, { "epoch": 0.17, "learning_rate": 1.90398458205587e-05, "loss": 0.7759, "step": 1529 }, { "epoch": 0.17, "learning_rate": 1.9038337699485207e-05, "loss": 0.7734, "step": 1530 }, { "epoch": 0.17, "learning_rate": 1.9036828454756953e-05, "loss": 0.7832, "step": 1531 }, { "epoch": 0.17, "learning_rate": 1.9035318086561566e-05, "loss": 0.7856, "step": 1532 }, { "epoch": 0.17, "learning_rate": 1.903380659508682e-05, "loss": 0.7756, "step": 1533 }, { "epoch": 0.17, "learning_rate": 1.903229398052062e-05, "loss": 0.6846, "step": 1534 }, { "epoch": 0.17, "learning_rate": 1.9030780243051025e-05, "loss": 0.7505, "step": 1535 }, { "epoch": 0.17, "learning_rate": 1.9029265382866216e-05, "loss": 0.6555, "step": 1536 }, { "epoch": 0.17, "learning_rate": 1.902774940015452e-05, "loss": 0.8159, "step": 1537 }, { "epoch": 0.17, "learning_rate": 1.9026232295104414e-05, "loss": 0.7676, "step": 1538 }, { "epoch": 0.17, "learning_rate": 1.9024714067904496e-05, "loss": 0.8721, "step": 1539 }, { "epoch": 0.17, "learning_rate": 1.9023194718743524e-05, "loss": 0.7649, "step": 1540 }, { "epoch": 0.17, "learning_rate": 1.902167424781038e-05, "loss": 0.687, "step": 1541 }, { "epoch": 0.17, "learning_rate": 1.9020152655294087e-05, "loss": 0.7239, "step": 1542 }, { "epoch": 0.17, "learning_rate": 1.9018629941383816e-05, "loss": 0.7734, "step": 1543 }, { "epoch": 0.17, "learning_rate": 1.901710610626887e-05, "loss": 0.7463, "step": 1544 }, { "epoch": 0.17, "learning_rate": 1.9015581150138693e-05, "loss": 0.7439, "step": 1545 }, { "epoch": 0.17, "learning_rate": 1.9014055073182872e-05, "loss": 0.7427, "step": 1546 }, { "epoch": 0.17, "learning_rate": 1.9012527875591122e-05, "loss": 0.73, "step": 1547 }, { "epoch": 0.17, "learning_rate": 1.9010999557553317e-05, "loss": 0.874, "step": 1548 }, { "epoch": 0.17, "learning_rate": 1.9009470119259453e-05, "loss": 0.7266, "step": 1549 }, { "epoch": 0.17, "learning_rate": 1.9007939560899676e-05, "loss": 0.8188, "step": 1550 }, { "epoch": 0.17, "learning_rate": 1.9006407882664256e-05, "loss": 0.7947, "step": 1551 }, { "epoch": 0.17, "learning_rate": 1.9004875084743624e-05, "loss": 0.8325, "step": 1552 }, { "epoch": 0.17, "learning_rate": 1.9003341167328333e-05, "loss": 0.8096, "step": 1553 }, { "epoch": 0.17, "learning_rate": 1.900180613060908e-05, "loss": 0.7554, "step": 1554 }, { "epoch": 0.17, "learning_rate": 1.9000269974776707e-05, "loss": 0.6531, "step": 1555 }, { "epoch": 0.17, "learning_rate": 1.8998732700022186e-05, "loss": 0.616, "step": 1556 }, { "epoch": 0.17, "learning_rate": 1.8997194306536635e-05, "loss": 0.7327, "step": 1557 }, { "epoch": 0.17, "learning_rate": 1.899565479451131e-05, "loss": 0.6772, "step": 1558 }, { "epoch": 0.17, "learning_rate": 1.8994114164137597e-05, "loss": 0.8716, "step": 1559 }, { "epoch": 0.17, "learning_rate": 1.899257241560704e-05, "loss": 0.8936, "step": 1560 }, { "epoch": 0.17, "learning_rate": 1.8991029549111298e-05, "loss": 0.7402, "step": 1561 }, { "epoch": 0.17, "learning_rate": 1.8989485564842197e-05, "loss": 0.7773, "step": 1562 }, { "epoch": 0.17, "learning_rate": 1.8987940462991673e-05, "loss": 0.7437, "step": 1563 }, { "epoch": 0.17, "learning_rate": 1.898639424375182e-05, "loss": 0.6467, "step": 1564 }, { "epoch": 0.17, "learning_rate": 1.8984846907314863e-05, "loss": 0.8008, "step": 1565 }, { "epoch": 0.17, "learning_rate": 1.8983298453873172e-05, "loss": 0.8037, "step": 1566 }, { "epoch": 0.17, "learning_rate": 1.898174888361925e-05, "loss": 0.7798, "step": 1567 }, { "epoch": 0.17, "learning_rate": 1.8980198196745743e-05, "loss": 0.6843, "step": 1568 }, { "epoch": 0.17, "learning_rate": 1.897864639344543e-05, "loss": 0.7417, "step": 1569 }, { "epoch": 0.17, "learning_rate": 1.897709347391124e-05, "loss": 0.7812, "step": 1570 }, { "epoch": 0.17, "learning_rate": 1.8975539438336225e-05, "loss": 0.7083, "step": 1571 }, { "epoch": 0.17, "learning_rate": 1.8973984286913584e-05, "loss": 0.7871, "step": 1572 }, { "epoch": 0.17, "learning_rate": 1.8972428019836663e-05, "loss": 0.8555, "step": 1573 }, { "epoch": 0.17, "learning_rate": 1.8970870637298936e-05, "loss": 0.6846, "step": 1574 }, { "epoch": 0.17, "learning_rate": 1.8969312139494015e-05, "loss": 0.8735, "step": 1575 }, { "epoch": 0.17, "learning_rate": 1.896775252661565e-05, "loss": 0.7043, "step": 1576 }, { "epoch": 0.17, "learning_rate": 1.896619179885775e-05, "loss": 0.7769, "step": 1577 }, { "epoch": 0.17, "learning_rate": 1.896462995641432e-05, "loss": 0.8662, "step": 1578 }, { "epoch": 0.17, "learning_rate": 1.8963066999479557e-05, "loss": 0.7449, "step": 1579 }, { "epoch": 0.17, "learning_rate": 1.8961502928247754e-05, "loss": 0.8188, "step": 1580 }, { "epoch": 0.17, "learning_rate": 1.895993774291336e-05, "loss": 0.7224, "step": 1581 }, { "epoch": 0.17, "learning_rate": 1.895837144367096e-05, "loss": 0.8027, "step": 1582 }, { "epoch": 0.17, "learning_rate": 1.8956804030715284e-05, "loss": 0.6758, "step": 1583 }, { "epoch": 0.17, "learning_rate": 1.8955235504241187e-05, "loss": 0.7988, "step": 1584 }, { "epoch": 0.17, "learning_rate": 1.895366586444367e-05, "loss": 0.6421, "step": 1585 }, { "epoch": 0.17, "learning_rate": 1.8952095111517875e-05, "loss": 0.7405, "step": 1586 }, { "epoch": 0.17, "learning_rate": 1.895052324565908e-05, "loss": 0.7793, "step": 1587 }, { "epoch": 0.17, "learning_rate": 1.89489502670627e-05, "loss": 0.7725, "step": 1588 }, { "epoch": 0.17, "learning_rate": 1.894737617592429e-05, "loss": 0.7781, "step": 1589 }, { "epoch": 0.17, "learning_rate": 1.894580097243954e-05, "loss": 0.7778, "step": 1590 }, { "epoch": 0.17, "learning_rate": 1.894422465680428e-05, "loss": 0.7637, "step": 1591 }, { "epoch": 0.17, "learning_rate": 1.8942647229214484e-05, "loss": 0.6353, "step": 1592 }, { "epoch": 0.17, "learning_rate": 1.8941068689866255e-05, "loss": 0.7556, "step": 1593 }, { "epoch": 0.17, "learning_rate": 1.893948903895584e-05, "loss": 0.8984, "step": 1594 }, { "epoch": 0.17, "learning_rate": 1.893790827667962e-05, "loss": 0.6587, "step": 1595 }, { "epoch": 0.17, "learning_rate": 1.8936326403234125e-05, "loss": 0.759, "step": 1596 }, { "epoch": 0.17, "learning_rate": 1.8934743418816008e-05, "loss": 0.7205, "step": 1597 }, { "epoch": 0.17, "learning_rate": 1.8933159323622065e-05, "loss": 0.6882, "step": 1598 }, { "epoch": 0.17, "learning_rate": 1.893157411784924e-05, "loss": 0.6494, "step": 1599 }, { "epoch": 0.17, "learning_rate": 1.8929987801694602e-05, "loss": 0.8857, "step": 1600 }, { "epoch": 0.17, "learning_rate": 1.8928400375355366e-05, "loss": 0.8379, "step": 1601 }, { "epoch": 0.17, "learning_rate": 1.892681183902888e-05, "loss": 0.6985, "step": 1602 }, { "epoch": 0.17, "learning_rate": 1.892522219291263e-05, "loss": 0.8271, "step": 1603 }, { "epoch": 0.17, "learning_rate": 1.892363143720425e-05, "loss": 0.6741, "step": 1604 }, { "epoch": 0.17, "learning_rate": 1.89220395721015e-05, "loss": 0.7229, "step": 1605 }, { "epoch": 0.17, "learning_rate": 1.8920446597802276e-05, "loss": 0.7097, "step": 1606 }, { "epoch": 0.17, "learning_rate": 1.8918852514504632e-05, "loss": 0.8013, "step": 1607 }, { "epoch": 0.18, "learning_rate": 1.8917257322406735e-05, "loss": 0.7444, "step": 1608 }, { "epoch": 0.18, "learning_rate": 1.8915661021706902e-05, "loss": 0.8223, "step": 1609 }, { "epoch": 0.18, "learning_rate": 1.891406361260359e-05, "loss": 0.8477, "step": 1610 }, { "epoch": 0.18, "learning_rate": 1.891246509529539e-05, "loss": 0.7825, "step": 1611 }, { "epoch": 0.18, "learning_rate": 1.891086546998103e-05, "loss": 0.7417, "step": 1612 }, { "epoch": 0.18, "learning_rate": 1.8909264736859375e-05, "loss": 0.7686, "step": 1613 }, { "epoch": 0.18, "learning_rate": 1.8907662896129435e-05, "loss": 0.8198, "step": 1614 }, { "epoch": 0.18, "learning_rate": 1.8906059947990346e-05, "loss": 0.5967, "step": 1615 }, { "epoch": 0.18, "learning_rate": 1.8904455892641394e-05, "loss": 0.7869, "step": 1616 }, { "epoch": 0.18, "learning_rate": 1.8902850730281993e-05, "loss": 0.8306, "step": 1617 }, { "epoch": 0.18, "learning_rate": 1.8901244461111697e-05, "loss": 0.7334, "step": 1618 }, { "epoch": 0.18, "learning_rate": 1.8899637085330203e-05, "loss": 0.8081, "step": 1619 }, { "epoch": 0.18, "learning_rate": 1.8898028603137343e-05, "loss": 0.7676, "step": 1620 }, { "epoch": 0.18, "learning_rate": 1.8896419014733074e-05, "loss": 0.7126, "step": 1621 }, { "epoch": 0.18, "learning_rate": 1.8894808320317516e-05, "loss": 0.7847, "step": 1622 }, { "epoch": 0.18, "learning_rate": 1.88931965200909e-05, "loss": 0.8145, "step": 1623 }, { "epoch": 0.18, "learning_rate": 1.8891583614253613e-05, "loss": 0.676, "step": 1624 }, { "epoch": 0.18, "learning_rate": 1.8889969603006176e-05, "loss": 0.7588, "step": 1625 }, { "epoch": 0.18, "learning_rate": 1.8888354486549238e-05, "loss": 0.8237, "step": 1626 }, { "epoch": 0.18, "learning_rate": 1.888673826508359e-05, "loss": 0.8203, "step": 1627 }, { "epoch": 0.18, "learning_rate": 1.888512093881017e-05, "loss": 0.77, "step": 1628 }, { "epoch": 0.18, "learning_rate": 1.8883502507930044e-05, "loss": 0.6802, "step": 1629 }, { "epoch": 0.18, "learning_rate": 1.888188297264441e-05, "loss": 0.7627, "step": 1630 }, { "epoch": 0.18, "learning_rate": 1.8880262333154618e-05, "loss": 0.7056, "step": 1631 }, { "epoch": 0.18, "learning_rate": 1.8878640589662144e-05, "loss": 0.7559, "step": 1632 }, { "epoch": 0.18, "learning_rate": 1.88770177423686e-05, "loss": 0.7612, "step": 1633 }, { "epoch": 0.18, "learning_rate": 1.887539379147575e-05, "loss": 0.7788, "step": 1634 }, { "epoch": 0.18, "learning_rate": 1.887376873718548e-05, "loss": 0.8159, "step": 1635 }, { "epoch": 0.18, "learning_rate": 1.8872142579699818e-05, "loss": 0.8594, "step": 1636 }, { "epoch": 0.18, "learning_rate": 1.8870515319220927e-05, "loss": 0.8154, "step": 1637 }, { "epoch": 0.18, "learning_rate": 1.8868886955951115e-05, "loss": 0.7739, "step": 1638 }, { "epoch": 0.18, "learning_rate": 1.886725749009282e-05, "loss": 0.6953, "step": 1639 }, { "epoch": 0.18, "learning_rate": 1.8865626921848615e-05, "loss": 0.7483, "step": 1640 }, { "epoch": 0.18, "learning_rate": 1.886399525142122e-05, "loss": 0.7183, "step": 1641 }, { "epoch": 0.18, "learning_rate": 1.886236247901348e-05, "loss": 0.8389, "step": 1642 }, { "epoch": 0.18, "learning_rate": 1.8860728604828383e-05, "loss": 0.7253, "step": 1643 }, { "epoch": 0.18, "learning_rate": 1.8859093629069057e-05, "loss": 0.8516, "step": 1644 }, { "epoch": 0.18, "learning_rate": 1.8857457551938763e-05, "loss": 0.7632, "step": 1645 }, { "epoch": 0.18, "learning_rate": 1.88558203736409e-05, "loss": 0.811, "step": 1646 }, { "epoch": 0.18, "learning_rate": 1.8854182094379007e-05, "loss": 0.7295, "step": 1647 }, { "epoch": 0.18, "learning_rate": 1.8852542714356747e-05, "loss": 0.8135, "step": 1648 }, { "epoch": 0.18, "learning_rate": 1.8850902233777937e-05, "loss": 0.8396, "step": 1649 }, { "epoch": 0.18, "learning_rate": 1.884926065284652e-05, "loss": 0.718, "step": 1650 }, { "epoch": 0.18, "learning_rate": 1.8847617971766577e-05, "loss": 0.7655, "step": 1651 }, { "epoch": 0.18, "learning_rate": 1.8845974190742334e-05, "loss": 0.8335, "step": 1652 }, { "epoch": 0.18, "learning_rate": 1.8844329309978146e-05, "loss": 0.7671, "step": 1653 }, { "epoch": 0.18, "learning_rate": 1.88426833296785e-05, "loss": 0.8145, "step": 1654 }, { "epoch": 0.18, "learning_rate": 1.8841036250048032e-05, "loss": 0.8259, "step": 1655 }, { "epoch": 0.18, "learning_rate": 1.8839388071291506e-05, "loss": 0.7688, "step": 1656 }, { "epoch": 0.18, "learning_rate": 1.8837738793613823e-05, "loss": 0.8, "step": 1657 }, { "epoch": 0.18, "learning_rate": 1.8836088417220025e-05, "loss": 0.8164, "step": 1658 }, { "epoch": 0.18, "learning_rate": 1.8834436942315293e-05, "loss": 0.7632, "step": 1659 }, { "epoch": 0.18, "learning_rate": 1.8832784369104934e-05, "loss": 0.6594, "step": 1660 }, { "epoch": 0.18, "learning_rate": 1.8831130697794397e-05, "loss": 0.7927, "step": 1661 }, { "epoch": 0.18, "learning_rate": 1.8829475928589272e-05, "loss": 0.7546, "step": 1662 }, { "epoch": 0.18, "learning_rate": 1.882782006169528e-05, "loss": 0.7207, "step": 1663 }, { "epoch": 0.18, "learning_rate": 1.8826163097318277e-05, "loss": 0.7676, "step": 1664 }, { "epoch": 0.18, "learning_rate": 1.882450503566426e-05, "loss": 0.6716, "step": 1665 }, { "epoch": 0.18, "learning_rate": 1.8822845876939365e-05, "loss": 0.8462, "step": 1666 }, { "epoch": 0.18, "learning_rate": 1.8821185621349856e-05, "loss": 0.6084, "step": 1667 }, { "epoch": 0.18, "learning_rate": 1.8819524269102138e-05, "loss": 0.7556, "step": 1668 }, { "epoch": 0.18, "learning_rate": 1.881786182040275e-05, "loss": 0.6267, "step": 1669 }, { "epoch": 0.18, "learning_rate": 1.8816198275458376e-05, "loss": 0.771, "step": 1670 }, { "epoch": 0.18, "learning_rate": 1.881453363447582e-05, "loss": 0.8093, "step": 1671 }, { "epoch": 0.18, "learning_rate": 1.881286789766204e-05, "loss": 0.7429, "step": 1672 }, { "epoch": 0.18, "learning_rate": 1.8811201065224122e-05, "loss": 0.8318, "step": 1673 }, { "epoch": 0.18, "learning_rate": 1.880953313736928e-05, "loss": 0.7227, "step": 1674 }, { "epoch": 0.18, "learning_rate": 1.8807864114304875e-05, "loss": 0.7109, "step": 1675 }, { "epoch": 0.18, "learning_rate": 1.880619399623841e-05, "loss": 0.7358, "step": 1676 }, { "epoch": 0.18, "learning_rate": 1.880452278337751e-05, "loss": 0.6245, "step": 1677 }, { "epoch": 0.18, "learning_rate": 1.8802850475929933e-05, "loss": 0.77, "step": 1678 }, { "epoch": 0.18, "learning_rate": 1.8801177074103598e-05, "loss": 0.6602, "step": 1679 }, { "epoch": 0.18, "learning_rate": 1.8799502578106533e-05, "loss": 0.7461, "step": 1680 }, { "epoch": 0.18, "learning_rate": 1.8797826988146918e-05, "loss": 0.7461, "step": 1681 }, { "epoch": 0.18, "learning_rate": 1.879615030443306e-05, "loss": 0.9663, "step": 1682 }, { "epoch": 0.18, "learning_rate": 1.879447252717341e-05, "loss": 0.7871, "step": 1683 }, { "epoch": 0.18, "learning_rate": 1.8792793656576544e-05, "loss": 0.6938, "step": 1684 }, { "epoch": 0.18, "learning_rate": 1.879111369285119e-05, "loss": 0.6389, "step": 1685 }, { "epoch": 0.18, "learning_rate": 1.8789432636206197e-05, "loss": 0.7402, "step": 1686 }, { "epoch": 0.18, "learning_rate": 1.8787750486850557e-05, "loss": 0.8374, "step": 1687 }, { "epoch": 0.18, "learning_rate": 1.8786067244993397e-05, "loss": 0.8379, "step": 1688 }, { "epoch": 0.18, "learning_rate": 1.8784382910843978e-05, "loss": 0.8296, "step": 1689 }, { "epoch": 0.18, "learning_rate": 1.8782697484611697e-05, "loss": 0.7773, "step": 1690 }, { "epoch": 0.18, "learning_rate": 1.878101096650609e-05, "loss": 0.7815, "step": 1691 }, { "epoch": 0.18, "learning_rate": 1.8779323356736824e-05, "loss": 0.8599, "step": 1692 }, { "epoch": 0.18, "learning_rate": 1.8777634655513706e-05, "loss": 0.7078, "step": 1693 }, { "epoch": 0.18, "learning_rate": 1.8775944863046682e-05, "loss": 0.8496, "step": 1694 }, { "epoch": 0.18, "learning_rate": 1.877425397954582e-05, "loss": 0.8164, "step": 1695 }, { "epoch": 0.18, "learning_rate": 1.8772562005221338e-05, "loss": 0.8066, "step": 1696 }, { "epoch": 0.18, "learning_rate": 1.877086894028358e-05, "loss": 0.7009, "step": 1697 }, { "epoch": 0.18, "learning_rate": 1.8769174784943032e-05, "loss": 0.7808, "step": 1698 }, { "epoch": 0.18, "learning_rate": 1.8767479539410312e-05, "loss": 0.7502, "step": 1699 }, { "epoch": 0.19, "learning_rate": 1.8765783203896175e-05, "loss": 0.7822, "step": 1700 }, { "epoch": 0.19, "learning_rate": 1.8764085778611507e-05, "loss": 0.9258, "step": 1701 }, { "epoch": 0.19, "learning_rate": 1.8762387263767343e-05, "loss": 0.7461, "step": 1702 }, { "epoch": 0.19, "learning_rate": 1.8760687659574835e-05, "loss": 0.74, "step": 1703 }, { "epoch": 0.19, "learning_rate": 1.8758986966245282e-05, "loss": 0.6934, "step": 1704 }, { "epoch": 0.19, "learning_rate": 1.8757285183990118e-05, "loss": 0.6743, "step": 1705 }, { "epoch": 0.19, "learning_rate": 1.8755582313020912e-05, "loss": 0.8276, "step": 1706 }, { "epoch": 0.19, "learning_rate": 1.8753878353549357e-05, "loss": 0.593, "step": 1707 }, { "epoch": 0.19, "learning_rate": 1.87521733057873e-05, "loss": 0.7598, "step": 1708 }, { "epoch": 0.19, "learning_rate": 1.875046716994671e-05, "loss": 0.8398, "step": 1709 }, { "epoch": 0.19, "learning_rate": 1.87487599462397e-05, "loss": 0.8525, "step": 1710 }, { "epoch": 0.19, "learning_rate": 1.874705163487851e-05, "loss": 0.6919, "step": 1711 }, { "epoch": 0.19, "learning_rate": 1.874534223607552e-05, "loss": 0.9346, "step": 1712 }, { "epoch": 0.19, "learning_rate": 1.874363175004324e-05, "loss": 0.7175, "step": 1713 }, { "epoch": 0.19, "learning_rate": 1.8741920176994323e-05, "loss": 0.856, "step": 1714 }, { "epoch": 0.19, "learning_rate": 1.8740207517141553e-05, "loss": 0.7246, "step": 1715 }, { "epoch": 0.19, "learning_rate": 1.873849377069785e-05, "loss": 0.6296, "step": 1716 }, { "epoch": 0.19, "learning_rate": 1.873677893787627e-05, "loss": 0.7568, "step": 1717 }, { "epoch": 0.19, "learning_rate": 1.8735063018890002e-05, "loss": 0.8086, "step": 1718 }, { "epoch": 0.19, "learning_rate": 1.8733346013952362e-05, "loss": 0.7808, "step": 1719 }, { "epoch": 0.19, "learning_rate": 1.8731627923276825e-05, "loss": 0.7739, "step": 1720 }, { "epoch": 0.19, "learning_rate": 1.872990874707697e-05, "loss": 0.7498, "step": 1721 }, { "epoch": 0.19, "learning_rate": 1.8728188485566545e-05, "loss": 0.73, "step": 1722 }, { "epoch": 0.19, "learning_rate": 1.8726467138959398e-05, "loss": 0.9409, "step": 1723 }, { "epoch": 0.19, "learning_rate": 1.8724744707469535e-05, "loss": 0.8611, "step": 1724 }, { "epoch": 0.19, "learning_rate": 1.872302119131109e-05, "loss": 0.7764, "step": 1725 }, { "epoch": 0.19, "learning_rate": 1.872129659069833e-05, "loss": 0.7485, "step": 1726 }, { "epoch": 0.19, "learning_rate": 1.8719570905845664e-05, "loss": 0.8491, "step": 1727 }, { "epoch": 0.19, "learning_rate": 1.8717844136967626e-05, "loss": 0.687, "step": 1728 }, { "epoch": 0.19, "learning_rate": 1.8716116284278893e-05, "loss": 0.7788, "step": 1729 }, { "epoch": 0.19, "learning_rate": 1.8714387347994267e-05, "loss": 0.6826, "step": 1730 }, { "epoch": 0.19, "learning_rate": 1.87126573283287e-05, "loss": 0.8193, "step": 1731 }, { "epoch": 0.19, "learning_rate": 1.8710926225497266e-05, "loss": 0.7222, "step": 1732 }, { "epoch": 0.19, "learning_rate": 1.8709194039715173e-05, "loss": 0.6948, "step": 1733 }, { "epoch": 0.19, "learning_rate": 1.8707460771197773e-05, "loss": 0.6868, "step": 1734 }, { "epoch": 0.19, "learning_rate": 1.8705726420160547e-05, "loss": 0.748, "step": 1735 }, { "epoch": 0.19, "learning_rate": 1.870399098681911e-05, "loss": 0.748, "step": 1736 }, { "epoch": 0.19, "learning_rate": 1.8702254471389214e-05, "loss": 0.7678, "step": 1737 }, { "epoch": 0.19, "learning_rate": 1.870051687408674e-05, "loss": 0.7661, "step": 1738 }, { "epoch": 0.19, "learning_rate": 1.8698778195127715e-05, "loss": 0.6917, "step": 1739 }, { "epoch": 0.19, "learning_rate": 1.869703843472829e-05, "loss": 0.696, "step": 1740 }, { "epoch": 0.19, "learning_rate": 1.869529759310475e-05, "loss": 0.8071, "step": 1741 }, { "epoch": 0.19, "learning_rate": 1.869355567047352e-05, "loss": 0.7773, "step": 1742 }, { "epoch": 0.19, "learning_rate": 1.8691812667051164e-05, "loss": 0.7913, "step": 1743 }, { "epoch": 0.19, "learning_rate": 1.8690068583054365e-05, "loss": 0.7129, "step": 1744 }, { "epoch": 0.19, "learning_rate": 1.8688323418699954e-05, "loss": 0.7036, "step": 1745 }, { "epoch": 0.19, "learning_rate": 1.8686577174204887e-05, "loss": 0.8027, "step": 1746 }, { "epoch": 0.19, "learning_rate": 1.8684829849786266e-05, "loss": 0.7168, "step": 1747 }, { "epoch": 0.19, "learning_rate": 1.8683081445661312e-05, "loss": 0.6794, "step": 1748 }, { "epoch": 0.19, "learning_rate": 1.8681331962047396e-05, "loss": 0.7805, "step": 1749 }, { "epoch": 0.19, "learning_rate": 1.8679581399162008e-05, "loss": 0.7927, "step": 1750 }, { "epoch": 0.19, "learning_rate": 1.8677829757222788e-05, "loss": 0.7729, "step": 1751 }, { "epoch": 0.19, "learning_rate": 1.867607703644749e-05, "loss": 0.7803, "step": 1752 }, { "epoch": 0.19, "learning_rate": 1.8674323237054027e-05, "loss": 0.8354, "step": 1753 }, { "epoch": 0.19, "learning_rate": 1.867256835926043e-05, "loss": 0.7483, "step": 1754 }, { "epoch": 0.19, "learning_rate": 1.8670812403284858e-05, "loss": 0.7876, "step": 1755 }, { "epoch": 0.19, "learning_rate": 1.8669055369345617e-05, "loss": 0.7705, "step": 1756 }, { "epoch": 0.19, "learning_rate": 1.8667297257661153e-05, "loss": 0.8652, "step": 1757 }, { "epoch": 0.19, "learning_rate": 1.8665538068450023e-05, "loss": 0.7141, "step": 1758 }, { "epoch": 0.19, "learning_rate": 1.866377780193094e-05, "loss": 0.6892, "step": 1759 }, { "epoch": 0.19, "learning_rate": 1.8662016458322737e-05, "loss": 0.7339, "step": 1760 }, { "epoch": 0.19, "learning_rate": 1.866025403784439e-05, "loss": 0.7769, "step": 1761 }, { "epoch": 0.19, "learning_rate": 1.8658490540715e-05, "loss": 0.7178, "step": 1762 }, { "epoch": 0.19, "learning_rate": 1.865672596715381e-05, "loss": 0.8125, "step": 1763 }, { "epoch": 0.19, "learning_rate": 1.865496031738019e-05, "loss": 0.7537, "step": 1764 }, { "epoch": 0.19, "learning_rate": 1.8653193591613652e-05, "loss": 0.8174, "step": 1765 }, { "epoch": 0.19, "learning_rate": 1.865142579007383e-05, "loss": 0.7979, "step": 1766 }, { "epoch": 0.19, "learning_rate": 1.8649656912980508e-05, "loss": 0.7485, "step": 1767 }, { "epoch": 0.19, "learning_rate": 1.864788696055359e-05, "loss": 0.7725, "step": 1768 }, { "epoch": 0.19, "learning_rate": 1.864611593301312e-05, "loss": 0.7148, "step": 1769 }, { "epoch": 0.19, "learning_rate": 1.864434383057927e-05, "loss": 0.7573, "step": 1770 }, { "epoch": 0.19, "learning_rate": 1.864257065347235e-05, "loss": 0.7422, "step": 1771 }, { "epoch": 0.19, "learning_rate": 1.8640796401912805e-05, "loss": 0.7295, "step": 1772 }, { "epoch": 0.19, "learning_rate": 1.8639021076121214e-05, "loss": 0.8232, "step": 1773 }, { "epoch": 0.19, "learning_rate": 1.863724467631828e-05, "loss": 0.8223, "step": 1774 }, { "epoch": 0.19, "learning_rate": 1.8635467202724855e-05, "loss": 0.8042, "step": 1775 }, { "epoch": 0.19, "learning_rate": 1.863368865556191e-05, "loss": 0.7278, "step": 1776 }, { "epoch": 0.19, "learning_rate": 1.863190903505056e-05, "loss": 0.9062, "step": 1777 }, { "epoch": 0.19, "learning_rate": 1.8630128341412045e-05, "loss": 0.7258, "step": 1778 }, { "epoch": 0.19, "learning_rate": 1.8628346574867748e-05, "loss": 0.7783, "step": 1779 }, { "epoch": 0.19, "learning_rate": 1.862656373563917e-05, "loss": 0.7542, "step": 1780 }, { "epoch": 0.19, "learning_rate": 1.862477982394797e-05, "loss": 0.7095, "step": 1781 }, { "epoch": 0.19, "learning_rate": 1.862299484001591e-05, "loss": 0.9316, "step": 1782 }, { "epoch": 0.19, "learning_rate": 1.8621208784064913e-05, "loss": 0.6655, "step": 1783 }, { "epoch": 0.19, "learning_rate": 1.861942165631702e-05, "loss": 0.7759, "step": 1784 }, { "epoch": 0.19, "learning_rate": 1.86176334569944e-05, "loss": 0.7881, "step": 1785 }, { "epoch": 0.19, "learning_rate": 1.8615844186319377e-05, "loss": 0.7251, "step": 1786 }, { "epoch": 0.19, "learning_rate": 1.8614053844514386e-05, "loss": 0.7275, "step": 1787 }, { "epoch": 0.19, "learning_rate": 1.861226243180201e-05, "loss": 0.7856, "step": 1788 }, { "epoch": 0.19, "learning_rate": 1.861046994840495e-05, "loss": 0.6948, "step": 1789 }, { "epoch": 0.19, "learning_rate": 1.8608676394546058e-05, "loss": 0.7422, "step": 1790 }, { "epoch": 0.19, "learning_rate": 1.8606881770448305e-05, "loss": 0.6567, "step": 1791 }, { "epoch": 0.2, "learning_rate": 1.8605086076334803e-05, "loss": 0.7581, "step": 1792 }, { "epoch": 0.2, "learning_rate": 1.8603289312428792e-05, "loss": 0.79, "step": 1793 }, { "epoch": 0.2, "learning_rate": 1.860149147895366e-05, "loss": 0.7354, "step": 1794 }, { "epoch": 0.2, "learning_rate": 1.859969257613289e-05, "loss": 0.7224, "step": 1795 }, { "epoch": 0.2, "learning_rate": 1.8597892604190148e-05, "loss": 0.8088, "step": 1796 }, { "epoch": 0.2, "learning_rate": 1.859609156334919e-05, "loss": 0.6929, "step": 1797 }, { "epoch": 0.2, "learning_rate": 1.859428945383394e-05, "loss": 0.7458, "step": 1798 }, { "epoch": 0.2, "learning_rate": 1.8592486275868426e-05, "loss": 0.9131, "step": 1799 }, { "epoch": 0.2, "learning_rate": 1.8590682029676825e-05, "loss": 0.7581, "step": 1800 }, { "epoch": 0.2, "learning_rate": 1.858887671548344e-05, "loss": 0.7458, "step": 1801 }, { "epoch": 0.2, "learning_rate": 1.8587070333512713e-05, "loss": 0.8066, "step": 1802 }, { "epoch": 0.2, "learning_rate": 1.858526288398921e-05, "loss": 0.77, "step": 1803 }, { "epoch": 0.2, "learning_rate": 1.858345436713764e-05, "loss": 0.7549, "step": 1804 }, { "epoch": 0.2, "learning_rate": 1.8581644783182837e-05, "loss": 0.7178, "step": 1805 }, { "epoch": 0.2, "learning_rate": 1.8579834132349773e-05, "loss": 0.7422, "step": 1806 }, { "epoch": 0.2, "learning_rate": 1.8578022414863545e-05, "loss": 0.6636, "step": 1807 }, { "epoch": 0.2, "learning_rate": 1.8576209630949392e-05, "loss": 0.7556, "step": 1808 }, { "epoch": 0.2, "learning_rate": 1.857439578083268e-05, "loss": 0.8926, "step": 1809 }, { "epoch": 0.2, "learning_rate": 1.85725808647389e-05, "loss": 0.7585, "step": 1810 }, { "epoch": 0.2, "learning_rate": 1.85707648828937e-05, "loss": 0.8132, "step": 1811 }, { "epoch": 0.2, "learning_rate": 1.8568947835522836e-05, "loss": 0.7, "step": 1812 }, { "epoch": 0.2, "learning_rate": 1.8567129722852205e-05, "loss": 0.75, "step": 1813 }, { "epoch": 0.2, "learning_rate": 1.8565310545107834e-05, "loss": 0.7344, "step": 1814 }, { "epoch": 0.2, "learning_rate": 1.856349030251589e-05, "loss": 0.7891, "step": 1815 }, { "epoch": 0.2, "learning_rate": 1.8561668995302668e-05, "loss": 0.7886, "step": 1816 }, { "epoch": 0.2, "learning_rate": 1.8559846623694588e-05, "loss": 0.6606, "step": 1817 }, { "epoch": 0.2, "learning_rate": 1.8558023187918214e-05, "loss": 0.8994, "step": 1818 }, { "epoch": 0.2, "learning_rate": 1.8556198688200234e-05, "loss": 0.5271, "step": 1819 }, { "epoch": 0.2, "learning_rate": 1.8554373124767475e-05, "loss": 0.8359, "step": 1820 }, { "epoch": 0.2, "learning_rate": 1.8552546497846893e-05, "loss": 0.719, "step": 1821 }, { "epoch": 0.2, "learning_rate": 1.8550718807665574e-05, "loss": 0.7148, "step": 1822 }, { "epoch": 0.2, "learning_rate": 1.8548890054450738e-05, "loss": 0.7866, "step": 1823 }, { "epoch": 0.2, "learning_rate": 1.8547060238429737e-05, "loss": 0.7925, "step": 1824 }, { "epoch": 0.2, "learning_rate": 1.8545229359830058e-05, "loss": 0.7759, "step": 1825 }, { "epoch": 0.2, "learning_rate": 1.8543397418879315e-05, "loss": 0.7603, "step": 1826 }, { "epoch": 0.2, "learning_rate": 1.854156441580526e-05, "loss": 0.7891, "step": 1827 }, { "epoch": 0.2, "learning_rate": 1.8539730350835768e-05, "loss": 0.7515, "step": 1828 }, { "epoch": 0.2, "learning_rate": 1.8537895224198858e-05, "loss": 0.7686, "step": 1829 }, { "epoch": 0.2, "learning_rate": 1.853605903612267e-05, "loss": 0.686, "step": 1830 }, { "epoch": 0.2, "learning_rate": 1.8534221786835478e-05, "loss": 0.6951, "step": 1831 }, { "epoch": 0.2, "learning_rate": 1.8532383476565702e-05, "loss": 0.7939, "step": 1832 }, { "epoch": 0.2, "learning_rate": 1.8530544105541872e-05, "loss": 0.7312, "step": 1833 }, { "epoch": 0.2, "learning_rate": 1.8528703673992664e-05, "loss": 0.7437, "step": 1834 }, { "epoch": 0.2, "learning_rate": 1.8526862182146883e-05, "loss": 0.6936, "step": 1835 }, { "epoch": 0.2, "learning_rate": 1.8525019630233463e-05, "loss": 0.7766, "step": 1836 }, { "epoch": 0.2, "learning_rate": 1.8523176018481473e-05, "loss": 0.6584, "step": 1837 }, { "epoch": 0.2, "learning_rate": 1.8521331347120116e-05, "loss": 0.7861, "step": 1838 }, { "epoch": 0.2, "learning_rate": 1.8519485616378717e-05, "loss": 0.6609, "step": 1839 }, { "epoch": 0.2, "learning_rate": 1.8517638826486738e-05, "loss": 0.8042, "step": 1840 }, { "epoch": 0.2, "learning_rate": 1.8515790977673786e-05, "loss": 0.7144, "step": 1841 }, { "epoch": 0.2, "learning_rate": 1.8513942070169572e-05, "loss": 0.7383, "step": 1842 }, { "epoch": 0.2, "learning_rate": 1.851209210420396e-05, "loss": 0.75, "step": 1843 }, { "epoch": 0.2, "learning_rate": 1.8510241080006944e-05, "loss": 0.7883, "step": 1844 }, { "epoch": 0.2, "learning_rate": 1.8508388997808638e-05, "loss": 0.7661, "step": 1845 }, { "epoch": 0.2, "learning_rate": 1.8506535857839304e-05, "loss": 0.6909, "step": 1846 }, { "epoch": 0.2, "learning_rate": 1.8504681660329312e-05, "loss": 0.6987, "step": 1847 }, { "epoch": 0.2, "learning_rate": 1.850282640550919e-05, "loss": 0.7527, "step": 1848 }, { "epoch": 0.2, "learning_rate": 1.850097009360958e-05, "loss": 0.6882, "step": 1849 }, { "epoch": 0.2, "learning_rate": 1.8499112724861262e-05, "loss": 0.8008, "step": 1850 }, { "epoch": 0.2, "learning_rate": 1.8497254299495147e-05, "loss": 0.7856, "step": 1851 }, { "epoch": 0.2, "learning_rate": 1.849539481774227e-05, "loss": 0.7195, "step": 1852 }, { "epoch": 0.2, "learning_rate": 1.8493534279833812e-05, "loss": 0.8628, "step": 1853 }, { "epoch": 0.2, "learning_rate": 1.849167268600107e-05, "loss": 0.6648, "step": 1854 }, { "epoch": 0.2, "learning_rate": 1.848981003647548e-05, "loss": 0.8164, "step": 1855 }, { "epoch": 0.2, "learning_rate": 1.8487946331488613e-05, "loss": 0.7349, "step": 1856 }, { "epoch": 0.2, "learning_rate": 1.8486081571272163e-05, "loss": 0.877, "step": 1857 }, { "epoch": 0.2, "learning_rate": 1.8484215756057956e-05, "loss": 0.7319, "step": 1858 }, { "epoch": 0.2, "learning_rate": 1.848234888607796e-05, "loss": 0.6731, "step": 1859 }, { "epoch": 0.2, "learning_rate": 1.848048096156426e-05, "loss": 0.697, "step": 1860 }, { "epoch": 0.2, "learning_rate": 1.8478611982749082e-05, "loss": 0.7314, "step": 1861 }, { "epoch": 0.2, "learning_rate": 1.8476741949864774e-05, "loss": 0.7808, "step": 1862 }, { "epoch": 0.2, "learning_rate": 1.8474870863143822e-05, "loss": 0.8027, "step": 1863 }, { "epoch": 0.2, "learning_rate": 1.8472998722818847e-05, "loss": 0.7537, "step": 1864 }, { "epoch": 0.2, "learning_rate": 1.8471125529122585e-05, "loss": 0.8228, "step": 1865 }, { "epoch": 0.2, "learning_rate": 1.8469251282287925e-05, "loss": 0.8145, "step": 1866 }, { "epoch": 0.2, "learning_rate": 1.8467375982547865e-05, "loss": 0.7524, "step": 1867 }, { "epoch": 0.2, "learning_rate": 1.8465499630135547e-05, "loss": 0.729, "step": 1868 }, { "epoch": 0.2, "learning_rate": 1.8463622225284242e-05, "loss": 0.8379, "step": 1869 }, { "epoch": 0.2, "learning_rate": 1.8461743768227357e-05, "loss": 0.8408, "step": 1870 }, { "epoch": 0.2, "learning_rate": 1.845986425919841e-05, "loss": 0.7063, "step": 1871 }, { "epoch": 0.2, "learning_rate": 1.8457983698431078e-05, "loss": 0.7163, "step": 1872 }, { "epoch": 0.2, "learning_rate": 1.845610208615914e-05, "loss": 0.6206, "step": 1873 }, { "epoch": 0.2, "learning_rate": 1.845421942261653e-05, "loss": 0.6433, "step": 1874 }, { "epoch": 0.2, "learning_rate": 1.84523357080373e-05, "loss": 0.8074, "step": 1875 }, { "epoch": 0.2, "learning_rate": 1.845045094265563e-05, "loss": 0.7781, "step": 1876 }, { "epoch": 0.2, "learning_rate": 1.8448565126705845e-05, "loss": 0.8062, "step": 1877 }, { "epoch": 0.2, "learning_rate": 1.8446678260422388e-05, "loss": 0.8384, "step": 1878 }, { "epoch": 0.2, "learning_rate": 1.8444790344039825e-05, "loss": 0.6917, "step": 1879 }, { "epoch": 0.2, "learning_rate": 1.844290137779288e-05, "loss": 0.6951, "step": 1880 }, { "epoch": 0.2, "learning_rate": 1.8441011361916387e-05, "loss": 0.7874, "step": 1881 }, { "epoch": 0.2, "learning_rate": 1.843912029664531e-05, "loss": 0.7207, "step": 1882 }, { "epoch": 0.2, "learning_rate": 1.8437228182214748e-05, "loss": 0.79, "step": 1883 }, { "epoch": 0.21, "learning_rate": 1.8435335018859933e-05, "loss": 0.6702, "step": 1884 }, { "epoch": 0.21, "learning_rate": 1.8433440806816224e-05, "loss": 0.8062, "step": 1885 }, { "epoch": 0.21, "learning_rate": 1.843154554631911e-05, "loss": 0.855, "step": 1886 }, { "epoch": 0.21, "learning_rate": 1.8429649237604215e-05, "loss": 0.728, "step": 1887 }, { "epoch": 0.21, "learning_rate": 1.8427751880907288e-05, "loss": 0.7646, "step": 1888 }, { "epoch": 0.21, "learning_rate": 1.8425853476464212e-05, "loss": 0.792, "step": 1889 }, { "epoch": 0.21, "learning_rate": 1.8423954024510995e-05, "loss": 0.7004, "step": 1890 }, { "epoch": 0.21, "learning_rate": 1.842205352528378e-05, "loss": 0.7681, "step": 1891 }, { "epoch": 0.21, "learning_rate": 1.842015197901884e-05, "loss": 0.7246, "step": 1892 }, { "epoch": 0.21, "learning_rate": 1.8418249385952575e-05, "loss": 0.656, "step": 1893 }, { "epoch": 0.21, "learning_rate": 1.841634574632152e-05, "loss": 0.7871, "step": 1894 }, { "epoch": 0.21, "learning_rate": 1.8414441060362332e-05, "loss": 0.7905, "step": 1895 }, { "epoch": 0.21, "learning_rate": 1.8412535328311813e-05, "loss": 0.6892, "step": 1896 }, { "epoch": 0.21, "learning_rate": 1.8410628550406877e-05, "loss": 0.8154, "step": 1897 }, { "epoch": 0.21, "learning_rate": 1.8408720726884576e-05, "loss": 0.7993, "step": 1898 }, { "epoch": 0.21, "learning_rate": 1.84068118579821e-05, "loss": 0.7615, "step": 1899 }, { "epoch": 0.21, "learning_rate": 1.8404901943936755e-05, "loss": 0.8501, "step": 1900 }, { "epoch": 0.21, "learning_rate": 1.8402990984985987e-05, "loss": 0.7271, "step": 1901 }, { "epoch": 0.21, "learning_rate": 1.8401078981367364e-05, "loss": 0.8555, "step": 1902 }, { "epoch": 0.21, "learning_rate": 1.839916593331859e-05, "loss": 0.8032, "step": 1903 }, { "epoch": 0.21, "learning_rate": 1.83972518410775e-05, "loss": 0.656, "step": 1904 }, { "epoch": 0.21, "learning_rate": 1.839533670488205e-05, "loss": 0.7534, "step": 1905 }, { "epoch": 0.21, "learning_rate": 1.8393420524970337e-05, "loss": 0.7817, "step": 1906 }, { "epoch": 0.21, "learning_rate": 1.839150330158058e-05, "loss": 0.7188, "step": 1907 }, { "epoch": 0.21, "learning_rate": 1.838958503495113e-05, "loss": 0.791, "step": 1908 }, { "epoch": 0.21, "learning_rate": 1.8387665725320467e-05, "loss": 0.7852, "step": 1909 }, { "epoch": 0.21, "learning_rate": 1.8385745372927203e-05, "loss": 0.7456, "step": 1910 }, { "epoch": 0.21, "learning_rate": 1.8383823978010077e-05, "loss": 0.6984, "step": 1911 }, { "epoch": 0.21, "learning_rate": 1.838190154080796e-05, "loss": 0.7473, "step": 1912 }, { "epoch": 0.21, "learning_rate": 1.8379978061559847e-05, "loss": 0.7092, "step": 1913 }, { "epoch": 0.21, "learning_rate": 1.8378053540504874e-05, "loss": 0.7329, "step": 1914 }, { "epoch": 0.21, "learning_rate": 1.8376127977882294e-05, "loss": 0.7048, "step": 1915 }, { "epoch": 0.21, "learning_rate": 1.8374201373931497e-05, "loss": 0.7495, "step": 1916 }, { "epoch": 0.21, "learning_rate": 1.8372273728891997e-05, "loss": 0.7449, "step": 1917 }, { "epoch": 0.21, "learning_rate": 1.8370345043003445e-05, "loss": 0.6904, "step": 1918 }, { "epoch": 0.21, "learning_rate": 1.8368415316505614e-05, "loss": 0.646, "step": 1919 }, { "epoch": 0.21, "learning_rate": 1.836648454963841e-05, "loss": 0.7754, "step": 1920 }, { "epoch": 0.21, "learning_rate": 1.836455274264187e-05, "loss": 0.7563, "step": 1921 }, { "epoch": 0.21, "learning_rate": 1.8362619895756154e-05, "loss": 0.8062, "step": 1922 }, { "epoch": 0.21, "learning_rate": 1.836068600922156e-05, "loss": 0.6909, "step": 1923 }, { "epoch": 0.21, "learning_rate": 1.8358751083278508e-05, "loss": 0.7336, "step": 1924 }, { "epoch": 0.21, "learning_rate": 1.8356815118167552e-05, "loss": 0.7002, "step": 1925 }, { "epoch": 0.21, "learning_rate": 1.8354878114129368e-05, "loss": 0.7817, "step": 1926 }, { "epoch": 0.21, "learning_rate": 1.8352940071404767e-05, "loss": 0.8188, "step": 1927 }, { "epoch": 0.21, "learning_rate": 1.8351000990234696e-05, "loss": 0.7329, "step": 1928 }, { "epoch": 0.21, "learning_rate": 1.8349060870860215e-05, "loss": 0.7268, "step": 1929 }, { "epoch": 0.21, "learning_rate": 1.8347119713522524e-05, "loss": 0.6953, "step": 1930 }, { "epoch": 0.21, "learning_rate": 1.8345177518462954e-05, "loss": 0.6868, "step": 1931 }, { "epoch": 0.21, "learning_rate": 1.8343234285922955e-05, "loss": 0.5742, "step": 1932 }, { "epoch": 0.21, "learning_rate": 1.8341290016144112e-05, "loss": 0.7598, "step": 1933 }, { "epoch": 0.21, "learning_rate": 1.8339344709368138e-05, "loss": 0.6625, "step": 1934 }, { "epoch": 0.21, "learning_rate": 1.8337398365836884e-05, "loss": 0.7847, "step": 1935 }, { "epoch": 0.21, "learning_rate": 1.8335450985792307e-05, "loss": 0.793, "step": 1936 }, { "epoch": 0.21, "learning_rate": 1.8333502569476516e-05, "loss": 0.7671, "step": 1937 }, { "epoch": 0.21, "learning_rate": 1.833155311713174e-05, "loss": 0.6797, "step": 1938 }, { "epoch": 0.21, "learning_rate": 1.8329602629000334e-05, "loss": 0.7336, "step": 1939 }, { "epoch": 0.21, "learning_rate": 1.832765110532479e-05, "loss": 0.7083, "step": 1940 }, { "epoch": 0.21, "learning_rate": 1.8325698546347714e-05, "loss": 0.646, "step": 1941 }, { "epoch": 0.21, "learning_rate": 1.8323744952311857e-05, "loss": 0.8101, "step": 1942 }, { "epoch": 0.21, "learning_rate": 1.832179032346009e-05, "loss": 0.7393, "step": 1943 }, { "epoch": 0.21, "learning_rate": 1.8319834660035415e-05, "loss": 0.644, "step": 1944 }, { "epoch": 0.21, "learning_rate": 1.8317877962280958e-05, "loss": 0.6951, "step": 1945 }, { "epoch": 0.21, "learning_rate": 1.8315920230439985e-05, "loss": 0.7361, "step": 1946 }, { "epoch": 0.21, "learning_rate": 1.8313961464755876e-05, "loss": 0.6277, "step": 1947 }, { "epoch": 0.21, "learning_rate": 1.8312001665472146e-05, "loss": 0.812, "step": 1948 }, { "epoch": 0.21, "learning_rate": 1.831004083283245e-05, "loss": 0.7495, "step": 1949 }, { "epoch": 0.21, "learning_rate": 1.8308078967080547e-05, "loss": 0.6672, "step": 1950 }, { "epoch": 0.21, "learning_rate": 1.8306116068460348e-05, "loss": 0.751, "step": 1951 }, { "epoch": 0.21, "learning_rate": 1.8304152137215877e-05, "loss": 0.7915, "step": 1952 }, { "epoch": 0.21, "learning_rate": 1.830218717359129e-05, "loss": 0.741, "step": 1953 }, { "epoch": 0.21, "learning_rate": 1.830022117783088e-05, "loss": 0.812, "step": 1954 }, { "epoch": 0.21, "learning_rate": 1.8298254150179055e-05, "loss": 0.7769, "step": 1955 }, { "epoch": 0.21, "learning_rate": 1.8296286090880362e-05, "loss": 0.8296, "step": 1956 }, { "epoch": 0.21, "learning_rate": 1.829431700017947e-05, "loss": 0.793, "step": 1957 }, { "epoch": 0.21, "learning_rate": 1.8292346878321182e-05, "loss": 0.7351, "step": 1958 }, { "epoch": 0.21, "learning_rate": 1.8290375725550417e-05, "loss": 0.8677, "step": 1959 }, { "epoch": 0.21, "learning_rate": 1.828840354211224e-05, "loss": 0.7402, "step": 1960 }, { "epoch": 0.21, "learning_rate": 1.828643032825183e-05, "loss": 0.7458, "step": 1961 }, { "epoch": 0.21, "learning_rate": 1.8284456084214496e-05, "loss": 0.894, "step": 1962 }, { "epoch": 0.21, "learning_rate": 1.8282480810245685e-05, "loss": 0.8159, "step": 1963 }, { "epoch": 0.21, "learning_rate": 1.828050450659096e-05, "loss": 0.6538, "step": 1964 }, { "epoch": 0.21, "learning_rate": 1.8278527173496022e-05, "loss": 0.7031, "step": 1965 }, { "epoch": 0.21, "learning_rate": 1.8276548811206684e-05, "loss": 0.7866, "step": 1966 }, { "epoch": 0.21, "learning_rate": 1.827456941996891e-05, "loss": 0.7661, "step": 1967 }, { "epoch": 0.21, "learning_rate": 1.8272589000028774e-05, "loss": 0.7109, "step": 1968 }, { "epoch": 0.21, "learning_rate": 1.8270607551632484e-05, "loss": 0.9341, "step": 1969 }, { "epoch": 0.21, "learning_rate": 1.8268625075026375e-05, "loss": 0.8359, "step": 1970 }, { "epoch": 0.21, "learning_rate": 1.8266641570456915e-05, "loss": 0.8169, "step": 1971 }, { "epoch": 0.21, "learning_rate": 1.8264657038170686e-05, "loss": 0.7466, "step": 1972 }, { "epoch": 0.21, "learning_rate": 1.8262671478414415e-05, "loss": 0.7212, "step": 1973 }, { "epoch": 0.21, "learning_rate": 1.826068489143495e-05, "loss": 0.7075, "step": 1974 }, { "epoch": 0.22, "learning_rate": 1.825869727747926e-05, "loss": 0.709, "step": 1975 }, { "epoch": 0.22, "learning_rate": 1.8256708636794446e-05, "loss": 0.7756, "step": 1976 }, { "epoch": 0.22, "learning_rate": 1.825471896962774e-05, "loss": 0.7952, "step": 1977 }, { "epoch": 0.22, "learning_rate": 1.8252728276226503e-05, "loss": 0.5884, "step": 1978 }, { "epoch": 0.22, "learning_rate": 1.8250736556838212e-05, "loss": 0.793, "step": 1979 }, { "epoch": 0.22, "learning_rate": 1.824874381171049e-05, "loss": 0.7451, "step": 1980 }, { "epoch": 0.22, "learning_rate": 1.824675004109107e-05, "loss": 0.7969, "step": 1981 }, { "epoch": 0.22, "learning_rate": 1.8244755245227818e-05, "loss": 0.7098, "step": 1982 }, { "epoch": 0.22, "learning_rate": 1.8242759424368733e-05, "loss": 0.7441, "step": 1983 }, { "epoch": 0.22, "learning_rate": 1.8240762578761935e-05, "loss": 0.7256, "step": 1984 }, { "epoch": 0.22, "learning_rate": 1.8238764708655676e-05, "loss": 0.7488, "step": 1985 }, { "epoch": 0.22, "learning_rate": 1.8236765814298328e-05, "loss": 0.7783, "step": 1986 }, { "epoch": 0.22, "learning_rate": 1.8234765895938405e-05, "loss": 0.7275, "step": 1987 }, { "epoch": 0.22, "learning_rate": 1.8232764953824528e-05, "loss": 0.8389, "step": 1988 }, { "epoch": 0.22, "learning_rate": 1.8230762988205463e-05, "loss": 0.7051, "step": 1989 }, { "epoch": 0.22, "learning_rate": 1.8228759999330093e-05, "loss": 0.6853, "step": 1990 }, { "epoch": 0.22, "learning_rate": 1.8226755987447432e-05, "loss": 0.7627, "step": 1991 }, { "epoch": 0.22, "learning_rate": 1.8224750952806626e-05, "loss": 0.7502, "step": 1992 }, { "epoch": 0.22, "learning_rate": 1.8222744895656932e-05, "loss": 0.7344, "step": 1993 }, { "epoch": 0.22, "learning_rate": 1.8220737816247756e-05, "loss": 0.8022, "step": 1994 }, { "epoch": 0.22, "learning_rate": 1.8218729714828612e-05, "loss": 0.7366, "step": 1995 }, { "epoch": 0.22, "learning_rate": 1.8216720591649152e-05, "loss": 0.896, "step": 1996 }, { "epoch": 0.22, "learning_rate": 1.8214710446959155e-05, "loss": 0.771, "step": 1997 }, { "epoch": 0.22, "learning_rate": 1.821269928100852e-05, "loss": 0.894, "step": 1998 }, { "epoch": 0.22, "learning_rate": 1.821068709404728e-05, "loss": 0.7756, "step": 1999 }, { "epoch": 0.22, "learning_rate": 1.820867388632559e-05, "loss": 0.8628, "step": 2000 }, { "epoch": 0.22, "learning_rate": 1.820665965809373e-05, "loss": 0.7942, "step": 2001 }, { "epoch": 0.22, "learning_rate": 1.8204644409602123e-05, "loss": 0.7424, "step": 2002 }, { "epoch": 0.22, "learning_rate": 1.8202628141101294e-05, "loss": 0.7104, "step": 2003 }, { "epoch": 0.22, "learning_rate": 1.8200610852841913e-05, "loss": 0.8242, "step": 2004 }, { "epoch": 0.22, "learning_rate": 1.8198592545074772e-05, "loss": 0.7124, "step": 2005 }, { "epoch": 0.22, "learning_rate": 1.8196573218050784e-05, "loss": 0.6992, "step": 2006 }, { "epoch": 0.22, "learning_rate": 1.8194552872020997e-05, "loss": 0.769, "step": 2007 }, { "epoch": 0.22, "learning_rate": 1.8192531507236587e-05, "loss": 0.6506, "step": 2008 }, { "epoch": 0.22, "learning_rate": 1.8190509123948845e-05, "loss": 0.7734, "step": 2009 }, { "epoch": 0.22, "learning_rate": 1.8188485722409196e-05, "loss": 0.8564, "step": 2010 }, { "epoch": 0.22, "learning_rate": 1.8186461302869193e-05, "loss": 0.75, "step": 2011 }, { "epoch": 0.22, "learning_rate": 1.818443586558052e-05, "loss": 0.7896, "step": 2012 }, { "epoch": 0.22, "learning_rate": 1.818240941079497e-05, "loss": 0.6013, "step": 2013 }, { "epoch": 0.22, "learning_rate": 1.818038193876448e-05, "loss": 0.8176, "step": 2014 }, { "epoch": 0.22, "learning_rate": 1.8178353449741105e-05, "loss": 0.7617, "step": 2015 }, { "epoch": 0.22, "learning_rate": 1.8176323943977034e-05, "loss": 0.6555, "step": 2016 }, { "epoch": 0.22, "learning_rate": 1.817429342172457e-05, "loss": 0.7896, "step": 2017 }, { "epoch": 0.22, "learning_rate": 1.817226188323615e-05, "loss": 0.7651, "step": 2018 }, { "epoch": 0.22, "learning_rate": 1.8170229328764343e-05, "loss": 0.8281, "step": 2019 }, { "epoch": 0.22, "learning_rate": 1.8168195758561836e-05, "loss": 0.5972, "step": 2020 }, { "epoch": 0.22, "learning_rate": 1.816616117288144e-05, "loss": 0.7974, "step": 2021 }, { "epoch": 0.22, "learning_rate": 1.81641255719761e-05, "loss": 0.801, "step": 2022 }, { "epoch": 0.22, "learning_rate": 1.8162088956098882e-05, "loss": 0.7419, "step": 2023 }, { "epoch": 0.22, "learning_rate": 1.8160051325502983e-05, "loss": 0.7014, "step": 2024 }, { "epoch": 0.22, "learning_rate": 1.8158012680441723e-05, "loss": 0.7153, "step": 2025 }, { "epoch": 0.22, "learning_rate": 1.8155973021168546e-05, "loss": 0.8315, "step": 2026 }, { "epoch": 0.22, "learning_rate": 1.815393234793702e-05, "loss": 0.814, "step": 2027 }, { "epoch": 0.22, "learning_rate": 1.8151890661000857e-05, "loss": 0.7612, "step": 2028 }, { "epoch": 0.22, "learning_rate": 1.8149847960613867e-05, "loss": 0.6824, "step": 2029 }, { "epoch": 0.22, "learning_rate": 1.814780424703001e-05, "loss": 0.781, "step": 2030 }, { "epoch": 0.22, "learning_rate": 1.814575952050336e-05, "loss": 0.731, "step": 2031 }, { "epoch": 0.22, "learning_rate": 1.8143713781288116e-05, "loss": 0.7952, "step": 2032 }, { "epoch": 0.22, "learning_rate": 1.8141667029638607e-05, "loss": 0.8169, "step": 2033 }, { "epoch": 0.22, "learning_rate": 1.8139619265809293e-05, "loss": 0.7451, "step": 2034 }, { "epoch": 0.22, "learning_rate": 1.813757049005475e-05, "loss": 0.7358, "step": 2035 }, { "epoch": 0.22, "learning_rate": 1.8135520702629677e-05, "loss": 0.759, "step": 2036 }, { "epoch": 0.22, "learning_rate": 1.8133469903788915e-05, "loss": 0.6973, "step": 2037 }, { "epoch": 0.22, "learning_rate": 1.813141809378742e-05, "loss": 0.7939, "step": 2038 }, { "epoch": 0.22, "learning_rate": 1.8129365272880274e-05, "loss": 0.6921, "step": 2039 }, { "epoch": 0.22, "learning_rate": 1.812731144132268e-05, "loss": 0.6694, "step": 2040 }, { "epoch": 0.22, "learning_rate": 1.8125256599369984e-05, "loss": 0.8562, "step": 2041 }, { "epoch": 0.22, "learning_rate": 1.8123200747277633e-05, "loss": 0.6895, "step": 2042 }, { "epoch": 0.22, "learning_rate": 1.812114388530122e-05, "loss": 0.8218, "step": 2043 }, { "epoch": 0.22, "learning_rate": 1.8119086013696457e-05, "loss": 0.7891, "step": 2044 }, { "epoch": 0.22, "learning_rate": 1.8117027132719177e-05, "loss": 0.7969, "step": 2045 }, { "epoch": 0.22, "learning_rate": 1.8114967242625342e-05, "loss": 0.7119, "step": 2046 }, { "epoch": 0.22, "learning_rate": 1.8112906343671045e-05, "loss": 0.7827, "step": 2047 }, { "epoch": 0.22, "learning_rate": 1.811084443611249e-05, "loss": 0.6611, "step": 2048 }, { "epoch": 0.22, "learning_rate": 1.810878152020602e-05, "loss": 0.658, "step": 2049 }, { "epoch": 0.22, "learning_rate": 1.81067175962081e-05, "loss": 0.7063, "step": 2050 }, { "epoch": 0.22, "learning_rate": 1.810465266437532e-05, "loss": 0.7549, "step": 2051 }, { "epoch": 0.22, "learning_rate": 1.8102586724964387e-05, "loss": 0.6855, "step": 2052 }, { "epoch": 0.22, "learning_rate": 1.810051977823215e-05, "loss": 0.7241, "step": 2053 }, { "epoch": 0.22, "learning_rate": 1.8098451824435564e-05, "loss": 0.6809, "step": 2054 }, { "epoch": 0.22, "learning_rate": 1.809638286383173e-05, "loss": 0.6815, "step": 2055 }, { "epoch": 0.22, "learning_rate": 1.8094312896677853e-05, "loss": 0.7561, "step": 2056 }, { "epoch": 0.22, "learning_rate": 1.809224192323128e-05, "loss": 0.7051, "step": 2057 }, { "epoch": 0.22, "learning_rate": 1.8090169943749477e-05, "loss": 0.8186, "step": 2058 }, { "epoch": 0.22, "learning_rate": 1.8088096958490028e-05, "loss": 0.7227, "step": 2059 }, { "epoch": 0.22, "learning_rate": 1.8086022967710652e-05, "loss": 0.7913, "step": 2060 }, { "epoch": 0.22, "learning_rate": 1.808394797166919e-05, "loss": 0.7969, "step": 2061 }, { "epoch": 0.22, "learning_rate": 1.8081871970623607e-05, "loss": 0.752, "step": 2062 }, { "epoch": 0.22, "learning_rate": 1.8079794964831994e-05, "loss": 0.5911, "step": 2063 }, { "epoch": 0.22, "learning_rate": 1.8077716954552564e-05, "loss": 0.7935, "step": 2064 }, { "epoch": 0.22, "learning_rate": 1.807563794004366e-05, "loss": 0.7036, "step": 2065 }, { "epoch": 0.22, "learning_rate": 1.8073557921563747e-05, "loss": 0.6953, "step": 2066 }, { "epoch": 0.23, "learning_rate": 1.8071476899371414e-05, "loss": 0.7749, "step": 2067 }, { "epoch": 0.23, "learning_rate": 1.8069394873725375e-05, "loss": 0.7012, "step": 2068 }, { "epoch": 0.23, "learning_rate": 1.806731184488447e-05, "loss": 0.7715, "step": 2069 }, { "epoch": 0.23, "learning_rate": 1.8065227813107667e-05, "loss": 0.751, "step": 2070 }, { "epoch": 0.23, "learning_rate": 1.8063142778654046e-05, "loss": 0.812, "step": 2071 }, { "epoch": 0.23, "learning_rate": 1.8061056741782827e-05, "loss": 0.8, "step": 2072 }, { "epoch": 0.23, "learning_rate": 1.8058969702753346e-05, "loss": 0.6409, "step": 2073 }, { "epoch": 0.23, "learning_rate": 1.805688166182507e-05, "loss": 0.7454, "step": 2074 }, { "epoch": 0.23, "learning_rate": 1.805479261925758e-05, "loss": 0.7832, "step": 2075 }, { "epoch": 0.23, "learning_rate": 1.8052702575310588e-05, "loss": 0.6575, "step": 2076 }, { "epoch": 0.23, "learning_rate": 1.8050611530243936e-05, "loss": 0.7329, "step": 2077 }, { "epoch": 0.23, "learning_rate": 1.804851948431758e-05, "loss": 0.7681, "step": 2078 }, { "epoch": 0.23, "learning_rate": 1.8046426437791603e-05, "loss": 0.7742, "step": 2079 }, { "epoch": 0.23, "learning_rate": 1.8044332390926224e-05, "loss": 0.8496, "step": 2080 }, { "epoch": 0.23, "learning_rate": 1.8042237343981767e-05, "loss": 0.7332, "step": 2081 }, { "epoch": 0.23, "learning_rate": 1.8040141297218693e-05, "loss": 0.8721, "step": 2082 }, { "epoch": 0.23, "learning_rate": 1.803804425089759e-05, "loss": 0.8325, "step": 2083 }, { "epoch": 0.23, "learning_rate": 1.8035946205279157e-05, "loss": 0.7576, "step": 2084 }, { "epoch": 0.23, "learning_rate": 1.803384716062423e-05, "loss": 0.7783, "step": 2085 }, { "epoch": 0.23, "learning_rate": 1.803174711719376e-05, "loss": 0.7573, "step": 2086 }, { "epoch": 0.23, "learning_rate": 1.802964607524883e-05, "loss": 0.8862, "step": 2087 }, { "epoch": 0.23, "learning_rate": 1.8027544035050647e-05, "loss": 0.8315, "step": 2088 }, { "epoch": 0.23, "learning_rate": 1.802544099686053e-05, "loss": 0.8467, "step": 2089 }, { "epoch": 0.23, "learning_rate": 1.8023336960939938e-05, "loss": 0.8789, "step": 2090 }, { "epoch": 0.23, "learning_rate": 1.802123192755044e-05, "loss": 0.8623, "step": 2091 }, { "epoch": 0.23, "learning_rate": 1.8019125896953742e-05, "loss": 0.7358, "step": 2092 }, { "epoch": 0.23, "learning_rate": 1.8017018869411666e-05, "loss": 0.7395, "step": 2093 }, { "epoch": 0.23, "learning_rate": 1.8014910845186154e-05, "loss": 0.7759, "step": 2094 }, { "epoch": 0.23, "learning_rate": 1.8012801824539287e-05, "loss": 0.8088, "step": 2095 }, { "epoch": 0.23, "learning_rate": 1.8010691807733253e-05, "loss": 0.6467, "step": 2096 }, { "epoch": 0.23, "learning_rate": 1.8008580795030377e-05, "loss": 0.7043, "step": 2097 }, { "epoch": 0.23, "learning_rate": 1.80064687866931e-05, "loss": 0.6309, "step": 2098 }, { "epoch": 0.23, "learning_rate": 1.8004355782983985e-05, "loss": 0.7024, "step": 2099 }, { "epoch": 0.23, "learning_rate": 1.800224178416573e-05, "loss": 0.7905, "step": 2100 }, { "epoch": 0.23, "learning_rate": 1.800012679050114e-05, "loss": 0.811, "step": 2101 }, { "epoch": 0.23, "learning_rate": 1.799801080225316e-05, "loss": 0.6909, "step": 2102 }, { "epoch": 0.23, "learning_rate": 1.799589381968485e-05, "loss": 0.8313, "step": 2103 }, { "epoch": 0.23, "learning_rate": 1.7993775843059396e-05, "loss": 0.7734, "step": 2104 }, { "epoch": 0.23, "learning_rate": 1.7991656872640107e-05, "loss": 0.6655, "step": 2105 }, { "epoch": 0.23, "learning_rate": 1.7989536908690413e-05, "loss": 0.7373, "step": 2106 }, { "epoch": 0.23, "learning_rate": 1.7987415951473872e-05, "loss": 0.8413, "step": 2107 }, { "epoch": 0.23, "learning_rate": 1.7985294001254163e-05, "loss": 0.6602, "step": 2108 }, { "epoch": 0.23, "learning_rate": 1.798317105829509e-05, "loss": 0.8032, "step": 2109 }, { "epoch": 0.23, "learning_rate": 1.798104712286058e-05, "loss": 0.7539, "step": 2110 }, { "epoch": 0.23, "learning_rate": 1.7978922195214675e-05, "loss": 0.7473, "step": 2111 }, { "epoch": 0.23, "learning_rate": 1.7976796275621556e-05, "loss": 0.8118, "step": 2112 }, { "epoch": 0.23, "learning_rate": 1.7974669364345518e-05, "loss": 0.6624, "step": 2113 }, { "epoch": 0.23, "learning_rate": 1.7972541461650978e-05, "loss": 0.7639, "step": 2114 }, { "epoch": 0.23, "learning_rate": 1.797041256780248e-05, "loss": 0.7061, "step": 2115 }, { "epoch": 0.23, "learning_rate": 1.796828268306469e-05, "loss": 0.801, "step": 2116 }, { "epoch": 0.23, "learning_rate": 1.7966151807702402e-05, "loss": 0.7412, "step": 2117 }, { "epoch": 0.23, "learning_rate": 1.7964019941980524e-05, "loss": 0.8159, "step": 2118 }, { "epoch": 0.23, "learning_rate": 1.796188708616409e-05, "loss": 0.7617, "step": 2119 }, { "epoch": 0.23, "learning_rate": 1.7959753240518263e-05, "loss": 0.689, "step": 2120 }, { "epoch": 0.23, "learning_rate": 1.7957618405308323e-05, "loss": 0.6985, "step": 2121 }, { "epoch": 0.23, "learning_rate": 1.7955482580799672e-05, "loss": 0.7007, "step": 2122 }, { "epoch": 0.23, "learning_rate": 1.7953345767257842e-05, "loss": 0.7173, "step": 2123 }, { "epoch": 0.23, "learning_rate": 1.795120796494848e-05, "loss": 0.6917, "step": 2124 }, { "epoch": 0.23, "learning_rate": 1.794906917413736e-05, "loss": 0.7627, "step": 2125 }, { "epoch": 0.23, "learning_rate": 1.7946929395090382e-05, "loss": 0.7095, "step": 2126 }, { "epoch": 0.23, "learning_rate": 1.794478862807356e-05, "loss": 0.8081, "step": 2127 }, { "epoch": 0.23, "learning_rate": 1.7942646873353045e-05, "loss": 0.7759, "step": 2128 }, { "epoch": 0.23, "learning_rate": 1.7940504131195093e-05, "loss": 0.7659, "step": 2129 }, { "epoch": 0.23, "learning_rate": 1.7938360401866096e-05, "loss": 0.7832, "step": 2130 }, { "epoch": 0.23, "learning_rate": 1.793621568563256e-05, "loss": 0.7202, "step": 2131 }, { "epoch": 0.23, "learning_rate": 1.7934069982761127e-05, "loss": 0.8384, "step": 2132 }, { "epoch": 0.23, "learning_rate": 1.7931923293518546e-05, "loss": 0.8398, "step": 2133 }, { "epoch": 0.23, "learning_rate": 1.7929775618171693e-05, "loss": 0.6636, "step": 2134 }, { "epoch": 0.23, "learning_rate": 1.7927626956987577e-05, "loss": 0.7734, "step": 2135 }, { "epoch": 0.23, "learning_rate": 1.792547731023332e-05, "loss": 0.7808, "step": 2136 }, { "epoch": 0.23, "learning_rate": 1.792332667817616e-05, "loss": 0.7759, "step": 2137 }, { "epoch": 0.23, "learning_rate": 1.7921175061083475e-05, "loss": 0.7671, "step": 2138 }, { "epoch": 0.23, "learning_rate": 1.7919022459222754e-05, "loss": 0.626, "step": 2139 }, { "epoch": 0.23, "learning_rate": 1.7916868872861605e-05, "loss": 0.7583, "step": 2140 }, { "epoch": 0.23, "learning_rate": 1.791471430226777e-05, "loss": 0.7754, "step": 2141 }, { "epoch": 0.23, "learning_rate": 1.7912558747709105e-05, "loss": 0.7607, "step": 2142 }, { "epoch": 0.23, "learning_rate": 1.791040220945359e-05, "loss": 0.7686, "step": 2143 }, { "epoch": 0.23, "learning_rate": 1.7908244687769333e-05, "loss": 0.811, "step": 2144 }, { "epoch": 0.23, "learning_rate": 1.790608618292455e-05, "loss": 0.8892, "step": 2145 }, { "epoch": 0.23, "learning_rate": 1.7903926695187595e-05, "loss": 0.8416, "step": 2146 }, { "epoch": 0.23, "learning_rate": 1.7901766224826934e-05, "loss": 0.6255, "step": 2147 }, { "epoch": 0.23, "learning_rate": 1.7899604772111163e-05, "loss": 0.7437, "step": 2148 }, { "epoch": 0.23, "learning_rate": 1.7897442337308995e-05, "loss": 0.7666, "step": 2149 }, { "epoch": 0.23, "learning_rate": 1.789527892068926e-05, "loss": 0.8066, "step": 2150 }, { "epoch": 0.23, "learning_rate": 1.789311452252092e-05, "loss": 0.7505, "step": 2151 }, { "epoch": 0.23, "learning_rate": 1.789094914307306e-05, "loss": 0.7524, "step": 2152 }, { "epoch": 0.23, "learning_rate": 1.7888782782614877e-05, "loss": 0.7539, "step": 2153 }, { "epoch": 0.23, "learning_rate": 1.7886615441415693e-05, "loss": 0.7437, "step": 2154 }, { "epoch": 0.23, "learning_rate": 1.7884447119744956e-05, "loss": 0.7349, "step": 2155 }, { "epoch": 0.23, "learning_rate": 1.7882277817872236e-05, "loss": 0.6611, "step": 2156 }, { "epoch": 0.23, "learning_rate": 1.788010753606722e-05, "loss": 0.7441, "step": 2157 }, { "epoch": 0.23, "learning_rate": 1.7877936274599722e-05, "loss": 0.7859, "step": 2158 }, { "epoch": 0.24, "learning_rate": 1.7875764033739674e-05, "loss": 0.8679, "step": 2159 }, { "epoch": 0.24, "learning_rate": 1.787359081375713e-05, "loss": 0.748, "step": 2160 }, { "epoch": 0.24, "learning_rate": 1.7871416614922267e-05, "loss": 0.5427, "step": 2161 }, { "epoch": 0.24, "learning_rate": 1.7869241437505382e-05, "loss": 0.8306, "step": 2162 }, { "epoch": 0.24, "learning_rate": 1.78670652817769e-05, "loss": 0.7627, "step": 2163 }, { "epoch": 0.24, "learning_rate": 1.786488814800736e-05, "loss": 0.7686, "step": 2164 }, { "epoch": 0.24, "learning_rate": 1.7862710036467423e-05, "loss": 0.7751, "step": 2165 }, { "epoch": 0.24, "learning_rate": 1.7860530947427878e-05, "loss": 0.6113, "step": 2166 }, { "epoch": 0.24, "learning_rate": 1.785835088115963e-05, "loss": 0.7607, "step": 2167 }, { "epoch": 0.24, "learning_rate": 1.78561698379337e-05, "loss": 0.7505, "step": 2168 }, { "epoch": 0.24, "learning_rate": 1.7853987818021252e-05, "loss": 0.7775, "step": 2169 }, { "epoch": 0.24, "learning_rate": 1.785180482169355e-05, "loss": 0.9458, "step": 2170 }, { "epoch": 0.24, "learning_rate": 1.7849620849221976e-05, "loss": 0.7629, "step": 2171 }, { "epoch": 0.24, "learning_rate": 1.784743590087806e-05, "loss": 0.8726, "step": 2172 }, { "epoch": 0.24, "learning_rate": 1.7845249976933426e-05, "loss": 0.8379, "step": 2173 }, { "epoch": 0.24, "learning_rate": 1.7843063077659834e-05, "loss": 0.7288, "step": 2174 }, { "epoch": 0.24, "learning_rate": 1.784087520332916e-05, "loss": 0.6323, "step": 2175 }, { "epoch": 0.24, "learning_rate": 1.78386863542134e-05, "loss": 0.7803, "step": 2176 }, { "epoch": 0.24, "learning_rate": 1.7836496530584684e-05, "loss": 0.7886, "step": 2177 }, { "epoch": 0.24, "learning_rate": 1.7834305732715243e-05, "loss": 0.7515, "step": 2178 }, { "epoch": 0.24, "learning_rate": 1.7832113960877445e-05, "loss": 0.8955, "step": 2179 }, { "epoch": 0.24, "learning_rate": 1.7829921215343766e-05, "loss": 0.6814, "step": 2180 }, { "epoch": 0.24, "learning_rate": 1.782772749638682e-05, "loss": 0.7297, "step": 2181 }, { "epoch": 0.24, "learning_rate": 1.7825532804279323e-05, "loss": 0.8457, "step": 2182 }, { "epoch": 0.24, "learning_rate": 1.7823337139294125e-05, "loss": 0.696, "step": 2183 }, { "epoch": 0.24, "learning_rate": 1.7821140501704195e-05, "loss": 0.8003, "step": 2184 }, { "epoch": 0.24, "learning_rate": 1.7818942891782617e-05, "loss": 0.7441, "step": 2185 }, { "epoch": 0.24, "learning_rate": 1.7816744309802604e-05, "loss": 0.6968, "step": 2186 }, { "epoch": 0.24, "learning_rate": 1.7814544756037486e-05, "loss": 0.916, "step": 2187 }, { "epoch": 0.24, "learning_rate": 1.781234423076071e-05, "loss": 0.7827, "step": 2188 }, { "epoch": 0.24, "learning_rate": 1.7810142734245847e-05, "loss": 0.7788, "step": 2189 }, { "epoch": 0.24, "learning_rate": 1.7807940266766595e-05, "loss": 0.6719, "step": 2190 }, { "epoch": 0.24, "learning_rate": 1.780573682859676e-05, "loss": 0.7485, "step": 2191 }, { "epoch": 0.24, "learning_rate": 1.780353242001028e-05, "loss": 0.7852, "step": 2192 }, { "epoch": 0.24, "learning_rate": 1.780132704128121e-05, "loss": 0.7581, "step": 2193 }, { "epoch": 0.24, "learning_rate": 1.779912069268372e-05, "loss": 0.812, "step": 2194 }, { "epoch": 0.24, "learning_rate": 1.7796913374492105e-05, "loss": 0.7192, "step": 2195 }, { "epoch": 0.24, "learning_rate": 1.779470508698079e-05, "loss": 0.7214, "step": 2196 }, { "epoch": 0.24, "learning_rate": 1.77924958304243e-05, "loss": 0.624, "step": 2197 }, { "epoch": 0.24, "learning_rate": 1.7790285605097305e-05, "loss": 0.8462, "step": 2198 }, { "epoch": 0.24, "learning_rate": 1.7788074411274566e-05, "loss": 0.8101, "step": 2199 }, { "epoch": 0.24, "learning_rate": 1.7785862249230996e-05, "loss": 0.7109, "step": 2200 }, { "epoch": 0.24, "learning_rate": 1.7783649119241603e-05, "loss": 0.7617, "step": 2201 }, { "epoch": 0.24, "learning_rate": 1.7781435021581527e-05, "loss": 0.6216, "step": 2202 }, { "epoch": 0.24, "learning_rate": 1.7779219956526033e-05, "loss": 0.7456, "step": 2203 }, { "epoch": 0.24, "learning_rate": 1.7777003924350492e-05, "loss": 0.7617, "step": 2204 }, { "epoch": 0.24, "learning_rate": 1.7774786925330406e-05, "loss": 0.7505, "step": 2205 }, { "epoch": 0.24, "learning_rate": 1.77725689597414e-05, "loss": 0.7441, "step": 2206 }, { "epoch": 0.24, "learning_rate": 1.7770350027859203e-05, "loss": 0.7224, "step": 2207 }, { "epoch": 0.24, "learning_rate": 1.7768130129959685e-05, "loss": 0.8137, "step": 2208 }, { "epoch": 0.24, "learning_rate": 1.7765909266318817e-05, "loss": 0.7358, "step": 2209 }, { "epoch": 0.24, "learning_rate": 1.7763687437212707e-05, "loss": 0.709, "step": 2210 }, { "epoch": 0.24, "learning_rate": 1.776146464291757e-05, "loss": 0.7227, "step": 2211 }, { "epoch": 0.24, "learning_rate": 1.7759240883709745e-05, "loss": 0.7329, "step": 2212 }, { "epoch": 0.24, "learning_rate": 1.7757016159865695e-05, "loss": 0.749, "step": 2213 }, { "epoch": 0.24, "learning_rate": 1.7754790471662003e-05, "loss": 0.6821, "step": 2214 }, { "epoch": 0.24, "learning_rate": 1.7752563819375362e-05, "loss": 0.6506, "step": 2215 }, { "epoch": 0.24, "learning_rate": 1.7750336203282588e-05, "loss": 0.835, "step": 2216 }, { "epoch": 0.24, "learning_rate": 1.7748107623660635e-05, "loss": 0.7266, "step": 2217 }, { "epoch": 0.24, "learning_rate": 1.774587808078655e-05, "loss": 0.7207, "step": 2218 }, { "epoch": 0.24, "learning_rate": 1.7743647574937514e-05, "loss": 0.6931, "step": 2219 }, { "epoch": 0.24, "learning_rate": 1.7741416106390828e-05, "loss": 0.8428, "step": 2220 }, { "epoch": 0.24, "learning_rate": 1.7739183675423904e-05, "loss": 0.7922, "step": 2221 }, { "epoch": 0.24, "learning_rate": 1.7736950282314292e-05, "loss": 0.6582, "step": 2222 }, { "epoch": 0.24, "learning_rate": 1.7734715927339642e-05, "loss": 0.7827, "step": 2223 }, { "epoch": 0.24, "learning_rate": 1.773248061077773e-05, "loss": 0.7136, "step": 2224 }, { "epoch": 0.24, "learning_rate": 1.7730244332906458e-05, "loss": 0.8677, "step": 2225 }, { "epoch": 0.24, "learning_rate": 1.772800709400383e-05, "loss": 0.7581, "step": 2226 }, { "epoch": 0.24, "learning_rate": 1.7725768894348002e-05, "loss": 0.7319, "step": 2227 }, { "epoch": 0.24, "learning_rate": 1.772352973421721e-05, "loss": 0.688, "step": 2228 }, { "epoch": 0.24, "learning_rate": 1.7721289613889835e-05, "loss": 0.6777, "step": 2229 }, { "epoch": 0.24, "learning_rate": 1.7719048533644376e-05, "loss": 0.6882, "step": 2230 }, { "epoch": 0.24, "learning_rate": 1.771680649375944e-05, "loss": 0.7061, "step": 2231 }, { "epoch": 0.24, "learning_rate": 1.7714563494513766e-05, "loss": 0.7458, "step": 2232 }, { "epoch": 0.24, "learning_rate": 1.7712319536186196e-05, "loss": 0.709, "step": 2233 }, { "epoch": 0.24, "learning_rate": 1.7710074619055707e-05, "loss": 0.6882, "step": 2234 }, { "epoch": 0.24, "learning_rate": 1.770782874340139e-05, "loss": 0.7859, "step": 2235 }, { "epoch": 0.24, "learning_rate": 1.7705581909502457e-05, "loss": 0.678, "step": 2236 }, { "epoch": 0.24, "learning_rate": 1.770333411763823e-05, "loss": 0.7534, "step": 2237 }, { "epoch": 0.24, "learning_rate": 1.7701085368088157e-05, "loss": 0.6699, "step": 2238 }, { "epoch": 0.24, "learning_rate": 1.769883566113181e-05, "loss": 0.7712, "step": 2239 }, { "epoch": 0.24, "learning_rate": 1.769658499704887e-05, "loss": 0.8906, "step": 2240 }, { "epoch": 0.24, "learning_rate": 1.7694333376119144e-05, "loss": 0.9194, "step": 2241 }, { "epoch": 0.24, "learning_rate": 1.7692080798622556e-05, "loss": 0.6477, "step": 2242 }, { "epoch": 0.24, "learning_rate": 1.7689827264839147e-05, "loss": 0.6873, "step": 2243 }, { "epoch": 0.24, "learning_rate": 1.768757277504908e-05, "loss": 0.771, "step": 2244 }, { "epoch": 0.24, "learning_rate": 1.7685317329532633e-05, "loss": 0.729, "step": 2245 }, { "epoch": 0.24, "learning_rate": 1.768306092857021e-05, "loss": 0.7131, "step": 2246 }, { "epoch": 0.24, "learning_rate": 1.768080357244232e-05, "loss": 0.793, "step": 2247 }, { "epoch": 0.24, "learning_rate": 1.767854526142961e-05, "loss": 0.6428, "step": 2248 }, { "epoch": 0.24, "learning_rate": 1.767628599581283e-05, "loss": 0.7773, "step": 2249 }, { "epoch": 0.24, "learning_rate": 1.767402577587285e-05, "loss": 0.7837, "step": 2250 }, { "epoch": 0.25, "learning_rate": 1.7671764601890673e-05, "loss": 0.7361, "step": 2251 }, { "epoch": 0.25, "learning_rate": 1.76695024741474e-05, "loss": 0.71, "step": 2252 }, { "epoch": 0.25, "learning_rate": 1.766723939292427e-05, "loss": 0.6018, "step": 2253 }, { "epoch": 0.25, "learning_rate": 1.7664975358502622e-05, "loss": 0.8286, "step": 2254 }, { "epoch": 0.25, "learning_rate": 1.7662710371163932e-05, "loss": 0.729, "step": 2255 }, { "epoch": 0.25, "learning_rate": 1.766044443118978e-05, "loss": 0.6465, "step": 2256 }, { "epoch": 0.25, "learning_rate": 1.7658177538861873e-05, "loss": 0.8057, "step": 2257 }, { "epoch": 0.25, "learning_rate": 1.765590969446203e-05, "loss": 0.6172, "step": 2258 }, { "epoch": 0.25, "learning_rate": 1.7653640898272192e-05, "loss": 0.7417, "step": 2259 }, { "epoch": 0.25, "learning_rate": 1.765137115057442e-05, "loss": 0.7856, "step": 2260 }, { "epoch": 0.25, "learning_rate": 1.764910045165089e-05, "loss": 0.677, "step": 2261 }, { "epoch": 0.25, "learning_rate": 1.7646828801783897e-05, "loss": 0.7534, "step": 2262 }, { "epoch": 0.25, "learning_rate": 1.7644556201255855e-05, "loss": 0.7822, "step": 2263 }, { "epoch": 0.25, "learning_rate": 1.7642282650349294e-05, "loss": 0.7925, "step": 2264 }, { "epoch": 0.25, "learning_rate": 1.7640008149346866e-05, "loss": 0.7651, "step": 2265 }, { "epoch": 0.25, "learning_rate": 1.763773269853134e-05, "loss": 0.6729, "step": 2266 }, { "epoch": 0.25, "learning_rate": 1.7635456298185607e-05, "loss": 0.7429, "step": 2267 }, { "epoch": 0.25, "learning_rate": 1.763317894859266e-05, "loss": 0.6816, "step": 2268 }, { "epoch": 0.25, "learning_rate": 1.7630900650035626e-05, "loss": 0.875, "step": 2269 }, { "epoch": 0.25, "learning_rate": 1.7628621402797746e-05, "loss": 0.6526, "step": 2270 }, { "epoch": 0.25, "learning_rate": 1.762634120716238e-05, "loss": 0.7495, "step": 2271 }, { "epoch": 0.25, "learning_rate": 1.7624060063413003e-05, "loss": 0.8228, "step": 2272 }, { "epoch": 0.25, "learning_rate": 1.762177797183321e-05, "loss": 0.7915, "step": 2273 }, { "epoch": 0.25, "learning_rate": 1.761949493270671e-05, "loss": 0.8579, "step": 2274 }, { "epoch": 0.25, "learning_rate": 1.7617210946317333e-05, "loss": 0.8423, "step": 2275 }, { "epoch": 0.25, "learning_rate": 1.7614926012949027e-05, "loss": 0.6653, "step": 2276 }, { "epoch": 0.25, "learning_rate": 1.7612640132885857e-05, "loss": 0.802, "step": 2277 }, { "epoch": 0.25, "learning_rate": 1.761035330641201e-05, "loss": 0.686, "step": 2278 }, { "epoch": 0.25, "learning_rate": 1.7608065533811777e-05, "loss": 0.6714, "step": 2279 }, { "epoch": 0.25, "learning_rate": 1.7605776815369583e-05, "loss": 0.6094, "step": 2280 }, { "epoch": 0.25, "learning_rate": 1.760348715136996e-05, "loss": 0.6572, "step": 2281 }, { "epoch": 0.25, "learning_rate": 1.760119654209757e-05, "loss": 0.8525, "step": 2282 }, { "epoch": 0.25, "learning_rate": 1.759890498783717e-05, "loss": 0.6248, "step": 2283 }, { "epoch": 0.25, "learning_rate": 1.759661248887366e-05, "loss": 0.6848, "step": 2284 }, { "epoch": 0.25, "learning_rate": 1.759431904549204e-05, "loss": 0.813, "step": 2285 }, { "epoch": 0.25, "learning_rate": 1.7592024657977432e-05, "loss": 0.7434, "step": 2286 }, { "epoch": 0.25, "learning_rate": 1.7589729326615082e-05, "loss": 0.7371, "step": 2287 }, { "epoch": 0.25, "learning_rate": 1.7587433051690342e-05, "loss": 0.7739, "step": 2288 }, { "epoch": 0.25, "learning_rate": 1.7585135833488692e-05, "loss": 0.6086, "step": 2289 }, { "epoch": 0.25, "learning_rate": 1.7582837672295717e-05, "loss": 0.7474, "step": 2290 }, { "epoch": 0.25, "learning_rate": 1.7580538568397135e-05, "loss": 0.8745, "step": 2291 }, { "epoch": 0.25, "learning_rate": 1.757823852207877e-05, "loss": 0.7915, "step": 2292 }, { "epoch": 0.25, "learning_rate": 1.7575937533626562e-05, "loss": 0.7039, "step": 2293 }, { "epoch": 0.25, "learning_rate": 1.757363560332658e-05, "loss": 0.7268, "step": 2294 }, { "epoch": 0.25, "learning_rate": 1.757133273146499e-05, "loss": 0.8882, "step": 2295 }, { "epoch": 0.25, "learning_rate": 1.75690289183281e-05, "loss": 0.6936, "step": 2296 }, { "epoch": 0.25, "learning_rate": 1.7566724164202315e-05, "loss": 0.7998, "step": 2297 }, { "epoch": 0.25, "learning_rate": 1.7564418469374167e-05, "loss": 0.8223, "step": 2298 }, { "epoch": 0.25, "learning_rate": 1.7562111834130304e-05, "loss": 0.665, "step": 2299 }, { "epoch": 0.25, "learning_rate": 1.755980425875748e-05, "loss": 0.7473, "step": 2300 }, { "epoch": 0.25, "learning_rate": 1.7557495743542586e-05, "loss": 0.7561, "step": 2301 }, { "epoch": 0.25, "learning_rate": 1.755518628877261e-05, "loss": 0.7947, "step": 2302 }, { "epoch": 0.25, "learning_rate": 1.7552875894734672e-05, "loss": 0.7964, "step": 2303 }, { "epoch": 0.25, "learning_rate": 1.7550564561716e-05, "loss": 0.8047, "step": 2304 }, { "epoch": 0.25, "learning_rate": 1.7548252290003943e-05, "loss": 0.7803, "step": 2305 }, { "epoch": 0.25, "learning_rate": 1.7545939079885962e-05, "loss": 0.7615, "step": 2306 }, { "epoch": 0.25, "learning_rate": 1.7543624931649636e-05, "loss": 0.7363, "step": 2307 }, { "epoch": 0.25, "learning_rate": 1.754130984558267e-05, "loss": 0.7498, "step": 2308 }, { "epoch": 0.25, "learning_rate": 1.7538993821972868e-05, "loss": 0.6331, "step": 2309 }, { "epoch": 0.25, "learning_rate": 1.7536676861108167e-05, "loss": 0.7659, "step": 2310 }, { "epoch": 0.25, "learning_rate": 1.7534358963276606e-05, "loss": 0.7744, "step": 2311 }, { "epoch": 0.25, "learning_rate": 1.7532040128766362e-05, "loss": 0.76, "step": 2312 }, { "epoch": 0.25, "learning_rate": 1.75297203578657e-05, "loss": 0.8276, "step": 2313 }, { "epoch": 0.25, "learning_rate": 1.7527399650863025e-05, "loss": 0.7119, "step": 2314 }, { "epoch": 0.25, "learning_rate": 1.752507800804685e-05, "loss": 0.8184, "step": 2315 }, { "epoch": 0.25, "learning_rate": 1.75227554297058e-05, "loss": 0.7861, "step": 2316 }, { "epoch": 0.25, "learning_rate": 1.7520431916128614e-05, "loss": 0.6997, "step": 2317 }, { "epoch": 0.25, "learning_rate": 1.7518107467604166e-05, "loss": 0.7358, "step": 2318 }, { "epoch": 0.25, "learning_rate": 1.7515782084421426e-05, "loss": 0.7576, "step": 2319 }, { "epoch": 0.25, "learning_rate": 1.7513455766869496e-05, "loss": 0.7092, "step": 2320 }, { "epoch": 0.25, "learning_rate": 1.7511128515237574e-05, "loss": 0.8037, "step": 2321 }, { "epoch": 0.25, "learning_rate": 1.7508800329814993e-05, "loss": 0.8037, "step": 2322 }, { "epoch": 0.25, "learning_rate": 1.7506471210891197e-05, "loss": 0.8091, "step": 2323 }, { "epoch": 0.25, "learning_rate": 1.750414115875574e-05, "loss": 0.7947, "step": 2324 }, { "epoch": 0.25, "learning_rate": 1.75018101736983e-05, "loss": 0.7041, "step": 2325 }, { "epoch": 0.25, "learning_rate": 1.7499478256008658e-05, "loss": 0.7393, "step": 2326 }, { "epoch": 0.25, "learning_rate": 1.7497145405976734e-05, "loss": 0.7329, "step": 2327 }, { "epoch": 0.25, "learning_rate": 1.7494811623892543e-05, "loss": 0.7034, "step": 2328 }, { "epoch": 0.25, "learning_rate": 1.7492476910046222e-05, "loss": 0.7979, "step": 2329 }, { "epoch": 0.25, "learning_rate": 1.7490141264728028e-05, "loss": 0.7368, "step": 2330 }, { "epoch": 0.25, "learning_rate": 1.7487804688228327e-05, "loss": 0.7307, "step": 2331 }, { "epoch": 0.25, "learning_rate": 1.7485467180837608e-05, "loss": 0.7969, "step": 2332 }, { "epoch": 0.25, "learning_rate": 1.748312874284647e-05, "loss": 0.8149, "step": 2333 }, { "epoch": 0.25, "learning_rate": 1.7480789374545633e-05, "loss": 0.6702, "step": 2334 }, { "epoch": 0.25, "learning_rate": 1.7478449076225924e-05, "loss": 0.656, "step": 2335 }, { "epoch": 0.25, "learning_rate": 1.7476107848178298e-05, "loss": 0.7478, "step": 2336 }, { "epoch": 0.25, "learning_rate": 1.7473765690693812e-05, "loss": 0.7285, "step": 2337 }, { "epoch": 0.25, "learning_rate": 1.7471422604063647e-05, "loss": 0.6086, "step": 2338 }, { "epoch": 0.25, "learning_rate": 1.74690785885791e-05, "loss": 0.6682, "step": 2339 }, { "epoch": 0.25, "learning_rate": 1.7466733644531578e-05, "loss": 0.7349, "step": 2340 }, { "epoch": 0.25, "learning_rate": 1.7464387772212616e-05, "loss": 0.835, "step": 2341 }, { "epoch": 0.25, "learning_rate": 1.746204097191384e-05, "loss": 0.7686, "step": 2342 }, { "epoch": 0.26, "learning_rate": 1.745969324392702e-05, "loss": 0.7993, "step": 2343 }, { "epoch": 0.26, "learning_rate": 1.7457344588544018e-05, "loss": 0.7988, "step": 2344 }, { "epoch": 0.26, "learning_rate": 1.745499500605683e-05, "loss": 0.7903, "step": 2345 }, { "epoch": 0.26, "learning_rate": 1.745264449675755e-05, "loss": 0.7739, "step": 2346 }, { "epoch": 0.26, "learning_rate": 1.74502930609384e-05, "loss": 0.792, "step": 2347 }, { "epoch": 0.26, "learning_rate": 1.744794069889171e-05, "loss": 0.8521, "step": 2348 }, { "epoch": 0.26, "learning_rate": 1.7445587410909932e-05, "loss": 0.813, "step": 2349 }, { "epoch": 0.26, "learning_rate": 1.7443233197285625e-05, "loss": 0.6731, "step": 2350 }, { "epoch": 0.26, "learning_rate": 1.7440878058311467e-05, "loss": 0.8564, "step": 2351 }, { "epoch": 0.26, "learning_rate": 1.7438521994280257e-05, "loss": 0.8289, "step": 2352 }, { "epoch": 0.26, "learning_rate": 1.7436165005484896e-05, "loss": 0.7568, "step": 2353 }, { "epoch": 0.26, "learning_rate": 1.7433807092218417e-05, "loss": 0.7004, "step": 2354 }, { "epoch": 0.26, "learning_rate": 1.7431448254773943e-05, "loss": 0.7559, "step": 2355 }, { "epoch": 0.26, "learning_rate": 1.7429088493444738e-05, "loss": 0.8174, "step": 2356 }, { "epoch": 0.26, "learning_rate": 1.7426727808524167e-05, "loss": 0.8696, "step": 2357 }, { "epoch": 0.26, "learning_rate": 1.7424366200305717e-05, "loss": 0.7273, "step": 2358 }, { "epoch": 0.26, "learning_rate": 1.7422003669082972e-05, "loss": 0.7231, "step": 2359 }, { "epoch": 0.26, "learning_rate": 1.741964021514966e-05, "loss": 0.7302, "step": 2360 }, { "epoch": 0.26, "learning_rate": 1.7417275838799596e-05, "loss": 0.707, "step": 2361 }, { "epoch": 0.26, "learning_rate": 1.741491054032673e-05, "loss": 0.7805, "step": 2362 }, { "epoch": 0.26, "learning_rate": 1.7412544320025114e-05, "loss": 0.5706, "step": 2363 }, { "epoch": 0.26, "learning_rate": 1.7410177178188917e-05, "loss": 0.7949, "step": 2364 }, { "epoch": 0.26, "learning_rate": 1.7407809115112432e-05, "loss": 0.7771, "step": 2365 }, { "epoch": 0.26, "learning_rate": 1.740544013109005e-05, "loss": 0.7139, "step": 2366 }, { "epoch": 0.26, "learning_rate": 1.740307022641629e-05, "loss": 0.7998, "step": 2367 }, { "epoch": 0.26, "learning_rate": 1.7400699401385774e-05, "loss": 0.8018, "step": 2368 }, { "epoch": 0.26, "learning_rate": 1.7398327656293257e-05, "loss": 0.7197, "step": 2369 }, { "epoch": 0.26, "learning_rate": 1.7395954991433588e-05, "loss": 0.7285, "step": 2370 }, { "epoch": 0.26, "learning_rate": 1.739358140710174e-05, "loss": 0.771, "step": 2371 }, { "epoch": 0.26, "learning_rate": 1.7391206903592803e-05, "loss": 0.7686, "step": 2372 }, { "epoch": 0.26, "learning_rate": 1.738883148120198e-05, "loss": 0.7512, "step": 2373 }, { "epoch": 0.26, "learning_rate": 1.738645514022457e-05, "loss": 0.759, "step": 2374 }, { "epoch": 0.26, "learning_rate": 1.7384077880956023e-05, "loss": 0.7761, "step": 2375 }, { "epoch": 0.26, "learning_rate": 1.7381699703691866e-05, "loss": 0.7432, "step": 2376 }, { "epoch": 0.26, "learning_rate": 1.7379320608727766e-05, "loss": 0.7715, "step": 2377 }, { "epoch": 0.26, "learning_rate": 1.737694059635949e-05, "loss": 0.7175, "step": 2378 }, { "epoch": 0.26, "learning_rate": 1.7374559666882923e-05, "loss": 0.5592, "step": 2379 }, { "epoch": 0.26, "learning_rate": 1.7372177820594067e-05, "loss": 0.7393, "step": 2380 }, { "epoch": 0.26, "learning_rate": 1.7369795057789034e-05, "loss": 0.7708, "step": 2381 }, { "epoch": 0.26, "learning_rate": 1.736741137876405e-05, "loss": 0.7593, "step": 2382 }, { "epoch": 0.26, "learning_rate": 1.7365026783815458e-05, "loss": 0.8657, "step": 2383 }, { "epoch": 0.26, "learning_rate": 1.7362641273239714e-05, "loss": 0.6458, "step": 2384 }, { "epoch": 0.26, "learning_rate": 1.7360254847333388e-05, "loss": 0.77, "step": 2385 }, { "epoch": 0.26, "learning_rate": 1.7357867506393154e-05, "loss": 0.6716, "step": 2386 }, { "epoch": 0.26, "learning_rate": 1.735547925071582e-05, "loss": 0.6162, "step": 2387 }, { "epoch": 0.26, "learning_rate": 1.735309008059829e-05, "loss": 0.8403, "step": 2388 }, { "epoch": 0.26, "learning_rate": 1.735069999633759e-05, "loss": 0.6836, "step": 2389 }, { "epoch": 0.26, "learning_rate": 1.7348308998230852e-05, "loss": 0.8599, "step": 2390 }, { "epoch": 0.26, "learning_rate": 1.734591708657533e-05, "loss": 0.7661, "step": 2391 }, { "epoch": 0.26, "learning_rate": 1.73435242616684e-05, "loss": 0.7031, "step": 2392 }, { "epoch": 0.26, "learning_rate": 1.7341130523807527e-05, "loss": 0.8115, "step": 2393 }, { "epoch": 0.26, "learning_rate": 1.7338735873290304e-05, "loss": 0.7385, "step": 2394 }, { "epoch": 0.26, "learning_rate": 1.7336340310414442e-05, "loss": 0.7522, "step": 2395 }, { "epoch": 0.26, "learning_rate": 1.7333943835477752e-05, "loss": 0.8003, "step": 2396 }, { "epoch": 0.26, "learning_rate": 1.7331546448778175e-05, "loss": 0.7163, "step": 2397 }, { "epoch": 0.26, "learning_rate": 1.7329148150613752e-05, "loss": 0.8232, "step": 2398 }, { "epoch": 0.26, "learning_rate": 1.7326748941282638e-05, "loss": 0.7461, "step": 2399 }, { "epoch": 0.26, "learning_rate": 1.732434882108311e-05, "loss": 0.7852, "step": 2400 }, { "epoch": 0.26, "learning_rate": 1.7321947790313554e-05, "loss": 0.6609, "step": 2401 }, { "epoch": 0.26, "learning_rate": 1.7319545849272464e-05, "loss": 0.7661, "step": 2402 }, { "epoch": 0.26, "learning_rate": 1.7317142998258454e-05, "loss": 0.7842, "step": 2403 }, { "epoch": 0.26, "learning_rate": 1.731473923757025e-05, "loss": 0.7817, "step": 2404 }, { "epoch": 0.26, "learning_rate": 1.7312334567506684e-05, "loss": 0.6958, "step": 2405 }, { "epoch": 0.26, "learning_rate": 1.730992898836672e-05, "loss": 0.8423, "step": 2406 }, { "epoch": 0.26, "learning_rate": 1.7307522500449407e-05, "loss": 0.7627, "step": 2407 }, { "epoch": 0.26, "learning_rate": 1.7305115104053927e-05, "loss": 0.7781, "step": 2408 }, { "epoch": 0.26, "learning_rate": 1.7302706799479575e-05, "loss": 0.7778, "step": 2409 }, { "epoch": 0.26, "learning_rate": 1.7300297587025748e-05, "loss": 0.7837, "step": 2410 }, { "epoch": 0.26, "learning_rate": 1.729788746699196e-05, "loss": 0.7556, "step": 2411 }, { "epoch": 0.26, "learning_rate": 1.7295476439677847e-05, "loss": 0.825, "step": 2412 }, { "epoch": 0.26, "learning_rate": 1.7293064505383147e-05, "loss": 0.748, "step": 2413 }, { "epoch": 0.26, "learning_rate": 1.729065166440771e-05, "loss": 0.7859, "step": 2414 }, { "epoch": 0.26, "learning_rate": 1.7288237917051506e-05, "loss": 0.7861, "step": 2415 }, { "epoch": 0.26, "learning_rate": 1.7285823263614613e-05, "loss": 0.7339, "step": 2416 }, { "epoch": 0.26, "learning_rate": 1.7283407704397224e-05, "loss": 0.7449, "step": 2417 }, { "epoch": 0.26, "learning_rate": 1.7280991239699643e-05, "loss": 0.873, "step": 2418 }, { "epoch": 0.26, "learning_rate": 1.7278573869822288e-05, "loss": 0.7852, "step": 2419 }, { "epoch": 0.26, "learning_rate": 1.727615559506569e-05, "loss": 0.8181, "step": 2420 }, { "epoch": 0.26, "learning_rate": 1.7273736415730488e-05, "loss": 0.8726, "step": 2421 }, { "epoch": 0.26, "learning_rate": 1.727131633211744e-05, "loss": 0.7734, "step": 2422 }, { "epoch": 0.26, "learning_rate": 1.726889534452741e-05, "loss": 0.5654, "step": 2423 }, { "epoch": 0.26, "learning_rate": 1.7266473453261378e-05, "loss": 0.7419, "step": 2424 }, { "epoch": 0.26, "learning_rate": 1.7264050658620442e-05, "loss": 0.7786, "step": 2425 }, { "epoch": 0.26, "learning_rate": 1.7261626960905795e-05, "loss": 0.6978, "step": 2426 }, { "epoch": 0.26, "learning_rate": 1.7259202360418765e-05, "loss": 0.7019, "step": 2427 }, { "epoch": 0.26, "learning_rate": 1.7256776857460768e-05, "loss": 0.7676, "step": 2428 }, { "epoch": 0.26, "learning_rate": 1.7254350452333356e-05, "loss": 0.8418, "step": 2429 }, { "epoch": 0.26, "learning_rate": 1.7251923145338175e-05, "loss": 0.7661, "step": 2430 }, { "epoch": 0.26, "learning_rate": 1.7249494936776994e-05, "loss": 0.7388, "step": 2431 }, { "epoch": 0.26, "learning_rate": 1.7247065826951694e-05, "loss": 0.7698, "step": 2432 }, { "epoch": 0.26, "learning_rate": 1.7244635816164254e-05, "loss": 0.7241, "step": 2433 }, { "epoch": 0.26, "learning_rate": 1.7242204904716785e-05, "loss": 0.6079, "step": 2434 }, { "epoch": 0.27, "learning_rate": 1.7239773092911488e-05, "loss": 0.7395, "step": 2435 }, { "epoch": 0.27, "learning_rate": 1.72373403810507e-05, "loss": 0.7212, "step": 2436 }, { "epoch": 0.27, "learning_rate": 1.723490676943686e-05, "loss": 0.6274, "step": 2437 }, { "epoch": 0.27, "learning_rate": 1.7232472258372504e-05, "loss": 0.6819, "step": 2438 }, { "epoch": 0.27, "learning_rate": 1.7230036848160302e-05, "loss": 0.8018, "step": 2439 }, { "epoch": 0.27, "learning_rate": 1.7227600539103024e-05, "loss": 0.6541, "step": 2440 }, { "epoch": 0.27, "learning_rate": 1.7225163331503557e-05, "loss": 0.7522, "step": 2441 }, { "epoch": 0.27, "learning_rate": 1.722272522566489e-05, "loss": 0.78, "step": 2442 }, { "epoch": 0.27, "learning_rate": 1.7220286221890137e-05, "loss": 0.6179, "step": 2443 }, { "epoch": 0.27, "learning_rate": 1.7217846320482517e-05, "loss": 0.8091, "step": 2444 }, { "epoch": 0.27, "learning_rate": 1.7215405521745358e-05, "loss": 0.8467, "step": 2445 }, { "epoch": 0.27, "learning_rate": 1.7212963825982103e-05, "loss": 0.8931, "step": 2446 }, { "epoch": 0.27, "learning_rate": 1.721052123349631e-05, "loss": 0.8486, "step": 2447 }, { "epoch": 0.27, "learning_rate": 1.7208077744591633e-05, "loss": 0.7754, "step": 2448 }, { "epoch": 0.27, "learning_rate": 1.7205633359571866e-05, "loss": 0.7148, "step": 2449 }, { "epoch": 0.27, "learning_rate": 1.7203188078740883e-05, "loss": 0.7461, "step": 2450 }, { "epoch": 0.27, "learning_rate": 1.720074190240269e-05, "loss": 0.8081, "step": 2451 }, { "epoch": 0.27, "learning_rate": 1.71982948308614e-05, "loss": 0.6885, "step": 2452 }, { "epoch": 0.27, "learning_rate": 1.7195846864421227e-05, "loss": 0.7305, "step": 2453 }, { "epoch": 0.27, "learning_rate": 1.7193398003386514e-05, "loss": 0.6714, "step": 2454 }, { "epoch": 0.27, "learning_rate": 1.71909482480617e-05, "loss": 0.7227, "step": 2455 }, { "epoch": 0.27, "learning_rate": 1.7188497598751343e-05, "loss": 0.6901, "step": 2456 }, { "epoch": 0.27, "learning_rate": 1.7186046055760105e-05, "loss": 0.7515, "step": 2457 }, { "epoch": 0.27, "learning_rate": 1.718359361939277e-05, "loss": 0.7788, "step": 2458 }, { "epoch": 0.27, "learning_rate": 1.718114028995423e-05, "loss": 0.6565, "step": 2459 }, { "epoch": 0.27, "learning_rate": 1.717868606774948e-05, "loss": 0.7412, "step": 2460 }, { "epoch": 0.27, "learning_rate": 1.717623095308363e-05, "loss": 0.5754, "step": 2461 }, { "epoch": 0.27, "learning_rate": 1.7173774946261902e-05, "loss": 0.8193, "step": 2462 }, { "epoch": 0.27, "learning_rate": 1.7171318047589637e-05, "loss": 0.7764, "step": 2463 }, { "epoch": 0.27, "learning_rate": 1.716886025737227e-05, "loss": 0.8135, "step": 2464 }, { "epoch": 0.27, "learning_rate": 1.716640157591536e-05, "loss": 0.8281, "step": 2465 }, { "epoch": 0.27, "learning_rate": 1.7163942003524574e-05, "loss": 0.6641, "step": 2466 }, { "epoch": 0.27, "learning_rate": 1.7161481540505686e-05, "loss": 0.752, "step": 2467 }, { "epoch": 0.27, "learning_rate": 1.7159020187164582e-05, "loss": 0.7563, "step": 2468 }, { "epoch": 0.27, "learning_rate": 1.715655794380726e-05, "loss": 0.6987, "step": 2469 }, { "epoch": 0.27, "learning_rate": 1.715409481073983e-05, "loss": 0.6729, "step": 2470 }, { "epoch": 0.27, "learning_rate": 1.7151630788268514e-05, "loss": 0.8267, "step": 2471 }, { "epoch": 0.27, "learning_rate": 1.7149165876699635e-05, "loss": 0.8286, "step": 2472 }, { "epoch": 0.27, "learning_rate": 1.714670007633964e-05, "loss": 0.7903, "step": 2473 }, { "epoch": 0.27, "learning_rate": 1.7144233387495074e-05, "loss": 0.7327, "step": 2474 }, { "epoch": 0.27, "learning_rate": 1.7141765810472603e-05, "loss": 0.7397, "step": 2475 }, { "epoch": 0.27, "learning_rate": 1.7139297345578992e-05, "loss": 0.6592, "step": 2476 }, { "epoch": 0.27, "learning_rate": 1.713682799312113e-05, "loss": 0.7922, "step": 2477 }, { "epoch": 0.27, "learning_rate": 1.7134357753406003e-05, "loss": 0.7441, "step": 2478 }, { "epoch": 0.27, "learning_rate": 1.7131886626740717e-05, "loss": 0.5745, "step": 2479 }, { "epoch": 0.27, "learning_rate": 1.7129414613432486e-05, "loss": 0.6982, "step": 2480 }, { "epoch": 0.27, "learning_rate": 1.7126941713788633e-05, "loss": 0.6887, "step": 2481 }, { "epoch": 0.27, "learning_rate": 1.7124467928116587e-05, "loss": 0.7625, "step": 2482 }, { "epoch": 0.27, "learning_rate": 1.7121993256723893e-05, "loss": 0.7563, "step": 2483 }, { "epoch": 0.27, "learning_rate": 1.7119517699918206e-05, "loss": 0.707, "step": 2484 }, { "epoch": 0.27, "learning_rate": 1.711704125800729e-05, "loss": 0.8481, "step": 2485 }, { "epoch": 0.27, "learning_rate": 1.7114563931299016e-05, "loss": 0.6438, "step": 2486 }, { "epoch": 0.27, "learning_rate": 1.711208572010137e-05, "loss": 0.7231, "step": 2487 }, { "epoch": 0.27, "learning_rate": 1.7109606624722448e-05, "loss": 0.8218, "step": 2488 }, { "epoch": 0.27, "learning_rate": 1.710712664547045e-05, "loss": 0.7109, "step": 2489 }, { "epoch": 0.27, "learning_rate": 1.710464578265369e-05, "loss": 0.7585, "step": 2490 }, { "epoch": 0.27, "learning_rate": 1.710216403658059e-05, "loss": 0.6865, "step": 2491 }, { "epoch": 0.27, "learning_rate": 1.7099681407559684e-05, "loss": 0.7412, "step": 2492 }, { "epoch": 0.27, "learning_rate": 1.7097197895899614e-05, "loss": 0.7166, "step": 2493 }, { "epoch": 0.27, "learning_rate": 1.7094713501909135e-05, "loss": 0.7771, "step": 2494 }, { "epoch": 0.27, "learning_rate": 1.7092228225897106e-05, "loss": 0.7351, "step": 2495 }, { "epoch": 0.27, "learning_rate": 1.70897420681725e-05, "loss": 0.7051, "step": 2496 }, { "epoch": 0.27, "learning_rate": 1.7087255029044402e-05, "loss": 0.5601, "step": 2497 }, { "epoch": 0.27, "learning_rate": 1.7084767108822e-05, "loss": 0.7227, "step": 2498 }, { "epoch": 0.27, "learning_rate": 1.7082278307814593e-05, "loss": 0.6477, "step": 2499 }, { "epoch": 0.27, "learning_rate": 1.7079788626331593e-05, "loss": 0.6501, "step": 2500 }, { "epoch": 0.27, "learning_rate": 1.707729806468252e-05, "loss": 0.8103, "step": 2501 }, { "epoch": 0.27, "learning_rate": 1.7074806623177004e-05, "loss": 0.7686, "step": 2502 }, { "epoch": 0.27, "learning_rate": 1.707231430212478e-05, "loss": 0.6541, "step": 2503 }, { "epoch": 0.27, "learning_rate": 1.70698211018357e-05, "loss": 0.6492, "step": 2504 }, { "epoch": 0.27, "learning_rate": 1.7067327022619716e-05, "loss": 0.8853, "step": 2505 }, { "epoch": 0.27, "learning_rate": 1.7064832064786894e-05, "loss": 0.7759, "step": 2506 }, { "epoch": 0.27, "learning_rate": 1.706233622864742e-05, "loss": 0.7646, "step": 2507 }, { "epoch": 0.27, "learning_rate": 1.7059839514511565e-05, "loss": 0.6868, "step": 2508 }, { "epoch": 0.27, "learning_rate": 1.7057341922689733e-05, "loss": 0.6797, "step": 2509 }, { "epoch": 0.27, "learning_rate": 1.705484345349242e-05, "loss": 0.9092, "step": 2510 }, { "epoch": 0.27, "learning_rate": 1.7052344107230244e-05, "loss": 0.8037, "step": 2511 }, { "epoch": 0.27, "learning_rate": 1.704984388421392e-05, "loss": 0.7798, "step": 2512 }, { "epoch": 0.27, "learning_rate": 1.7047342784754284e-05, "loss": 0.698, "step": 2513 }, { "epoch": 0.27, "learning_rate": 1.704484080916227e-05, "loss": 0.7588, "step": 2514 }, { "epoch": 0.27, "learning_rate": 1.7042337957748934e-05, "loss": 0.8696, "step": 2515 }, { "epoch": 0.27, "learning_rate": 1.703983423082542e-05, "loss": 0.672, "step": 2516 }, { "epoch": 0.27, "learning_rate": 1.7037329628703005e-05, "loss": 0.8311, "step": 2517 }, { "epoch": 0.27, "learning_rate": 1.7034824151693058e-05, "loss": 0.7744, "step": 2518 }, { "epoch": 0.27, "learning_rate": 1.7032317800107067e-05, "loss": 0.7039, "step": 2519 }, { "epoch": 0.27, "learning_rate": 1.702981057425662e-05, "loss": 0.6628, "step": 2520 }, { "epoch": 0.27, "learning_rate": 1.7027302474453414e-05, "loss": 0.8306, "step": 2521 }, { "epoch": 0.27, "learning_rate": 1.702479350100927e-05, "loss": 0.7231, "step": 2522 }, { "epoch": 0.27, "learning_rate": 1.7022283654236093e-05, "loss": 0.8311, "step": 2523 }, { "epoch": 0.27, "learning_rate": 1.7019772934445917e-05, "loss": 0.5957, "step": 2524 }, { "epoch": 0.27, "learning_rate": 1.7017261341950877e-05, "loss": 0.8662, "step": 2525 }, { "epoch": 0.27, "learning_rate": 1.7014748877063212e-05, "loss": 0.7834, "step": 2526 }, { "epoch": 0.28, "learning_rate": 1.7012235540095284e-05, "loss": 0.8027, "step": 2527 }, { "epoch": 0.28, "learning_rate": 1.700972133135954e-05, "loss": 0.6333, "step": 2528 }, { "epoch": 0.28, "learning_rate": 1.7007206251168557e-05, "loss": 0.7156, "step": 2529 }, { "epoch": 0.28, "learning_rate": 1.7004690299835012e-05, "loss": 0.7178, "step": 2530 }, { "epoch": 0.28, "learning_rate": 1.7002173477671685e-05, "loss": 0.7937, "step": 2531 }, { "epoch": 0.28, "learning_rate": 1.699965578499148e-05, "loss": 0.675, "step": 2532 }, { "epoch": 0.28, "learning_rate": 1.699713722210739e-05, "loss": 0.832, "step": 2533 }, { "epoch": 0.28, "learning_rate": 1.6994617789332526e-05, "loss": 0.7971, "step": 2534 }, { "epoch": 0.28, "learning_rate": 1.6992097486980107e-05, "loss": 0.7446, "step": 2535 }, { "epoch": 0.28, "learning_rate": 1.6989576315363467e-05, "loss": 0.7336, "step": 2536 }, { "epoch": 0.28, "learning_rate": 1.6987054274796027e-05, "loss": 0.699, "step": 2537 }, { "epoch": 0.28, "learning_rate": 1.698453136559134e-05, "loss": 0.7395, "step": 2538 }, { "epoch": 0.28, "learning_rate": 1.6982007588063052e-05, "loss": 0.8403, "step": 2539 }, { "epoch": 0.28, "learning_rate": 1.6979482942524924e-05, "loss": 0.8594, "step": 2540 }, { "epoch": 0.28, "learning_rate": 1.697695742929082e-05, "loss": 0.738, "step": 2541 }, { "epoch": 0.28, "learning_rate": 1.6974431048674714e-05, "loss": 0.5696, "step": 2542 }, { "epoch": 0.28, "learning_rate": 1.697190380099069e-05, "loss": 0.8633, "step": 2543 }, { "epoch": 0.28, "learning_rate": 1.696937568655294e-05, "loss": 0.7988, "step": 2544 }, { "epoch": 0.28, "learning_rate": 1.696684670567575e-05, "loss": 0.7239, "step": 2545 }, { "epoch": 0.28, "learning_rate": 1.6964316858673538e-05, "loss": 0.6133, "step": 2546 }, { "epoch": 0.28, "learning_rate": 1.6961786145860814e-05, "loss": 0.7849, "step": 2547 }, { "epoch": 0.28, "learning_rate": 1.69592545675522e-05, "loss": 0.7832, "step": 2548 }, { "epoch": 0.28, "learning_rate": 1.6956722124062415e-05, "loss": 0.6982, "step": 2549 }, { "epoch": 0.28, "learning_rate": 1.6954188815706306e-05, "loss": 0.7559, "step": 2550 }, { "epoch": 0.28, "learning_rate": 1.6951654642798812e-05, "loss": 0.7241, "step": 2551 }, { "epoch": 0.28, "learning_rate": 1.694911960565498e-05, "loss": 0.7568, "step": 2552 }, { "epoch": 0.28, "learning_rate": 1.6946583704589973e-05, "loss": 0.8149, "step": 2553 }, { "epoch": 0.28, "learning_rate": 1.694404693991906e-05, "loss": 0.7754, "step": 2554 }, { "epoch": 0.28, "learning_rate": 1.69415093119576e-05, "loss": 0.7034, "step": 2555 }, { "epoch": 0.28, "learning_rate": 1.693897082102109e-05, "loss": 0.7808, "step": 2556 }, { "epoch": 0.28, "learning_rate": 1.693643146742511e-05, "loss": 0.8242, "step": 2557 }, { "epoch": 0.28, "learning_rate": 1.6933891251485355e-05, "loss": 0.6987, "step": 2558 }, { "epoch": 0.28, "learning_rate": 1.6931350173517625e-05, "loss": 0.7861, "step": 2559 }, { "epoch": 0.28, "learning_rate": 1.6928808233837833e-05, "loss": 0.708, "step": 2560 }, { "epoch": 0.28, "learning_rate": 1.6926265432761993e-05, "loss": 0.8208, "step": 2561 }, { "epoch": 0.28, "learning_rate": 1.692372177060623e-05, "loss": 0.6992, "step": 2562 }, { "epoch": 0.28, "learning_rate": 1.6921177247686773e-05, "loss": 0.8164, "step": 2563 }, { "epoch": 0.28, "learning_rate": 1.691863186431996e-05, "loss": 0.8096, "step": 2564 }, { "epoch": 0.28, "learning_rate": 1.6916085620822236e-05, "loss": 0.7793, "step": 2565 }, { "epoch": 0.28, "learning_rate": 1.6913538517510155e-05, "loss": 0.6096, "step": 2566 }, { "epoch": 0.28, "learning_rate": 1.691099055470037e-05, "loss": 0.7439, "step": 2567 }, { "epoch": 0.28, "learning_rate": 1.690844173270965e-05, "loss": 0.7671, "step": 2568 }, { "epoch": 0.28, "learning_rate": 1.690589205185486e-05, "loss": 0.791, "step": 2569 }, { "epoch": 0.28, "learning_rate": 1.6903341512452992e-05, "loss": 0.7275, "step": 2570 }, { "epoch": 0.28, "learning_rate": 1.6900790114821122e-05, "loss": 0.8542, "step": 2571 }, { "epoch": 0.28, "learning_rate": 1.6898237859276444e-05, "loss": 0.6641, "step": 2572 }, { "epoch": 0.28, "learning_rate": 1.6895684746136254e-05, "loss": 0.8325, "step": 2573 }, { "epoch": 0.28, "learning_rate": 1.689313077571796e-05, "loss": 0.7627, "step": 2574 }, { "epoch": 0.28, "learning_rate": 1.689057594833908e-05, "loss": 0.8599, "step": 2575 }, { "epoch": 0.28, "learning_rate": 1.6888020264317227e-05, "loss": 0.7412, "step": 2576 }, { "epoch": 0.28, "learning_rate": 1.688546372397012e-05, "loss": 0.8066, "step": 2577 }, { "epoch": 0.28, "learning_rate": 1.68829063276156e-05, "loss": 0.6494, "step": 2578 }, { "epoch": 0.28, "learning_rate": 1.6880348075571605e-05, "loss": 0.7173, "step": 2579 }, { "epoch": 0.28, "learning_rate": 1.6877788968156172e-05, "loss": 0.7798, "step": 2580 }, { "epoch": 0.28, "learning_rate": 1.6875229005687454e-05, "loss": 0.7554, "step": 2581 }, { "epoch": 0.28, "learning_rate": 1.687266818848371e-05, "loss": 0.656, "step": 2582 }, { "epoch": 0.28, "learning_rate": 1.687010651686331e-05, "loss": 0.7416, "step": 2583 }, { "epoch": 0.28, "learning_rate": 1.686754399114471e-05, "loss": 0.6978, "step": 2584 }, { "epoch": 0.28, "learning_rate": 1.686498061164649e-05, "loss": 0.6309, "step": 2585 }, { "epoch": 0.28, "learning_rate": 1.686241637868734e-05, "loss": 0.8472, "step": 2586 }, { "epoch": 0.28, "learning_rate": 1.6859851292586034e-05, "loss": 0.7471, "step": 2587 }, { "epoch": 0.28, "learning_rate": 1.6857285353661478e-05, "loss": 0.6858, "step": 2588 }, { "epoch": 0.28, "learning_rate": 1.685471856223267e-05, "loss": 0.7749, "step": 2589 }, { "epoch": 0.28, "learning_rate": 1.685215091861871e-05, "loss": 0.6934, "step": 2590 }, { "epoch": 0.28, "learning_rate": 1.6849582423138815e-05, "loss": 0.8149, "step": 2591 }, { "epoch": 0.28, "learning_rate": 1.68470130761123e-05, "loss": 0.7358, "step": 2592 }, { "epoch": 0.28, "learning_rate": 1.684444287785859e-05, "loss": 0.7656, "step": 2593 }, { "epoch": 0.28, "learning_rate": 1.6841871828697214e-05, "loss": 0.7034, "step": 2594 }, { "epoch": 0.28, "learning_rate": 1.6839299928947807e-05, "loss": 0.7417, "step": 2595 }, { "epoch": 0.28, "learning_rate": 1.683672717893011e-05, "loss": 0.7983, "step": 2596 }, { "epoch": 0.28, "learning_rate": 1.683415357896397e-05, "loss": 0.708, "step": 2597 }, { "epoch": 0.28, "learning_rate": 1.6831579129369347e-05, "loss": 0.8066, "step": 2598 }, { "epoch": 0.28, "learning_rate": 1.6829003830466286e-05, "loss": 0.7432, "step": 2599 }, { "epoch": 0.28, "learning_rate": 1.6826427682574957e-05, "loss": 0.6587, "step": 2600 }, { "epoch": 0.28, "learning_rate": 1.682385068601563e-05, "loss": 0.7605, "step": 2601 }, { "epoch": 0.28, "learning_rate": 1.6821272841108675e-05, "loss": 0.7271, "step": 2602 }, { "epoch": 0.28, "learning_rate": 1.681869414817458e-05, "loss": 0.7466, "step": 2603 }, { "epoch": 0.28, "learning_rate": 1.6816114607533922e-05, "loss": 0.7974, "step": 2604 }, { "epoch": 0.28, "learning_rate": 1.68135342195074e-05, "loss": 0.6836, "step": 2605 }, { "epoch": 0.28, "learning_rate": 1.6810952984415804e-05, "loss": 0.6533, "step": 2606 }, { "epoch": 0.28, "learning_rate": 1.6808370902580034e-05, "loss": 0.833, "step": 2607 }, { "epoch": 0.28, "learning_rate": 1.6805787974321107e-05, "loss": 0.7998, "step": 2608 }, { "epoch": 0.28, "learning_rate": 1.6803204199960125e-05, "loss": 0.8525, "step": 2609 }, { "epoch": 0.28, "learning_rate": 1.680061957981831e-05, "loss": 0.7688, "step": 2610 }, { "epoch": 0.28, "learning_rate": 1.6798034114216983e-05, "loss": 0.7593, "step": 2611 }, { "epoch": 0.28, "learning_rate": 1.6795447803477575e-05, "loss": 0.7283, "step": 2612 }, { "epoch": 0.28, "learning_rate": 1.6792860647921614e-05, "loss": 0.7629, "step": 2613 }, { "epoch": 0.28, "learning_rate": 1.679027264787074e-05, "loss": 0.8877, "step": 2614 }, { "epoch": 0.28, "learning_rate": 1.6787683803646692e-05, "loss": 0.7803, "step": 2615 }, { "epoch": 0.28, "learning_rate": 1.6785094115571323e-05, "loss": 0.6785, "step": 2616 }, { "epoch": 0.28, "learning_rate": 1.6782503583966583e-05, "loss": 0.7019, "step": 2617 }, { "epoch": 0.28, "learning_rate": 1.677991220915453e-05, "loss": 0.8669, "step": 2618 }, { "epoch": 0.29, "learning_rate": 1.6777319991457325e-05, "loss": 0.67, "step": 2619 }, { "epoch": 0.29, "learning_rate": 1.6774726931197233e-05, "loss": 0.6782, "step": 2620 }, { "epoch": 0.29, "learning_rate": 1.6772133028696634e-05, "loss": 0.8452, "step": 2621 }, { "epoch": 0.29, "learning_rate": 1.6769538284277996e-05, "loss": 0.7368, "step": 2622 }, { "epoch": 0.29, "learning_rate": 1.67669426982639e-05, "loss": 0.9673, "step": 2623 }, { "epoch": 0.29, "learning_rate": 1.6764346270977038e-05, "loss": 0.8037, "step": 2624 }, { "epoch": 0.29, "learning_rate": 1.6761749002740195e-05, "loss": 0.8101, "step": 2625 }, { "epoch": 0.29, "learning_rate": 1.6759150893876272e-05, "loss": 0.6929, "step": 2626 }, { "epoch": 0.29, "learning_rate": 1.6756551944708258e-05, "loss": 0.7949, "step": 2627 }, { "epoch": 0.29, "learning_rate": 1.6753952155559266e-05, "loss": 0.9141, "step": 2628 }, { "epoch": 0.29, "learning_rate": 1.6751351526752503e-05, "loss": 0.8369, "step": 2629 }, { "epoch": 0.29, "learning_rate": 1.674875005861128e-05, "loss": 0.7908, "step": 2630 }, { "epoch": 0.29, "learning_rate": 1.674614775145901e-05, "loss": 0.8555, "step": 2631 }, { "epoch": 0.29, "learning_rate": 1.6743544605619216e-05, "loss": 0.7725, "step": 2632 }, { "epoch": 0.29, "learning_rate": 1.6740940621415534e-05, "loss": 0.7405, "step": 2633 }, { "epoch": 0.29, "learning_rate": 1.673833579917168e-05, "loss": 0.8369, "step": 2634 }, { "epoch": 0.29, "learning_rate": 1.6735730139211493e-05, "loss": 0.7671, "step": 2635 }, { "epoch": 0.29, "learning_rate": 1.6733123641858915e-05, "loss": 0.6736, "step": 2636 }, { "epoch": 0.29, "learning_rate": 1.6730516307437986e-05, "loss": 0.7441, "step": 2637 }, { "epoch": 0.29, "learning_rate": 1.6727908136272847e-05, "loss": 0.7822, "step": 2638 }, { "epoch": 0.29, "learning_rate": 1.6725299128687755e-05, "loss": 0.7412, "step": 2639 }, { "epoch": 0.29, "learning_rate": 1.6722689285007063e-05, "loss": 0.8413, "step": 2640 }, { "epoch": 0.29, "learning_rate": 1.6720078605555227e-05, "loss": 0.7847, "step": 2641 }, { "epoch": 0.29, "learning_rate": 1.6717467090656808e-05, "loss": 0.7393, "step": 2642 }, { "epoch": 0.29, "learning_rate": 1.6714854740636477e-05, "loss": 0.707, "step": 2643 }, { "epoch": 0.29, "learning_rate": 1.6712241555819e-05, "loss": 0.7251, "step": 2644 }, { "epoch": 0.29, "learning_rate": 1.670962753652925e-05, "loss": 0.6353, "step": 2645 }, { "epoch": 0.29, "learning_rate": 1.670701268309221e-05, "loss": 0.7515, "step": 2646 }, { "epoch": 0.29, "learning_rate": 1.6704396995832954e-05, "loss": 0.6851, "step": 2647 }, { "epoch": 0.29, "learning_rate": 1.6701780475076675e-05, "loss": 0.7209, "step": 2648 }, { "epoch": 0.29, "learning_rate": 1.6699163121148652e-05, "loss": 0.5837, "step": 2649 }, { "epoch": 0.29, "learning_rate": 1.669654493437428e-05, "loss": 0.7524, "step": 2650 }, { "epoch": 0.29, "learning_rate": 1.669392591507906e-05, "loss": 0.7659, "step": 2651 }, { "epoch": 0.29, "learning_rate": 1.6691306063588583e-05, "loss": 0.7822, "step": 2652 }, { "epoch": 0.29, "learning_rate": 1.6688685380228557e-05, "loss": 0.7578, "step": 2653 }, { "epoch": 0.29, "learning_rate": 1.6686063865324788e-05, "loss": 0.6606, "step": 2654 }, { "epoch": 0.29, "learning_rate": 1.668344151920318e-05, "loss": 0.8628, "step": 2655 }, { "epoch": 0.29, "learning_rate": 1.6680818342189748e-05, "loss": 0.791, "step": 2656 }, { "epoch": 0.29, "learning_rate": 1.667819433461061e-05, "loss": 0.7405, "step": 2657 }, { "epoch": 0.29, "learning_rate": 1.6675569496791985e-05, "loss": 0.7141, "step": 2658 }, { "epoch": 0.29, "learning_rate": 1.6672943829060194e-05, "loss": 0.8062, "step": 2659 }, { "epoch": 0.29, "learning_rate": 1.6670317331741662e-05, "loss": 0.7139, "step": 2660 }, { "epoch": 0.29, "learning_rate": 1.666769000516292e-05, "loss": 0.7427, "step": 2661 }, { "epoch": 0.29, "learning_rate": 1.6665061849650595e-05, "loss": 0.7256, "step": 2662 }, { "epoch": 0.29, "learning_rate": 1.6662432865531428e-05, "loss": 0.7437, "step": 2663 }, { "epoch": 0.29, "learning_rate": 1.665980305313225e-05, "loss": 0.6321, "step": 2664 }, { "epoch": 0.29, "learning_rate": 1.6657172412780006e-05, "loss": 0.7261, "step": 2665 }, { "epoch": 0.29, "learning_rate": 1.665454094480174e-05, "loss": 0.7993, "step": 2666 }, { "epoch": 0.29, "learning_rate": 1.66519086495246e-05, "loss": 0.7061, "step": 2667 }, { "epoch": 0.29, "learning_rate": 1.664927552727583e-05, "loss": 0.7952, "step": 2668 }, { "epoch": 0.29, "learning_rate": 1.6646641578382787e-05, "loss": 0.8037, "step": 2669 }, { "epoch": 0.29, "learning_rate": 1.6644006803172926e-05, "loss": 0.6499, "step": 2670 }, { "epoch": 0.29, "learning_rate": 1.66413712019738e-05, "loss": 0.6814, "step": 2671 }, { "epoch": 0.29, "learning_rate": 1.6638734775113077e-05, "loss": 0.6584, "step": 2672 }, { "epoch": 0.29, "learning_rate": 1.6636097522918514e-05, "loss": 0.6335, "step": 2673 }, { "epoch": 0.29, "learning_rate": 1.6633459445717973e-05, "loss": 0.8716, "step": 2674 }, { "epoch": 0.29, "learning_rate": 1.6630820543839433e-05, "loss": 0.667, "step": 2675 }, { "epoch": 0.29, "learning_rate": 1.6628180817610963e-05, "loss": 0.7993, "step": 2676 }, { "epoch": 0.29, "learning_rate": 1.662554026736073e-05, "loss": 0.6709, "step": 2677 }, { "epoch": 0.29, "learning_rate": 1.662289889341701e-05, "loss": 0.636, "step": 2678 }, { "epoch": 0.29, "learning_rate": 1.6620256696108187e-05, "loss": 0.7388, "step": 2679 }, { "epoch": 0.29, "learning_rate": 1.6617613675762737e-05, "loss": 0.7148, "step": 2680 }, { "epoch": 0.29, "learning_rate": 1.6614969832709245e-05, "loss": 0.6626, "step": 2681 }, { "epoch": 0.29, "learning_rate": 1.6612325167276395e-05, "loss": 0.7593, "step": 2682 }, { "epoch": 0.29, "learning_rate": 1.660967967979297e-05, "loss": 0.5972, "step": 2683 }, { "epoch": 0.29, "learning_rate": 1.660703337058787e-05, "loss": 0.7366, "step": 2684 }, { "epoch": 0.29, "learning_rate": 1.6604386239990077e-05, "loss": 0.7373, "step": 2685 }, { "epoch": 0.29, "learning_rate": 1.6601738288328692e-05, "loss": 0.8506, "step": 2686 }, { "epoch": 0.29, "learning_rate": 1.6599089515932906e-05, "loss": 0.7358, "step": 2687 }, { "epoch": 0.29, "learning_rate": 1.6596439923132016e-05, "loss": 0.7891, "step": 2688 }, { "epoch": 0.29, "learning_rate": 1.6593789510255426e-05, "loss": 0.676, "step": 2689 }, { "epoch": 0.29, "learning_rate": 1.6591138277632638e-05, "loss": 0.8013, "step": 2690 }, { "epoch": 0.29, "learning_rate": 1.658848622559325e-05, "loss": 0.7795, "step": 2691 }, { "epoch": 0.29, "learning_rate": 1.6585833354466975e-05, "loss": 0.7021, "step": 2692 }, { "epoch": 0.29, "learning_rate": 1.6583179664583612e-05, "loss": 0.7329, "step": 2693 }, { "epoch": 0.29, "learning_rate": 1.6580525156273083e-05, "loss": 0.7104, "step": 2694 }, { "epoch": 0.29, "learning_rate": 1.6577869829865386e-05, "loss": 0.6648, "step": 2695 }, { "epoch": 0.29, "learning_rate": 1.657521368569064e-05, "loss": 0.7681, "step": 2696 }, { "epoch": 0.29, "learning_rate": 1.6572556724079055e-05, "loss": 0.8027, "step": 2697 }, { "epoch": 0.29, "learning_rate": 1.6569898945360953e-05, "loss": 0.8257, "step": 2698 }, { "epoch": 0.29, "learning_rate": 1.656724034986675e-05, "loss": 0.7129, "step": 2699 }, { "epoch": 0.29, "learning_rate": 1.656458093792696e-05, "loss": 0.6897, "step": 2700 }, { "epoch": 0.29, "learning_rate": 1.6561920709872214e-05, "loss": 0.7429, "step": 2701 }, { "epoch": 0.29, "learning_rate": 1.655925966603322e-05, "loss": 0.771, "step": 2702 }, { "epoch": 0.29, "learning_rate": 1.6556597806740815e-05, "loss": 0.7383, "step": 2703 }, { "epoch": 0.29, "learning_rate": 1.6553935132325916e-05, "loss": 0.8044, "step": 2704 }, { "epoch": 0.29, "learning_rate": 1.6551271643119556e-05, "loss": 0.8037, "step": 2705 }, { "epoch": 0.29, "learning_rate": 1.6548607339452853e-05, "loss": 0.637, "step": 2706 }, { "epoch": 0.29, "learning_rate": 1.6545942221657042e-05, "loss": 0.8472, "step": 2707 }, { "epoch": 0.29, "learning_rate": 1.6543276290063447e-05, "loss": 0.7656, "step": 2708 }, { "epoch": 0.29, "learning_rate": 1.6540609545003513e-05, "loss": 0.6848, "step": 2709 }, { "epoch": 0.3, "learning_rate": 1.6537941986808754e-05, "loss": 0.6277, "step": 2710 }, { "epoch": 0.3, "learning_rate": 1.653527361581082e-05, "loss": 0.8408, "step": 2711 }, { "epoch": 0.3, "learning_rate": 1.653260443234143e-05, "loss": 0.8513, "step": 2712 }, { "epoch": 0.3, "learning_rate": 1.6529934436732433e-05, "loss": 0.7153, "step": 2713 }, { "epoch": 0.3, "learning_rate": 1.6527263629315758e-05, "loss": 0.812, "step": 2714 }, { "epoch": 0.3, "learning_rate": 1.6524592010423444e-05, "loss": 0.7725, "step": 2715 }, { "epoch": 0.3, "learning_rate": 1.652191958038763e-05, "loss": 0.7358, "step": 2716 }, { "epoch": 0.3, "learning_rate": 1.651924633954055e-05, "loss": 0.8618, "step": 2717 }, { "epoch": 0.3, "learning_rate": 1.6516572288214555e-05, "loss": 0.7625, "step": 2718 }, { "epoch": 0.3, "learning_rate": 1.6513897426742073e-05, "loss": 0.7686, "step": 2719 }, { "epoch": 0.3, "learning_rate": 1.6511221755455654e-05, "loss": 0.7703, "step": 2720 }, { "epoch": 0.3, "learning_rate": 1.6508545274687936e-05, "loss": 0.7837, "step": 2721 }, { "epoch": 0.3, "learning_rate": 1.6505867984771665e-05, "loss": 0.7603, "step": 2722 }, { "epoch": 0.3, "learning_rate": 1.650318988603968e-05, "loss": 0.9263, "step": 2723 }, { "epoch": 0.3, "learning_rate": 1.6500510978824928e-05, "loss": 0.7529, "step": 2724 }, { "epoch": 0.3, "learning_rate": 1.649783126346045e-05, "loss": 0.791, "step": 2725 }, { "epoch": 0.3, "learning_rate": 1.649515074027939e-05, "loss": 0.7383, "step": 2726 }, { "epoch": 0.3, "learning_rate": 1.6492469409615003e-05, "loss": 0.7483, "step": 2727 }, { "epoch": 0.3, "learning_rate": 1.6489787271800625e-05, "loss": 0.6877, "step": 2728 }, { "epoch": 0.3, "learning_rate": 1.6487104327169702e-05, "loss": 0.7764, "step": 2729 }, { "epoch": 0.3, "learning_rate": 1.6484420576055787e-05, "loss": 0.8174, "step": 2730 }, { "epoch": 0.3, "learning_rate": 1.6481736018792517e-05, "loss": 0.7583, "step": 2731 }, { "epoch": 0.3, "learning_rate": 1.6479050655713645e-05, "loss": 0.7283, "step": 2732 }, { "epoch": 0.3, "learning_rate": 1.6476364487153024e-05, "loss": 0.7261, "step": 2733 }, { "epoch": 0.3, "learning_rate": 1.6473677513444588e-05, "loss": 0.6987, "step": 2734 }, { "epoch": 0.3, "learning_rate": 1.647098973492239e-05, "loss": 0.8101, "step": 2735 }, { "epoch": 0.3, "learning_rate": 1.6468301151920576e-05, "loss": 0.7275, "step": 2736 }, { "epoch": 0.3, "learning_rate": 1.6465611764773397e-05, "loss": 0.6848, "step": 2737 }, { "epoch": 0.3, "learning_rate": 1.6462921573815194e-05, "loss": 0.7388, "step": 2738 }, { "epoch": 0.3, "learning_rate": 1.6460230579380423e-05, "loss": 0.8716, "step": 2739 }, { "epoch": 0.3, "learning_rate": 1.6457538781803625e-05, "loss": 0.6775, "step": 2740 }, { "epoch": 0.3, "learning_rate": 1.6454846181419444e-05, "loss": 0.6816, "step": 2741 }, { "epoch": 0.3, "learning_rate": 1.6452152778562633e-05, "loss": 0.6978, "step": 2742 }, { "epoch": 0.3, "learning_rate": 1.6449458573568032e-05, "loss": 0.7949, "step": 2743 }, { "epoch": 0.3, "learning_rate": 1.6446763566770598e-05, "loss": 0.6887, "step": 2744 }, { "epoch": 0.3, "learning_rate": 1.644406775850536e-05, "loss": 0.7041, "step": 2745 }, { "epoch": 0.3, "learning_rate": 1.6441371149107478e-05, "loss": 0.6228, "step": 2746 }, { "epoch": 0.3, "learning_rate": 1.6438673738912195e-05, "loss": 0.7864, "step": 2747 }, { "epoch": 0.3, "learning_rate": 1.6435975528254847e-05, "loss": 0.7456, "step": 2748 }, { "epoch": 0.3, "learning_rate": 1.6433276517470888e-05, "loss": 0.7363, "step": 2749 }, { "epoch": 0.3, "learning_rate": 1.6430576706895855e-05, "loss": 0.8398, "step": 2750 }, { "epoch": 0.3, "learning_rate": 1.6427876096865394e-05, "loss": 0.7993, "step": 2751 }, { "epoch": 0.3, "learning_rate": 1.6425174687715247e-05, "loss": 0.7366, "step": 2752 }, { "epoch": 0.3, "learning_rate": 1.6422472479781258e-05, "loss": 0.6758, "step": 2753 }, { "epoch": 0.3, "learning_rate": 1.6419769473399362e-05, "loss": 0.8149, "step": 2754 }, { "epoch": 0.3, "learning_rate": 1.6417065668905605e-05, "loss": 0.6519, "step": 2755 }, { "epoch": 0.3, "learning_rate": 1.6414361066636123e-05, "loss": 0.814, "step": 2756 }, { "epoch": 0.3, "learning_rate": 1.6411655666927157e-05, "loss": 0.7554, "step": 2757 }, { "epoch": 0.3, "learning_rate": 1.6408949470115045e-05, "loss": 0.655, "step": 2758 }, { "epoch": 0.3, "learning_rate": 1.640624247653622e-05, "loss": 0.8604, "step": 2759 }, { "epoch": 0.3, "learning_rate": 1.6403534686527223e-05, "loss": 0.79, "step": 2760 }, { "epoch": 0.3, "learning_rate": 1.640082610042469e-05, "loss": 0.6938, "step": 2761 }, { "epoch": 0.3, "learning_rate": 1.639811671856535e-05, "loss": 0.7285, "step": 2762 }, { "epoch": 0.3, "learning_rate": 1.6395406541286036e-05, "loss": 0.8184, "step": 2763 }, { "epoch": 0.3, "learning_rate": 1.6392695568923685e-05, "loss": 0.7847, "step": 2764 }, { "epoch": 0.3, "learning_rate": 1.6389983801815324e-05, "loss": 0.7334, "step": 2765 }, { "epoch": 0.3, "learning_rate": 1.6387271240298082e-05, "loss": 0.7207, "step": 2766 }, { "epoch": 0.3, "learning_rate": 1.6384557884709188e-05, "loss": 0.8218, "step": 2767 }, { "epoch": 0.3, "learning_rate": 1.6381843735385975e-05, "loss": 0.7783, "step": 2768 }, { "epoch": 0.3, "learning_rate": 1.6379128792665853e-05, "loss": 0.5896, "step": 2769 }, { "epoch": 0.3, "learning_rate": 1.6376413056886364e-05, "loss": 0.7322, "step": 2770 }, { "epoch": 0.3, "learning_rate": 1.637369652838512e-05, "loss": 0.7778, "step": 2771 }, { "epoch": 0.3, "learning_rate": 1.6370979207499845e-05, "loss": 0.8115, "step": 2772 }, { "epoch": 0.3, "learning_rate": 1.636826109456836e-05, "loss": 0.7419, "step": 2773 }, { "epoch": 0.3, "learning_rate": 1.6365542189928584e-05, "loss": 0.8135, "step": 2774 }, { "epoch": 0.3, "learning_rate": 1.636282249391853e-05, "loss": 0.6682, "step": 2775 }, { "epoch": 0.3, "learning_rate": 1.6360102006876317e-05, "loss": 0.6809, "step": 2776 }, { "epoch": 0.3, "learning_rate": 1.6357380729140156e-05, "loss": 0.5408, "step": 2777 }, { "epoch": 0.3, "learning_rate": 1.6354658661048364e-05, "loss": 0.7644, "step": 2778 }, { "epoch": 0.3, "learning_rate": 1.6351935802939344e-05, "loss": 0.7578, "step": 2779 }, { "epoch": 0.3, "learning_rate": 1.6349212155151606e-05, "loss": 0.6648, "step": 2780 }, { "epoch": 0.3, "learning_rate": 1.6346487718023762e-05, "loss": 0.6377, "step": 2781 }, { "epoch": 0.3, "learning_rate": 1.6343762491894513e-05, "loss": 0.8223, "step": 2782 }, { "epoch": 0.3, "learning_rate": 1.634103647710266e-05, "loss": 0.8003, "step": 2783 }, { "epoch": 0.3, "learning_rate": 1.63383096739871e-05, "loss": 0.7524, "step": 2784 }, { "epoch": 0.3, "learning_rate": 1.6335582082886843e-05, "loss": 0.7979, "step": 2785 }, { "epoch": 0.3, "learning_rate": 1.633285370414098e-05, "loss": 0.7158, "step": 2786 }, { "epoch": 0.3, "learning_rate": 1.6330124538088705e-05, "loss": 0.7412, "step": 2787 }, { "epoch": 0.3, "learning_rate": 1.632739458506931e-05, "loss": 0.708, "step": 2788 }, { "epoch": 0.3, "learning_rate": 1.6324663845422187e-05, "loss": 0.7654, "step": 2789 }, { "epoch": 0.3, "learning_rate": 1.6321932319486822e-05, "loss": 0.635, "step": 2790 }, { "epoch": 0.3, "learning_rate": 1.6319200007602803e-05, "loss": 0.7461, "step": 2791 }, { "epoch": 0.3, "learning_rate": 1.6316466910109813e-05, "loss": 0.7817, "step": 2792 }, { "epoch": 0.3, "learning_rate": 1.631373302734763e-05, "loss": 0.8628, "step": 2793 }, { "epoch": 0.3, "learning_rate": 1.6310998359656137e-05, "loss": 0.7847, "step": 2794 }, { "epoch": 0.3, "learning_rate": 1.6308262907375314e-05, "loss": 0.8564, "step": 2795 }, { "epoch": 0.3, "learning_rate": 1.6305526670845225e-05, "loss": 0.6643, "step": 2796 }, { "epoch": 0.3, "learning_rate": 1.630278965040605e-05, "loss": 0.6621, "step": 2797 }, { "epoch": 0.3, "learning_rate": 1.6300051846398055e-05, "loss": 0.8086, "step": 2798 }, { "epoch": 0.3, "learning_rate": 1.6297313259161605e-05, "loss": 0.7839, "step": 2799 }, { "epoch": 0.3, "learning_rate": 1.629457388903717e-05, "loss": 0.8291, "step": 2800 }, { "epoch": 0.3, "learning_rate": 1.6291833736365303e-05, "loss": 0.7529, "step": 2801 }, { "epoch": 0.31, "learning_rate": 1.628909280148667e-05, "loss": 0.6594, "step": 2802 }, { "epoch": 0.31, "learning_rate": 1.6286351084742014e-05, "loss": 0.6758, "step": 2803 }, { "epoch": 0.31, "learning_rate": 1.6283608586472202e-05, "loss": 0.7703, "step": 2804 }, { "epoch": 0.31, "learning_rate": 1.6280865307018177e-05, "loss": 0.73, "step": 2805 }, { "epoch": 0.31, "learning_rate": 1.627812124672099e-05, "loss": 0.7925, "step": 2806 }, { "epoch": 0.31, "learning_rate": 1.6275376405921778e-05, "loss": 0.7988, "step": 2807 }, { "epoch": 0.31, "learning_rate": 1.6272630784961786e-05, "loss": 0.7812, "step": 2808 }, { "epoch": 0.31, "learning_rate": 1.626988438418236e-05, "loss": 0.7002, "step": 2809 }, { "epoch": 0.31, "learning_rate": 1.6267137203924924e-05, "loss": 0.7832, "step": 2810 }, { "epoch": 0.31, "learning_rate": 1.6264389244531015e-05, "loss": 0.8999, "step": 2811 }, { "epoch": 0.31, "learning_rate": 1.626164050634226e-05, "loss": 0.772, "step": 2812 }, { "epoch": 0.31, "learning_rate": 1.6258890989700384e-05, "loss": 0.8472, "step": 2813 }, { "epoch": 0.31, "learning_rate": 1.6256140694947217e-05, "loss": 0.689, "step": 2814 }, { "epoch": 0.31, "learning_rate": 1.6253389622424668e-05, "loss": 0.7623, "step": 2815 }, { "epoch": 0.31, "learning_rate": 1.6250637772474764e-05, "loss": 0.7075, "step": 2816 }, { "epoch": 0.31, "learning_rate": 1.6247885145439602e-05, "loss": 0.6533, "step": 2817 }, { "epoch": 0.31, "learning_rate": 1.6245131741661408e-05, "loss": 0.8447, "step": 2818 }, { "epoch": 0.31, "learning_rate": 1.6242377561482477e-05, "loss": 0.7593, "step": 2819 }, { "epoch": 0.31, "learning_rate": 1.6239622605245217e-05, "loss": 0.7239, "step": 2820 }, { "epoch": 0.31, "learning_rate": 1.623686687329212e-05, "loss": 0.7241, "step": 2821 }, { "epoch": 0.31, "learning_rate": 1.623411036596579e-05, "loss": 0.6794, "step": 2822 }, { "epoch": 0.31, "learning_rate": 1.623135308360891e-05, "loss": 0.7949, "step": 2823 }, { "epoch": 0.31, "learning_rate": 1.6228595026564277e-05, "loss": 0.6716, "step": 2824 }, { "epoch": 0.31, "learning_rate": 1.622583619517477e-05, "loss": 0.8506, "step": 2825 }, { "epoch": 0.31, "learning_rate": 1.6223076589783368e-05, "loss": 0.8035, "step": 2826 }, { "epoch": 0.31, "learning_rate": 1.6220316210733152e-05, "loss": 0.7378, "step": 2827 }, { "epoch": 0.31, "learning_rate": 1.6217555058367288e-05, "loss": 0.7805, "step": 2828 }, { "epoch": 0.31, "learning_rate": 1.6214793133029055e-05, "loss": 0.6523, "step": 2829 }, { "epoch": 0.31, "learning_rate": 1.6212030435061813e-05, "loss": 0.813, "step": 2830 }, { "epoch": 0.31, "learning_rate": 1.620926696480902e-05, "loss": 0.7275, "step": 2831 }, { "epoch": 0.31, "learning_rate": 1.620650272261424e-05, "loss": 0.5918, "step": 2832 }, { "epoch": 0.31, "learning_rate": 1.6203737708821118e-05, "loss": 0.8286, "step": 2833 }, { "epoch": 0.31, "learning_rate": 1.6200971923773414e-05, "loss": 0.7578, "step": 2834 }, { "epoch": 0.31, "learning_rate": 1.6198205367814964e-05, "loss": 0.832, "step": 2835 }, { "epoch": 0.31, "learning_rate": 1.619543804128971e-05, "loss": 0.8071, "step": 2836 }, { "epoch": 0.31, "learning_rate": 1.6192669944541693e-05, "loss": 0.7715, "step": 2837 }, { "epoch": 0.31, "learning_rate": 1.6189901077915046e-05, "loss": 0.7905, "step": 2838 }, { "epoch": 0.31, "learning_rate": 1.618713144175399e-05, "loss": 0.7759, "step": 2839 }, { "epoch": 0.31, "learning_rate": 1.6184361036402854e-05, "loss": 0.6035, "step": 2840 }, { "epoch": 0.31, "learning_rate": 1.6181589862206053e-05, "loss": 0.8579, "step": 2841 }, { "epoch": 0.31, "learning_rate": 1.617881791950811e-05, "loss": 0.7053, "step": 2842 }, { "epoch": 0.31, "learning_rate": 1.617604520865363e-05, "loss": 0.7, "step": 2843 }, { "epoch": 0.31, "learning_rate": 1.617327172998732e-05, "loss": 0.6365, "step": 2844 }, { "epoch": 0.31, "learning_rate": 1.617049748385398e-05, "loss": 0.6194, "step": 2845 }, { "epoch": 0.31, "learning_rate": 1.6167722470598506e-05, "loss": 0.7185, "step": 2846 }, { "epoch": 0.31, "learning_rate": 1.6164946690565898e-05, "loss": 0.9014, "step": 2847 }, { "epoch": 0.31, "learning_rate": 1.6162170144101237e-05, "loss": 0.6633, "step": 2848 }, { "epoch": 0.31, "learning_rate": 1.6159392831549708e-05, "loss": 0.7678, "step": 2849 }, { "epoch": 0.31, "learning_rate": 1.6156614753256583e-05, "loss": 0.7625, "step": 2850 }, { "epoch": 0.31, "learning_rate": 1.6153835909567245e-05, "loss": 0.7827, "step": 2851 }, { "epoch": 0.31, "learning_rate": 1.6151056300827158e-05, "loss": 0.7832, "step": 2852 }, { "epoch": 0.31, "learning_rate": 1.6148275927381887e-05, "loss": 0.7856, "step": 2853 }, { "epoch": 0.31, "learning_rate": 1.614549478957709e-05, "loss": 0.8706, "step": 2854 }, { "epoch": 0.31, "learning_rate": 1.6142712887758515e-05, "loss": 0.7563, "step": 2855 }, { "epoch": 0.31, "learning_rate": 1.613993022227202e-05, "loss": 0.7754, "step": 2856 }, { "epoch": 0.31, "learning_rate": 1.6137146793463545e-05, "loss": 0.6248, "step": 2857 }, { "epoch": 0.31, "learning_rate": 1.613436260167913e-05, "loss": 0.6455, "step": 2858 }, { "epoch": 0.31, "learning_rate": 1.6131577647264903e-05, "loss": 0.7734, "step": 2859 }, { "epoch": 0.31, "learning_rate": 1.6128791930567095e-05, "loss": 0.6592, "step": 2860 }, { "epoch": 0.31, "learning_rate": 1.6126005451932028e-05, "loss": 0.6372, "step": 2861 }, { "epoch": 0.31, "learning_rate": 1.6123218211706125e-05, "loss": 0.6658, "step": 2862 }, { "epoch": 0.31, "learning_rate": 1.6120430210235896e-05, "loss": 0.7764, "step": 2863 }, { "epoch": 0.31, "learning_rate": 1.611764144786794e-05, "loss": 0.7188, "step": 2864 }, { "epoch": 0.31, "learning_rate": 1.611485192494897e-05, "loss": 0.8491, "step": 2865 }, { "epoch": 0.31, "learning_rate": 1.611206164182578e-05, "loss": 0.6765, "step": 2866 }, { "epoch": 0.31, "learning_rate": 1.6109270598845256e-05, "loss": 0.7529, "step": 2867 }, { "epoch": 0.31, "learning_rate": 1.6106478796354382e-05, "loss": 0.658, "step": 2868 }, { "epoch": 0.31, "learning_rate": 1.6103686234700244e-05, "loss": 0.7317, "step": 2869 }, { "epoch": 0.31, "learning_rate": 1.610089291423001e-05, "loss": 0.8745, "step": 2870 }, { "epoch": 0.31, "learning_rate": 1.6098098835290955e-05, "loss": 0.7336, "step": 2871 }, { "epoch": 0.31, "learning_rate": 1.6095303998230432e-05, "loss": 0.7625, "step": 2872 }, { "epoch": 0.31, "learning_rate": 1.6092508403395908e-05, "loss": 0.7422, "step": 2873 }, { "epoch": 0.31, "learning_rate": 1.6089712051134927e-05, "loss": 0.7715, "step": 2874 }, { "epoch": 0.31, "learning_rate": 1.6086914941795136e-05, "loss": 0.7788, "step": 2875 }, { "epoch": 0.31, "learning_rate": 1.608411707572428e-05, "loss": 0.72, "step": 2876 }, { "epoch": 0.31, "learning_rate": 1.608131845327018e-05, "loss": 0.7241, "step": 2877 }, { "epoch": 0.31, "learning_rate": 1.6078519074780775e-05, "loss": 0.918, "step": 2878 }, { "epoch": 0.31, "learning_rate": 1.6075718940604076e-05, "loss": 0.7568, "step": 2879 }, { "epoch": 0.31, "learning_rate": 1.6072918051088212e-05, "loss": 0.7307, "step": 2880 }, { "epoch": 0.31, "learning_rate": 1.6070116406581382e-05, "loss": 0.8076, "step": 2881 }, { "epoch": 0.31, "learning_rate": 1.606731400743189e-05, "loss": 0.7744, "step": 2882 }, { "epoch": 0.31, "learning_rate": 1.6064510853988137e-05, "loss": 0.7666, "step": 2883 }, { "epoch": 0.31, "learning_rate": 1.606170694659861e-05, "loss": 0.6533, "step": 2884 }, { "epoch": 0.31, "learning_rate": 1.6058902285611892e-05, "loss": 0.7825, "step": 2885 }, { "epoch": 0.31, "learning_rate": 1.6056096871376667e-05, "loss": 0.7979, "step": 2886 }, { "epoch": 0.31, "learning_rate": 1.6053290704241705e-05, "loss": 0.708, "step": 2887 }, { "epoch": 0.31, "learning_rate": 1.6050483784555867e-05, "loss": 0.7305, "step": 2888 }, { "epoch": 0.31, "learning_rate": 1.6047676112668118e-05, "loss": 0.7397, "step": 2889 }, { "epoch": 0.31, "learning_rate": 1.6044867688927504e-05, "loss": 0.7212, "step": 2890 }, { "epoch": 0.31, "learning_rate": 1.6042058513683177e-05, "loss": 0.7202, "step": 2891 }, { "epoch": 0.31, "learning_rate": 1.6039248587284373e-05, "loss": 0.8208, "step": 2892 }, { "epoch": 0.31, "learning_rate": 1.6036437910080427e-05, "loss": 0.7856, "step": 2893 }, { "epoch": 0.32, "learning_rate": 1.603362648242076e-05, "loss": 0.7256, "step": 2894 }, { "epoch": 0.32, "learning_rate": 1.6030814304654895e-05, "loss": 0.7915, "step": 2895 }, { "epoch": 0.32, "learning_rate": 1.6028001377132447e-05, "loss": 0.6289, "step": 2896 }, { "epoch": 0.32, "learning_rate": 1.602518770020312e-05, "loss": 0.7354, "step": 2897 }, { "epoch": 0.32, "learning_rate": 1.602237327421671e-05, "loss": 0.7969, "step": 2898 }, { "epoch": 0.32, "learning_rate": 1.6019558099523115e-05, "loss": 0.7229, "step": 2899 }, { "epoch": 0.32, "learning_rate": 1.601674217647231e-05, "loss": 0.7368, "step": 2900 }, { "epoch": 0.32, "learning_rate": 1.6013925505414386e-05, "loss": 0.8306, "step": 2901 }, { "epoch": 0.32, "learning_rate": 1.6011108086699506e-05, "loss": 0.74, "step": 2902 }, { "epoch": 0.32, "learning_rate": 1.6008289920677933e-05, "loss": 0.6057, "step": 2903 }, { "epoch": 0.32, "learning_rate": 1.6005471007700033e-05, "loss": 0.8103, "step": 2904 }, { "epoch": 0.32, "learning_rate": 1.6002651348116248e-05, "loss": 0.7319, "step": 2905 }, { "epoch": 0.32, "learning_rate": 1.5999830942277124e-05, "loss": 0.9102, "step": 2906 }, { "epoch": 0.32, "learning_rate": 1.5997009790533292e-05, "loss": 0.6868, "step": 2907 }, { "epoch": 0.32, "learning_rate": 1.5994187893235485e-05, "loss": 0.8103, "step": 2908 }, { "epoch": 0.32, "learning_rate": 1.5991365250734524e-05, "loss": 0.7642, "step": 2909 }, { "epoch": 0.32, "learning_rate": 1.5988541863381323e-05, "loss": 0.7554, "step": 2910 }, { "epoch": 0.32, "learning_rate": 1.5985717731526888e-05, "loss": 0.7161, "step": 2911 }, { "epoch": 0.32, "learning_rate": 1.5982892855522312e-05, "loss": 0.771, "step": 2912 }, { "epoch": 0.32, "learning_rate": 1.5980067235718793e-05, "loss": 0.6858, "step": 2913 }, { "epoch": 0.32, "learning_rate": 1.597724087246761e-05, "loss": 0.8477, "step": 2914 }, { "epoch": 0.32, "learning_rate": 1.5974413766120145e-05, "loss": 0.6543, "step": 2915 }, { "epoch": 0.32, "learning_rate": 1.5971585917027864e-05, "loss": 0.8564, "step": 2916 }, { "epoch": 0.32, "learning_rate": 1.5968757325542322e-05, "loss": 0.7649, "step": 2917 }, { "epoch": 0.32, "learning_rate": 1.5965927992015182e-05, "loss": 0.7734, "step": 2918 }, { "epoch": 0.32, "learning_rate": 1.5963097916798184e-05, "loss": 0.7324, "step": 2919 }, { "epoch": 0.32, "learning_rate": 1.5960267100243165e-05, "loss": 0.7681, "step": 2920 }, { "epoch": 0.32, "learning_rate": 1.595743554270206e-05, "loss": 0.843, "step": 2921 }, { "epoch": 0.32, "learning_rate": 1.595460324452688e-05, "loss": 0.7146, "step": 2922 }, { "epoch": 0.32, "learning_rate": 1.595177020606975e-05, "loss": 0.7705, "step": 2923 }, { "epoch": 0.32, "learning_rate": 1.5948936427682874e-05, "loss": 0.7607, "step": 2924 }, { "epoch": 0.32, "learning_rate": 1.5946101909718548e-05, "loss": 0.73, "step": 2925 }, { "epoch": 0.32, "learning_rate": 1.5943266652529162e-05, "loss": 0.6948, "step": 2926 }, { "epoch": 0.32, "learning_rate": 1.5940430656467193e-05, "loss": 0.7627, "step": 2927 }, { "epoch": 0.32, "learning_rate": 1.5937593921885227e-05, "loss": 0.5625, "step": 2928 }, { "epoch": 0.32, "learning_rate": 1.593475644913592e-05, "loss": 0.8911, "step": 2929 }, { "epoch": 0.32, "learning_rate": 1.5931918238572025e-05, "loss": 0.7085, "step": 2930 }, { "epoch": 0.32, "learning_rate": 1.5929079290546408e-05, "loss": 0.7153, "step": 2931 }, { "epoch": 0.32, "learning_rate": 1.592623960541199e-05, "loss": 0.7571, "step": 2932 }, { "epoch": 0.32, "learning_rate": 1.592339918352182e-05, "loss": 0.7524, "step": 2933 }, { "epoch": 0.32, "learning_rate": 1.5920558025229015e-05, "loss": 0.7671, "step": 2934 }, { "epoch": 0.32, "learning_rate": 1.5917716130886786e-05, "loss": 0.7456, "step": 2935 }, { "epoch": 0.32, "learning_rate": 1.5914873500848446e-05, "loss": 0.7568, "step": 2936 }, { "epoch": 0.32, "learning_rate": 1.591203013546739e-05, "loss": 0.7251, "step": 2937 }, { "epoch": 0.32, "learning_rate": 1.5909186035097114e-05, "loss": 0.7021, "step": 2938 }, { "epoch": 0.32, "learning_rate": 1.5906341200091194e-05, "loss": 0.7607, "step": 2939 }, { "epoch": 0.32, "learning_rate": 1.5903495630803302e-05, "loss": 0.6978, "step": 2940 }, { "epoch": 0.32, "learning_rate": 1.59006493275872e-05, "loss": 0.6731, "step": 2941 }, { "epoch": 0.32, "learning_rate": 1.5897802290796752e-05, "loss": 0.738, "step": 2942 }, { "epoch": 0.32, "learning_rate": 1.5894954520785895e-05, "loss": 0.7556, "step": 2943 }, { "epoch": 0.32, "learning_rate": 1.5892106017908675e-05, "loss": 0.7588, "step": 2944 }, { "epoch": 0.32, "learning_rate": 1.588925678251921e-05, "loss": 0.6023, "step": 2945 }, { "epoch": 0.32, "learning_rate": 1.5886406814971728e-05, "loss": 0.7373, "step": 2946 }, { "epoch": 0.32, "learning_rate": 1.588355611562054e-05, "loss": 0.6523, "step": 2947 }, { "epoch": 0.32, "learning_rate": 1.5880704684820046e-05, "loss": 0.8267, "step": 2948 }, { "epoch": 0.32, "learning_rate": 1.5877852522924733e-05, "loss": 0.7827, "step": 2949 }, { "epoch": 0.32, "learning_rate": 1.5874999630289193e-05, "loss": 0.7061, "step": 2950 }, { "epoch": 0.32, "learning_rate": 1.587214600726809e-05, "loss": 0.814, "step": 2951 }, { "epoch": 0.32, "learning_rate": 1.5869291654216203e-05, "loss": 0.6711, "step": 2952 }, { "epoch": 0.32, "learning_rate": 1.5866436571488376e-05, "loss": 0.8184, "step": 2953 }, { "epoch": 0.32, "learning_rate": 1.5863580759439563e-05, "loss": 0.7112, "step": 2954 }, { "epoch": 0.32, "learning_rate": 1.5860724218424794e-05, "loss": 0.7874, "step": 2955 }, { "epoch": 0.32, "learning_rate": 1.5857866948799202e-05, "loss": 0.6841, "step": 2956 }, { "epoch": 0.32, "learning_rate": 1.585500895091801e-05, "loss": 0.824, "step": 2957 }, { "epoch": 0.32, "learning_rate": 1.585215022513652e-05, "loss": 0.8198, "step": 2958 }, { "epoch": 0.32, "learning_rate": 1.5849290771810127e-05, "loss": 0.6675, "step": 2959 }, { "epoch": 0.32, "learning_rate": 1.5846430591294334e-05, "loss": 0.7219, "step": 2960 }, { "epoch": 0.32, "learning_rate": 1.584356968394471e-05, "loss": 0.8955, "step": 2961 }, { "epoch": 0.32, "learning_rate": 1.5840708050116935e-05, "loss": 0.635, "step": 2962 }, { "epoch": 0.32, "learning_rate": 1.583784569016676e-05, "loss": 0.7344, "step": 2963 }, { "epoch": 0.32, "learning_rate": 1.5834982604450044e-05, "loss": 0.7974, "step": 2964 }, { "epoch": 0.32, "learning_rate": 1.5832118793322727e-05, "loss": 0.8074, "step": 2965 }, { "epoch": 0.32, "learning_rate": 1.582925425714084e-05, "loss": 0.615, "step": 2966 }, { "epoch": 0.32, "learning_rate": 1.5826388996260503e-05, "loss": 0.7554, "step": 2967 }, { "epoch": 0.32, "learning_rate": 1.5823523011037932e-05, "loss": 0.6792, "step": 2968 }, { "epoch": 0.32, "learning_rate": 1.5820656301829425e-05, "loss": 0.7217, "step": 2969 }, { "epoch": 0.32, "learning_rate": 1.581778886899138e-05, "loss": 0.7422, "step": 2970 }, { "epoch": 0.32, "learning_rate": 1.5814920712880267e-05, "loss": 0.8, "step": 2971 }, { "epoch": 0.32, "learning_rate": 1.581205183385267e-05, "loss": 0.7871, "step": 2972 }, { "epoch": 0.32, "learning_rate": 1.580918223226525e-05, "loss": 0.8218, "step": 2973 }, { "epoch": 0.32, "learning_rate": 1.580631190847475e-05, "loss": 0.7832, "step": 2974 }, { "epoch": 0.32, "learning_rate": 1.5803440862838018e-05, "loss": 0.7393, "step": 2975 }, { "epoch": 0.32, "learning_rate": 1.5800569095711983e-05, "loss": 0.7168, "step": 2976 }, { "epoch": 0.32, "learning_rate": 1.5797696607453668e-05, "loss": 0.7422, "step": 2977 }, { "epoch": 0.32, "learning_rate": 1.579482339842018e-05, "loss": 0.7341, "step": 2978 }, { "epoch": 0.32, "learning_rate": 1.5791949468968723e-05, "loss": 0.8071, "step": 2979 }, { "epoch": 0.32, "learning_rate": 1.5789074819456583e-05, "loss": 0.7178, "step": 2980 }, { "epoch": 0.32, "learning_rate": 1.578619945024114e-05, "loss": 0.6548, "step": 2981 }, { "epoch": 0.32, "learning_rate": 1.5783323361679865e-05, "loss": 0.8735, "step": 2982 }, { "epoch": 0.32, "learning_rate": 1.5780446554130318e-05, "loss": 0.6418, "step": 2983 }, { "epoch": 0.32, "learning_rate": 1.5777569027950137e-05, "loss": 0.6616, "step": 2984 }, { "epoch": 0.32, "learning_rate": 1.5774690783497066e-05, "loss": 0.9058, "step": 2985 }, { "epoch": 0.33, "learning_rate": 1.5771811821128932e-05, "loss": 0.7363, "step": 2986 }, { "epoch": 0.33, "learning_rate": 1.5768932141203647e-05, "loss": 0.7144, "step": 2987 }, { "epoch": 0.33, "learning_rate": 1.5766051744079217e-05, "loss": 0.8096, "step": 2988 }, { "epoch": 0.33, "learning_rate": 1.5763170630113735e-05, "loss": 0.7834, "step": 2989 }, { "epoch": 0.33, "learning_rate": 1.5760288799665387e-05, "loss": 0.5786, "step": 2990 }, { "epoch": 0.33, "learning_rate": 1.575740625309244e-05, "loss": 0.7722, "step": 2991 }, { "epoch": 0.33, "learning_rate": 1.575452299075326e-05, "loss": 0.7839, "step": 2992 }, { "epoch": 0.33, "learning_rate": 1.575163901300629e-05, "loss": 0.7998, "step": 2993 }, { "epoch": 0.33, "learning_rate": 1.5748754320210074e-05, "loss": 0.6736, "step": 2994 }, { "epoch": 0.33, "learning_rate": 1.5745868912723236e-05, "loss": 0.7561, "step": 2995 }, { "epoch": 0.33, "learning_rate": 1.57429827909045e-05, "loss": 0.6719, "step": 2996 }, { "epoch": 0.33, "learning_rate": 1.574009595511267e-05, "loss": 0.7815, "step": 2997 }, { "epoch": 0.33, "learning_rate": 1.5737208405706628e-05, "loss": 0.7449, "step": 2998 }, { "epoch": 0.33, "learning_rate": 1.5734320143045373e-05, "loss": 0.7422, "step": 2999 }, { "epoch": 0.33, "learning_rate": 1.5731431167487966e-05, "loss": 0.856, "step": 3000 }, { "epoch": 0.33, "learning_rate": 1.572854147939357e-05, "loss": 0.8149, "step": 3001 }, { "epoch": 0.33, "learning_rate": 1.5725651079121432e-05, "loss": 0.7124, "step": 3002 }, { "epoch": 0.33, "learning_rate": 1.5722759967030898e-05, "loss": 0.7163, "step": 3003 }, { "epoch": 0.33, "learning_rate": 1.5719868143481385e-05, "loss": 0.7251, "step": 3004 }, { "epoch": 0.33, "learning_rate": 1.571697560883241e-05, "loss": 0.6497, "step": 3005 }, { "epoch": 0.33, "learning_rate": 1.5714082363443576e-05, "loss": 0.7539, "step": 3006 }, { "epoch": 0.33, "learning_rate": 1.5711188407674572e-05, "loss": 0.6805, "step": 3007 }, { "epoch": 0.33, "learning_rate": 1.570829374188518e-05, "loss": 0.7744, "step": 3008 }, { "epoch": 0.33, "learning_rate": 1.5705398366435264e-05, "loss": 0.646, "step": 3009 }, { "epoch": 0.33, "learning_rate": 1.570250228168478e-05, "loss": 0.7227, "step": 3010 }, { "epoch": 0.33, "learning_rate": 1.5699605487993782e-05, "loss": 0.6428, "step": 3011 }, { "epoch": 0.33, "learning_rate": 1.569670798572239e-05, "loss": 0.7979, "step": 3012 }, { "epoch": 0.33, "learning_rate": 1.569380977523083e-05, "loss": 0.8423, "step": 3013 }, { "epoch": 0.33, "learning_rate": 1.5690910856879407e-05, "loss": 0.7236, "step": 3014 }, { "epoch": 0.33, "learning_rate": 1.568801123102852e-05, "loss": 0.8223, "step": 3015 }, { "epoch": 0.33, "learning_rate": 1.5685110898038653e-05, "loss": 0.8242, "step": 3016 }, { "epoch": 0.33, "learning_rate": 1.5682209858270376e-05, "loss": 0.7124, "step": 3017 }, { "epoch": 0.33, "learning_rate": 1.5679308112084352e-05, "loss": 0.7202, "step": 3018 }, { "epoch": 0.33, "learning_rate": 1.567640565984133e-05, "loss": 0.6089, "step": 3019 }, { "epoch": 0.33, "learning_rate": 1.567350250190214e-05, "loss": 0.7524, "step": 3020 }, { "epoch": 0.33, "learning_rate": 1.5670598638627707e-05, "loss": 0.7593, "step": 3021 }, { "epoch": 0.33, "learning_rate": 1.566769407037905e-05, "loss": 0.7327, "step": 3022 }, { "epoch": 0.33, "learning_rate": 1.5664788797517254e-05, "loss": 0.7458, "step": 3023 }, { "epoch": 0.33, "learning_rate": 1.5661882820403516e-05, "loss": 0.9209, "step": 3024 }, { "epoch": 0.33, "learning_rate": 1.5658976139399107e-05, "loss": 0.7349, "step": 3025 }, { "epoch": 0.33, "learning_rate": 1.5656068754865388e-05, "loss": 0.7156, "step": 3026 }, { "epoch": 0.33, "learning_rate": 1.565316066716381e-05, "loss": 0.6792, "step": 3027 }, { "epoch": 0.33, "learning_rate": 1.56502518766559e-05, "loss": 0.7861, "step": 3028 }, { "epoch": 0.33, "learning_rate": 1.564734238370329e-05, "loss": 0.7285, "step": 3029 }, { "epoch": 0.33, "learning_rate": 1.5644432188667695e-05, "loss": 0.7429, "step": 3030 }, { "epoch": 0.33, "learning_rate": 1.5641521291910905e-05, "loss": 0.7495, "step": 3031 }, { "epoch": 0.33, "learning_rate": 1.5638609693794805e-05, "loss": 0.7749, "step": 3032 }, { "epoch": 0.33, "learning_rate": 1.5635697394681373e-05, "loss": 0.7368, "step": 3033 }, { "epoch": 0.33, "learning_rate": 1.5632784394932666e-05, "loss": 0.7625, "step": 3034 }, { "epoch": 0.33, "learning_rate": 1.5629870694910833e-05, "loss": 0.7761, "step": 3035 }, { "epoch": 0.33, "learning_rate": 1.5626956294978103e-05, "loss": 0.7778, "step": 3036 }, { "epoch": 0.33, "learning_rate": 1.56240411954968e-05, "loss": 0.7822, "step": 3037 }, { "epoch": 0.33, "learning_rate": 1.562112539682934e-05, "loss": 0.752, "step": 3038 }, { "epoch": 0.33, "learning_rate": 1.56182088993382e-05, "loss": 0.7412, "step": 3039 }, { "epoch": 0.33, "learning_rate": 1.561529170338598e-05, "loss": 0.8213, "step": 3040 }, { "epoch": 0.33, "learning_rate": 1.561237380933534e-05, "loss": 0.7307, "step": 3041 }, { "epoch": 0.33, "learning_rate": 1.5609455217549032e-05, "loss": 0.7527, "step": 3042 }, { "epoch": 0.33, "learning_rate": 1.5606535928389902e-05, "loss": 0.7263, "step": 3043 }, { "epoch": 0.33, "learning_rate": 1.560361594222088e-05, "loss": 0.6855, "step": 3044 }, { "epoch": 0.33, "learning_rate": 1.5600695259404983e-05, "loss": 0.7302, "step": 3045 }, { "epoch": 0.33, "learning_rate": 1.5597773880305307e-05, "loss": 0.7847, "step": 3046 }, { "epoch": 0.33, "learning_rate": 1.5594851805285043e-05, "loss": 0.8154, "step": 3047 }, { "epoch": 0.33, "learning_rate": 1.5591929034707468e-05, "loss": 0.7415, "step": 3048 }, { "epoch": 0.33, "learning_rate": 1.5589005568935947e-05, "loss": 0.7122, "step": 3049 }, { "epoch": 0.33, "learning_rate": 1.558608140833392e-05, "loss": 0.7468, "step": 3050 }, { "epoch": 0.33, "learning_rate": 1.5583156553264923e-05, "loss": 0.7595, "step": 3051 }, { "epoch": 0.33, "learning_rate": 1.5580231004092584e-05, "loss": 0.7466, "step": 3052 }, { "epoch": 0.33, "learning_rate": 1.5577304761180607e-05, "loss": 0.7319, "step": 3053 }, { "epoch": 0.33, "learning_rate": 1.5574377824892778e-05, "loss": 0.7405, "step": 3054 }, { "epoch": 0.33, "learning_rate": 1.557145019559298e-05, "loss": 0.7761, "step": 3055 }, { "epoch": 0.33, "learning_rate": 1.5568521873645183e-05, "loss": 0.7373, "step": 3056 }, { "epoch": 0.33, "learning_rate": 1.5565592859413442e-05, "loss": 0.7598, "step": 3057 }, { "epoch": 0.33, "learning_rate": 1.5562663153261882e-05, "loss": 0.6592, "step": 3058 }, { "epoch": 0.33, "learning_rate": 1.5559732755554734e-05, "loss": 0.7944, "step": 3059 }, { "epoch": 0.33, "learning_rate": 1.5556801666656315e-05, "loss": 0.6919, "step": 3060 }, { "epoch": 0.33, "learning_rate": 1.5553869886931007e-05, "loss": 0.6484, "step": 3061 }, { "epoch": 0.33, "learning_rate": 1.55509374167433e-05, "loss": 0.7329, "step": 3062 }, { "epoch": 0.33, "learning_rate": 1.554800425645776e-05, "loss": 0.7092, "step": 3063 }, { "epoch": 0.33, "learning_rate": 1.5545070406439042e-05, "loss": 0.658, "step": 3064 }, { "epoch": 0.33, "learning_rate": 1.554213586705188e-05, "loss": 0.7939, "step": 3065 }, { "epoch": 0.33, "learning_rate": 1.5539200638661106e-05, "loss": 0.7393, "step": 3066 }, { "epoch": 0.33, "learning_rate": 1.553626472163162e-05, "loss": 0.7446, "step": 3067 }, { "epoch": 0.33, "learning_rate": 1.553332811632843e-05, "loss": 0.7695, "step": 3068 }, { "epoch": 0.33, "learning_rate": 1.5530390823116612e-05, "loss": 0.7734, "step": 3069 }, { "epoch": 0.33, "learning_rate": 1.552745284236133e-05, "loss": 0.7402, "step": 3070 }, { "epoch": 0.33, "learning_rate": 1.552451417442784e-05, "loss": 0.6445, "step": 3071 }, { "epoch": 0.33, "learning_rate": 1.552157481968148e-05, "loss": 0.8477, "step": 3072 }, { "epoch": 0.33, "learning_rate": 1.551863477848767e-05, "loss": 0.7346, "step": 3073 }, { "epoch": 0.33, "learning_rate": 1.5515694051211925e-05, "loss": 0.6714, "step": 3074 }, { "epoch": 0.33, "learning_rate": 1.5512752638219834e-05, "loss": 0.6426, "step": 3075 }, { "epoch": 0.33, "learning_rate": 1.550981053987708e-05, "loss": 0.761, "step": 3076 }, { "epoch": 0.33, "learning_rate": 1.5506867756549424e-05, "loss": 0.6804, "step": 3077 }, { "epoch": 0.34, "learning_rate": 1.5503924288602717e-05, "loss": 0.7966, "step": 3078 }, { "epoch": 0.34, "learning_rate": 1.550098013640289e-05, "loss": 0.6787, "step": 3079 }, { "epoch": 0.34, "learning_rate": 1.549803530031597e-05, "loss": 0.7158, "step": 3080 }, { "epoch": 0.34, "learning_rate": 1.5495089780708062e-05, "loss": 0.6653, "step": 3081 }, { "epoch": 0.34, "learning_rate": 1.549214357794535e-05, "loss": 0.7734, "step": 3082 }, { "epoch": 0.34, "learning_rate": 1.548919669239411e-05, "loss": 0.7432, "step": 3083 }, { "epoch": 0.34, "learning_rate": 1.5486249124420702e-05, "loss": 0.812, "step": 3084 }, { "epoch": 0.34, "learning_rate": 1.548330087439157e-05, "loss": 0.7493, "step": 3085 }, { "epoch": 0.34, "learning_rate": 1.5480351942673248e-05, "loss": 0.7539, "step": 3086 }, { "epoch": 0.34, "learning_rate": 1.5477402329632342e-05, "loss": 0.7998, "step": 3087 }, { "epoch": 0.34, "learning_rate": 1.5474452035635558e-05, "loss": 0.7424, "step": 3088 }, { "epoch": 0.34, "learning_rate": 1.5471501061049675e-05, "loss": 0.7263, "step": 3089 }, { "epoch": 0.34, "learning_rate": 1.546854940624156e-05, "loss": 0.7087, "step": 3090 }, { "epoch": 0.34, "learning_rate": 1.5465597071578172e-05, "loss": 0.6431, "step": 3091 }, { "epoch": 0.34, "learning_rate": 1.546264405742654e-05, "loss": 0.8062, "step": 3092 }, { "epoch": 0.34, "learning_rate": 1.5459690364153792e-05, "loss": 0.8159, "step": 3093 }, { "epoch": 0.34, "learning_rate": 1.5456735992127133e-05, "loss": 0.8687, "step": 3094 }, { "epoch": 0.34, "learning_rate": 1.545378094171385e-05, "loss": 0.8438, "step": 3095 }, { "epoch": 0.34, "learning_rate": 1.5450825213281317e-05, "loss": 0.7368, "step": 3096 }, { "epoch": 0.34, "learning_rate": 1.5447868807197e-05, "loss": 0.6887, "step": 3097 }, { "epoch": 0.34, "learning_rate": 1.5444911723828436e-05, "loss": 0.8228, "step": 3098 }, { "epoch": 0.34, "learning_rate": 1.544195396354325e-05, "loss": 0.7444, "step": 3099 }, { "epoch": 0.34, "learning_rate": 1.543899552670916e-05, "loss": 0.6401, "step": 3100 }, { "epoch": 0.34, "learning_rate": 1.5436036413693962e-05, "loss": 0.8167, "step": 3101 }, { "epoch": 0.34, "learning_rate": 1.5433076624865533e-05, "loss": 0.6506, "step": 3102 }, { "epoch": 0.34, "learning_rate": 1.5430116160591836e-05, "loss": 0.7429, "step": 3103 }, { "epoch": 0.34, "learning_rate": 1.5427155021240917e-05, "loss": 0.792, "step": 3104 }, { "epoch": 0.34, "learning_rate": 1.542419320718091e-05, "loss": 0.6426, "step": 3105 }, { "epoch": 0.34, "learning_rate": 1.5421230718780036e-05, "loss": 0.655, "step": 3106 }, { "epoch": 0.34, "learning_rate": 1.5418267556406586e-05, "loss": 0.6221, "step": 3107 }, { "epoch": 0.34, "learning_rate": 1.5415303720428948e-05, "loss": 0.8247, "step": 3108 }, { "epoch": 0.34, "learning_rate": 1.5412339211215585e-05, "loss": 0.6792, "step": 3109 }, { "epoch": 0.34, "learning_rate": 1.5409374029135047e-05, "loss": 0.6675, "step": 3110 }, { "epoch": 0.34, "learning_rate": 1.5406408174555978e-05, "loss": 0.7251, "step": 3111 }, { "epoch": 0.34, "learning_rate": 1.5403441647847083e-05, "loss": 0.8257, "step": 3112 }, { "epoch": 0.34, "learning_rate": 1.5400474449377174e-05, "loss": 0.6724, "step": 3113 }, { "epoch": 0.34, "learning_rate": 1.539750657951513e-05, "loss": 0.677, "step": 3114 }, { "epoch": 0.34, "learning_rate": 1.5394538038629924e-05, "loss": 0.6924, "step": 3115 }, { "epoch": 0.34, "learning_rate": 1.53915688270906e-05, "loss": 0.7974, "step": 3116 }, { "epoch": 0.34, "learning_rate": 1.5388598945266297e-05, "loss": 0.678, "step": 3117 }, { "epoch": 0.34, "learning_rate": 1.5385628393526236e-05, "loss": 0.7744, "step": 3118 }, { "epoch": 0.34, "learning_rate": 1.5382657172239718e-05, "loss": 0.7246, "step": 3119 }, { "epoch": 0.34, "learning_rate": 1.5379685281776125e-05, "loss": 0.749, "step": 3120 }, { "epoch": 0.34, "learning_rate": 1.5376712722504932e-05, "loss": 0.7354, "step": 3121 }, { "epoch": 0.34, "learning_rate": 1.5373739494795687e-05, "loss": 0.7117, "step": 3122 }, { "epoch": 0.34, "learning_rate": 1.5370765599018014e-05, "loss": 0.7764, "step": 3123 }, { "epoch": 0.34, "learning_rate": 1.5367791035541646e-05, "loss": 0.7856, "step": 3124 }, { "epoch": 0.34, "learning_rate": 1.536481580473638e-05, "loss": 0.7402, "step": 3125 }, { "epoch": 0.34, "learning_rate": 1.5361839906972095e-05, "loss": 0.6355, "step": 3126 }, { "epoch": 0.34, "learning_rate": 1.5358863342618757e-05, "loss": 0.8481, "step": 3127 }, { "epoch": 0.34, "learning_rate": 1.535588611204642e-05, "loss": 0.7839, "step": 3128 }, { "epoch": 0.34, "learning_rate": 1.5352908215625215e-05, "loss": 0.8423, "step": 3129 }, { "epoch": 0.34, "learning_rate": 1.5349929653725358e-05, "loss": 0.7542, "step": 3130 }, { "epoch": 0.34, "learning_rate": 1.534695042671714e-05, "loss": 0.6611, "step": 3131 }, { "epoch": 0.34, "learning_rate": 1.5343970534970948e-05, "loss": 0.7554, "step": 3132 }, { "epoch": 0.34, "learning_rate": 1.534098997885724e-05, "loss": 0.686, "step": 3133 }, { "epoch": 0.34, "learning_rate": 1.5338008758746567e-05, "loss": 0.8184, "step": 3134 }, { "epoch": 0.34, "learning_rate": 1.5335026875009557e-05, "loss": 0.709, "step": 3135 }, { "epoch": 0.34, "learning_rate": 1.5332044328016916e-05, "loss": 0.6665, "step": 3136 }, { "epoch": 0.34, "learning_rate": 1.5329061118139438e-05, "loss": 0.8325, "step": 3137 }, { "epoch": 0.34, "learning_rate": 1.5326077245747998e-05, "loss": 0.8232, "step": 3138 }, { "epoch": 0.34, "learning_rate": 1.532309271121356e-05, "loss": 0.7637, "step": 3139 }, { "epoch": 0.34, "learning_rate": 1.532010751490716e-05, "loss": 0.7671, "step": 3140 }, { "epoch": 0.34, "learning_rate": 1.531712165719992e-05, "loss": 0.665, "step": 3141 }, { "epoch": 0.34, "learning_rate": 1.531413513846304e-05, "loss": 0.6821, "step": 3142 }, { "epoch": 0.34, "learning_rate": 1.531114795906782e-05, "loss": 0.7051, "step": 3143 }, { "epoch": 0.34, "learning_rate": 1.5308160119385615e-05, "loss": 0.7463, "step": 3144 }, { "epoch": 0.34, "learning_rate": 1.5305171619787883e-05, "loss": 0.6851, "step": 3145 }, { "epoch": 0.34, "learning_rate": 1.5302182460646158e-05, "loss": 0.7986, "step": 3146 }, { "epoch": 0.34, "learning_rate": 1.529919264233205e-05, "loss": 0.6716, "step": 3147 }, { "epoch": 0.34, "learning_rate": 1.5296202165217263e-05, "loss": 0.7539, "step": 3148 }, { "epoch": 0.34, "learning_rate": 1.5293211029673568e-05, "loss": 0.8076, "step": 3149 }, { "epoch": 0.34, "learning_rate": 1.5290219236072833e-05, "loss": 0.6304, "step": 3150 }, { "epoch": 0.34, "learning_rate": 1.5287226784786996e-05, "loss": 0.6885, "step": 3151 }, { "epoch": 0.34, "learning_rate": 1.5284233676188084e-05, "loss": 0.728, "step": 3152 }, { "epoch": 0.34, "learning_rate": 1.5281239910648203e-05, "loss": 0.7744, "step": 3153 }, { "epoch": 0.34, "learning_rate": 1.527824548853954e-05, "loss": 0.7874, "step": 3154 }, { "epoch": 0.34, "learning_rate": 1.5275250410234366e-05, "loss": 0.6562, "step": 3155 }, { "epoch": 0.34, "learning_rate": 1.5272254676105026e-05, "loss": 0.8022, "step": 3156 }, { "epoch": 0.34, "learning_rate": 1.5269258286523956e-05, "loss": 0.7468, "step": 3157 }, { "epoch": 0.34, "learning_rate": 1.5266261241863675e-05, "loss": 0.7502, "step": 3158 }, { "epoch": 0.34, "learning_rate": 1.5263263542496775e-05, "loss": 0.7119, "step": 3159 }, { "epoch": 0.34, "learning_rate": 1.526026518879593e-05, "loss": 0.8301, "step": 3160 }, { "epoch": 0.34, "learning_rate": 1.5257266181133899e-05, "loss": 0.7542, "step": 3161 }, { "epoch": 0.34, "learning_rate": 1.5254266519883525e-05, "loss": 0.679, "step": 3162 }, { "epoch": 0.34, "learning_rate": 1.5251266205417727e-05, "loss": 0.6633, "step": 3163 }, { "epoch": 0.34, "learning_rate": 1.5248265238109508e-05, "loss": 0.7627, "step": 3164 }, { "epoch": 0.34, "learning_rate": 1.5245263618331944e-05, "loss": 0.7444, "step": 3165 }, { "epoch": 0.34, "learning_rate": 1.524226134645821e-05, "loss": 0.6865, "step": 3166 }, { "epoch": 0.34, "learning_rate": 1.5239258422861544e-05, "loss": 0.7166, "step": 3167 }, { "epoch": 0.34, "learning_rate": 1.5236254847915275e-05, "loss": 0.7336, "step": 3168 }, { "epoch": 0.34, "learning_rate": 1.523325062199281e-05, "loss": 0.7729, "step": 3169 }, { "epoch": 0.35, "learning_rate": 1.5230245745467637e-05, "loss": 0.6895, "step": 3170 }, { "epoch": 0.35, "learning_rate": 1.5227240218713326e-05, "loss": 0.6995, "step": 3171 }, { "epoch": 0.35, "learning_rate": 1.5224234042103528e-05, "loss": 0.7654, "step": 3172 }, { "epoch": 0.35, "learning_rate": 1.5221227216011967e-05, "loss": 0.7378, "step": 3173 }, { "epoch": 0.35, "learning_rate": 1.521821974081246e-05, "loss": 0.6671, "step": 3174 }, { "epoch": 0.35, "learning_rate": 1.5215211616878903e-05, "loss": 0.7161, "step": 3175 }, { "epoch": 0.35, "learning_rate": 1.5212202844585258e-05, "loss": 0.7637, "step": 3176 }, { "epoch": 0.35, "learning_rate": 1.520919342430559e-05, "loss": 0.7173, "step": 3177 }, { "epoch": 0.35, "learning_rate": 1.5206183356414026e-05, "loss": 0.6558, "step": 3178 }, { "epoch": 0.35, "learning_rate": 1.5203172641284787e-05, "loss": 0.7988, "step": 3179 }, { "epoch": 0.35, "learning_rate": 1.5200161279292154e-05, "loss": 0.7095, "step": 3180 }, { "epoch": 0.35, "learning_rate": 1.5197149270810519e-05, "loss": 0.6338, "step": 3181 }, { "epoch": 0.35, "learning_rate": 1.519413661621433e-05, "loss": 0.8584, "step": 3182 }, { "epoch": 0.35, "learning_rate": 1.5191123315878123e-05, "loss": 0.6538, "step": 3183 }, { "epoch": 0.35, "learning_rate": 1.5188109370176511e-05, "loss": 0.6716, "step": 3184 }, { "epoch": 0.35, "learning_rate": 1.5185094779484196e-05, "loss": 0.6919, "step": 3185 }, { "epoch": 0.35, "learning_rate": 1.5182079544175957e-05, "loss": 0.7886, "step": 3186 }, { "epoch": 0.35, "learning_rate": 1.5179063664626646e-05, "loss": 0.7937, "step": 3187 }, { "epoch": 0.35, "learning_rate": 1.5176047141211199e-05, "loss": 0.7249, "step": 3188 }, { "epoch": 0.35, "learning_rate": 1.5173029974304636e-05, "loss": 0.6782, "step": 3189 }, { "epoch": 0.35, "learning_rate": 1.5170012164282055e-05, "loss": 0.8564, "step": 3190 }, { "epoch": 0.35, "learning_rate": 1.5166993711518631e-05, "loss": 0.7739, "step": 3191 }, { "epoch": 0.35, "learning_rate": 1.5163974616389621e-05, "loss": 0.6487, "step": 3192 }, { "epoch": 0.35, "learning_rate": 1.5160954879270362e-05, "loss": 0.7886, "step": 3193 }, { "epoch": 0.35, "learning_rate": 1.5157934500536274e-05, "loss": 0.7668, "step": 3194 }, { "epoch": 0.35, "learning_rate": 1.5154913480562845e-05, "loss": 0.7117, "step": 3195 }, { "epoch": 0.35, "learning_rate": 1.5151891819725657e-05, "loss": 0.6458, "step": 3196 }, { "epoch": 0.35, "learning_rate": 1.514886951840037e-05, "loss": 0.604, "step": 3197 }, { "epoch": 0.35, "learning_rate": 1.514584657696271e-05, "loss": 0.6504, "step": 3198 }, { "epoch": 0.35, "learning_rate": 1.5142822995788493e-05, "loss": 0.7891, "step": 3199 }, { "epoch": 0.35, "learning_rate": 1.5139798775253622e-05, "loss": 0.752, "step": 3200 }, { "epoch": 0.35, "learning_rate": 1.5136773915734067e-05, "loss": 0.6887, "step": 3201 }, { "epoch": 0.35, "learning_rate": 1.5133748417605878e-05, "loss": 0.7205, "step": 3202 }, { "epoch": 0.35, "learning_rate": 1.5130722281245187e-05, "loss": 0.6362, "step": 3203 }, { "epoch": 0.35, "learning_rate": 1.5127695507028212e-05, "loss": 0.7268, "step": 3204 }, { "epoch": 0.35, "learning_rate": 1.5124668095331243e-05, "loss": 0.7676, "step": 3205 }, { "epoch": 0.35, "learning_rate": 1.5121640046530651e-05, "loss": 0.6924, "step": 3206 }, { "epoch": 0.35, "learning_rate": 1.5118611361002877e-05, "loss": 0.7817, "step": 3207 }, { "epoch": 0.35, "learning_rate": 1.5115582039124464e-05, "loss": 0.8457, "step": 3208 }, { "epoch": 0.35, "learning_rate": 1.5112552081272009e-05, "loss": 0.8062, "step": 3209 }, { "epoch": 0.35, "learning_rate": 1.5109521487822208e-05, "loss": 0.7891, "step": 3210 }, { "epoch": 0.35, "learning_rate": 1.510649025915182e-05, "loss": 0.7578, "step": 3211 }, { "epoch": 0.35, "learning_rate": 1.5103458395637694e-05, "loss": 0.8164, "step": 3212 }, { "epoch": 0.35, "learning_rate": 1.5100425897656754e-05, "loss": 0.6694, "step": 3213 }, { "epoch": 0.35, "learning_rate": 1.5097392765586003e-05, "loss": 0.8071, "step": 3214 }, { "epoch": 0.35, "learning_rate": 1.5094358999802521e-05, "loss": 0.813, "step": 3215 }, { "epoch": 0.35, "learning_rate": 1.5091324600683472e-05, "loss": 0.833, "step": 3216 }, { "epoch": 0.35, "learning_rate": 1.5088289568606091e-05, "loss": 0.854, "step": 3217 }, { "epoch": 0.35, "learning_rate": 1.5085253903947699e-05, "loss": 0.7493, "step": 3218 }, { "epoch": 0.35, "learning_rate": 1.5082217607085692e-05, "loss": 0.749, "step": 3219 }, { "epoch": 0.35, "learning_rate": 1.5079180678397547e-05, "loss": 0.6624, "step": 3220 }, { "epoch": 0.35, "learning_rate": 1.5076143118260818e-05, "loss": 0.7358, "step": 3221 }, { "epoch": 0.35, "learning_rate": 1.507310492705313e-05, "loss": 0.6228, "step": 3222 }, { "epoch": 0.35, "learning_rate": 1.5070066105152203e-05, "loss": 0.7573, "step": 3223 }, { "epoch": 0.35, "learning_rate": 1.5067026652935823e-05, "loss": 0.8584, "step": 3224 }, { "epoch": 0.35, "learning_rate": 1.5063986570781859e-05, "loss": 0.7092, "step": 3225 }, { "epoch": 0.35, "learning_rate": 1.5060945859068252e-05, "loss": 0.752, "step": 3226 }, { "epoch": 0.35, "learning_rate": 1.5057904518173034e-05, "loss": 0.7563, "step": 3227 }, { "epoch": 0.35, "learning_rate": 1.5054862548474298e-05, "loss": 0.6353, "step": 3228 }, { "epoch": 0.35, "learning_rate": 1.5051819950350232e-05, "loss": 0.7261, "step": 3229 }, { "epoch": 0.35, "learning_rate": 1.504877672417909e-05, "loss": 0.7451, "step": 3230 }, { "epoch": 0.35, "learning_rate": 1.5045732870339213e-05, "loss": 0.832, "step": 3231 }, { "epoch": 0.35, "learning_rate": 1.5042688389209017e-05, "loss": 0.7256, "step": 3232 }, { "epoch": 0.35, "learning_rate": 1.5039643281166986e-05, "loss": 0.7329, "step": 3233 }, { "epoch": 0.35, "learning_rate": 1.5036597546591699e-05, "loss": 0.7085, "step": 3234 }, { "epoch": 0.35, "learning_rate": 1.50335511858618e-05, "loss": 0.72, "step": 3235 }, { "epoch": 0.35, "learning_rate": 1.5030504199356022e-05, "loss": 0.7124, "step": 3236 }, { "epoch": 0.35, "learning_rate": 1.5027456587453159e-05, "loss": 0.678, "step": 3237 }, { "epoch": 0.35, "learning_rate": 1.5024408350532103e-05, "loss": 0.8135, "step": 3238 }, { "epoch": 0.35, "learning_rate": 1.5021359488971808e-05, "loss": 0.7563, "step": 3239 }, { "epoch": 0.35, "learning_rate": 1.5018310003151312e-05, "loss": 0.6821, "step": 3240 }, { "epoch": 0.35, "learning_rate": 1.5015259893449732e-05, "loss": 0.6799, "step": 3241 }, { "epoch": 0.35, "learning_rate": 1.501220916024626e-05, "loss": 0.6694, "step": 3242 }, { "epoch": 0.35, "learning_rate": 1.5009157803920162e-05, "loss": 0.6941, "step": 3243 }, { "epoch": 0.35, "learning_rate": 1.5006105824850791e-05, "loss": 0.9097, "step": 3244 }, { "epoch": 0.35, "learning_rate": 1.500305322341757e-05, "loss": 0.8506, "step": 3245 }, { "epoch": 0.35, "learning_rate": 1.5000000000000002e-05, "loss": 0.6685, "step": 3246 }, { "epoch": 0.35, "learning_rate": 1.4996946154977666e-05, "loss": 0.7935, "step": 3247 }, { "epoch": 0.35, "learning_rate": 1.4993891688730217e-05, "loss": 0.7063, "step": 3248 }, { "epoch": 0.35, "learning_rate": 1.4990836601637391e-05, "loss": 0.7527, "step": 3249 }, { "epoch": 0.35, "learning_rate": 1.4987780894079e-05, "loss": 0.7368, "step": 3250 }, { "epoch": 0.35, "learning_rate": 1.4984724566434935e-05, "loss": 0.7715, "step": 3251 }, { "epoch": 0.35, "learning_rate": 1.4981667619085152e-05, "loss": 0.8506, "step": 3252 }, { "epoch": 0.35, "learning_rate": 1.4978610052409703e-05, "loss": 0.6631, "step": 3253 }, { "epoch": 0.35, "learning_rate": 1.4975551866788705e-05, "loss": 0.696, "step": 3254 }, { "epoch": 0.35, "learning_rate": 1.4972493062602355e-05, "loss": 0.7769, "step": 3255 }, { "epoch": 0.35, "learning_rate": 1.4969433640230922e-05, "loss": 0.6919, "step": 3256 }, { "epoch": 0.35, "learning_rate": 1.4966373600054763e-05, "loss": 0.6555, "step": 3257 }, { "epoch": 0.35, "learning_rate": 1.49633129424543e-05, "loss": 0.8843, "step": 3258 }, { "epoch": 0.35, "learning_rate": 1.4960251667810041e-05, "loss": 0.78, "step": 3259 }, { "epoch": 0.35, "learning_rate": 1.4957189776502563e-05, "loss": 0.812, "step": 3260 }, { "epoch": 0.35, "learning_rate": 1.4954127268912525e-05, "loss": 0.6826, "step": 3261 }, { "epoch": 0.36, "learning_rate": 1.495106414542066e-05, "loss": 0.7168, "step": 3262 }, { "epoch": 0.36, "learning_rate": 1.4948000406407782e-05, "loss": 0.7188, "step": 3263 }, { "epoch": 0.36, "learning_rate": 1.494493605225477e-05, "loss": 0.7305, "step": 3264 }, { "epoch": 0.36, "learning_rate": 1.4941871083342596e-05, "loss": 0.8408, "step": 3265 }, { "epoch": 0.36, "learning_rate": 1.4938805500052294e-05, "loss": 0.7881, "step": 3266 }, { "epoch": 0.36, "learning_rate": 1.4935739302764981e-05, "loss": 0.8853, "step": 3267 }, { "epoch": 0.36, "learning_rate": 1.4932672491861855e-05, "loss": 0.8662, "step": 3268 }, { "epoch": 0.36, "learning_rate": 1.492960506772418e-05, "loss": 0.8086, "step": 3269 }, { "epoch": 0.36, "learning_rate": 1.4926537030733301e-05, "loss": 0.8691, "step": 3270 }, { "epoch": 0.36, "learning_rate": 1.492346838127064e-05, "loss": 0.7817, "step": 3271 }, { "epoch": 0.36, "learning_rate": 1.4920399119717695e-05, "loss": 0.8228, "step": 3272 }, { "epoch": 0.36, "learning_rate": 1.491732924645604e-05, "loss": 0.8022, "step": 3273 }, { "epoch": 0.36, "learning_rate": 1.4914258761867324e-05, "loss": 0.7087, "step": 3274 }, { "epoch": 0.36, "learning_rate": 1.4911187666333269e-05, "loss": 0.7676, "step": 3275 }, { "epoch": 0.36, "learning_rate": 1.4908115960235683e-05, "loss": 0.6851, "step": 3276 }, { "epoch": 0.36, "learning_rate": 1.490504364395644e-05, "loss": 0.7395, "step": 3277 }, { "epoch": 0.36, "learning_rate": 1.4901970717877494e-05, "loss": 0.7986, "step": 3278 }, { "epoch": 0.36, "learning_rate": 1.4898897182380872e-05, "loss": 0.6038, "step": 3279 }, { "epoch": 0.36, "learning_rate": 1.4895823037848683e-05, "loss": 0.825, "step": 3280 }, { "epoch": 0.36, "learning_rate": 1.4892748284663101e-05, "loss": 0.6514, "step": 3281 }, { "epoch": 0.36, "learning_rate": 1.488967292320639e-05, "loss": 0.7681, "step": 3282 }, { "epoch": 0.36, "learning_rate": 1.4886596953860876e-05, "loss": 0.751, "step": 3283 }, { "epoch": 0.36, "learning_rate": 1.4883520377008971e-05, "loss": 0.7571, "step": 3284 }, { "epoch": 0.36, "learning_rate": 1.4880443193033156e-05, "loss": 0.7158, "step": 3285 }, { "epoch": 0.36, "learning_rate": 1.4877365402315986e-05, "loss": 0.6499, "step": 3286 }, { "epoch": 0.36, "learning_rate": 1.4874287005240098e-05, "loss": 0.7505, "step": 3287 }, { "epoch": 0.36, "learning_rate": 1.4871208002188204e-05, "loss": 0.6953, "step": 3288 }, { "epoch": 0.36, "learning_rate": 1.4868128393543087e-05, "loss": 0.7012, "step": 3289 }, { "epoch": 0.36, "learning_rate": 1.48650481796876e-05, "loss": 0.7974, "step": 3290 }, { "epoch": 0.36, "learning_rate": 1.4861967361004687e-05, "loss": 0.811, "step": 3291 }, { "epoch": 0.36, "learning_rate": 1.4858885937877356e-05, "loss": 0.7593, "step": 3292 }, { "epoch": 0.36, "learning_rate": 1.4855803910688694e-05, "loss": 0.6211, "step": 3293 }, { "epoch": 0.36, "learning_rate": 1.4852721279821854e-05, "loss": 0.8643, "step": 3294 }, { "epoch": 0.36, "learning_rate": 1.4849638045660078e-05, "loss": 0.7988, "step": 3295 }, { "epoch": 0.36, "learning_rate": 1.4846554208586676e-05, "loss": 0.6904, "step": 3296 }, { "epoch": 0.36, "learning_rate": 1.4843469768985036e-05, "loss": 0.6104, "step": 3297 }, { "epoch": 0.36, "learning_rate": 1.484038472723861e-05, "loss": 0.6458, "step": 3298 }, { "epoch": 0.36, "learning_rate": 1.4837299083730945e-05, "loss": 0.7627, "step": 3299 }, { "epoch": 0.36, "learning_rate": 1.4834212838845639e-05, "loss": 0.7319, "step": 3300 }, { "epoch": 0.36, "learning_rate": 1.4831125992966386e-05, "loss": 0.666, "step": 3301 }, { "epoch": 0.36, "learning_rate": 1.4828038546476941e-05, "loss": 0.7639, "step": 3302 }, { "epoch": 0.36, "learning_rate": 1.4824950499761141e-05, "loss": 0.7227, "step": 3303 }, { "epoch": 0.36, "learning_rate": 1.4821861853202894e-05, "loss": 0.7886, "step": 3304 }, { "epoch": 0.36, "learning_rate": 1.4818772607186183e-05, "loss": 0.8208, "step": 3305 }, { "epoch": 0.36, "learning_rate": 1.4815682762095065e-05, "loss": 0.7075, "step": 3306 }, { "epoch": 0.36, "learning_rate": 1.4812592318313675e-05, "loss": 0.7427, "step": 3307 }, { "epoch": 0.36, "learning_rate": 1.480950127622622e-05, "loss": 0.678, "step": 3308 }, { "epoch": 0.36, "learning_rate": 1.4806409636216974e-05, "loss": 0.7617, "step": 3309 }, { "epoch": 0.36, "learning_rate": 1.4803317398670301e-05, "loss": 0.7852, "step": 3310 }, { "epoch": 0.36, "learning_rate": 1.4800224563970632e-05, "loss": 0.7842, "step": 3311 }, { "epoch": 0.36, "learning_rate": 1.4797131132502464e-05, "loss": 0.7051, "step": 3312 }, { "epoch": 0.36, "learning_rate": 1.479403710465038e-05, "loss": 0.7407, "step": 3313 }, { "epoch": 0.36, "learning_rate": 1.479094248079903e-05, "loss": 0.8738, "step": 3314 }, { "epoch": 0.36, "learning_rate": 1.4787847261333143e-05, "loss": 0.7334, "step": 3315 }, { "epoch": 0.36, "learning_rate": 1.4784751446637522e-05, "loss": 0.7043, "step": 3316 }, { "epoch": 0.36, "learning_rate": 1.4781655037097034e-05, "loss": 0.771, "step": 3317 }, { "epoch": 0.36, "learning_rate": 1.4778558033096633e-05, "loss": 0.6921, "step": 3318 }, { "epoch": 0.36, "learning_rate": 1.4775460435021341e-05, "loss": 0.832, "step": 3319 }, { "epoch": 0.36, "learning_rate": 1.4772362243256253e-05, "loss": 0.7368, "step": 3320 }, { "epoch": 0.36, "learning_rate": 1.476926345818654e-05, "loss": 0.6497, "step": 3321 }, { "epoch": 0.36, "learning_rate": 1.4766164080197446e-05, "loss": 0.7837, "step": 3322 }, { "epoch": 0.36, "learning_rate": 1.476306410967429e-05, "loss": 0.7427, "step": 3323 }, { "epoch": 0.36, "learning_rate": 1.4759963547002459e-05, "loss": 0.8667, "step": 3324 }, { "epoch": 0.36, "learning_rate": 1.475686239256742e-05, "loss": 0.7666, "step": 3325 }, { "epoch": 0.36, "learning_rate": 1.4753760646754714e-05, "loss": 0.7183, "step": 3326 }, { "epoch": 0.36, "learning_rate": 1.4750658309949953e-05, "loss": 0.75, "step": 3327 }, { "epoch": 0.36, "learning_rate": 1.4747555382538816e-05, "loss": 0.79, "step": 3328 }, { "epoch": 0.36, "learning_rate": 1.4744451864907067e-05, "loss": 0.7053, "step": 3329 }, { "epoch": 0.36, "learning_rate": 1.474134775744054e-05, "loss": 0.749, "step": 3330 }, { "epoch": 0.36, "learning_rate": 1.4738243060525139e-05, "loss": 0.8286, "step": 3331 }, { "epoch": 0.36, "learning_rate": 1.473513777454684e-05, "loss": 0.8892, "step": 3332 }, { "epoch": 0.36, "learning_rate": 1.4732031899891696e-05, "loss": 0.6807, "step": 3333 }, { "epoch": 0.36, "learning_rate": 1.4728925436945838e-05, "loss": 0.73, "step": 3334 }, { "epoch": 0.36, "learning_rate": 1.4725818386095459e-05, "loss": 0.8418, "step": 3335 }, { "epoch": 0.36, "learning_rate": 1.472271074772683e-05, "loss": 0.6868, "step": 3336 }, { "epoch": 0.36, "learning_rate": 1.4719602522226298e-05, "loss": 0.7588, "step": 3337 }, { "epoch": 0.36, "learning_rate": 1.4716493709980277e-05, "loss": 0.7764, "step": 3338 }, { "epoch": 0.36, "learning_rate": 1.4713384311375263e-05, "loss": 0.7144, "step": 3339 }, { "epoch": 0.36, "learning_rate": 1.4710274326797816e-05, "loss": 0.738, "step": 3340 }, { "epoch": 0.36, "learning_rate": 1.4707163756634573e-05, "loss": 0.696, "step": 3341 }, { "epoch": 0.36, "learning_rate": 1.4704052601272242e-05, "loss": 0.771, "step": 3342 }, { "epoch": 0.36, "learning_rate": 1.4700940861097605e-05, "loss": 0.7764, "step": 3343 }, { "epoch": 0.36, "learning_rate": 1.4697828536497518e-05, "loss": 0.7107, "step": 3344 }, { "epoch": 0.36, "learning_rate": 1.469471562785891e-05, "loss": 0.7573, "step": 3345 }, { "epoch": 0.36, "learning_rate": 1.4691602135568776e-05, "loss": 0.8057, "step": 3346 }, { "epoch": 0.36, "learning_rate": 1.468848806001419e-05, "loss": 0.6934, "step": 3347 }, { "epoch": 0.36, "learning_rate": 1.4685373401582297e-05, "loss": 0.7354, "step": 3348 }, { "epoch": 0.36, "learning_rate": 1.4682258160660317e-05, "loss": 0.688, "step": 3349 }, { "epoch": 0.36, "learning_rate": 1.4679142337635535e-05, "loss": 0.7673, "step": 3350 }, { "epoch": 0.36, "learning_rate": 1.4676025932895315e-05, "loss": 0.7812, "step": 3351 }, { "epoch": 0.36, "learning_rate": 1.4672908946827091e-05, "loss": 0.7471, "step": 3352 }, { "epoch": 0.37, "learning_rate": 1.4669791379818374e-05, "loss": 0.7993, "step": 3353 }, { "epoch": 0.37, "learning_rate": 1.4666673232256738e-05, "loss": 0.7944, "step": 3354 }, { "epoch": 0.37, "learning_rate": 1.4663554504529836e-05, "loss": 0.8081, "step": 3355 }, { "epoch": 0.37, "learning_rate": 1.4660435197025391e-05, "loss": 0.6814, "step": 3356 }, { "epoch": 0.37, "learning_rate": 1.4657315310131195e-05, "loss": 0.6538, "step": 3357 }, { "epoch": 0.37, "learning_rate": 1.465419484423512e-05, "loss": 0.7363, "step": 3358 }, { "epoch": 0.37, "learning_rate": 1.4651073799725104e-05, "loss": 0.7292, "step": 3359 }, { "epoch": 0.37, "learning_rate": 1.464795217698916e-05, "loss": 0.8413, "step": 3360 }, { "epoch": 0.37, "learning_rate": 1.4644829976415367e-05, "loss": 0.7056, "step": 3361 }, { "epoch": 0.37, "learning_rate": 1.464170719839188e-05, "loss": 0.6816, "step": 3362 }, { "epoch": 0.37, "learning_rate": 1.4638583843306928e-05, "loss": 0.8286, "step": 3363 }, { "epoch": 0.37, "learning_rate": 1.4635459911548811e-05, "loss": 0.728, "step": 3364 }, { "epoch": 0.37, "learning_rate": 1.4632335403505897e-05, "loss": 0.7698, "step": 3365 }, { "epoch": 0.37, "learning_rate": 1.4629210319566626e-05, "loss": 0.7119, "step": 3366 }, { "epoch": 0.37, "learning_rate": 1.4626084660119515e-05, "loss": 0.6582, "step": 3367 }, { "epoch": 0.37, "learning_rate": 1.4622958425553148e-05, "loss": 0.7915, "step": 3368 }, { "epoch": 0.37, "learning_rate": 1.4619831616256181e-05, "loss": 0.6038, "step": 3369 }, { "epoch": 0.37, "learning_rate": 1.461670423261734e-05, "loss": 0.7229, "step": 3370 }, { "epoch": 0.37, "learning_rate": 1.461357627502543e-05, "loss": 0.8164, "step": 3371 }, { "epoch": 0.37, "learning_rate": 1.4610447743869313e-05, "loss": 0.7139, "step": 3372 }, { "epoch": 0.37, "learning_rate": 1.460731863953794e-05, "loss": 0.8525, "step": 3373 }, { "epoch": 0.37, "learning_rate": 1.4604188962420318e-05, "loss": 0.6636, "step": 3374 }, { "epoch": 0.37, "learning_rate": 1.4601058712905536e-05, "loss": 0.728, "step": 3375 }, { "epoch": 0.37, "learning_rate": 1.4597927891382742e-05, "loss": 0.79, "step": 3376 }, { "epoch": 0.37, "learning_rate": 1.4594796498241173e-05, "loss": 0.8018, "step": 3377 }, { "epoch": 0.37, "learning_rate": 1.4591664533870118e-05, "loss": 0.5845, "step": 3378 }, { "epoch": 0.37, "learning_rate": 1.458853199865895e-05, "loss": 0.6899, "step": 3379 }, { "epoch": 0.37, "learning_rate": 1.4585398892997111e-05, "loss": 0.8179, "step": 3380 }, { "epoch": 0.37, "learning_rate": 1.4582265217274105e-05, "loss": 0.7258, "step": 3381 }, { "epoch": 0.37, "learning_rate": 1.4579130971879518e-05, "loss": 0.7373, "step": 3382 }, { "epoch": 0.37, "learning_rate": 1.4575996157203004e-05, "loss": 0.6575, "step": 3383 }, { "epoch": 0.37, "learning_rate": 1.4572860773634286e-05, "loss": 0.7046, "step": 3384 }, { "epoch": 0.37, "learning_rate": 1.4569724821563149e-05, "loss": 0.741, "step": 3385 }, { "epoch": 0.37, "learning_rate": 1.456658830137947e-05, "loss": 0.7314, "step": 3386 }, { "epoch": 0.37, "learning_rate": 1.4563451213473177e-05, "loss": 0.6902, "step": 3387 }, { "epoch": 0.37, "learning_rate": 1.4560313558234276e-05, "loss": 0.8306, "step": 3388 }, { "epoch": 0.37, "learning_rate": 1.4557175336052844e-05, "loss": 0.6648, "step": 3389 }, { "epoch": 0.37, "learning_rate": 1.4554036547319033e-05, "loss": 0.8623, "step": 3390 }, { "epoch": 0.37, "learning_rate": 1.455089719242305e-05, "loss": 0.6685, "step": 3391 }, { "epoch": 0.37, "learning_rate": 1.4547757271755192e-05, "loss": 0.666, "step": 3392 }, { "epoch": 0.37, "learning_rate": 1.454461678570581e-05, "loss": 0.699, "step": 3393 }, { "epoch": 0.37, "learning_rate": 1.4541475734665337e-05, "loss": 0.772, "step": 3394 }, { "epoch": 0.37, "learning_rate": 1.453833411902427e-05, "loss": 0.7944, "step": 3395 }, { "epoch": 0.37, "learning_rate": 1.4535191939173179e-05, "loss": 0.7539, "step": 3396 }, { "epoch": 0.37, "learning_rate": 1.4532049195502697e-05, "loss": 0.6848, "step": 3397 }, { "epoch": 0.37, "learning_rate": 1.4528905888403542e-05, "loss": 0.748, "step": 3398 }, { "epoch": 0.37, "learning_rate": 1.4525762018266484e-05, "loss": 0.6379, "step": 3399 }, { "epoch": 0.37, "learning_rate": 1.4522617585482377e-05, "loss": 0.7012, "step": 3400 }, { "epoch": 0.37, "learning_rate": 1.4519472590442138e-05, "loss": 0.6951, "step": 3401 }, { "epoch": 0.37, "learning_rate": 1.4516327033536761e-05, "loss": 0.6814, "step": 3402 }, { "epoch": 0.37, "learning_rate": 1.4513180915157299e-05, "loss": 0.7524, "step": 3403 }, { "epoch": 0.37, "learning_rate": 1.451003423569488e-05, "loss": 0.6709, "step": 3404 }, { "epoch": 0.37, "learning_rate": 1.4506886995540701e-05, "loss": 0.5896, "step": 3405 }, { "epoch": 0.37, "learning_rate": 1.4503739195086038e-05, "loss": 0.813, "step": 3406 }, { "epoch": 0.37, "learning_rate": 1.4500590834722222e-05, "loss": 0.6987, "step": 3407 }, { "epoch": 0.37, "learning_rate": 1.449744191484066e-05, "loss": 0.8672, "step": 3408 }, { "epoch": 0.37, "learning_rate": 1.449429243583283e-05, "loss": 0.6353, "step": 3409 }, { "epoch": 0.37, "learning_rate": 1.4491142398090278e-05, "loss": 0.6978, "step": 3410 }, { "epoch": 0.37, "learning_rate": 1.4487991802004625e-05, "loss": 0.8022, "step": 3411 }, { "epoch": 0.37, "learning_rate": 1.4484840647967547e-05, "loss": 0.6653, "step": 3412 }, { "epoch": 0.37, "learning_rate": 1.4481688936370804e-05, "loss": 0.7039, "step": 3413 }, { "epoch": 0.37, "learning_rate": 1.4478536667606218e-05, "loss": 0.6499, "step": 3414 }, { "epoch": 0.37, "learning_rate": 1.4475383842065682e-05, "loss": 0.6995, "step": 3415 }, { "epoch": 0.37, "learning_rate": 1.4472230460141159e-05, "loss": 0.7542, "step": 3416 }, { "epoch": 0.37, "learning_rate": 1.4469076522224683e-05, "loss": 0.7209, "step": 3417 }, { "epoch": 0.37, "learning_rate": 1.446592202870835e-05, "loss": 0.6829, "step": 3418 }, { "epoch": 0.37, "learning_rate": 1.4462766979984331e-05, "loss": 0.7864, "step": 3419 }, { "epoch": 0.37, "learning_rate": 1.4459611376444864e-05, "loss": 0.7739, "step": 3420 }, { "epoch": 0.37, "learning_rate": 1.4456455218482262e-05, "loss": 0.5745, "step": 3421 }, { "epoch": 0.37, "learning_rate": 1.4453298506488896e-05, "loss": 0.6897, "step": 3422 }, { "epoch": 0.37, "learning_rate": 1.445014124085721e-05, "loss": 0.7544, "step": 3423 }, { "epoch": 0.37, "learning_rate": 1.4446983421979723e-05, "loss": 0.6367, "step": 3424 }, { "epoch": 0.37, "learning_rate": 1.4443825050249016e-05, "loss": 0.7524, "step": 3425 }, { "epoch": 0.37, "learning_rate": 1.4440666126057743e-05, "loss": 0.7349, "step": 3426 }, { "epoch": 0.37, "learning_rate": 1.443750664979862e-05, "loss": 0.686, "step": 3427 }, { "epoch": 0.37, "learning_rate": 1.4434346621864442e-05, "loss": 0.7058, "step": 3428 }, { "epoch": 0.37, "learning_rate": 1.4431186042648058e-05, "loss": 0.7161, "step": 3429 }, { "epoch": 0.37, "learning_rate": 1.4428024912542405e-05, "loss": 0.8003, "step": 3430 }, { "epoch": 0.37, "learning_rate": 1.4424863231940467e-05, "loss": 0.655, "step": 3431 }, { "epoch": 0.37, "learning_rate": 1.4421701001235315e-05, "loss": 0.6914, "step": 3432 }, { "epoch": 0.37, "learning_rate": 1.441853822082008e-05, "loss": 0.7969, "step": 3433 }, { "epoch": 0.37, "learning_rate": 1.4415374891087954e-05, "loss": 0.7393, "step": 3434 }, { "epoch": 0.37, "learning_rate": 1.4412211012432213e-05, "loss": 0.75, "step": 3435 }, { "epoch": 0.37, "learning_rate": 1.4409046585246193e-05, "loss": 0.7197, "step": 3436 }, { "epoch": 0.37, "learning_rate": 1.4405881609923297e-05, "loss": 0.689, "step": 3437 }, { "epoch": 0.37, "learning_rate": 1.4402716086856999e-05, "loss": 0.7505, "step": 3438 }, { "epoch": 0.37, "learning_rate": 1.4399550016440835e-05, "loss": 0.7856, "step": 3439 }, { "epoch": 0.37, "learning_rate": 1.439638339906842e-05, "loss": 0.7156, "step": 3440 }, { "epoch": 0.37, "learning_rate": 1.4393216235133427e-05, "loss": 0.8125, "step": 3441 }, { "epoch": 0.37, "learning_rate": 1.43900485250296e-05, "loss": 0.73, "step": 3442 }, { "epoch": 0.37, "learning_rate": 1.4386880269150756e-05, "loss": 0.8496, "step": 3443 }, { "epoch": 0.37, "learning_rate": 1.4383711467890776e-05, "loss": 0.675, "step": 3444 }, { "epoch": 0.38, "learning_rate": 1.4380542121643603e-05, "loss": 0.7593, "step": 3445 }, { "epoch": 0.38, "learning_rate": 1.4377372230803257e-05, "loss": 0.7822, "step": 3446 }, { "epoch": 0.38, "learning_rate": 1.4374201795763823e-05, "loss": 0.7751, "step": 3447 }, { "epoch": 0.38, "learning_rate": 1.4371030816919444e-05, "loss": 0.7695, "step": 3448 }, { "epoch": 0.38, "learning_rate": 1.4367859294664351e-05, "loss": 0.8335, "step": 3449 }, { "epoch": 0.38, "learning_rate": 1.4364687229392823e-05, "loss": 0.8198, "step": 3450 }, { "epoch": 0.38, "learning_rate": 1.4361514621499217e-05, "loss": 0.6782, "step": 3451 }, { "epoch": 0.38, "learning_rate": 1.4358341471377957e-05, "loss": 0.7837, "step": 3452 }, { "epoch": 0.38, "learning_rate": 1.4355167779423525e-05, "loss": 0.7788, "step": 3453 }, { "epoch": 0.38, "learning_rate": 1.435199354603048e-05, "loss": 0.8091, "step": 3454 }, { "epoch": 0.38, "learning_rate": 1.4348818771593452e-05, "loss": 0.8281, "step": 3455 }, { "epoch": 0.38, "learning_rate": 1.4345643456507126e-05, "loss": 0.6953, "step": 3456 }, { "epoch": 0.38, "learning_rate": 1.4342467601166257e-05, "loss": 0.7231, "step": 3457 }, { "epoch": 0.38, "learning_rate": 1.4339291205965677e-05, "loss": 0.6384, "step": 3458 }, { "epoch": 0.38, "learning_rate": 1.4336114271300279e-05, "loss": 0.7874, "step": 3459 }, { "epoch": 0.38, "learning_rate": 1.4332936797565018e-05, "loss": 0.7205, "step": 3460 }, { "epoch": 0.38, "learning_rate": 1.4329758785154922e-05, "loss": 0.7104, "step": 3461 }, { "epoch": 0.38, "learning_rate": 1.4326580234465084e-05, "loss": 0.8062, "step": 3462 }, { "epoch": 0.38, "learning_rate": 1.4323401145890668e-05, "loss": 0.7803, "step": 3463 }, { "epoch": 0.38, "learning_rate": 1.4320221519826896e-05, "loss": 0.6782, "step": 3464 }, { "epoch": 0.38, "learning_rate": 1.4317041356669066e-05, "loss": 0.7773, "step": 3465 }, { "epoch": 0.38, "learning_rate": 1.4313860656812537e-05, "loss": 0.7017, "step": 3466 }, { "epoch": 0.38, "learning_rate": 1.4310679420652736e-05, "loss": 0.8081, "step": 3467 }, { "epoch": 0.38, "learning_rate": 1.4307497648585162e-05, "loss": 0.7842, "step": 3468 }, { "epoch": 0.38, "learning_rate": 1.4304315341005369e-05, "loss": 0.7354, "step": 3469 }, { "epoch": 0.38, "learning_rate": 1.4301132498308992e-05, "loss": 0.635, "step": 3470 }, { "epoch": 0.38, "learning_rate": 1.4297949120891718e-05, "loss": 0.7644, "step": 3471 }, { "epoch": 0.38, "learning_rate": 1.4294765209149311e-05, "loss": 0.7329, "step": 3472 }, { "epoch": 0.38, "learning_rate": 1.4291580763477596e-05, "loss": 0.792, "step": 3473 }, { "epoch": 0.38, "learning_rate": 1.4288395784272473e-05, "loss": 0.873, "step": 3474 }, { "epoch": 0.38, "learning_rate": 1.4285210271929895e-05, "loss": 0.686, "step": 3475 }, { "epoch": 0.38, "learning_rate": 1.4282024226845885e-05, "loss": 0.7832, "step": 3476 }, { "epoch": 0.38, "learning_rate": 1.4278837649416543e-05, "loss": 0.7515, "step": 3477 }, { "epoch": 0.38, "learning_rate": 1.4275650540038023e-05, "loss": 0.7329, "step": 3478 }, { "epoch": 0.38, "learning_rate": 1.4272462899106555e-05, "loss": 0.6931, "step": 3479 }, { "epoch": 0.38, "learning_rate": 1.4269274727018419e-05, "loss": 0.7317, "step": 3480 }, { "epoch": 0.38, "learning_rate": 1.426608602416998e-05, "loss": 0.6833, "step": 3481 }, { "epoch": 0.38, "learning_rate": 1.426289679095766e-05, "loss": 0.7329, "step": 3482 }, { "epoch": 0.38, "learning_rate": 1.4259707027777943e-05, "loss": 0.7012, "step": 3483 }, { "epoch": 0.38, "learning_rate": 1.4256516735027385e-05, "loss": 0.7139, "step": 3484 }, { "epoch": 0.38, "learning_rate": 1.4253325913102611e-05, "loss": 0.7644, "step": 3485 }, { "epoch": 0.38, "learning_rate": 1.4250134562400301e-05, "loss": 0.8276, "step": 3486 }, { "epoch": 0.38, "learning_rate": 1.424694268331721e-05, "loss": 0.7378, "step": 3487 }, { "epoch": 0.38, "learning_rate": 1.4243750276250154e-05, "loss": 0.7134, "step": 3488 }, { "epoch": 0.38, "learning_rate": 1.424055734159602e-05, "loss": 0.7817, "step": 3489 }, { "epoch": 0.38, "learning_rate": 1.423736387975175e-05, "loss": 0.8359, "step": 3490 }, { "epoch": 0.38, "learning_rate": 1.4234169891114361e-05, "loss": 0.7034, "step": 3491 }, { "epoch": 0.38, "learning_rate": 1.4230975376080936e-05, "loss": 0.8296, "step": 3492 }, { "epoch": 0.38, "learning_rate": 1.4227780335048615e-05, "loss": 0.7119, "step": 3493 }, { "epoch": 0.38, "learning_rate": 1.4224584768414612e-05, "loss": 0.6521, "step": 3494 }, { "epoch": 0.38, "learning_rate": 1.4221388676576203e-05, "loss": 0.6836, "step": 3495 }, { "epoch": 0.38, "learning_rate": 1.4218192059930724e-05, "loss": 0.7117, "step": 3496 }, { "epoch": 0.38, "learning_rate": 1.421499491887559e-05, "loss": 0.7202, "step": 3497 }, { "epoch": 0.38, "learning_rate": 1.4211797253808268e-05, "loss": 0.7524, "step": 3498 }, { "epoch": 0.38, "learning_rate": 1.4208599065126292e-05, "loss": 0.6863, "step": 3499 }, { "epoch": 0.38, "learning_rate": 1.420540035322727e-05, "loss": 0.7429, "step": 3500 }, { "epoch": 0.38, "learning_rate": 1.4202201118508863e-05, "loss": 0.7761, "step": 3501 }, { "epoch": 0.38, "learning_rate": 1.4199001361368808e-05, "loss": 0.6855, "step": 3502 }, { "epoch": 0.38, "learning_rate": 1.4195801082204896e-05, "loss": 0.7417, "step": 3503 }, { "epoch": 0.38, "learning_rate": 1.4192600281414994e-05, "loss": 0.7485, "step": 3504 }, { "epoch": 0.38, "learning_rate": 1.4189398959397027e-05, "loss": 0.812, "step": 3505 }, { "epoch": 0.38, "learning_rate": 1.4186197116548987e-05, "loss": 0.6592, "step": 3506 }, { "epoch": 0.38, "learning_rate": 1.4182994753268929e-05, "loss": 0.5979, "step": 3507 }, { "epoch": 0.38, "learning_rate": 1.4179791869954975e-05, "loss": 0.752, "step": 3508 }, { "epoch": 0.38, "learning_rate": 1.417658846700531e-05, "loss": 0.7471, "step": 3509 }, { "epoch": 0.38, "learning_rate": 1.417338454481818e-05, "loss": 0.7612, "step": 3510 }, { "epoch": 0.38, "learning_rate": 1.4170180103791906e-05, "loss": 0.8406, "step": 3511 }, { "epoch": 0.38, "learning_rate": 1.4166975144324866e-05, "loss": 0.6396, "step": 3512 }, { "epoch": 0.38, "learning_rate": 1.4163769666815502e-05, "loss": 0.6465, "step": 3513 }, { "epoch": 0.38, "learning_rate": 1.416056367166232e-05, "loss": 0.7244, "step": 3514 }, { "epoch": 0.38, "learning_rate": 1.4157357159263895e-05, "loss": 0.7549, "step": 3515 }, { "epoch": 0.38, "learning_rate": 1.4154150130018867e-05, "loss": 0.7786, "step": 3516 }, { "epoch": 0.38, "learning_rate": 1.4150942584325931e-05, "loss": 0.6731, "step": 3517 }, { "epoch": 0.38, "learning_rate": 1.4147734522583853e-05, "loss": 0.77, "step": 3518 }, { "epoch": 0.38, "learning_rate": 1.4144525945191465e-05, "loss": 0.6367, "step": 3519 }, { "epoch": 0.38, "learning_rate": 1.414131685254766e-05, "loss": 0.6565, "step": 3520 }, { "epoch": 0.38, "learning_rate": 1.4138107245051394e-05, "loss": 0.7727, "step": 3521 }, { "epoch": 0.38, "learning_rate": 1.4134897123101688e-05, "loss": 0.8091, "step": 3522 }, { "epoch": 0.38, "learning_rate": 1.4131686487097632e-05, "loss": 0.6738, "step": 3523 }, { "epoch": 0.38, "learning_rate": 1.4128475337438368e-05, "loss": 0.8257, "step": 3524 }, { "epoch": 0.38, "learning_rate": 1.4125263674523113e-05, "loss": 0.7476, "step": 3525 }, { "epoch": 0.38, "learning_rate": 1.4122051498751144e-05, "loss": 0.8062, "step": 3526 }, { "epoch": 0.38, "learning_rate": 1.4118838810521804e-05, "loss": 0.8594, "step": 3527 }, { "epoch": 0.38, "learning_rate": 1.4115625610234496e-05, "loss": 0.7568, "step": 3528 }, { "epoch": 0.38, "learning_rate": 1.4112411898288682e-05, "loss": 0.7695, "step": 3529 }, { "epoch": 0.38, "learning_rate": 1.4109197675083903e-05, "loss": 0.6316, "step": 3530 }, { "epoch": 0.38, "learning_rate": 1.4105982941019751e-05, "loss": 0.7109, "step": 3531 }, { "epoch": 0.38, "learning_rate": 1.4102767696495885e-05, "loss": 0.6641, "step": 3532 }, { "epoch": 0.38, "learning_rate": 1.4099551941912024e-05, "loss": 0.7158, "step": 3533 }, { "epoch": 0.38, "learning_rate": 1.4096335677667954e-05, "loss": 0.7559, "step": 3534 }, { "epoch": 0.38, "learning_rate": 1.4093118904163532e-05, "loss": 0.7532, "step": 3535 }, { "epoch": 0.38, "learning_rate": 1.4089901621798663e-05, "loss": 0.731, "step": 3536 }, { "epoch": 0.39, "learning_rate": 1.408668383097332e-05, "loss": 0.7979, "step": 3537 }, { "epoch": 0.39, "learning_rate": 1.408346553208755e-05, "loss": 0.7549, "step": 3538 }, { "epoch": 0.39, "learning_rate": 1.4080246725541448e-05, "loss": 0.7573, "step": 3539 }, { "epoch": 0.39, "learning_rate": 1.4077027411735185e-05, "loss": 0.8369, "step": 3540 }, { "epoch": 0.39, "learning_rate": 1.4073807591068982e-05, "loss": 0.7705, "step": 3541 }, { "epoch": 0.39, "learning_rate": 1.4070587263943139e-05, "loss": 0.7788, "step": 3542 }, { "epoch": 0.39, "learning_rate": 1.4067366430758004e-05, "loss": 0.6729, "step": 3543 }, { "epoch": 0.39, "learning_rate": 1.4064145091913994e-05, "loss": 0.8208, "step": 3544 }, { "epoch": 0.39, "learning_rate": 1.406092324781159e-05, "loss": 0.7217, "step": 3545 }, { "epoch": 0.39, "learning_rate": 1.405770089885134e-05, "loss": 0.7495, "step": 3546 }, { "epoch": 0.39, "learning_rate": 1.4054478045433842e-05, "loss": 0.6873, "step": 3547 }, { "epoch": 0.39, "learning_rate": 1.4051254687959766e-05, "loss": 0.7336, "step": 3548 }, { "epoch": 0.39, "learning_rate": 1.4048030826829843e-05, "loss": 0.6587, "step": 3549 }, { "epoch": 0.39, "learning_rate": 1.4044806462444869e-05, "loss": 0.7842, "step": 3550 }, { "epoch": 0.39, "learning_rate": 1.40415815952057e-05, "loss": 0.6672, "step": 3551 }, { "epoch": 0.39, "learning_rate": 1.403835622551325e-05, "loss": 0.6633, "step": 3552 }, { "epoch": 0.39, "learning_rate": 1.4035130353768502e-05, "loss": 0.5874, "step": 3553 }, { "epoch": 0.39, "learning_rate": 1.4031903980372503e-05, "loss": 0.6206, "step": 3554 }, { "epoch": 0.39, "learning_rate": 1.4028677105726356e-05, "loss": 0.7363, "step": 3555 }, { "epoch": 0.39, "learning_rate": 1.402544973023123e-05, "loss": 0.7573, "step": 3556 }, { "epoch": 0.39, "learning_rate": 1.4022221854288352e-05, "loss": 0.7058, "step": 3557 }, { "epoch": 0.39, "learning_rate": 1.4018993478299019e-05, "loss": 0.7773, "step": 3558 }, { "epoch": 0.39, "learning_rate": 1.4015764602664586e-05, "loss": 0.8433, "step": 3559 }, { "epoch": 0.39, "learning_rate": 1.4012535227786464e-05, "loss": 0.7515, "step": 3560 }, { "epoch": 0.39, "learning_rate": 1.4009305354066138e-05, "loss": 0.833, "step": 3561 }, { "epoch": 0.39, "learning_rate": 1.4006074981905148e-05, "loss": 0.7837, "step": 3562 }, { "epoch": 0.39, "learning_rate": 1.4002844111705094e-05, "loss": 0.6995, "step": 3563 }, { "epoch": 0.39, "learning_rate": 1.3999612743867643e-05, "loss": 0.7646, "step": 3564 }, { "epoch": 0.39, "learning_rate": 1.3996380878794524e-05, "loss": 0.6685, "step": 3565 }, { "epoch": 0.39, "learning_rate": 1.3993148516887522e-05, "loss": 0.7034, "step": 3566 }, { "epoch": 0.39, "learning_rate": 1.3989915658548488e-05, "loss": 0.8301, "step": 3567 }, { "epoch": 0.39, "learning_rate": 1.3986682304179332e-05, "loss": 0.6807, "step": 3568 }, { "epoch": 0.39, "learning_rate": 1.3983448454182033e-05, "loss": 0.6365, "step": 3569 }, { "epoch": 0.39, "learning_rate": 1.3980214108958626e-05, "loss": 0.7673, "step": 3570 }, { "epoch": 0.39, "learning_rate": 1.39769792689112e-05, "loss": 0.6982, "step": 3571 }, { "epoch": 0.39, "learning_rate": 1.3973743934441918e-05, "loss": 0.6655, "step": 3572 }, { "epoch": 0.39, "learning_rate": 1.3970508105953005e-05, "loss": 0.7439, "step": 3573 }, { "epoch": 0.39, "learning_rate": 1.3967271783846739e-05, "loss": 0.7932, "step": 3574 }, { "epoch": 0.39, "learning_rate": 1.3964034968525458e-05, "loss": 0.8804, "step": 3575 }, { "epoch": 0.39, "learning_rate": 1.396079766039157e-05, "loss": 0.7141, "step": 3576 }, { "epoch": 0.39, "learning_rate": 1.3957559859847539e-05, "loss": 0.7275, "step": 3577 }, { "epoch": 0.39, "learning_rate": 1.3954321567295894e-05, "loss": 0.7158, "step": 3578 }, { "epoch": 0.39, "learning_rate": 1.3951082783139221e-05, "loss": 0.6992, "step": 3579 }, { "epoch": 0.39, "learning_rate": 1.3947843507780168e-05, "loss": 0.7249, "step": 3580 }, { "epoch": 0.39, "learning_rate": 1.3944603741621445e-05, "loss": 0.7139, "step": 3581 }, { "epoch": 0.39, "learning_rate": 1.3941363485065822e-05, "loss": 0.6787, "step": 3582 }, { "epoch": 0.39, "learning_rate": 1.393812273851613e-05, "loss": 0.7732, "step": 3583 }, { "epoch": 0.39, "learning_rate": 1.393488150237527e-05, "loss": 0.759, "step": 3584 }, { "epoch": 0.39, "learning_rate": 1.3931639777046187e-05, "loss": 0.6328, "step": 3585 }, { "epoch": 0.39, "learning_rate": 1.3928397562931895e-05, "loss": 0.8442, "step": 3586 }, { "epoch": 0.39, "learning_rate": 1.3925154860435473e-05, "loss": 0.7078, "step": 3587 }, { "epoch": 0.39, "learning_rate": 1.3921911669960055e-05, "loss": 0.75, "step": 3588 }, { "epoch": 0.39, "learning_rate": 1.391866799190884e-05, "loss": 0.8184, "step": 3589 }, { "epoch": 0.39, "learning_rate": 1.3915423826685082e-05, "loss": 0.7407, "step": 3590 }, { "epoch": 0.39, "learning_rate": 1.39121791746921e-05, "loss": 0.8052, "step": 3591 }, { "epoch": 0.39, "learning_rate": 1.3908934036333273e-05, "loss": 0.7537, "step": 3592 }, { "epoch": 0.39, "learning_rate": 1.390568841201204e-05, "loss": 0.689, "step": 3593 }, { "epoch": 0.39, "learning_rate": 1.3902442302131896e-05, "loss": 0.7542, "step": 3594 }, { "epoch": 0.39, "learning_rate": 1.3899195707096405e-05, "loss": 0.6431, "step": 3595 }, { "epoch": 0.39, "learning_rate": 1.3895948627309184e-05, "loss": 0.6948, "step": 3596 }, { "epoch": 0.39, "learning_rate": 1.3892701063173917e-05, "loss": 0.853, "step": 3597 }, { "epoch": 0.39, "learning_rate": 1.3889453015094338e-05, "loss": 0.8813, "step": 3598 }, { "epoch": 0.39, "learning_rate": 1.3886204483474255e-05, "loss": 0.7256, "step": 3599 }, { "epoch": 0.39, "learning_rate": 1.3882955468717526e-05, "loss": 0.8306, "step": 3600 }, { "epoch": 0.39, "learning_rate": 1.3879705971228063e-05, "loss": 0.7415, "step": 3601 }, { "epoch": 0.39, "learning_rate": 1.3876455991409859e-05, "loss": 0.731, "step": 3602 }, { "epoch": 0.39, "learning_rate": 1.3873205529666949e-05, "loss": 0.8057, "step": 3603 }, { "epoch": 0.39, "learning_rate": 1.3869954586403434e-05, "loss": 0.7234, "step": 3604 }, { "epoch": 0.39, "learning_rate": 1.3866703162023471e-05, "loss": 0.6953, "step": 3605 }, { "epoch": 0.39, "learning_rate": 1.3863451256931286e-05, "loss": 0.8054, "step": 3606 }, { "epoch": 0.39, "learning_rate": 1.3860198871531159e-05, "loss": 0.7468, "step": 3607 }, { "epoch": 0.39, "learning_rate": 1.3856946006227425e-05, "loss": 0.646, "step": 3608 }, { "epoch": 0.39, "learning_rate": 1.3853692661424485e-05, "loss": 0.7234, "step": 3609 }, { "epoch": 0.39, "learning_rate": 1.38504388375268e-05, "loss": 0.7354, "step": 3610 }, { "epoch": 0.39, "learning_rate": 1.3847184534938882e-05, "loss": 0.6899, "step": 3611 }, { "epoch": 0.39, "learning_rate": 1.3843929754065319e-05, "loss": 0.7358, "step": 3612 }, { "epoch": 0.39, "learning_rate": 1.3840674495310739e-05, "loss": 0.6516, "step": 3613 }, { "epoch": 0.39, "learning_rate": 1.3837418759079848e-05, "loss": 0.791, "step": 3614 }, { "epoch": 0.39, "learning_rate": 1.3834162545777394e-05, "loss": 0.6423, "step": 3615 }, { "epoch": 0.39, "learning_rate": 1.3830905855808197e-05, "loss": 0.7861, "step": 3616 }, { "epoch": 0.39, "learning_rate": 1.382764868957713e-05, "loss": 0.759, "step": 3617 }, { "epoch": 0.39, "learning_rate": 1.3824391047489129e-05, "loss": 0.7739, "step": 3618 }, { "epoch": 0.39, "learning_rate": 1.3821132929949185e-05, "loss": 0.7473, "step": 3619 }, { "epoch": 0.39, "learning_rate": 1.3817874337362351e-05, "loss": 0.8311, "step": 3620 }, { "epoch": 0.39, "learning_rate": 1.381461527013374e-05, "loss": 0.7241, "step": 3621 }, { "epoch": 0.39, "learning_rate": 1.381135572866852e-05, "loss": 0.7219, "step": 3622 }, { "epoch": 0.39, "learning_rate": 1.3808095713371923e-05, "loss": 0.6643, "step": 3623 }, { "epoch": 0.39, "learning_rate": 1.380483522464923e-05, "loss": 0.6768, "step": 3624 }, { "epoch": 0.39, "learning_rate": 1.3801574262905799e-05, "loss": 0.813, "step": 3625 }, { "epoch": 0.39, "learning_rate": 1.3798312828547028e-05, "loss": 0.7065, "step": 3626 }, { "epoch": 0.39, "learning_rate": 1.3795050921978386e-05, "loss": 0.7856, "step": 3627 }, { "epoch": 0.39, "learning_rate": 1.379178854360539e-05, "loss": 0.6846, "step": 3628 }, { "epoch": 0.4, "learning_rate": 1.378852569383363e-05, "loss": 0.6812, "step": 3629 }, { "epoch": 0.4, "learning_rate": 1.3785262373068742e-05, "loss": 0.6421, "step": 3630 }, { "epoch": 0.4, "learning_rate": 1.3781998581716427e-05, "loss": 0.6768, "step": 3631 }, { "epoch": 0.4, "learning_rate": 1.3778734320182439e-05, "loss": 0.7769, "step": 3632 }, { "epoch": 0.4, "learning_rate": 1.3775469588872601e-05, "loss": 0.7354, "step": 3633 }, { "epoch": 0.4, "learning_rate": 1.3772204388192778e-05, "loss": 0.7126, "step": 3634 }, { "epoch": 0.4, "learning_rate": 1.3768938718548912e-05, "loss": 0.7126, "step": 3635 }, { "epoch": 0.4, "learning_rate": 1.3765672580346986e-05, "loss": 0.6562, "step": 3636 }, { "epoch": 0.4, "learning_rate": 1.376240597399306e-05, "loss": 0.7827, "step": 3637 }, { "epoch": 0.4, "learning_rate": 1.3759138899893233e-05, "loss": 0.6511, "step": 3638 }, { "epoch": 0.4, "learning_rate": 1.3755871358453671e-05, "loss": 0.7544, "step": 3639 }, { "epoch": 0.4, "learning_rate": 1.37526033500806e-05, "loss": 0.7871, "step": 3640 }, { "epoch": 0.4, "learning_rate": 1.3749334875180305e-05, "loss": 0.7166, "step": 3641 }, { "epoch": 0.4, "learning_rate": 1.3746065934159123e-05, "loss": 0.7842, "step": 3642 }, { "epoch": 0.4, "learning_rate": 1.3742796527423448e-05, "loss": 0.658, "step": 3643 }, { "epoch": 0.4, "learning_rate": 1.3739526655379743e-05, "loss": 0.7634, "step": 3644 }, { "epoch": 0.4, "learning_rate": 1.3736256318434515e-05, "loss": 0.8682, "step": 3645 }, { "epoch": 0.4, "learning_rate": 1.3732985516994341e-05, "loss": 0.6614, "step": 3646 }, { "epoch": 0.4, "learning_rate": 1.3729714251465847e-05, "loss": 0.7866, "step": 3647 }, { "epoch": 0.4, "learning_rate": 1.372644252225572e-05, "loss": 0.9175, "step": 3648 }, { "epoch": 0.4, "learning_rate": 1.3723170329770703e-05, "loss": 0.8647, "step": 3649 }, { "epoch": 0.4, "learning_rate": 1.3719897674417605e-05, "loss": 0.667, "step": 3650 }, { "epoch": 0.4, "learning_rate": 1.3716624556603275e-05, "loss": 0.8701, "step": 3651 }, { "epoch": 0.4, "learning_rate": 1.371335097673464e-05, "loss": 0.7253, "step": 3652 }, { "epoch": 0.4, "learning_rate": 1.3710076935218671e-05, "loss": 0.8286, "step": 3653 }, { "epoch": 0.4, "learning_rate": 1.3706802432462396e-05, "loss": 0.7129, "step": 3654 }, { "epoch": 0.4, "learning_rate": 1.3703527468872908e-05, "loss": 0.7007, "step": 3655 }, { "epoch": 0.4, "learning_rate": 1.3700252044857356e-05, "loss": 0.7456, "step": 3656 }, { "epoch": 0.4, "learning_rate": 1.3696976160822941e-05, "loss": 0.7346, "step": 3657 }, { "epoch": 0.4, "learning_rate": 1.3693699817176923e-05, "loss": 1.0493, "step": 3658 }, { "epoch": 0.4, "learning_rate": 1.3690423014326619e-05, "loss": 0.7593, "step": 3659 }, { "epoch": 0.4, "learning_rate": 1.3687145752679409e-05, "loss": 0.8403, "step": 3660 }, { "epoch": 0.4, "learning_rate": 1.3683868032642722e-05, "loss": 0.8232, "step": 3661 }, { "epoch": 0.4, "learning_rate": 1.3680589854624049e-05, "loss": 0.8213, "step": 3662 }, { "epoch": 0.4, "learning_rate": 1.3677311219030933e-05, "loss": 0.8389, "step": 3663 }, { "epoch": 0.4, "learning_rate": 1.3674032126270982e-05, "loss": 0.6572, "step": 3664 }, { "epoch": 0.4, "learning_rate": 1.3670752576751856e-05, "loss": 0.7595, "step": 3665 }, { "epoch": 0.4, "learning_rate": 1.3667472570881264e-05, "loss": 0.6589, "step": 3666 }, { "epoch": 0.4, "learning_rate": 1.3664192109066986e-05, "loss": 0.8184, "step": 3667 }, { "epoch": 0.4, "learning_rate": 1.366091119171685e-05, "loss": 0.657, "step": 3668 }, { "epoch": 0.4, "learning_rate": 1.3657629819238747e-05, "loss": 0.8291, "step": 3669 }, { "epoch": 0.4, "learning_rate": 1.3654347992040613e-05, "loss": 0.7456, "step": 3670 }, { "epoch": 0.4, "learning_rate": 1.3651065710530453e-05, "loss": 0.7524, "step": 3671 }, { "epoch": 0.4, "learning_rate": 1.3647782975116325e-05, "loss": 0.6638, "step": 3672 }, { "epoch": 0.4, "learning_rate": 1.3644499786206336e-05, "loss": 0.9072, "step": 3673 }, { "epoch": 0.4, "learning_rate": 1.3641216144208658e-05, "loss": 0.8457, "step": 3674 }, { "epoch": 0.4, "learning_rate": 1.3637932049531517e-05, "loss": 0.783, "step": 3675 }, { "epoch": 0.4, "learning_rate": 1.3634647502583196e-05, "loss": 0.6375, "step": 3676 }, { "epoch": 0.4, "learning_rate": 1.3631362503772028e-05, "loss": 0.7305, "step": 3677 }, { "epoch": 0.4, "learning_rate": 1.362807705350641e-05, "loss": 0.8257, "step": 3678 }, { "epoch": 0.4, "learning_rate": 1.3624791152194796e-05, "loss": 0.6433, "step": 3679 }, { "epoch": 0.4, "learning_rate": 1.362150480024569e-05, "loss": 0.7783, "step": 3680 }, { "epoch": 0.4, "learning_rate": 1.361821799806765e-05, "loss": 0.7466, "step": 3681 }, { "epoch": 0.4, "learning_rate": 1.36149307460693e-05, "loss": 0.7026, "step": 3682 }, { "epoch": 0.4, "learning_rate": 1.3611643044659314e-05, "loss": 0.687, "step": 3683 }, { "epoch": 0.4, "learning_rate": 1.360835489424642e-05, "loss": 0.8074, "step": 3684 }, { "epoch": 0.4, "learning_rate": 1.3605066295239402e-05, "loss": 0.8364, "step": 3685 }, { "epoch": 0.4, "learning_rate": 1.3601777248047105e-05, "loss": 0.6829, "step": 3686 }, { "epoch": 0.4, "learning_rate": 1.3598487753078426e-05, "loss": 0.6182, "step": 3687 }, { "epoch": 0.4, "learning_rate": 1.359519781074232e-05, "loss": 0.8022, "step": 3688 }, { "epoch": 0.4, "learning_rate": 1.3591907421447789e-05, "loss": 0.7744, "step": 3689 }, { "epoch": 0.4, "learning_rate": 1.3588616585603908e-05, "loss": 0.687, "step": 3690 }, { "epoch": 0.4, "learning_rate": 1.358532530361979e-05, "loss": 0.731, "step": 3691 }, { "epoch": 0.4, "learning_rate": 1.3582033575904608e-05, "loss": 0.6841, "step": 3692 }, { "epoch": 0.4, "learning_rate": 1.3578741402867594e-05, "loss": 0.6929, "step": 3693 }, { "epoch": 0.4, "learning_rate": 1.3575448784918041e-05, "loss": 0.7456, "step": 3694 }, { "epoch": 0.4, "learning_rate": 1.3572155722465286e-05, "loss": 0.6372, "step": 3695 }, { "epoch": 0.4, "learning_rate": 1.356886221591872e-05, "loss": 0.7578, "step": 3696 }, { "epoch": 0.4, "learning_rate": 1.3565568265687802e-05, "loss": 0.6194, "step": 3697 }, { "epoch": 0.4, "learning_rate": 1.356227387218204e-05, "loss": 0.8755, "step": 3698 }, { "epoch": 0.4, "learning_rate": 1.3558979035810989e-05, "loss": 0.7461, "step": 3699 }, { "epoch": 0.4, "learning_rate": 1.355568375698427e-05, "loss": 0.7, "step": 3700 }, { "epoch": 0.4, "learning_rate": 1.3552388036111557e-05, "loss": 0.7668, "step": 3701 }, { "epoch": 0.4, "learning_rate": 1.3549091873602578e-05, "loss": 0.8208, "step": 3702 }, { "epoch": 0.4, "learning_rate": 1.354579526986711e-05, "loss": 0.7266, "step": 3703 }, { "epoch": 0.4, "learning_rate": 1.3542498225314993e-05, "loss": 0.7651, "step": 3704 }, { "epoch": 0.4, "learning_rate": 1.353920074035612e-05, "loss": 0.6853, "step": 3705 }, { "epoch": 0.4, "learning_rate": 1.3535902815400435e-05, "loss": 0.8232, "step": 3706 }, { "epoch": 0.4, "learning_rate": 1.353260445085794e-05, "loss": 0.7939, "step": 3707 }, { "epoch": 0.4, "learning_rate": 1.3529305647138689e-05, "loss": 0.7122, "step": 3708 }, { "epoch": 0.4, "learning_rate": 1.3526006404652798e-05, "loss": 0.7705, "step": 3709 }, { "epoch": 0.4, "learning_rate": 1.3522706723810428e-05, "loss": 0.7729, "step": 3710 }, { "epoch": 0.4, "learning_rate": 1.3519406605021797e-05, "loss": 0.6602, "step": 3711 }, { "epoch": 0.4, "learning_rate": 1.3516106048697177e-05, "loss": 0.7629, "step": 3712 }, { "epoch": 0.4, "learning_rate": 1.3512805055246905e-05, "loss": 0.7339, "step": 3713 }, { "epoch": 0.4, "learning_rate": 1.350950362508136e-05, "loss": 0.7437, "step": 3714 }, { "epoch": 0.4, "learning_rate": 1.3506201758610974e-05, "loss": 0.6812, "step": 3715 }, { "epoch": 0.4, "learning_rate": 1.350289945624624e-05, "loss": 0.7554, "step": 3716 }, { "epoch": 0.4, "learning_rate": 1.3499596718397707e-05, "loss": 0.7476, "step": 3717 }, { "epoch": 0.4, "learning_rate": 1.3496293545475976e-05, "loss": 0.6008, "step": 3718 }, { "epoch": 0.4, "learning_rate": 1.3492989937891694e-05, "loss": 0.6699, "step": 3719 }, { "epoch": 0.4, "learning_rate": 1.3489685896055573e-05, "loss": 0.7646, "step": 3720 }, { "epoch": 0.41, "learning_rate": 1.3486381420378372e-05, "loss": 0.7153, "step": 3721 }, { "epoch": 0.41, "learning_rate": 1.3483076511270909e-05, "loss": 0.7285, "step": 3722 }, { "epoch": 0.41, "learning_rate": 1.3479771169144052e-05, "loss": 0.7666, "step": 3723 }, { "epoch": 0.41, "learning_rate": 1.3476465394408727e-05, "loss": 0.7288, "step": 3724 }, { "epoch": 0.41, "learning_rate": 1.3473159187475906e-05, "loss": 0.7273, "step": 3725 }, { "epoch": 0.41, "learning_rate": 1.3469852548756626e-05, "loss": 0.5725, "step": 3726 }, { "epoch": 0.41, "learning_rate": 1.3466545478661966e-05, "loss": 0.8362, "step": 3727 }, { "epoch": 0.41, "learning_rate": 1.3463237977603067e-05, "loss": 0.8069, "step": 3728 }, { "epoch": 0.41, "learning_rate": 1.3459930045991121e-05, "loss": 0.7632, "step": 3729 }, { "epoch": 0.41, "learning_rate": 1.3456621684237367e-05, "loss": 0.833, "step": 3730 }, { "epoch": 0.41, "learning_rate": 1.3453312892753114e-05, "loss": 0.7295, "step": 3731 }, { "epoch": 0.41, "learning_rate": 1.3450003671949707e-05, "loss": 0.7656, "step": 3732 }, { "epoch": 0.41, "learning_rate": 1.3446694022238555e-05, "loss": 0.8081, "step": 3733 }, { "epoch": 0.41, "learning_rate": 1.3443383944031114e-05, "loss": 0.8108, "step": 3734 }, { "epoch": 0.41, "learning_rate": 1.3440073437738899e-05, "loss": 0.6853, "step": 3735 }, { "epoch": 0.41, "learning_rate": 1.3436762503773473e-05, "loss": 0.7839, "step": 3736 }, { "epoch": 0.41, "learning_rate": 1.3433451142546455e-05, "loss": 0.7065, "step": 3737 }, { "epoch": 0.41, "learning_rate": 1.3430139354469516e-05, "loss": 0.7974, "step": 3738 }, { "epoch": 0.41, "learning_rate": 1.3426827139954382e-05, "loss": 0.7812, "step": 3739 }, { "epoch": 0.41, "learning_rate": 1.3423514499412829e-05, "loss": 0.8042, "step": 3740 }, { "epoch": 0.41, "learning_rate": 1.342020143325669e-05, "loss": 0.7393, "step": 3741 }, { "epoch": 0.41, "learning_rate": 1.3416887941897845e-05, "loss": 0.6802, "step": 3742 }, { "epoch": 0.41, "learning_rate": 1.3413574025748235e-05, "loss": 0.6392, "step": 3743 }, { "epoch": 0.41, "learning_rate": 1.3410259685219846e-05, "loss": 0.8467, "step": 3744 }, { "epoch": 0.41, "learning_rate": 1.3406944920724721e-05, "loss": 0.7729, "step": 3745 }, { "epoch": 0.41, "learning_rate": 1.3403629732674954e-05, "loss": 0.6565, "step": 3746 }, { "epoch": 0.41, "learning_rate": 1.3400314121482695e-05, "loss": 0.7236, "step": 3747 }, { "epoch": 0.41, "learning_rate": 1.3396998087560139e-05, "loss": 0.8066, "step": 3748 }, { "epoch": 0.41, "learning_rate": 1.3393681631319542e-05, "loss": 0.7139, "step": 3749 }, { "epoch": 0.41, "learning_rate": 1.3390364753173206e-05, "loss": 0.7163, "step": 3750 }, { "epoch": 0.41, "learning_rate": 1.3387047453533494e-05, "loss": 0.6963, "step": 3751 }, { "epoch": 0.41, "learning_rate": 1.3383729732812814e-05, "loss": 0.7705, "step": 3752 }, { "epoch": 0.41, "learning_rate": 1.3380411591423623e-05, "loss": 0.7463, "step": 3753 }, { "epoch": 0.41, "learning_rate": 1.3377093029778441e-05, "loss": 0.6985, "step": 3754 }, { "epoch": 0.41, "learning_rate": 1.3373774048289834e-05, "loss": 0.7612, "step": 3755 }, { "epoch": 0.41, "learning_rate": 1.3370454647370418e-05, "loss": 0.8779, "step": 3756 }, { "epoch": 0.41, "learning_rate": 1.3367134827432868e-05, "loss": 0.6924, "step": 3757 }, { "epoch": 0.41, "learning_rate": 1.3363814588889905e-05, "loss": 0.8408, "step": 3758 }, { "epoch": 0.41, "learning_rate": 1.3360493932154301e-05, "loss": 0.7734, "step": 3759 }, { "epoch": 0.41, "learning_rate": 1.3357172857638892e-05, "loss": 0.7065, "step": 3760 }, { "epoch": 0.41, "learning_rate": 1.3353851365756547e-05, "loss": 0.7573, "step": 3761 }, { "epoch": 0.41, "learning_rate": 1.3350529456920205e-05, "loss": 0.6543, "step": 3762 }, { "epoch": 0.41, "learning_rate": 1.3347207131542847e-05, "loss": 0.6543, "step": 3763 }, { "epoch": 0.41, "learning_rate": 1.3343884390037502e-05, "loss": 0.7112, "step": 3764 }, { "epoch": 0.41, "learning_rate": 1.3340561232817264e-05, "loss": 0.8486, "step": 3765 }, { "epoch": 0.41, "learning_rate": 1.3337237660295269e-05, "loss": 0.7036, "step": 3766 }, { "epoch": 0.41, "learning_rate": 1.3333913672884701e-05, "loss": 0.8259, "step": 3767 }, { "epoch": 0.41, "learning_rate": 1.3330589270998809e-05, "loss": 0.877, "step": 3768 }, { "epoch": 0.41, "learning_rate": 1.3327264455050882e-05, "loss": 0.8076, "step": 3769 }, { "epoch": 0.41, "learning_rate": 1.3323939225454266e-05, "loss": 0.749, "step": 3770 }, { "epoch": 0.41, "learning_rate": 1.3320613582622354e-05, "loss": 0.853, "step": 3771 }, { "epoch": 0.41, "learning_rate": 1.3317287526968597e-05, "loss": 0.7363, "step": 3772 }, { "epoch": 0.41, "learning_rate": 1.3313961058906486e-05, "loss": 0.6929, "step": 3773 }, { "epoch": 0.41, "learning_rate": 1.3310634178849583e-05, "loss": 0.8384, "step": 3774 }, { "epoch": 0.41, "learning_rate": 1.3307306887211478e-05, "loss": 0.7573, "step": 3775 }, { "epoch": 0.41, "learning_rate": 1.3303979184405826e-05, "loss": 0.8066, "step": 3776 }, { "epoch": 0.41, "learning_rate": 1.3300651070846333e-05, "loss": 0.8149, "step": 3777 }, { "epoch": 0.41, "learning_rate": 1.329732254694675e-05, "loss": 0.7515, "step": 3778 }, { "epoch": 0.41, "learning_rate": 1.3293993613120887e-05, "loss": 0.7979, "step": 3779 }, { "epoch": 0.41, "learning_rate": 1.3290664269782592e-05, "loss": 0.7661, "step": 3780 }, { "epoch": 0.41, "learning_rate": 1.3287334517345778e-05, "loss": 0.7317, "step": 3781 }, { "epoch": 0.41, "learning_rate": 1.3284004356224405e-05, "loss": 0.7017, "step": 3782 }, { "epoch": 0.41, "learning_rate": 1.3280673786832473e-05, "loss": 0.7351, "step": 3783 }, { "epoch": 0.41, "learning_rate": 1.3277342809584051e-05, "loss": 0.7117, "step": 3784 }, { "epoch": 0.41, "learning_rate": 1.3274011424893245e-05, "loss": 0.7388, "step": 3785 }, { "epoch": 0.41, "learning_rate": 1.3270679633174219e-05, "loss": 0.7087, "step": 3786 }, { "epoch": 0.41, "learning_rate": 1.3267347434841178e-05, "loss": 0.811, "step": 3787 }, { "epoch": 0.41, "learning_rate": 1.3264014830308389e-05, "loss": 0.7917, "step": 3788 }, { "epoch": 0.41, "learning_rate": 1.3260681819990166e-05, "loss": 0.7466, "step": 3789 }, { "epoch": 0.41, "learning_rate": 1.3257348404300868e-05, "loss": 0.7754, "step": 3790 }, { "epoch": 0.41, "learning_rate": 1.3254014583654909e-05, "loss": 0.5964, "step": 3791 }, { "epoch": 0.41, "learning_rate": 1.3250680358466754e-05, "loss": 0.7638, "step": 3792 }, { "epoch": 0.41, "learning_rate": 1.3247345729150917e-05, "loss": 0.7251, "step": 3793 }, { "epoch": 0.41, "learning_rate": 1.3244010696121966e-05, "loss": 0.6934, "step": 3794 }, { "epoch": 0.41, "learning_rate": 1.3240675259794507e-05, "loss": 0.7607, "step": 3795 }, { "epoch": 0.41, "learning_rate": 1.3237339420583213e-05, "loss": 0.6821, "step": 3796 }, { "epoch": 0.41, "learning_rate": 1.323400317890279e-05, "loss": 0.7227, "step": 3797 }, { "epoch": 0.41, "learning_rate": 1.3230666535168014e-05, "loss": 0.7603, "step": 3798 }, { "epoch": 0.41, "learning_rate": 1.3227329489793687e-05, "loss": 0.6328, "step": 3799 }, { "epoch": 0.41, "learning_rate": 1.3223992043194685e-05, "loss": 0.7075, "step": 3800 }, { "epoch": 0.41, "learning_rate": 1.3220654195785917e-05, "loss": 0.6633, "step": 3801 }, { "epoch": 0.41, "learning_rate": 1.3217315947982345e-05, "loss": 0.7292, "step": 3802 }, { "epoch": 0.41, "learning_rate": 1.3213977300198988e-05, "loss": 0.6892, "step": 3803 }, { "epoch": 0.41, "learning_rate": 1.321063825285091e-05, "loss": 0.8306, "step": 3804 }, { "epoch": 0.41, "learning_rate": 1.3207298806353222e-05, "loss": 0.7539, "step": 3805 }, { "epoch": 0.41, "learning_rate": 1.3203958961121087e-05, "loss": 0.8118, "step": 3806 }, { "epoch": 0.41, "learning_rate": 1.3200618717569716e-05, "loss": 0.6624, "step": 3807 }, { "epoch": 0.41, "learning_rate": 1.3197278076114377e-05, "loss": 0.7866, "step": 3808 }, { "epoch": 0.41, "learning_rate": 1.319393703717038e-05, "loss": 0.6746, "step": 3809 }, { "epoch": 0.41, "learning_rate": 1.319059560115308e-05, "loss": 0.7969, "step": 3810 }, { "epoch": 0.41, "learning_rate": 1.3187253768477895e-05, "loss": 0.6709, "step": 3811 }, { "epoch": 0.41, "learning_rate": 1.3183911539560282e-05, "loss": 0.708, "step": 3812 }, { "epoch": 0.42, "learning_rate": 1.3180568914815752e-05, "loss": 0.7405, "step": 3813 }, { "epoch": 0.42, "learning_rate": 1.3177225894659858e-05, "loss": 0.7273, "step": 3814 }, { "epoch": 0.42, "learning_rate": 1.3173882479508213e-05, "loss": 0.7563, "step": 3815 }, { "epoch": 0.42, "learning_rate": 1.3170538669776469e-05, "loss": 0.6455, "step": 3816 }, { "epoch": 0.42, "learning_rate": 1.3167194465880337e-05, "loss": 0.8408, "step": 3817 }, { "epoch": 0.42, "learning_rate": 1.3163849868235566e-05, "loss": 0.6648, "step": 3818 }, { "epoch": 0.42, "learning_rate": 1.3160504877257964e-05, "loss": 0.8677, "step": 3819 }, { "epoch": 0.42, "learning_rate": 1.3157159493363383e-05, "loss": 0.7812, "step": 3820 }, { "epoch": 0.42, "learning_rate": 1.3153813716967721e-05, "loss": 0.6565, "step": 3821 }, { "epoch": 0.42, "learning_rate": 1.3150467548486929e-05, "loss": 0.7439, "step": 3822 }, { "epoch": 0.42, "learning_rate": 1.314712098833701e-05, "loss": 0.7231, "step": 3823 }, { "epoch": 0.42, "learning_rate": 1.3143774036934008e-05, "loss": 0.6599, "step": 3824 }, { "epoch": 0.42, "learning_rate": 1.3140426694694017e-05, "loss": 0.7319, "step": 3825 }, { "epoch": 0.42, "learning_rate": 1.3137078962033186e-05, "loss": 0.6428, "step": 3826 }, { "epoch": 0.42, "learning_rate": 1.3133730839367707e-05, "loss": 0.6956, "step": 3827 }, { "epoch": 0.42, "learning_rate": 1.3130382327113824e-05, "loss": 0.707, "step": 3828 }, { "epoch": 0.42, "learning_rate": 1.312703342568782e-05, "loss": 0.7593, "step": 3829 }, { "epoch": 0.42, "learning_rate": 1.3123684135506041e-05, "loss": 0.7183, "step": 3830 }, { "epoch": 0.42, "learning_rate": 1.3120334456984871e-05, "loss": 0.7415, "step": 3831 }, { "epoch": 0.42, "learning_rate": 1.3116984390540749e-05, "loss": 0.6584, "step": 3832 }, { "epoch": 0.42, "learning_rate": 1.311363393659015e-05, "loss": 0.6631, "step": 3833 }, { "epoch": 0.42, "learning_rate": 1.3110283095549613e-05, "loss": 0.7278, "step": 3834 }, { "epoch": 0.42, "learning_rate": 1.3106931867835715e-05, "loss": 0.6333, "step": 3835 }, { "epoch": 0.42, "learning_rate": 1.3103580253865086e-05, "loss": 0.6936, "step": 3836 }, { "epoch": 0.42, "learning_rate": 1.3100228254054399e-05, "loss": 0.7632, "step": 3837 }, { "epoch": 0.42, "learning_rate": 1.309687586882038e-05, "loss": 0.7229, "step": 3838 }, { "epoch": 0.42, "learning_rate": 1.3093523098579799e-05, "loss": 0.7886, "step": 3839 }, { "epoch": 0.42, "learning_rate": 1.3090169943749475e-05, "loss": 0.7681, "step": 3840 }, { "epoch": 0.42, "learning_rate": 1.3086816404746276e-05, "loss": 0.7129, "step": 3841 }, { "epoch": 0.42, "learning_rate": 1.3083462481987121e-05, "loss": 0.635, "step": 3842 }, { "epoch": 0.42, "learning_rate": 1.308010817588897e-05, "loss": 0.709, "step": 3843 }, { "epoch": 0.42, "learning_rate": 1.3076753486868832e-05, "loss": 0.7305, "step": 3844 }, { "epoch": 0.42, "learning_rate": 1.3073398415343763e-05, "loss": 0.8018, "step": 3845 }, { "epoch": 0.42, "learning_rate": 1.3070042961730878e-05, "loss": 0.6787, "step": 3846 }, { "epoch": 0.42, "learning_rate": 1.3066687126447322e-05, "loss": 0.6646, "step": 3847 }, { "epoch": 0.42, "learning_rate": 1.3063330909910296e-05, "loss": 0.71, "step": 3848 }, { "epoch": 0.42, "learning_rate": 1.3059974312537054e-05, "loss": 0.6997, "step": 3849 }, { "epoch": 0.42, "learning_rate": 1.3056617334744883e-05, "loss": 0.8555, "step": 3850 }, { "epoch": 0.42, "learning_rate": 1.3053259976951134e-05, "loss": 0.6997, "step": 3851 }, { "epoch": 0.42, "learning_rate": 1.3049902239573188e-05, "loss": 0.7285, "step": 3852 }, { "epoch": 0.42, "learning_rate": 1.3046544123028493e-05, "loss": 0.6968, "step": 3853 }, { "epoch": 0.42, "learning_rate": 1.3043185627734523e-05, "loss": 0.8921, "step": 3854 }, { "epoch": 0.42, "learning_rate": 1.3039826754108814e-05, "loss": 0.6858, "step": 3855 }, { "epoch": 0.42, "learning_rate": 1.3036467502568945e-05, "loss": 0.8081, "step": 3856 }, { "epoch": 0.42, "learning_rate": 1.3033107873532542e-05, "loss": 0.7979, "step": 3857 }, { "epoch": 0.42, "learning_rate": 1.3029747867417275e-05, "loss": 0.7588, "step": 3858 }, { "epoch": 0.42, "learning_rate": 1.3026387484640864e-05, "loss": 0.7227, "step": 3859 }, { "epoch": 0.42, "learning_rate": 1.302302672562107e-05, "loss": 0.7593, "step": 3860 }, { "epoch": 0.42, "learning_rate": 1.3019665590775717e-05, "loss": 0.7178, "step": 3861 }, { "epoch": 0.42, "learning_rate": 1.3016304080522657e-05, "loss": 0.6743, "step": 3862 }, { "epoch": 0.42, "learning_rate": 1.3012942195279794e-05, "loss": 0.627, "step": 3863 }, { "epoch": 0.42, "learning_rate": 1.3009579935465087e-05, "loss": 0.7373, "step": 3864 }, { "epoch": 0.42, "learning_rate": 1.3006217301496532e-05, "loss": 0.7954, "step": 3865 }, { "epoch": 0.42, "learning_rate": 1.3002854293792175e-05, "loss": 0.7612, "step": 3866 }, { "epoch": 0.42, "learning_rate": 1.2999490912770108e-05, "loss": 0.6133, "step": 3867 }, { "epoch": 0.42, "learning_rate": 1.299612715884847e-05, "loss": 0.7476, "step": 3868 }, { "epoch": 0.42, "learning_rate": 1.2992763032445445e-05, "loss": 0.6804, "step": 3869 }, { "epoch": 0.42, "learning_rate": 1.2989398533979271e-05, "loss": 0.7285, "step": 3870 }, { "epoch": 0.42, "learning_rate": 1.2986033663868216e-05, "loss": 0.6868, "step": 3871 }, { "epoch": 0.42, "learning_rate": 1.2982668422530611e-05, "loss": 0.6555, "step": 3872 }, { "epoch": 0.42, "learning_rate": 1.297930281038482e-05, "loss": 0.6147, "step": 3873 }, { "epoch": 0.42, "learning_rate": 1.2975936827849268e-05, "loss": 0.7817, "step": 3874 }, { "epoch": 0.42, "learning_rate": 1.2972570475342406e-05, "loss": 0.6375, "step": 3875 }, { "epoch": 0.42, "learning_rate": 1.296920375328275e-05, "loss": 0.7192, "step": 3876 }, { "epoch": 0.42, "learning_rate": 1.2965836662088854e-05, "loss": 0.6587, "step": 3877 }, { "epoch": 0.42, "learning_rate": 1.296246920217931e-05, "loss": 0.7737, "step": 3878 }, { "epoch": 0.42, "learning_rate": 1.2959101373972773e-05, "loss": 0.7461, "step": 3879 }, { "epoch": 0.42, "learning_rate": 1.2955733177887933e-05, "loss": 0.8594, "step": 3880 }, { "epoch": 0.42, "learning_rate": 1.2952364614343527e-05, "loss": 0.7935, "step": 3881 }, { "epoch": 0.42, "learning_rate": 1.2948995683758331e-05, "loss": 0.7493, "step": 3882 }, { "epoch": 0.42, "learning_rate": 1.2945626386551183e-05, "loss": 0.6106, "step": 3883 }, { "epoch": 0.42, "learning_rate": 1.2942256723140951e-05, "loss": 0.6714, "step": 3884 }, { "epoch": 0.42, "learning_rate": 1.2938886693946563e-05, "loss": 0.7263, "step": 3885 }, { "epoch": 0.42, "learning_rate": 1.2935516299386972e-05, "loss": 0.7083, "step": 3886 }, { "epoch": 0.42, "learning_rate": 1.29321455398812e-05, "loss": 0.7446, "step": 3887 }, { "epoch": 0.42, "learning_rate": 1.2928774415848296e-05, "loss": 0.7031, "step": 3888 }, { "epoch": 0.42, "learning_rate": 1.2925402927707364e-05, "loss": 0.7537, "step": 3889 }, { "epoch": 0.42, "learning_rate": 1.2922031075877551e-05, "loss": 0.7297, "step": 3890 }, { "epoch": 0.42, "learning_rate": 1.2918658860778046e-05, "loss": 0.8545, "step": 3891 }, { "epoch": 0.42, "learning_rate": 1.2915286282828092e-05, "loss": 0.6843, "step": 3892 }, { "epoch": 0.42, "learning_rate": 1.2911913342446965e-05, "loss": 0.7773, "step": 3893 }, { "epoch": 0.42, "learning_rate": 1.2908540040053992e-05, "loss": 0.729, "step": 3894 }, { "epoch": 0.42, "learning_rate": 1.290516637606855e-05, "loss": 1.0825, "step": 3895 }, { "epoch": 0.42, "learning_rate": 1.2901792350910053e-05, "loss": 0.7686, "step": 3896 }, { "epoch": 0.42, "learning_rate": 1.2898417964997965e-05, "loss": 0.8564, "step": 3897 }, { "epoch": 0.42, "learning_rate": 1.2895043218751788e-05, "loss": 0.7832, "step": 3898 }, { "epoch": 0.42, "learning_rate": 1.2891668112591082e-05, "loss": 0.7334, "step": 3899 }, { "epoch": 0.42, "learning_rate": 1.2888292646935438e-05, "loss": 0.7915, "step": 3900 }, { "epoch": 0.42, "learning_rate": 1.2884916822204494e-05, "loss": 0.6702, "step": 3901 }, { "epoch": 0.42, "learning_rate": 1.2881540638817942e-05, "loss": 0.7798, "step": 3902 }, { "epoch": 0.42, "learning_rate": 1.287816409719551e-05, "loss": 0.7156, "step": 3903 }, { "epoch": 0.42, "learning_rate": 1.2874787197756976e-05, "loss": 0.6719, "step": 3904 }, { "epoch": 0.43, "learning_rate": 1.2871409940922148e-05, "loss": 0.8623, "step": 3905 }, { "epoch": 0.43, "learning_rate": 1.2868032327110904e-05, "loss": 0.8223, "step": 3906 }, { "epoch": 0.43, "learning_rate": 1.2864654356743143e-05, "loss": 0.7058, "step": 3907 }, { "epoch": 0.43, "learning_rate": 1.2861276030238825e-05, "loss": 0.6892, "step": 3908 }, { "epoch": 0.43, "learning_rate": 1.2857897348017936e-05, "loss": 0.729, "step": 3909 }, { "epoch": 0.43, "learning_rate": 1.285451831050053e-05, "loss": 0.7036, "step": 3910 }, { "epoch": 0.43, "learning_rate": 1.2851138918106683e-05, "loss": 0.7856, "step": 3911 }, { "epoch": 0.43, "learning_rate": 1.2847759171256523e-05, "loss": 0.7568, "step": 3912 }, { "epoch": 0.43, "learning_rate": 1.284437907037023e-05, "loss": 0.7268, "step": 3913 }, { "epoch": 0.43, "learning_rate": 1.284099861586802e-05, "loss": 0.7014, "step": 3914 }, { "epoch": 0.43, "learning_rate": 1.2837617808170153e-05, "loss": 0.6631, "step": 3915 }, { "epoch": 0.43, "learning_rate": 1.283423664769693e-05, "loss": 0.8076, "step": 3916 }, { "epoch": 0.43, "learning_rate": 1.2830855134868705e-05, "loss": 0.8374, "step": 3917 }, { "epoch": 0.43, "learning_rate": 1.2827473270105873e-05, "loss": 0.6624, "step": 3918 }, { "epoch": 0.43, "learning_rate": 1.282409105382887e-05, "loss": 0.6687, "step": 3919 }, { "epoch": 0.43, "learning_rate": 1.2820708486458166e-05, "loss": 0.6609, "step": 3920 }, { "epoch": 0.43, "learning_rate": 1.2817325568414299e-05, "loss": 0.6572, "step": 3921 }, { "epoch": 0.43, "learning_rate": 1.2813942300117828e-05, "loss": 0.8311, "step": 3922 }, { "epoch": 0.43, "learning_rate": 1.281055868198937e-05, "loss": 0.6423, "step": 3923 }, { "epoch": 0.43, "learning_rate": 1.2807174714449572e-05, "loss": 0.7231, "step": 3924 }, { "epoch": 0.43, "learning_rate": 1.280379039791914e-05, "loss": 0.6956, "step": 3925 }, { "epoch": 0.43, "learning_rate": 1.280040573281881e-05, "loss": 0.7322, "step": 3926 }, { "epoch": 0.43, "learning_rate": 1.279702071956937e-05, "loss": 0.7329, "step": 3927 }, { "epoch": 0.43, "learning_rate": 1.2793635358591645e-05, "loss": 0.5984, "step": 3928 }, { "epoch": 0.43, "learning_rate": 1.279024965030651e-05, "loss": 0.7603, "step": 3929 }, { "epoch": 0.43, "learning_rate": 1.278686359513488e-05, "loss": 0.7764, "step": 3930 }, { "epoch": 0.43, "learning_rate": 1.2783477193497705e-05, "loss": 0.6938, "step": 3931 }, { "epoch": 0.43, "learning_rate": 1.278009044581599e-05, "loss": 0.7505, "step": 3932 }, { "epoch": 0.43, "learning_rate": 1.2776703352510787e-05, "loss": 0.8154, "step": 3933 }, { "epoch": 0.43, "learning_rate": 1.277331591400317e-05, "loss": 0.7776, "step": 3934 }, { "epoch": 0.43, "learning_rate": 1.2769928130714275e-05, "loss": 0.8281, "step": 3935 }, { "epoch": 0.43, "learning_rate": 1.2766540003065272e-05, "loss": 0.7212, "step": 3936 }, { "epoch": 0.43, "learning_rate": 1.276315153147738e-05, "loss": 0.8398, "step": 3937 }, { "epoch": 0.43, "learning_rate": 1.2759762716371853e-05, "loss": 0.8191, "step": 3938 }, { "epoch": 0.43, "learning_rate": 1.2756373558169992e-05, "loss": 0.7891, "step": 3939 }, { "epoch": 0.43, "learning_rate": 1.2752984057293143e-05, "loss": 0.6157, "step": 3940 }, { "epoch": 0.43, "learning_rate": 1.2749594214162693e-05, "loss": 0.6528, "step": 3941 }, { "epoch": 0.43, "learning_rate": 1.2746204029200066e-05, "loss": 0.6997, "step": 3942 }, { "epoch": 0.43, "learning_rate": 1.2742813502826735e-05, "loss": 0.6504, "step": 3943 }, { "epoch": 0.43, "learning_rate": 1.2739422635464216e-05, "loss": 0.7554, "step": 3944 }, { "epoch": 0.43, "learning_rate": 1.2736031427534059e-05, "loss": 0.7275, "step": 3945 }, { "epoch": 0.43, "learning_rate": 1.2732639879457867e-05, "loss": 0.7451, "step": 3946 }, { "epoch": 0.43, "learning_rate": 1.2729247991657279e-05, "loss": 0.6626, "step": 3947 }, { "epoch": 0.43, "learning_rate": 1.2725855764553981e-05, "loss": 0.7754, "step": 3948 }, { "epoch": 0.43, "learning_rate": 1.2722463198569693e-05, "loss": 0.6626, "step": 3949 }, { "epoch": 0.43, "learning_rate": 1.2719070294126183e-05, "loss": 0.7241, "step": 3950 }, { "epoch": 0.43, "learning_rate": 1.2715677051645259e-05, "loss": 0.6414, "step": 3951 }, { "epoch": 0.43, "learning_rate": 1.2712283471548778e-05, "loss": 0.6084, "step": 3952 }, { "epoch": 0.43, "learning_rate": 1.270888955425863e-05, "loss": 0.7383, "step": 3953 }, { "epoch": 0.43, "learning_rate": 1.2705495300196745e-05, "loss": 0.6748, "step": 3954 }, { "epoch": 0.43, "learning_rate": 1.2702100709785105e-05, "loss": 0.7485, "step": 3955 }, { "epoch": 0.43, "learning_rate": 1.2698705783445733e-05, "loss": 0.8364, "step": 3956 }, { "epoch": 0.43, "learning_rate": 1.269531052160068e-05, "loss": 0.7881, "step": 3957 }, { "epoch": 0.43, "learning_rate": 1.2691914924672053e-05, "loss": 0.7339, "step": 3958 }, { "epoch": 0.43, "learning_rate": 1.2688518993081998e-05, "loss": 0.7202, "step": 3959 }, { "epoch": 0.43, "learning_rate": 1.2685122727252695e-05, "loss": 0.5833, "step": 3960 }, { "epoch": 0.43, "learning_rate": 1.2681726127606374e-05, "loss": 0.7065, "step": 3961 }, { "epoch": 0.43, "learning_rate": 1.2678329194565304e-05, "loss": 0.6423, "step": 3962 }, { "epoch": 0.43, "learning_rate": 1.2674931928551797e-05, "loss": 0.812, "step": 3963 }, { "epoch": 0.43, "learning_rate": 1.2671534329988197e-05, "loss": 0.738, "step": 3964 }, { "epoch": 0.43, "learning_rate": 1.2668136399296907e-05, "loss": 0.7102, "step": 3965 }, { "epoch": 0.43, "learning_rate": 1.266473813690035e-05, "loss": 0.8096, "step": 3966 }, { "epoch": 0.43, "learning_rate": 1.266133954322101e-05, "loss": 0.6628, "step": 3967 }, { "epoch": 0.43, "learning_rate": 1.2657940618681402e-05, "loss": 0.7422, "step": 3968 }, { "epoch": 0.43, "learning_rate": 1.2654541363704077e-05, "loss": 0.7188, "step": 3969 }, { "epoch": 0.43, "learning_rate": 1.2651141778711638e-05, "loss": 0.6631, "step": 3970 }, { "epoch": 0.43, "learning_rate": 1.2647741864126727e-05, "loss": 0.6821, "step": 3971 }, { "epoch": 0.43, "learning_rate": 1.2644341620372025e-05, "loss": 0.7822, "step": 3972 }, { "epoch": 0.43, "learning_rate": 1.2640941047870245e-05, "loss": 0.6958, "step": 3973 }, { "epoch": 0.43, "learning_rate": 1.263754014704416e-05, "loss": 0.6104, "step": 3974 }, { "epoch": 0.43, "learning_rate": 1.2634138918316567e-05, "loss": 0.7031, "step": 3975 }, { "epoch": 0.43, "learning_rate": 1.2630737362110314e-05, "loss": 0.7761, "step": 3976 }, { "epoch": 0.43, "learning_rate": 1.2627335478848282e-05, "loss": 0.7039, "step": 3977 }, { "epoch": 0.43, "learning_rate": 1.2623933268953396e-05, "loss": 0.653, "step": 3978 }, { "epoch": 0.43, "learning_rate": 1.2620530732848626e-05, "loss": 0.751, "step": 3979 }, { "epoch": 0.43, "learning_rate": 1.2617127870956975e-05, "loss": 0.7, "step": 3980 }, { "epoch": 0.43, "learning_rate": 1.2613724683701491e-05, "loss": 0.8032, "step": 3981 }, { "epoch": 0.43, "learning_rate": 1.2610321171505264e-05, "loss": 0.7043, "step": 3982 }, { "epoch": 0.43, "learning_rate": 1.2606917334791415e-05, "loss": 0.7988, "step": 3983 }, { "epoch": 0.43, "learning_rate": 1.2603513173983121e-05, "loss": 0.6711, "step": 3984 }, { "epoch": 0.43, "learning_rate": 1.2600108689503584e-05, "loss": 0.7087, "step": 3985 }, { "epoch": 0.43, "learning_rate": 1.259670388177606e-05, "loss": 1.0559, "step": 3986 }, { "epoch": 0.43, "learning_rate": 1.259329875122383e-05, "loss": 0.728, "step": 3987 }, { "epoch": 0.43, "learning_rate": 1.2589893298270223e-05, "loss": 0.72, "step": 3988 }, { "epoch": 0.43, "learning_rate": 1.2586487523338615e-05, "loss": 0.5984, "step": 3989 }, { "epoch": 0.43, "learning_rate": 1.2583081426852412e-05, "loss": 0.8052, "step": 3990 }, { "epoch": 0.43, "learning_rate": 1.2579675009235062e-05, "loss": 0.7607, "step": 3991 }, { "epoch": 0.43, "learning_rate": 1.2576268270910052e-05, "loss": 0.6631, "step": 3992 }, { "epoch": 0.43, "learning_rate": 1.2572861212300917e-05, "loss": 0.6702, "step": 3993 }, { "epoch": 0.43, "learning_rate": 1.2569453833831222e-05, "loss": 0.7085, "step": 3994 }, { "epoch": 0.43, "learning_rate": 1.2566046135924577e-05, "loss": 0.709, "step": 3995 }, { "epoch": 0.44, "learning_rate": 1.2562638119004627e-05, "loss": 0.8101, "step": 3996 }, { "epoch": 0.44, "learning_rate": 1.2559229783495064e-05, "loss": 0.7317, "step": 3997 }, { "epoch": 0.44, "learning_rate": 1.2555821129819612e-05, "loss": 0.7056, "step": 3998 }, { "epoch": 0.44, "learning_rate": 1.2552412158402044e-05, "loss": 0.8052, "step": 3999 }, { "epoch": 0.44, "learning_rate": 1.2549002869666156e-05, "loss": 0.7473, "step": 4000 }, { "epoch": 0.44, "learning_rate": 1.2545593264035804e-05, "loss": 0.6821, "step": 4001 }, { "epoch": 0.44, "learning_rate": 1.2542183341934873e-05, "loss": 0.7312, "step": 4002 }, { "epoch": 0.44, "learning_rate": 1.2538773103787278e-05, "loss": 0.8091, "step": 4003 }, { "epoch": 0.44, "learning_rate": 1.2535362550016993e-05, "loss": 0.7981, "step": 4004 }, { "epoch": 0.44, "learning_rate": 1.253195168104802e-05, "loss": 1.1033, "step": 4005 }, { "epoch": 0.44, "learning_rate": 1.2528540497304398e-05, "loss": 0.7083, "step": 4006 }, { "epoch": 0.44, "learning_rate": 1.2525128999210207e-05, "loss": 0.7729, "step": 4007 }, { "epoch": 0.44, "learning_rate": 1.2521717187189572e-05, "loss": 0.7598, "step": 4008 }, { "epoch": 0.44, "learning_rate": 1.2518305061666655e-05, "loss": 0.6575, "step": 4009 }, { "epoch": 0.44, "learning_rate": 1.2514892623065648e-05, "loss": 0.6448, "step": 4010 }, { "epoch": 0.44, "learning_rate": 1.2511479871810792e-05, "loss": 0.8345, "step": 4011 }, { "epoch": 0.44, "learning_rate": 1.2508066808326364e-05, "loss": 0.7544, "step": 4012 }, { "epoch": 0.44, "learning_rate": 1.250465343303668e-05, "loss": 0.7107, "step": 4013 }, { "epoch": 0.44, "learning_rate": 1.2501239746366092e-05, "loss": 0.7268, "step": 4014 }, { "epoch": 0.44, "learning_rate": 1.2497825748738991e-05, "loss": 0.7358, "step": 4015 }, { "epoch": 0.44, "learning_rate": 1.2494411440579814e-05, "loss": 0.7588, "step": 4016 }, { "epoch": 0.44, "learning_rate": 1.2490996822313026e-05, "loss": 0.6716, "step": 4017 }, { "epoch": 0.44, "learning_rate": 1.248758189436314e-05, "loss": 0.7354, "step": 4018 }, { "epoch": 0.44, "learning_rate": 1.2484166657154696e-05, "loss": 0.606, "step": 4019 }, { "epoch": 0.44, "learning_rate": 1.248075111111229e-05, "loss": 0.6875, "step": 4020 }, { "epoch": 0.44, "learning_rate": 1.2477335256660538e-05, "loss": 0.6233, "step": 4021 }, { "epoch": 0.44, "learning_rate": 1.2473919094224102e-05, "loss": 0.6887, "step": 4022 }, { "epoch": 0.44, "learning_rate": 1.2470502624227687e-05, "loss": 0.7307, "step": 4023 }, { "epoch": 0.44, "learning_rate": 1.246708584709603e-05, "loss": 0.6909, "step": 4024 }, { "epoch": 0.44, "learning_rate": 1.246366876325391e-05, "loss": 0.7529, "step": 4025 }, { "epoch": 0.44, "learning_rate": 1.2460251373126136e-05, "loss": 0.7073, "step": 4026 }, { "epoch": 0.44, "learning_rate": 1.2456833677137563e-05, "loss": 0.8774, "step": 4027 }, { "epoch": 0.44, "learning_rate": 1.245341567571309e-05, "loss": 0.7065, "step": 4028 }, { "epoch": 0.44, "learning_rate": 1.244999736927764e-05, "loss": 0.6665, "step": 4029 }, { "epoch": 0.44, "learning_rate": 1.2446578758256176e-05, "loss": 0.6936, "step": 4030 }, { "epoch": 0.44, "learning_rate": 1.2443159843073711e-05, "loss": 0.751, "step": 4031 }, { "epoch": 0.44, "learning_rate": 1.2439740624155285e-05, "loss": 0.637, "step": 4032 }, { "epoch": 0.44, "learning_rate": 1.2436321101925977e-05, "loss": 0.7075, "step": 4033 }, { "epoch": 0.44, "learning_rate": 1.2432901276810908e-05, "loss": 0.8018, "step": 4034 }, { "epoch": 0.44, "learning_rate": 1.242948114923523e-05, "loss": 0.8335, "step": 4035 }, { "epoch": 0.44, "learning_rate": 1.2426060719624139e-05, "loss": 0.6956, "step": 4036 }, { "epoch": 0.44, "learning_rate": 1.2422639988402865e-05, "loss": 0.6873, "step": 4037 }, { "epoch": 0.44, "learning_rate": 1.2419218955996677e-05, "loss": 0.7476, "step": 4038 }, { "epoch": 0.44, "learning_rate": 1.2415797622830886e-05, "loss": 0.7285, "step": 4039 }, { "epoch": 0.44, "learning_rate": 1.2412375989330826e-05, "loss": 0.7114, "step": 4040 }, { "epoch": 0.44, "learning_rate": 1.2408954055921884e-05, "loss": 0.6838, "step": 4041 }, { "epoch": 0.44, "learning_rate": 1.2405531823029475e-05, "loss": 0.717, "step": 4042 }, { "epoch": 0.44, "learning_rate": 1.2402109291079058e-05, "loss": 0.7344, "step": 4043 }, { "epoch": 0.44, "learning_rate": 1.2398686460496123e-05, "loss": 0.7061, "step": 4044 }, { "epoch": 0.44, "learning_rate": 1.2395263331706202e-05, "loss": 0.7217, "step": 4045 }, { "epoch": 0.44, "learning_rate": 1.2391839905134853e-05, "loss": 0.7998, "step": 4046 }, { "epoch": 0.44, "learning_rate": 1.238841618120769e-05, "loss": 0.73, "step": 4047 }, { "epoch": 0.44, "learning_rate": 1.2384992160350351e-05, "loss": 0.6685, "step": 4048 }, { "epoch": 0.44, "learning_rate": 1.238156784298851e-05, "loss": 0.7285, "step": 4049 }, { "epoch": 0.44, "learning_rate": 1.237814322954788e-05, "loss": 0.71, "step": 4050 }, { "epoch": 0.44, "learning_rate": 1.2374718320454222e-05, "loss": 0.7065, "step": 4051 }, { "epoch": 0.44, "learning_rate": 1.2371293116133318e-05, "loss": 0.8115, "step": 4052 }, { "epoch": 0.44, "learning_rate": 1.236786761701099e-05, "loss": 0.7371, "step": 4053 }, { "epoch": 0.44, "learning_rate": 1.2364441823513102e-05, "loss": 0.8247, "step": 4054 }, { "epoch": 0.44, "learning_rate": 1.2361015736065551e-05, "loss": 0.7104, "step": 4055 }, { "epoch": 0.44, "learning_rate": 1.2357589355094275e-05, "loss": 0.6948, "step": 4056 }, { "epoch": 0.44, "learning_rate": 1.2354162681025237e-05, "loss": 0.8032, "step": 4057 }, { "epoch": 0.44, "learning_rate": 1.2350735714284454e-05, "loss": 0.6472, "step": 4058 }, { "epoch": 0.44, "learning_rate": 1.2347308455297966e-05, "loss": 0.7354, "step": 4059 }, { "epoch": 0.44, "learning_rate": 1.2343880904491846e-05, "loss": 0.8083, "step": 4060 }, { "epoch": 0.44, "learning_rate": 1.2340453062292222e-05, "loss": 0.7744, "step": 4061 }, { "epoch": 0.44, "learning_rate": 1.233702492912524e-05, "loss": 0.6345, "step": 4062 }, { "epoch": 0.44, "learning_rate": 1.2333596505417093e-05, "loss": 0.8115, "step": 4063 }, { "epoch": 0.44, "learning_rate": 1.2330167791594001e-05, "loss": 0.8286, "step": 4064 }, { "epoch": 0.44, "learning_rate": 1.2326738788082225e-05, "loss": 0.8013, "step": 4065 }, { "epoch": 0.44, "learning_rate": 1.2323309495308066e-05, "loss": 0.6768, "step": 4066 }, { "epoch": 0.44, "learning_rate": 1.2319879913697857e-05, "loss": 0.6882, "step": 4067 }, { "epoch": 0.44, "learning_rate": 1.2316450043677962e-05, "loss": 0.6345, "step": 4068 }, { "epoch": 0.44, "learning_rate": 1.2313019885674786e-05, "loss": 0.7979, "step": 4069 }, { "epoch": 0.44, "learning_rate": 1.2309589440114775e-05, "loss": 0.7944, "step": 4070 }, { "epoch": 0.44, "learning_rate": 1.2306158707424402e-05, "loss": 0.729, "step": 4071 }, { "epoch": 0.44, "learning_rate": 1.2302727688030181e-05, "loss": 0.8062, "step": 4072 }, { "epoch": 0.44, "learning_rate": 1.2299296382358657e-05, "loss": 0.7798, "step": 4073 }, { "epoch": 0.44, "learning_rate": 1.2295864790836411e-05, "loss": 0.7749, "step": 4074 }, { "epoch": 0.44, "learning_rate": 1.229243291389007e-05, "loss": 0.6401, "step": 4075 }, { "epoch": 0.44, "learning_rate": 1.228900075194628e-05, "loss": 0.75, "step": 4076 }, { "epoch": 0.44, "learning_rate": 1.2285568305431735e-05, "loss": 0.7515, "step": 4077 }, { "epoch": 0.44, "learning_rate": 1.2282135574773157e-05, "loss": 0.7646, "step": 4078 }, { "epoch": 0.44, "learning_rate": 1.2278702560397307e-05, "loss": 0.5808, "step": 4079 }, { "epoch": 0.44, "learning_rate": 1.2275269262730982e-05, "loss": 0.8008, "step": 4080 }, { "epoch": 0.44, "learning_rate": 1.2271835682201016e-05, "loss": 0.6958, "step": 4081 }, { "epoch": 0.44, "learning_rate": 1.226840181923427e-05, "loss": 0.7249, "step": 4082 }, { "epoch": 0.44, "learning_rate": 1.2264967674257647e-05, "loss": 0.7161, "step": 4083 }, { "epoch": 0.44, "learning_rate": 1.2261533247698078e-05, "loss": 0.8159, "step": 4084 }, { "epoch": 0.44, "learning_rate": 1.2258098539982543e-05, "loss": 0.77, "step": 4085 }, { "epoch": 0.44, "learning_rate": 1.2254663551538047e-05, "loss": 0.7649, "step": 4086 }, { "epoch": 0.44, "learning_rate": 1.2251228282791625e-05, "loss": 0.7769, "step": 4087 }, { "epoch": 0.45, "learning_rate": 1.2247792734170357e-05, "loss": 0.8037, "step": 4088 }, { "epoch": 0.45, "learning_rate": 1.224435690610135e-05, "loss": 0.5754, "step": 4089 }, { "epoch": 0.45, "learning_rate": 1.2240920799011752e-05, "loss": 0.7456, "step": 4090 }, { "epoch": 0.45, "learning_rate": 1.2237484413328746e-05, "loss": 0.7783, "step": 4091 }, { "epoch": 0.45, "learning_rate": 1.2234047749479543e-05, "loss": 0.6714, "step": 4092 }, { "epoch": 0.45, "learning_rate": 1.2230610807891394e-05, "loss": 0.7639, "step": 4093 }, { "epoch": 0.45, "learning_rate": 1.2227173588991583e-05, "loss": 0.7783, "step": 4094 }, { "epoch": 0.45, "learning_rate": 1.2223736093207424e-05, "loss": 0.7043, "step": 4095 }, { "epoch": 0.45, "learning_rate": 1.2220298320966278e-05, "loss": 0.7476, "step": 4096 }, { "epoch": 0.45, "learning_rate": 1.2216860272695526e-05, "loss": 0.811, "step": 4097 }, { "epoch": 0.45, "learning_rate": 1.2213421948822589e-05, "loss": 0.8281, "step": 4098 }, { "epoch": 0.45, "learning_rate": 1.2209983349774924e-05, "loss": 0.877, "step": 4099 }, { "epoch": 0.45, "learning_rate": 1.2206544475980022e-05, "loss": 0.6318, "step": 4100 }, { "epoch": 0.45, "learning_rate": 1.2203105327865407e-05, "loss": 0.8647, "step": 4101 }, { "epoch": 0.45, "learning_rate": 1.219966590585864e-05, "loss": 0.7278, "step": 4102 }, { "epoch": 0.45, "learning_rate": 1.2196226210387303e-05, "loss": 0.6997, "step": 4103 }, { "epoch": 0.45, "learning_rate": 1.2192786241879033e-05, "loss": 0.6724, "step": 4104 }, { "epoch": 0.45, "learning_rate": 1.2189346000761489e-05, "loss": 0.7754, "step": 4105 }, { "epoch": 0.45, "learning_rate": 1.2185905487462359e-05, "loss": 0.8008, "step": 4106 }, { "epoch": 0.45, "learning_rate": 1.2182464702409375e-05, "loss": 0.7227, "step": 4107 }, { "epoch": 0.45, "learning_rate": 1.2179023646030297e-05, "loss": 0.6318, "step": 4108 }, { "epoch": 0.45, "learning_rate": 1.2175582318752923e-05, "loss": 0.6377, "step": 4109 }, { "epoch": 0.45, "learning_rate": 1.217214072100508e-05, "loss": 0.7273, "step": 4110 }, { "epoch": 0.45, "learning_rate": 1.2168698853214628e-05, "loss": 0.7188, "step": 4111 }, { "epoch": 0.45, "learning_rate": 1.216525671580947e-05, "loss": 0.8022, "step": 4112 }, { "epoch": 0.45, "learning_rate": 1.2161814309217532e-05, "loss": 0.6956, "step": 4113 }, { "epoch": 0.45, "learning_rate": 1.2158371633866777e-05, "loss": 0.7256, "step": 4114 }, { "epoch": 0.45, "learning_rate": 1.2154928690185201e-05, "loss": 0.6604, "step": 4115 }, { "epoch": 0.45, "learning_rate": 1.215148547860084e-05, "loss": 0.7097, "step": 4116 }, { "epoch": 0.45, "learning_rate": 1.2148041999541746e-05, "loss": 0.646, "step": 4117 }, { "epoch": 0.45, "learning_rate": 1.2144598253436024e-05, "loss": 0.7378, "step": 4118 }, { "epoch": 0.45, "learning_rate": 1.2141154240711806e-05, "loss": 0.7856, "step": 4119 }, { "epoch": 0.45, "learning_rate": 1.2137709961797248e-05, "loss": 0.7261, "step": 4120 }, { "epoch": 0.45, "learning_rate": 1.2134265417120549e-05, "loss": 0.7576, "step": 4121 }, { "epoch": 0.45, "learning_rate": 1.2130820607109937e-05, "loss": 0.7625, "step": 4122 }, { "epoch": 0.45, "learning_rate": 1.2127375532193674e-05, "loss": 0.6621, "step": 4123 }, { "epoch": 0.45, "learning_rate": 1.2123930192800062e-05, "loss": 0.8237, "step": 4124 }, { "epoch": 0.45, "learning_rate": 1.212048458935742e-05, "loss": 0.6665, "step": 4125 }, { "epoch": 0.45, "learning_rate": 1.211703872229411e-05, "loss": 0.7295, "step": 4126 }, { "epoch": 0.45, "learning_rate": 1.2113592592038525e-05, "loss": 0.7173, "step": 4127 }, { "epoch": 0.45, "learning_rate": 1.2110146199019099e-05, "loss": 0.6577, "step": 4128 }, { "epoch": 0.45, "learning_rate": 1.2106699543664282e-05, "loss": 0.6438, "step": 4129 }, { "epoch": 0.45, "learning_rate": 1.210325262640257e-05, "loss": 0.7014, "step": 4130 }, { "epoch": 0.45, "learning_rate": 1.2099805447662485e-05, "loss": 0.7029, "step": 4131 }, { "epoch": 0.45, "learning_rate": 1.2096358007872583e-05, "loss": 0.6726, "step": 4132 }, { "epoch": 0.45, "learning_rate": 1.2092910307461457e-05, "loss": 0.7183, "step": 4133 }, { "epoch": 0.45, "learning_rate": 1.2089462346857725e-05, "loss": 0.717, "step": 4134 }, { "epoch": 0.45, "learning_rate": 1.2086014126490041e-05, "loss": 0.6926, "step": 4135 }, { "epoch": 0.45, "learning_rate": 1.2082565646787092e-05, "loss": 0.7209, "step": 4136 }, { "epoch": 0.45, "learning_rate": 1.2079116908177592e-05, "loss": 0.7266, "step": 4137 }, { "epoch": 0.45, "learning_rate": 1.20756679110903e-05, "loss": 0.769, "step": 4138 }, { "epoch": 0.45, "learning_rate": 1.2072218655953995e-05, "loss": 0.7646, "step": 4139 }, { "epoch": 0.45, "learning_rate": 1.2068769143197488e-05, "loss": 0.8018, "step": 4140 }, { "epoch": 0.45, "learning_rate": 1.2065319373249627e-05, "loss": 0.7402, "step": 4141 }, { "epoch": 0.45, "learning_rate": 1.2061869346539292e-05, "loss": 0.7327, "step": 4142 }, { "epoch": 0.45, "learning_rate": 1.2058419063495397e-05, "loss": 0.7964, "step": 4143 }, { "epoch": 0.45, "learning_rate": 1.2054968524546879e-05, "loss": 0.7944, "step": 4144 }, { "epoch": 0.45, "learning_rate": 1.2051517730122715e-05, "loss": 0.6746, "step": 4145 }, { "epoch": 0.45, "learning_rate": 1.2048066680651908e-05, "loss": 0.6414, "step": 4146 }, { "epoch": 0.45, "learning_rate": 1.20446153765635e-05, "loss": 0.7144, "step": 4147 }, { "epoch": 0.45, "learning_rate": 1.2041163818286558e-05, "loss": 0.7656, "step": 4148 }, { "epoch": 0.45, "learning_rate": 1.2037712006250184e-05, "loss": 0.7539, "step": 4149 }, { "epoch": 0.45, "learning_rate": 1.2034259940883512e-05, "loss": 0.8452, "step": 4150 }, { "epoch": 0.45, "learning_rate": 1.20308076226157e-05, "loss": 0.8315, "step": 4151 }, { "epoch": 0.45, "learning_rate": 1.2027355051875951e-05, "loss": 0.79, "step": 4152 }, { "epoch": 0.45, "learning_rate": 1.2023902229093487e-05, "loss": 0.6357, "step": 4153 }, { "epoch": 0.45, "learning_rate": 1.2020449154697571e-05, "loss": 0.6372, "step": 4154 }, { "epoch": 0.45, "learning_rate": 1.2016995829117489e-05, "loss": 0.6411, "step": 4155 }, { "epoch": 0.45, "learning_rate": 1.2013542252782556e-05, "loss": 0.7371, "step": 4156 }, { "epoch": 0.45, "learning_rate": 1.2010088426122133e-05, "loss": 0.7402, "step": 4157 }, { "epoch": 0.45, "learning_rate": 1.2006634349565602e-05, "loss": 0.7126, "step": 4158 }, { "epoch": 0.45, "learning_rate": 1.2003180023542375e-05, "loss": 0.7778, "step": 4159 }, { "epoch": 0.45, "learning_rate": 1.1999725448481894e-05, "loss": 0.7827, "step": 4160 }, { "epoch": 0.45, "learning_rate": 1.1996270624813642e-05, "loss": 0.7681, "step": 4161 }, { "epoch": 0.45, "learning_rate": 1.199281555296712e-05, "loss": 0.8149, "step": 4162 }, { "epoch": 0.45, "learning_rate": 1.198936023337187e-05, "loss": 0.6528, "step": 4163 }, { "epoch": 0.45, "learning_rate": 1.1985904666457455e-05, "loss": 0.7151, "step": 4164 }, { "epoch": 0.45, "learning_rate": 1.198244885265348e-05, "loss": 0.752, "step": 4165 }, { "epoch": 0.45, "learning_rate": 1.1978992792389574e-05, "loss": 0.8003, "step": 4166 }, { "epoch": 0.45, "learning_rate": 1.1975536486095396e-05, "loss": 0.7969, "step": 4167 }, { "epoch": 0.45, "learning_rate": 1.197207993420064e-05, "loss": 0.8037, "step": 4168 }, { "epoch": 0.45, "learning_rate": 1.1968623137135024e-05, "loss": 0.6611, "step": 4169 }, { "epoch": 0.45, "learning_rate": 1.1965166095328302e-05, "loss": 0.8359, "step": 4170 }, { "epoch": 0.45, "learning_rate": 1.1961708809210258e-05, "loss": 0.717, "step": 4171 }, { "epoch": 0.45, "learning_rate": 1.1958251279210704e-05, "loss": 0.7842, "step": 4172 }, { "epoch": 0.45, "learning_rate": 1.1954793505759484e-05, "loss": 0.7942, "step": 4173 }, { "epoch": 0.45, "learning_rate": 1.195133548928647e-05, "loss": 0.7019, "step": 4174 }, { "epoch": 0.45, "learning_rate": 1.1947877230221565e-05, "loss": 0.8013, "step": 4175 }, { "epoch": 0.45, "learning_rate": 1.194441872899471e-05, "loss": 0.7954, "step": 4176 }, { "epoch": 0.45, "learning_rate": 1.1940959986035863e-05, "loss": 0.5474, "step": 4177 }, { "epoch": 0.45, "learning_rate": 1.193750100177502e-05, "loss": 0.6494, "step": 4178 }, { "epoch": 0.45, "learning_rate": 1.19340417766422e-05, "loss": 0.696, "step": 4179 }, { "epoch": 0.46, "learning_rate": 1.1930582311067468e-05, "loss": 0.7881, "step": 4180 }, { "epoch": 0.46, "learning_rate": 1.1927122605480899e-05, "loss": 0.7368, "step": 4181 }, { "epoch": 0.46, "learning_rate": 1.1923662660312611e-05, "loss": 0.6782, "step": 4182 }, { "epoch": 0.46, "learning_rate": 1.1920202475992743e-05, "loss": 0.7869, "step": 4183 }, { "epoch": 0.46, "learning_rate": 1.1916742052951476e-05, "loss": 0.7424, "step": 4184 }, { "epoch": 0.46, "learning_rate": 1.191328139161901e-05, "loss": 0.7244, "step": 4185 }, { "epoch": 0.46, "learning_rate": 1.1909820492425574e-05, "loss": 0.6519, "step": 4186 }, { "epoch": 0.46, "learning_rate": 1.1906359355801434e-05, "loss": 0.7241, "step": 4187 }, { "epoch": 0.46, "learning_rate": 1.1902897982176882e-05, "loss": 0.6663, "step": 4188 }, { "epoch": 0.46, "learning_rate": 1.1899436371982235e-05, "loss": 0.7258, "step": 4189 }, { "epoch": 0.46, "learning_rate": 1.1895974525647849e-05, "loss": 0.6558, "step": 4190 }, { "epoch": 0.46, "learning_rate": 1.1892512443604103e-05, "loss": 0.7549, "step": 4191 }, { "epoch": 0.46, "learning_rate": 1.1889050126281405e-05, "loss": 0.7549, "step": 4192 }, { "epoch": 0.46, "learning_rate": 1.1885587574110195e-05, "loss": 0.7285, "step": 4193 }, { "epoch": 0.46, "learning_rate": 1.1882124787520934e-05, "loss": 0.6951, "step": 4194 }, { "epoch": 0.46, "learning_rate": 1.187866176694413e-05, "loss": 0.6333, "step": 4195 }, { "epoch": 0.46, "learning_rate": 1.1875198512810301e-05, "loss": 0.7375, "step": 4196 }, { "epoch": 0.46, "learning_rate": 1.1871735025550008e-05, "loss": 0.6143, "step": 4197 }, { "epoch": 0.46, "learning_rate": 1.1868271305593828e-05, "loss": 0.689, "step": 4198 }, { "epoch": 0.46, "learning_rate": 1.1864807353372379e-05, "loss": 0.8347, "step": 4199 }, { "epoch": 0.46, "learning_rate": 1.1861343169316301e-05, "loss": 0.7788, "step": 4200 }, { "epoch": 0.46, "learning_rate": 1.1857878753856267e-05, "loss": 0.6846, "step": 4201 }, { "epoch": 0.46, "learning_rate": 1.1854414107422971e-05, "loss": 0.8376, "step": 4202 }, { "epoch": 0.46, "learning_rate": 1.1850949230447146e-05, "loss": 0.7051, "step": 4203 }, { "epoch": 0.46, "learning_rate": 1.184748412335955e-05, "loss": 0.6821, "step": 4204 }, { "epoch": 0.46, "learning_rate": 1.1844018786590964e-05, "loss": 0.7886, "step": 4205 }, { "epoch": 0.46, "learning_rate": 1.1840553220572204e-05, "loss": 0.6755, "step": 4206 }, { "epoch": 0.46, "learning_rate": 1.1837087425734114e-05, "loss": 0.7539, "step": 4207 }, { "epoch": 0.46, "learning_rate": 1.1833621402507562e-05, "loss": 0.6511, "step": 4208 }, { "epoch": 0.46, "learning_rate": 1.1830155151323447e-05, "loss": 0.7876, "step": 4209 }, { "epoch": 0.46, "learning_rate": 1.18266886726127e-05, "loss": 0.7002, "step": 4210 }, { "epoch": 0.46, "learning_rate": 1.1823221966806277e-05, "loss": 0.6531, "step": 4211 }, { "epoch": 0.46, "learning_rate": 1.181975503433516e-05, "loss": 0.7161, "step": 4212 }, { "epoch": 0.46, "learning_rate": 1.1816287875630357e-05, "loss": 0.8457, "step": 4213 }, { "epoch": 0.46, "learning_rate": 1.1812820491122918e-05, "loss": 0.6665, "step": 4214 }, { "epoch": 0.46, "learning_rate": 1.1809352881243904e-05, "loss": 0.6479, "step": 4215 }, { "epoch": 0.46, "learning_rate": 1.180588504642442e-05, "loss": 0.6614, "step": 4216 }, { "epoch": 0.46, "learning_rate": 1.1802416987095579e-05, "loss": 0.7424, "step": 4217 }, { "epoch": 0.46, "learning_rate": 1.179894870368854e-05, "loss": 0.8018, "step": 4218 }, { "epoch": 0.46, "learning_rate": 1.1795480196634483e-05, "loss": 0.7827, "step": 4219 }, { "epoch": 0.46, "learning_rate": 1.179201146636462e-05, "loss": 0.6296, "step": 4220 }, { "epoch": 0.46, "learning_rate": 1.1788542513310178e-05, "loss": 0.6953, "step": 4221 }, { "epoch": 0.46, "learning_rate": 1.1785073337902425e-05, "loss": 0.7915, "step": 4222 }, { "epoch": 0.46, "learning_rate": 1.1781603940572653e-05, "loss": 0.7422, "step": 4223 }, { "epoch": 0.46, "learning_rate": 1.1778134321752182e-05, "loss": 0.7087, "step": 4224 }, { "epoch": 0.46, "learning_rate": 1.1774664481872354e-05, "loss": 0.6785, "step": 4225 }, { "epoch": 0.46, "learning_rate": 1.1771194421364546e-05, "loss": 0.7175, "step": 4226 }, { "epoch": 0.46, "learning_rate": 1.1767724140660158e-05, "loss": 0.7834, "step": 4227 }, { "epoch": 0.46, "learning_rate": 1.1764253640190619e-05, "loss": 0.6929, "step": 4228 }, { "epoch": 0.46, "learning_rate": 1.1760782920387386e-05, "loss": 0.7461, "step": 4229 }, { "epoch": 0.46, "learning_rate": 1.1757311981681943e-05, "loss": 0.7505, "step": 4230 }, { "epoch": 0.46, "learning_rate": 1.1753840824505798e-05, "loss": 0.71, "step": 4231 }, { "epoch": 0.46, "learning_rate": 1.1750369449290484e-05, "loss": 0.6108, "step": 4232 }, { "epoch": 0.46, "learning_rate": 1.1746897856467574e-05, "loss": 0.7163, "step": 4233 }, { "epoch": 0.46, "learning_rate": 1.174342604646866e-05, "loss": 0.6841, "step": 4234 }, { "epoch": 0.46, "learning_rate": 1.1739954019725355e-05, "loss": 0.6873, "step": 4235 }, { "epoch": 0.46, "learning_rate": 1.1736481776669307e-05, "loss": 0.7451, "step": 4236 }, { "epoch": 0.46, "learning_rate": 1.1733009317732185e-05, "loss": 0.72, "step": 4237 }, { "epoch": 0.46, "learning_rate": 1.1729536643345696e-05, "loss": 0.7812, "step": 4238 }, { "epoch": 0.46, "learning_rate": 1.1726063753941563e-05, "loss": 0.7524, "step": 4239 }, { "epoch": 0.46, "learning_rate": 1.1722590649951534e-05, "loss": 0.7651, "step": 4240 }, { "epoch": 0.46, "learning_rate": 1.1719117331807397e-05, "loss": 0.832, "step": 4241 }, { "epoch": 0.46, "learning_rate": 1.171564379994095e-05, "loss": 0.7822, "step": 4242 }, { "epoch": 0.46, "learning_rate": 1.1712170054784033e-05, "loss": 0.7847, "step": 4243 }, { "epoch": 0.46, "learning_rate": 1.1708696096768499e-05, "loss": 0.7271, "step": 4244 }, { "epoch": 0.46, "learning_rate": 1.170522192632624e-05, "loss": 0.7251, "step": 4245 }, { "epoch": 0.46, "learning_rate": 1.1701747543889161e-05, "loss": 0.6929, "step": 4246 }, { "epoch": 0.46, "learning_rate": 1.1698272949889206e-05, "loss": 0.6855, "step": 4247 }, { "epoch": 0.46, "learning_rate": 1.1694798144758342e-05, "loss": 0.6438, "step": 4248 }, { "epoch": 0.46, "learning_rate": 1.1691323128928554e-05, "loss": 0.6982, "step": 4249 }, { "epoch": 0.46, "learning_rate": 1.1687847902831861e-05, "loss": 0.7749, "step": 4250 }, { "epoch": 0.46, "learning_rate": 1.1684372466900306e-05, "loss": 0.7998, "step": 4251 }, { "epoch": 0.46, "learning_rate": 1.168089682156596e-05, "loss": 0.7229, "step": 4252 }, { "epoch": 0.46, "learning_rate": 1.1677420967260921e-05, "loss": 0.6902, "step": 4253 }, { "epoch": 0.46, "learning_rate": 1.1673944904417309e-05, "loss": 0.6531, "step": 4254 }, { "epoch": 0.46, "learning_rate": 1.1670468633467266e-05, "loss": 0.7637, "step": 4255 }, { "epoch": 0.46, "learning_rate": 1.166699215484297e-05, "loss": 0.6929, "step": 4256 }, { "epoch": 0.46, "learning_rate": 1.166351546897662e-05, "loss": 0.6526, "step": 4257 }, { "epoch": 0.46, "learning_rate": 1.1660038576300444e-05, "loss": 0.73, "step": 4258 }, { "epoch": 0.46, "learning_rate": 1.1656561477246683e-05, "loss": 0.7305, "step": 4259 }, { "epoch": 0.46, "learning_rate": 1.1653084172247624e-05, "loss": 0.6855, "step": 4260 }, { "epoch": 0.46, "learning_rate": 1.1649606661735561e-05, "loss": 0.7954, "step": 4261 }, { "epoch": 0.46, "learning_rate": 1.1646128946142827e-05, "loss": 0.7109, "step": 4262 }, { "epoch": 0.46, "learning_rate": 1.1642651025901772e-05, "loss": 0.7839, "step": 4263 }, { "epoch": 0.46, "learning_rate": 1.1639172901444775e-05, "loss": 0.7346, "step": 4264 }, { "epoch": 0.46, "learning_rate": 1.1635694573204239e-05, "loss": 0.6252, "step": 4265 }, { "epoch": 0.46, "learning_rate": 1.1632216041612595e-05, "loss": 0.8169, "step": 4266 }, { "epoch": 0.46, "learning_rate": 1.1628737307102295e-05, "loss": 0.8076, "step": 4267 }, { "epoch": 0.46, "learning_rate": 1.162525837010582e-05, "loss": 0.6804, "step": 4268 }, { "epoch": 0.46, "learning_rate": 1.1621779231055677e-05, "loss": 0.7607, "step": 4269 }, { "epoch": 0.46, "learning_rate": 1.1618299890384387e-05, "loss": 0.7466, "step": 4270 }, { "epoch": 0.46, "learning_rate": 1.1614820348524517e-05, "loss": 0.7192, "step": 4271 }, { "epoch": 0.47, "learning_rate": 1.1611340605908643e-05, "loss": 0.6917, "step": 4272 }, { "epoch": 0.47, "learning_rate": 1.1607860662969366e-05, "loss": 0.6802, "step": 4273 }, { "epoch": 0.47, "learning_rate": 1.1604380520139315e-05, "loss": 0.6187, "step": 4274 }, { "epoch": 0.47, "learning_rate": 1.1600900177851152e-05, "loss": 0.7329, "step": 4275 }, { "epoch": 0.47, "learning_rate": 1.159741963653755e-05, "loss": 0.5293, "step": 4276 }, { "epoch": 0.47, "learning_rate": 1.1593938896631215e-05, "loss": 0.7483, "step": 4277 }, { "epoch": 0.47, "learning_rate": 1.1590457958564878e-05, "loss": 0.7124, "step": 4278 }, { "epoch": 0.47, "learning_rate": 1.158697682277129e-05, "loss": 0.7134, "step": 4279 }, { "epoch": 0.47, "learning_rate": 1.158349548968323e-05, "loss": 0.636, "step": 4280 }, { "epoch": 0.47, "learning_rate": 1.15800139597335e-05, "loss": 0.7256, "step": 4281 }, { "epoch": 0.47, "learning_rate": 1.1576532233354928e-05, "loss": 0.8125, "step": 4282 }, { "epoch": 0.47, "learning_rate": 1.1573050310980367e-05, "loss": 0.644, "step": 4283 }, { "epoch": 0.47, "learning_rate": 1.156956819304269e-05, "loss": 0.7664, "step": 4284 }, { "epoch": 0.47, "learning_rate": 1.1566085879974797e-05, "loss": 0.707, "step": 4285 }, { "epoch": 0.47, "learning_rate": 1.1562603372209616e-05, "loss": 0.8042, "step": 4286 }, { "epoch": 0.47, "learning_rate": 1.1559120670180095e-05, "loss": 0.6929, "step": 4287 }, { "epoch": 0.47, "learning_rate": 1.1555637774319203e-05, "loss": 0.7949, "step": 4288 }, { "epoch": 0.47, "learning_rate": 1.1552154685059938e-05, "loss": 0.7461, "step": 4289 }, { "epoch": 0.47, "learning_rate": 1.1548671402835325e-05, "loss": 0.8125, "step": 4290 }, { "epoch": 0.47, "learning_rate": 1.1545187928078407e-05, "loss": 0.6975, "step": 4291 }, { "epoch": 0.47, "learning_rate": 1.1541704261222251e-05, "loss": 1.1091, "step": 4292 }, { "epoch": 0.47, "learning_rate": 1.1538220402699952e-05, "loss": 0.8135, "step": 4293 }, { "epoch": 0.47, "learning_rate": 1.1534736352944623e-05, "loss": 0.7056, "step": 4294 }, { "epoch": 0.47, "learning_rate": 1.1531252112389408e-05, "loss": 0.8071, "step": 4295 }, { "epoch": 0.47, "learning_rate": 1.1527767681467472e-05, "loss": 0.8755, "step": 4296 }, { "epoch": 0.47, "learning_rate": 1.1524283060611998e-05, "loss": 0.8438, "step": 4297 }, { "epoch": 0.47, "learning_rate": 1.1520798250256204e-05, "loss": 0.7, "step": 4298 }, { "epoch": 0.47, "learning_rate": 1.1517313250833318e-05, "loss": 0.7118, "step": 4299 }, { "epoch": 0.47, "learning_rate": 1.1513828062776605e-05, "loss": 0.7573, "step": 4300 }, { "epoch": 0.47, "learning_rate": 1.1510342686519339e-05, "loss": 0.7656, "step": 4301 }, { "epoch": 0.47, "learning_rate": 1.1506857122494832e-05, "loss": 0.8159, "step": 4302 }, { "epoch": 0.47, "learning_rate": 1.1503371371136413e-05, "loss": 0.8008, "step": 4303 }, { "epoch": 0.47, "learning_rate": 1.1499885432877426e-05, "loss": 0.7261, "step": 4304 }, { "epoch": 0.47, "learning_rate": 1.1496399308151257e-05, "loss": 0.7095, "step": 4305 }, { "epoch": 0.47, "learning_rate": 1.1492912997391296e-05, "loss": 0.8037, "step": 4306 }, { "epoch": 0.47, "learning_rate": 1.1489426501030971e-05, "loss": 0.8259, "step": 4307 }, { "epoch": 0.47, "learning_rate": 1.1485939819503717e-05, "loss": 0.748, "step": 4308 }, { "epoch": 0.47, "learning_rate": 1.1482452953243013e-05, "loss": 0.748, "step": 4309 }, { "epoch": 0.47, "learning_rate": 1.1478965902682343e-05, "loss": 0.7593, "step": 4310 }, { "epoch": 0.47, "learning_rate": 1.1475478668255223e-05, "loss": 0.7925, "step": 4311 }, { "epoch": 0.47, "learning_rate": 1.1471991250395184e-05, "loss": 0.703, "step": 4312 }, { "epoch": 0.47, "learning_rate": 1.146850364953579e-05, "loss": 0.8315, "step": 4313 }, { "epoch": 0.47, "learning_rate": 1.1465015866110622e-05, "loss": 0.6987, "step": 4314 }, { "epoch": 0.47, "learning_rate": 1.1461527900553287e-05, "loss": 0.7012, "step": 4315 }, { "epoch": 0.47, "learning_rate": 1.1458039753297408e-05, "loss": 0.6858, "step": 4316 }, { "epoch": 0.47, "learning_rate": 1.1454551424776636e-05, "loss": 0.769, "step": 4317 }, { "epoch": 0.47, "learning_rate": 1.1451062915424643e-05, "loss": 0.7168, "step": 4318 }, { "epoch": 0.47, "learning_rate": 1.1447574225675126e-05, "loss": 0.7964, "step": 4319 }, { "epoch": 0.47, "learning_rate": 1.14440853559618e-05, "loss": 0.8279, "step": 4320 }, { "epoch": 0.47, "learning_rate": 1.1440596306718409e-05, "loss": 0.6343, "step": 4321 }, { "epoch": 0.47, "learning_rate": 1.1437107078378707e-05, "loss": 0.7998, "step": 4322 }, { "epoch": 0.47, "learning_rate": 1.1433617671376483e-05, "loss": 0.74, "step": 4323 }, { "epoch": 0.47, "learning_rate": 1.1430128086145542e-05, "loss": 0.6978, "step": 4324 }, { "epoch": 0.47, "learning_rate": 1.1426638323119716e-05, "loss": 0.7837, "step": 4325 }, { "epoch": 0.47, "learning_rate": 1.1423148382732854e-05, "loss": 0.7769, "step": 4326 }, { "epoch": 0.47, "learning_rate": 1.1419658265418825e-05, "loss": 0.7173, "step": 4327 }, { "epoch": 0.47, "learning_rate": 1.1416167971611526e-05, "loss": 0.6807, "step": 4328 }, { "epoch": 0.47, "learning_rate": 1.1412677501744878e-05, "loss": 0.7253, "step": 4329 }, { "epoch": 0.47, "learning_rate": 1.1409186856252817e-05, "loss": 0.7036, "step": 4330 }, { "epoch": 0.47, "learning_rate": 1.1405696035569296e-05, "loss": 0.772, "step": 4331 }, { "epoch": 0.47, "learning_rate": 1.1402205040128307e-05, "loss": 1.0051, "step": 4332 }, { "epoch": 0.47, "learning_rate": 1.1398713870363848e-05, "loss": 0.6794, "step": 4333 }, { "epoch": 0.47, "learning_rate": 1.1395222526709953e-05, "loss": 0.7607, "step": 4334 }, { "epoch": 0.47, "learning_rate": 1.1391731009600655e-05, "loss": 0.6821, "step": 4335 }, { "epoch": 0.47, "learning_rate": 1.1388239319470035e-05, "loss": 0.6873, "step": 4336 }, { "epoch": 0.47, "learning_rate": 1.138474745675218e-05, "loss": 0.7666, "step": 4337 }, { "epoch": 0.47, "learning_rate": 1.13812554218812e-05, "loss": 0.7856, "step": 4338 }, { "epoch": 0.47, "learning_rate": 1.1377763215291225e-05, "loss": 0.7188, "step": 4339 }, { "epoch": 0.47, "learning_rate": 1.1374270837416415e-05, "loss": 0.7029, "step": 4340 }, { "epoch": 0.47, "learning_rate": 1.1370778288690947e-05, "loss": 0.6953, "step": 4341 }, { "epoch": 0.47, "learning_rate": 1.1367285569549012e-05, "loss": 0.7354, "step": 4342 }, { "epoch": 0.47, "learning_rate": 1.136379268042483e-05, "loss": 0.6938, "step": 4343 }, { "epoch": 0.47, "learning_rate": 1.1360299621752644e-05, "loss": 0.6987, "step": 4344 }, { "epoch": 0.47, "learning_rate": 1.135680639396671e-05, "loss": 0.5996, "step": 4345 }, { "epoch": 0.47, "learning_rate": 1.1353312997501313e-05, "loss": 0.6714, "step": 4346 }, { "epoch": 0.47, "learning_rate": 1.1349819432790752e-05, "loss": 0.7114, "step": 4347 }, { "epoch": 0.47, "learning_rate": 1.1346325700269355e-05, "loss": 0.8105, "step": 4348 }, { "epoch": 0.47, "learning_rate": 1.1342831800371458e-05, "loss": 0.7915, "step": 4349 }, { "epoch": 0.47, "learning_rate": 1.1339337733531435e-05, "loss": 0.6716, "step": 4350 }, { "epoch": 0.47, "learning_rate": 1.1335843500183665e-05, "loss": 0.6797, "step": 4351 }, { "epoch": 0.47, "learning_rate": 1.1332349100762559e-05, "loss": 0.6902, "step": 4352 }, { "epoch": 0.47, "learning_rate": 1.1328854535702542e-05, "loss": 0.8081, "step": 4353 }, { "epoch": 0.47, "learning_rate": 1.132535980543806e-05, "loss": 0.7661, "step": 4354 }, { "epoch": 0.47, "learning_rate": 1.1321864910403586e-05, "loss": 0.7124, "step": 4355 }, { "epoch": 0.47, "learning_rate": 1.1318369851033604e-05, "loss": 0.7383, "step": 4356 }, { "epoch": 0.47, "learning_rate": 1.1314874627762627e-05, "loss": 1.1841, "step": 4357 }, { "epoch": 0.47, "learning_rate": 1.1311379241025179e-05, "loss": 0.6809, "step": 4358 }, { "epoch": 0.47, "learning_rate": 1.1307883691255817e-05, "loss": 0.7041, "step": 4359 }, { "epoch": 0.47, "learning_rate": 1.1304387978889107e-05, "loss": 0.7065, "step": 4360 }, { "epoch": 0.47, "learning_rate": 1.1300892104359635e-05, "loss": 0.7507, "step": 4361 }, { "epoch": 0.47, "learning_rate": 1.1297396068102019e-05, "loss": 0.7869, "step": 4362 }, { "epoch": 0.47, "learning_rate": 1.1293899870550886e-05, "loss": 0.7351, "step": 4363 }, { "epoch": 0.48, "learning_rate": 1.1290403512140888e-05, "loss": 0.7246, "step": 4364 }, { "epoch": 0.48, "learning_rate": 1.1286906993306694e-05, "loss": 0.7681, "step": 4365 }, { "epoch": 0.48, "learning_rate": 1.1283410314482994e-05, "loss": 0.729, "step": 4366 }, { "epoch": 0.48, "learning_rate": 1.1279913476104505e-05, "loss": 0.6458, "step": 4367 }, { "epoch": 0.48, "learning_rate": 1.127641647860595e-05, "loss": 0.6821, "step": 4368 }, { "epoch": 0.48, "learning_rate": 1.1272919322422077e-05, "loss": 0.748, "step": 4369 }, { "epoch": 0.48, "learning_rate": 1.1269422007987664e-05, "loss": 0.7866, "step": 4370 }, { "epoch": 0.48, "learning_rate": 1.1265924535737494e-05, "loss": 0.7656, "step": 4371 }, { "epoch": 0.48, "learning_rate": 1.126242690610638e-05, "loss": 0.7979, "step": 4372 }, { "epoch": 0.48, "learning_rate": 1.125892911952915e-05, "loss": 0.7729, "step": 4373 }, { "epoch": 0.48, "learning_rate": 1.125543117644065e-05, "loss": 0.7778, "step": 4374 }, { "epoch": 0.48, "learning_rate": 1.1251933077275748e-05, "loss": 0.7471, "step": 4375 }, { "epoch": 0.48, "learning_rate": 1.1248434822469334e-05, "loss": 0.7, "step": 4376 }, { "epoch": 0.48, "learning_rate": 1.1244936412456309e-05, "loss": 0.6609, "step": 4377 }, { "epoch": 0.48, "learning_rate": 1.1241437847671605e-05, "loss": 0.7725, "step": 4378 }, { "epoch": 0.48, "learning_rate": 1.1237939128550167e-05, "loss": 0.7334, "step": 4379 }, { "epoch": 0.48, "learning_rate": 1.1234440255526948e-05, "loss": 0.7676, "step": 4380 }, { "epoch": 0.48, "learning_rate": 1.1230941229036943e-05, "loss": 0.6624, "step": 4381 }, { "epoch": 0.48, "learning_rate": 1.1227442049515151e-05, "loss": 0.7302, "step": 4382 }, { "epoch": 0.48, "learning_rate": 1.1223942717396597e-05, "loss": 0.7593, "step": 4383 }, { "epoch": 0.48, "learning_rate": 1.122044323311631e-05, "loss": 0.6978, "step": 4384 }, { "epoch": 0.48, "learning_rate": 1.1216943597109358e-05, "loss": 0.6938, "step": 4385 }, { "epoch": 0.48, "learning_rate": 1.121344380981082e-05, "loss": 0.739, "step": 4386 }, { "epoch": 0.48, "learning_rate": 1.120994387165579e-05, "loss": 0.7939, "step": 4387 }, { "epoch": 0.48, "learning_rate": 1.1206443783079384e-05, "loss": 0.7393, "step": 4388 }, { "epoch": 0.48, "learning_rate": 1.1202943544516736e-05, "loss": 0.7925, "step": 4389 }, { "epoch": 0.48, "learning_rate": 1.1199443156402998e-05, "loss": 0.7466, "step": 4390 }, { "epoch": 0.48, "learning_rate": 1.1195942619173345e-05, "loss": 0.707, "step": 4391 }, { "epoch": 0.48, "learning_rate": 1.1192441933262963e-05, "loss": 0.7009, "step": 4392 }, { "epoch": 0.48, "learning_rate": 1.1188941099107064e-05, "loss": 0.7842, "step": 4393 }, { "epoch": 0.48, "learning_rate": 1.1185440117140876e-05, "loss": 0.7104, "step": 4394 }, { "epoch": 0.48, "learning_rate": 1.118193898779964e-05, "loss": 0.7375, "step": 4395 }, { "epoch": 0.48, "learning_rate": 1.117843771151862e-05, "loss": 0.6895, "step": 4396 }, { "epoch": 0.48, "learning_rate": 1.1174936288733102e-05, "loss": 0.7078, "step": 4397 }, { "epoch": 0.48, "learning_rate": 1.1171434719878385e-05, "loss": 0.7441, "step": 4398 }, { "epoch": 0.48, "learning_rate": 1.1167933005389785e-05, "loss": 0.7051, "step": 4399 }, { "epoch": 0.48, "learning_rate": 1.116443114570264e-05, "loss": 0.6929, "step": 4400 }, { "epoch": 0.48, "learning_rate": 1.1160929141252303e-05, "loss": 0.7822, "step": 4401 }, { "epoch": 0.48, "learning_rate": 1.1157426992474151e-05, "loss": 0.6626, "step": 4402 }, { "epoch": 0.48, "learning_rate": 1.1153924699803572e-05, "loss": 0.728, "step": 4403 }, { "epoch": 0.48, "learning_rate": 1.1150422263675969e-05, "loss": 0.7192, "step": 4404 }, { "epoch": 0.48, "learning_rate": 1.1146919684526778e-05, "loss": 0.7092, "step": 4405 }, { "epoch": 0.48, "learning_rate": 1.1143416962791437e-05, "loss": 0.7104, "step": 4406 }, { "epoch": 0.48, "learning_rate": 1.1139914098905406e-05, "loss": 0.6765, "step": 4407 }, { "epoch": 0.48, "learning_rate": 1.1136411093304171e-05, "loss": 0.7246, "step": 4408 }, { "epoch": 0.48, "learning_rate": 1.1132907946423223e-05, "loss": 0.772, "step": 4409 }, { "epoch": 0.48, "learning_rate": 1.1129404658698082e-05, "loss": 0.7056, "step": 4410 }, { "epoch": 0.48, "learning_rate": 1.1125901230564271e-05, "loss": 0.7441, "step": 4411 }, { "epoch": 0.48, "learning_rate": 1.1122397662457352e-05, "loss": 0.7104, "step": 4412 }, { "epoch": 0.48, "learning_rate": 1.111889395481288e-05, "loss": 0.7817, "step": 4413 }, { "epoch": 0.48, "learning_rate": 1.1115390108066447e-05, "loss": 0.7461, "step": 4414 }, { "epoch": 0.48, "learning_rate": 1.111188612265365e-05, "loss": 0.6506, "step": 4415 }, { "epoch": 0.48, "learning_rate": 1.1108381999010111e-05, "loss": 0.6243, "step": 4416 }, { "epoch": 0.48, "learning_rate": 1.1104877737571467e-05, "loss": 0.8354, "step": 4417 }, { "epoch": 0.48, "learning_rate": 1.1101373338773366e-05, "loss": 0.6987, "step": 4418 }, { "epoch": 0.48, "learning_rate": 1.1097868803051481e-05, "loss": 0.7312, "step": 4419 }, { "epoch": 0.48, "learning_rate": 1.1094364130841501e-05, "loss": 0.6975, "step": 4420 }, { "epoch": 0.48, "learning_rate": 1.109085932257913e-05, "loss": 0.6897, "step": 4421 }, { "epoch": 0.48, "learning_rate": 1.1087354378700087e-05, "loss": 0.7686, "step": 4422 }, { "epoch": 0.48, "learning_rate": 1.1083849299640109e-05, "loss": 0.6753, "step": 4423 }, { "epoch": 0.48, "learning_rate": 1.1080344085834953e-05, "loss": 0.6104, "step": 4424 }, { "epoch": 0.48, "learning_rate": 1.1076838737720392e-05, "loss": 0.7974, "step": 4425 }, { "epoch": 0.48, "learning_rate": 1.1073333255732208e-05, "loss": 0.6687, "step": 4426 }, { "epoch": 0.48, "learning_rate": 1.1069827640306214e-05, "loss": 0.7771, "step": 4427 }, { "epoch": 0.48, "learning_rate": 1.1066321891878226e-05, "loss": 0.6592, "step": 4428 }, { "epoch": 0.48, "learning_rate": 1.1062816010884086e-05, "loss": 0.7559, "step": 4429 }, { "epoch": 0.48, "learning_rate": 1.1059309997759642e-05, "loss": 0.6143, "step": 4430 }, { "epoch": 0.48, "learning_rate": 1.1055803852940772e-05, "loss": 0.7705, "step": 4431 }, { "epoch": 0.48, "learning_rate": 1.105229757686336e-05, "loss": 0.7432, "step": 4432 }, { "epoch": 0.48, "learning_rate": 1.1048791169963307e-05, "loss": 0.5681, "step": 4433 }, { "epoch": 0.48, "learning_rate": 1.1045284632676535e-05, "loss": 0.7197, "step": 4434 }, { "epoch": 0.48, "learning_rate": 1.1041777965438985e-05, "loss": 0.7483, "step": 4435 }, { "epoch": 0.48, "learning_rate": 1.1038271168686603e-05, "loss": 0.6921, "step": 4436 }, { "epoch": 0.48, "learning_rate": 1.1034764242855359e-05, "loss": 0.7695, "step": 4437 }, { "epoch": 0.48, "learning_rate": 1.1031257188381235e-05, "loss": 0.7771, "step": 4438 }, { "epoch": 0.48, "learning_rate": 1.1027750005700237e-05, "loss": 0.7266, "step": 4439 }, { "epoch": 0.48, "learning_rate": 1.1024242695248379e-05, "loss": 0.595, "step": 4440 }, { "epoch": 0.48, "learning_rate": 1.102073525746169e-05, "loss": 0.7061, "step": 4441 }, { "epoch": 0.48, "learning_rate": 1.101722769277622e-05, "loss": 0.7661, "step": 4442 }, { "epoch": 0.48, "learning_rate": 1.1013720001628034e-05, "loss": 0.8491, "step": 4443 }, { "epoch": 0.48, "learning_rate": 1.1010212184453213e-05, "loss": 0.7432, "step": 4444 }, { "epoch": 0.48, "learning_rate": 1.1006704241687846e-05, "loss": 0.7375, "step": 4445 }, { "epoch": 0.48, "learning_rate": 1.1003196173768051e-05, "loss": 0.6462, "step": 4446 }, { "epoch": 0.48, "learning_rate": 1.099968798112995e-05, "loss": 0.6211, "step": 4447 }, { "epoch": 0.48, "learning_rate": 1.0996179664209685e-05, "loss": 0.7192, "step": 4448 }, { "epoch": 0.48, "learning_rate": 1.0992671223443413e-05, "loss": 0.8257, "step": 4449 }, { "epoch": 0.48, "learning_rate": 1.0989162659267313e-05, "loss": 0.7163, "step": 4450 }, { "epoch": 0.48, "learning_rate": 1.0985653972117564e-05, "loss": 0.7112, "step": 4451 }, { "epoch": 0.48, "learning_rate": 1.0982145162430373e-05, "loss": 0.6311, "step": 4452 }, { "epoch": 0.48, "learning_rate": 1.097863623064196e-05, "loss": 0.7393, "step": 4453 }, { "epoch": 0.48, "learning_rate": 1.0975127177188555e-05, "loss": 0.6997, "step": 4454 }, { "epoch": 0.48, "learning_rate": 1.0971618002506414e-05, "loss": 0.6226, "step": 4455 }, { "epoch": 0.49, "learning_rate": 1.0968108707031792e-05, "loss": 0.752, "step": 4456 }, { "epoch": 0.49, "learning_rate": 1.0964599291200973e-05, "loss": 0.7266, "step": 4457 }, { "epoch": 0.49, "learning_rate": 1.0961089755450253e-05, "loss": 0.75, "step": 4458 }, { "epoch": 0.49, "learning_rate": 1.0957580100215936e-05, "loss": 0.7249, "step": 4459 }, { "epoch": 0.49, "learning_rate": 1.095407032593435e-05, "loss": 0.7598, "step": 4460 }, { "epoch": 0.49, "learning_rate": 1.0950560433041825e-05, "loss": 0.6963, "step": 4461 }, { "epoch": 0.49, "learning_rate": 1.0947050421974727e-05, "loss": 0.7488, "step": 4462 }, { "epoch": 0.49, "learning_rate": 1.0943540293169417e-05, "loss": 0.7368, "step": 4463 }, { "epoch": 0.49, "learning_rate": 1.0940030047062276e-05, "loss": 0.7773, "step": 4464 }, { "epoch": 0.49, "learning_rate": 1.0936519684089703e-05, "loss": 0.7915, "step": 4465 }, { "epoch": 0.49, "learning_rate": 1.093300920468811e-05, "loss": 0.7637, "step": 4466 }, { "epoch": 0.49, "learning_rate": 1.0929498609293925e-05, "loss": 0.6917, "step": 4467 }, { "epoch": 0.49, "learning_rate": 1.0925987898343582e-05, "loss": 0.7156, "step": 4468 }, { "epoch": 0.49, "learning_rate": 1.0922477072273545e-05, "loss": 0.7915, "step": 4469 }, { "epoch": 0.49, "learning_rate": 1.0918966131520276e-05, "loss": 0.7456, "step": 4470 }, { "epoch": 0.49, "learning_rate": 1.0915455076520263e-05, "loss": 0.6924, "step": 4471 }, { "epoch": 0.49, "learning_rate": 1.0911943907709999e-05, "loss": 0.8403, "step": 4472 }, { "epoch": 0.49, "learning_rate": 1.0908432625526001e-05, "loss": 0.6677, "step": 4473 }, { "epoch": 0.49, "learning_rate": 1.0904921230404795e-05, "loss": 0.7542, "step": 4474 }, { "epoch": 0.49, "learning_rate": 1.0901409722782914e-05, "loss": 0.6262, "step": 4475 }, { "epoch": 0.49, "learning_rate": 1.0897898103096917e-05, "loss": 0.8252, "step": 4476 }, { "epoch": 0.49, "learning_rate": 1.0894386371783374e-05, "loss": 0.6589, "step": 4477 }, { "epoch": 0.49, "learning_rate": 1.0890874529278866e-05, "loss": 0.7495, "step": 4478 }, { "epoch": 0.49, "learning_rate": 1.0887362576019981e-05, "loss": 0.7471, "step": 4479 }, { "epoch": 0.49, "learning_rate": 1.088385051244334e-05, "loss": 0.7378, "step": 4480 }, { "epoch": 0.49, "learning_rate": 1.0880338338985557e-05, "loss": 0.7473, "step": 4481 }, { "epoch": 0.49, "learning_rate": 1.0876826056083275e-05, "loss": 0.6196, "step": 4482 }, { "epoch": 0.49, "learning_rate": 1.0873313664173137e-05, "loss": 0.7915, "step": 4483 }, { "epoch": 0.49, "learning_rate": 1.0869801163691816e-05, "loss": 0.7573, "step": 4484 }, { "epoch": 0.49, "learning_rate": 1.0866288555075981e-05, "loss": 0.6687, "step": 4485 }, { "epoch": 0.49, "learning_rate": 1.0862775838762332e-05, "loss": 0.6982, "step": 4486 }, { "epoch": 0.49, "learning_rate": 1.0859263015187562e-05, "loss": 0.7646, "step": 4487 }, { "epoch": 0.49, "learning_rate": 1.08557500847884e-05, "loss": 0.6914, "step": 4488 }, { "epoch": 0.49, "learning_rate": 1.0852237048001568e-05, "loss": 0.8181, "step": 4489 }, { "epoch": 0.49, "learning_rate": 1.0848723905263814e-05, "loss": 0.7209, "step": 4490 }, { "epoch": 0.49, "learning_rate": 1.0845210657011893e-05, "loss": 0.7798, "step": 4491 }, { "epoch": 0.49, "learning_rate": 1.084169730368258e-05, "loss": 0.6794, "step": 4492 }, { "epoch": 0.49, "learning_rate": 1.0838183845712658e-05, "loss": 0.636, "step": 4493 }, { "epoch": 0.49, "learning_rate": 1.0834670283538915e-05, "loss": 0.6729, "step": 4494 }, { "epoch": 0.49, "learning_rate": 1.0831156617598168e-05, "loss": 0.7764, "step": 4495 }, { "epoch": 0.49, "learning_rate": 1.082764284832724e-05, "loss": 0.6807, "step": 4496 }, { "epoch": 0.49, "learning_rate": 1.0824128976162964e-05, "loss": 0.6841, "step": 4497 }, { "epoch": 0.49, "learning_rate": 1.0820615001542185e-05, "loss": 0.6245, "step": 4498 }, { "epoch": 0.49, "learning_rate": 1.0817100924901769e-05, "loss": 0.6909, "step": 4499 }, { "epoch": 0.49, "learning_rate": 1.0813586746678584e-05, "loss": 0.7385, "step": 4500 }, { "epoch": 0.49, "learning_rate": 1.081007246730952e-05, "loss": 0.7646, "step": 4501 }, { "epoch": 0.49, "learning_rate": 1.0806558087231476e-05, "loss": 0.7695, "step": 4502 }, { "epoch": 0.49, "learning_rate": 1.080304360688136e-05, "loss": 0.6497, "step": 4503 }, { "epoch": 0.49, "learning_rate": 1.0799529026696096e-05, "loss": 0.7339, "step": 4504 }, { "epoch": 0.49, "learning_rate": 1.0796014347112622e-05, "loss": 0.6802, "step": 4505 }, { "epoch": 0.49, "learning_rate": 1.0792499568567885e-05, "loss": 0.7651, "step": 4506 }, { "epoch": 0.49, "learning_rate": 1.0788984691498847e-05, "loss": 0.7034, "step": 4507 }, { "epoch": 0.49, "learning_rate": 1.0785469716342481e-05, "loss": 0.7529, "step": 4508 }, { "epoch": 0.49, "learning_rate": 1.0781954643535769e-05, "loss": 0.7249, "step": 4509 }, { "epoch": 0.49, "learning_rate": 1.0778439473515707e-05, "loss": 0.7402, "step": 4510 }, { "epoch": 0.49, "learning_rate": 1.077492420671931e-05, "loss": 0.6562, "step": 4511 }, { "epoch": 0.49, "learning_rate": 1.0771408843583599e-05, "loss": 0.6887, "step": 4512 }, { "epoch": 0.49, "learning_rate": 1.0767893384545602e-05, "loss": 0.7095, "step": 4513 }, { "epoch": 0.49, "learning_rate": 1.0764377830042364e-05, "loss": 0.6919, "step": 4514 }, { "epoch": 0.49, "learning_rate": 1.076086218051095e-05, "loss": 0.7239, "step": 4515 }, { "epoch": 0.49, "learning_rate": 1.0757346436388427e-05, "loss": 0.7671, "step": 4516 }, { "epoch": 0.49, "learning_rate": 1.0753830598111867e-05, "loss": 0.7861, "step": 4517 }, { "epoch": 0.49, "learning_rate": 1.0750314666118371e-05, "loss": 0.7366, "step": 4518 }, { "epoch": 0.49, "learning_rate": 1.0746798640845038e-05, "loss": 0.8276, "step": 4519 }, { "epoch": 0.49, "learning_rate": 1.0743282522728989e-05, "loss": 0.6284, "step": 4520 }, { "epoch": 0.49, "learning_rate": 1.0739766312207344e-05, "loss": 0.751, "step": 4521 }, { "epoch": 0.49, "learning_rate": 1.0736250009717249e-05, "loss": 0.5906, "step": 4522 }, { "epoch": 0.49, "learning_rate": 1.0732733615695852e-05, "loss": 0.7695, "step": 4523 }, { "epoch": 0.49, "learning_rate": 1.0729217130580309e-05, "loss": 0.6765, "step": 4524 }, { "epoch": 0.49, "learning_rate": 1.0725700554807796e-05, "loss": 0.6125, "step": 4525 }, { "epoch": 0.49, "learning_rate": 1.0722183888815503e-05, "loss": 0.6333, "step": 4526 }, { "epoch": 0.49, "learning_rate": 1.0718667133040618e-05, "loss": 0.7449, "step": 4527 }, { "epoch": 0.49, "learning_rate": 1.0715150287920348e-05, "loss": 0.6794, "step": 4528 }, { "epoch": 0.49, "learning_rate": 1.0711633353891913e-05, "loss": 0.75, "step": 4529 }, { "epoch": 0.49, "learning_rate": 1.0708116331392542e-05, "loss": 0.7749, "step": 4530 }, { "epoch": 0.49, "learning_rate": 1.0704599220859473e-05, "loss": 0.6333, "step": 4531 }, { "epoch": 0.49, "learning_rate": 1.0701082022729955e-05, "loss": 0.7004, "step": 4532 }, { "epoch": 0.49, "learning_rate": 1.0697564737441254e-05, "loss": 0.6831, "step": 4533 }, { "epoch": 0.49, "learning_rate": 1.069404736543064e-05, "loss": 0.6953, "step": 4534 }, { "epoch": 0.49, "learning_rate": 1.0690529907135395e-05, "loss": 0.709, "step": 4535 }, { "epoch": 0.49, "learning_rate": 1.068701236299281e-05, "loss": 0.6919, "step": 4536 }, { "epoch": 0.49, "learning_rate": 1.0683494733440198e-05, "loss": 0.771, "step": 4537 }, { "epoch": 0.49, "learning_rate": 1.0679977018914864e-05, "loss": 0.7622, "step": 4538 }, { "epoch": 0.49, "learning_rate": 1.0676459219854144e-05, "loss": 0.7861, "step": 4539 }, { "epoch": 0.49, "learning_rate": 1.0672941336695364e-05, "loss": 0.6272, "step": 4540 }, { "epoch": 0.49, "learning_rate": 1.0669423369875877e-05, "loss": 0.6724, "step": 4541 }, { "epoch": 0.49, "learning_rate": 1.066590531983304e-05, "loss": 0.6533, "step": 4542 }, { "epoch": 0.49, "learning_rate": 1.0662387187004217e-05, "loss": 0.8208, "step": 4543 }, { "epoch": 0.49, "learning_rate": 1.0658868971826785e-05, "loss": 0.8403, "step": 4544 }, { "epoch": 0.49, "learning_rate": 1.065535067473814e-05, "loss": 0.6812, "step": 4545 }, { "epoch": 0.49, "learning_rate": 1.0651832296175671e-05, "loss": 0.7158, "step": 4546 }, { "epoch": 0.49, "learning_rate": 1.0648313836576786e-05, "loss": 0.6482, "step": 4547 }, { "epoch": 0.5, "learning_rate": 1.0644795296378908e-05, "loss": 0.8018, "step": 4548 }, { "epoch": 0.5, "learning_rate": 1.0641276676019467e-05, "loss": 0.8296, "step": 4549 }, { "epoch": 0.5, "learning_rate": 1.0637757975935899e-05, "loss": 0.6318, "step": 4550 }, { "epoch": 0.5, "learning_rate": 1.0634239196565646e-05, "loss": 0.8462, "step": 4551 }, { "epoch": 0.5, "learning_rate": 1.0630720338346175e-05, "loss": 0.75, "step": 4552 }, { "epoch": 0.5, "learning_rate": 1.0627201401714948e-05, "loss": 0.791, "step": 4553 }, { "epoch": 0.5, "learning_rate": 1.0623682387109446e-05, "loss": 0.7209, "step": 4554 }, { "epoch": 0.5, "learning_rate": 1.0620163294967155e-05, "loss": 0.6062, "step": 4555 }, { "epoch": 0.5, "learning_rate": 1.0616644125725573e-05, "loss": 0.7744, "step": 4556 }, { "epoch": 0.5, "learning_rate": 1.0613124879822202e-05, "loss": 0.6904, "step": 4557 }, { "epoch": 0.5, "learning_rate": 1.0609605557694563e-05, "loss": 0.7334, "step": 4558 }, { "epoch": 0.5, "learning_rate": 1.0606086159780179e-05, "loss": 0.7212, "step": 4559 }, { "epoch": 0.5, "learning_rate": 1.0602566686516586e-05, "loss": 0.6665, "step": 4560 }, { "epoch": 0.5, "learning_rate": 1.0599047138341329e-05, "loss": 0.7021, "step": 4561 }, { "epoch": 0.5, "learning_rate": 1.0595527515691959e-05, "loss": 0.8643, "step": 4562 }, { "epoch": 0.5, "learning_rate": 1.0592007819006039e-05, "loss": 0.6492, "step": 4563 }, { "epoch": 0.5, "learning_rate": 1.0588488048721146e-05, "loss": 0.7505, "step": 4564 }, { "epoch": 0.5, "learning_rate": 1.0584968205274857e-05, "loss": 0.7935, "step": 4565 }, { "epoch": 0.5, "learning_rate": 1.0581448289104759e-05, "loss": 0.7241, "step": 4566 }, { "epoch": 0.5, "learning_rate": 1.0577928300648457e-05, "loss": 0.7, "step": 4567 }, { "epoch": 0.5, "learning_rate": 1.0574408240343561e-05, "loss": 0.6079, "step": 4568 }, { "epoch": 0.5, "learning_rate": 1.0570888108627682e-05, "loss": 0.771, "step": 4569 }, { "epoch": 0.5, "learning_rate": 1.0567367905938449e-05, "loss": 0.6685, "step": 4570 }, { "epoch": 0.5, "learning_rate": 1.0563847632713495e-05, "loss": 0.6963, "step": 4571 }, { "epoch": 0.5, "learning_rate": 1.0560327289390468e-05, "loss": 0.7661, "step": 4572 }, { "epoch": 0.5, "learning_rate": 1.055680687640702e-05, "loss": 0.6284, "step": 4573 }, { "epoch": 0.5, "learning_rate": 1.0553286394200805e-05, "loss": 0.6802, "step": 4574 }, { "epoch": 0.5, "learning_rate": 1.0549765843209503e-05, "loss": 0.6296, "step": 4575 }, { "epoch": 0.5, "learning_rate": 1.0546245223870783e-05, "loss": 0.7334, "step": 4576 }, { "epoch": 0.5, "learning_rate": 1.054272453662234e-05, "loss": 0.7295, "step": 4577 }, { "epoch": 0.5, "learning_rate": 1.053920378190186e-05, "loss": 0.7588, "step": 4578 }, { "epoch": 0.5, "learning_rate": 1.0535682960147056e-05, "loss": 0.7839, "step": 4579 }, { "epoch": 0.5, "learning_rate": 1.0532162071795636e-05, "loss": 0.7168, "step": 4580 }, { "epoch": 0.5, "learning_rate": 1.0528641117285315e-05, "loss": 0.7251, "step": 4581 }, { "epoch": 0.5, "learning_rate": 1.0525120097053826e-05, "loss": 0.666, "step": 4582 }, { "epoch": 0.5, "learning_rate": 1.0521599011538913e-05, "loss": 0.6851, "step": 4583 }, { "epoch": 0.5, "learning_rate": 1.0518077861178308e-05, "loss": 0.6521, "step": 4584 }, { "epoch": 0.5, "learning_rate": 1.0514556646409769e-05, "loss": 0.6362, "step": 4585 }, { "epoch": 0.5, "learning_rate": 1.0511035367671057e-05, "loss": 0.7231, "step": 4586 }, { "epoch": 0.5, "learning_rate": 1.0507514025399944e-05, "loss": 0.7837, "step": 4587 }, { "epoch": 0.5, "learning_rate": 1.0503992620034202e-05, "loss": 0.6321, "step": 4588 }, { "epoch": 0.5, "learning_rate": 1.0500471152011615e-05, "loss": 0.9038, "step": 4589 }, { "epoch": 0.5, "learning_rate": 1.0496949621769976e-05, "loss": 0.8574, "step": 4590 }, { "epoch": 0.5, "learning_rate": 1.049342802974709e-05, "loss": 0.6846, "step": 4591 }, { "epoch": 0.5, "learning_rate": 1.0489906376380761e-05, "loss": 0.6594, "step": 4592 }, { "epoch": 0.5, "learning_rate": 1.0486384662108802e-05, "loss": 0.6931, "step": 4593 }, { "epoch": 0.5, "learning_rate": 1.048286288736904e-05, "loss": 0.6499, "step": 4594 }, { "epoch": 0.5, "learning_rate": 1.04793410525993e-05, "loss": 0.6777, "step": 4595 }, { "epoch": 0.5, "learning_rate": 1.0475819158237426e-05, "loss": 0.8022, "step": 4596 }, { "epoch": 0.5, "learning_rate": 1.0472297204721258e-05, "loss": 0.6401, "step": 4597 }, { "epoch": 0.5, "learning_rate": 1.0468775192488651e-05, "loss": 0.7944, "step": 4598 }, { "epoch": 0.5, "learning_rate": 1.046525312197747e-05, "loss": 0.7241, "step": 4599 }, { "epoch": 0.5, "learning_rate": 1.0461730993625572e-05, "loss": 0.853, "step": 4600 }, { "epoch": 0.5, "learning_rate": 1.0458208807870837e-05, "loss": 0.7461, "step": 4601 }, { "epoch": 0.5, "learning_rate": 1.0454686565151148e-05, "loss": 0.7231, "step": 4602 }, { "epoch": 0.5, "learning_rate": 1.0451164265904392e-05, "loss": 0.7241, "step": 4603 }, { "epoch": 0.5, "learning_rate": 1.0447641910568462e-05, "loss": 0.6875, "step": 4604 }, { "epoch": 0.5, "learning_rate": 1.0444119499581263e-05, "loss": 0.7754, "step": 4605 }, { "epoch": 0.5, "learning_rate": 1.0440597033380706e-05, "loss": 0.7808, "step": 4606 }, { "epoch": 0.5, "learning_rate": 1.0437074512404705e-05, "loss": 0.7466, "step": 4607 }, { "epoch": 0.5, "learning_rate": 1.0433551937091185e-05, "loss": 0.6643, "step": 4608 }, { "epoch": 0.5, "learning_rate": 1.0430029307878073e-05, "loss": 0.7065, "step": 4609 }, { "epoch": 0.5, "learning_rate": 1.0426506625203308e-05, "loss": 0.7124, "step": 4610 }, { "epoch": 0.5, "learning_rate": 1.0422983889504831e-05, "loss": 0.8218, "step": 4611 }, { "epoch": 0.5, "learning_rate": 1.0419461101220596e-05, "loss": 0.8345, "step": 4612 }, { "epoch": 0.5, "learning_rate": 1.0415938260788556e-05, "loss": 0.769, "step": 4613 }, { "epoch": 0.5, "learning_rate": 1.0412415368646674e-05, "loss": 0.6926, "step": 4614 }, { "epoch": 0.5, "learning_rate": 1.0408892425232921e-05, "loss": 0.7131, "step": 4615 }, { "epoch": 0.5, "learning_rate": 1.040536943098527e-05, "loss": 0.636, "step": 4616 }, { "epoch": 0.5, "learning_rate": 1.0401846386341707e-05, "loss": 0.7275, "step": 4617 }, { "epoch": 0.5, "learning_rate": 1.039832329174022e-05, "loss": 0.6697, "step": 4618 }, { "epoch": 0.5, "learning_rate": 1.0394800147618797e-05, "loss": 0.7261, "step": 4619 }, { "epoch": 0.5, "learning_rate": 1.0391276954415443e-05, "loss": 0.6689, "step": 4620 }, { "epoch": 0.5, "learning_rate": 1.038775371256817e-05, "loss": 0.8047, "step": 4621 }, { "epoch": 0.5, "learning_rate": 1.0384230422514983e-05, "loss": 0.6428, "step": 4622 }, { "epoch": 0.5, "learning_rate": 1.0380707084693902e-05, "loss": 0.6777, "step": 4623 }, { "epoch": 0.5, "learning_rate": 1.0377183699542952e-05, "loss": 0.6096, "step": 4624 }, { "epoch": 0.5, "learning_rate": 1.0373660267500168e-05, "loss": 0.825, "step": 4625 }, { "epoch": 0.5, "learning_rate": 1.0370136789003582e-05, "loss": 0.7363, "step": 4626 }, { "epoch": 0.5, "learning_rate": 1.0366613264491236e-05, "loss": 0.8926, "step": 4627 }, { "epoch": 0.5, "learning_rate": 1.0363089694401182e-05, "loss": 0.7336, "step": 4628 }, { "epoch": 0.5, "learning_rate": 1.035956607917147e-05, "loss": 0.6562, "step": 4629 }, { "epoch": 0.5, "learning_rate": 1.035604241924016e-05, "loss": 0.7029, "step": 4630 }, { "epoch": 0.5, "learning_rate": 1.0352518715045316e-05, "loss": 0.5947, "step": 4631 }, { "epoch": 0.5, "learning_rate": 1.0348994967025012e-05, "loss": 0.6995, "step": 4632 }, { "epoch": 0.5, "learning_rate": 1.0345471175617318e-05, "loss": 0.6816, "step": 4633 }, { "epoch": 0.5, "learning_rate": 1.0341947341260318e-05, "loss": 0.7009, "step": 4634 }, { "epoch": 0.5, "learning_rate": 1.03384234643921e-05, "loss": 0.7368, "step": 4635 }, { "epoch": 0.5, "learning_rate": 1.0334899545450753e-05, "loss": 0.6345, "step": 4636 }, { "epoch": 0.5, "learning_rate": 1.0331375584874377e-05, "loss": 0.6001, "step": 4637 }, { "epoch": 0.5, "learning_rate": 1.0327851583101071e-05, "loss": 0.7324, "step": 4638 }, { "epoch": 0.51, "learning_rate": 1.0324327540568942e-05, "loss": 0.7163, "step": 4639 }, { "epoch": 0.51, "learning_rate": 1.0320803457716106e-05, "loss": 0.7046, "step": 4640 }, { "epoch": 0.51, "learning_rate": 1.031727933498068e-05, "loss": 0.7734, "step": 4641 }, { "epoch": 0.51, "learning_rate": 1.0313755172800779e-05, "loss": 0.6792, "step": 4642 }, { "epoch": 0.51, "learning_rate": 1.0310230971614538e-05, "loss": 0.6904, "step": 4643 }, { "epoch": 0.51, "learning_rate": 1.030670673186009e-05, "loss": 0.6907, "step": 4644 }, { "epoch": 0.51, "learning_rate": 1.0303182453975567e-05, "loss": 0.8789, "step": 4645 }, { "epoch": 0.51, "learning_rate": 1.029965813839911e-05, "loss": 0.7554, "step": 4646 }, { "epoch": 0.51, "learning_rate": 1.0296133785568869e-05, "loss": 0.7148, "step": 4647 }, { "epoch": 0.51, "learning_rate": 1.0292609395922993e-05, "loss": 0.6575, "step": 4648 }, { "epoch": 0.51, "learning_rate": 1.0289084969899639e-05, "loss": 0.7659, "step": 4649 }, { "epoch": 0.51, "learning_rate": 1.0285560507936962e-05, "loss": 0.7891, "step": 4650 }, { "epoch": 0.51, "learning_rate": 1.0282036010473135e-05, "loss": 0.6399, "step": 4651 }, { "epoch": 0.51, "learning_rate": 1.0278511477946323e-05, "loss": 0.5737, "step": 4652 }, { "epoch": 0.51, "learning_rate": 1.0274986910794693e-05, "loss": 0.7141, "step": 4653 }, { "epoch": 0.51, "learning_rate": 1.027146230945643e-05, "loss": 0.6743, "step": 4654 }, { "epoch": 0.51, "learning_rate": 1.0267937674369716e-05, "loss": 0.6919, "step": 4655 }, { "epoch": 0.51, "learning_rate": 1.0264413005972736e-05, "loss": 0.708, "step": 4656 }, { "epoch": 0.51, "learning_rate": 1.0260888304703676e-05, "loss": 0.6228, "step": 4657 }, { "epoch": 0.51, "learning_rate": 1.025736357100073e-05, "loss": 0.7405, "step": 4658 }, { "epoch": 0.51, "learning_rate": 1.0253838805302106e-05, "loss": 0.6873, "step": 4659 }, { "epoch": 0.51, "learning_rate": 1.0250314008045996e-05, "loss": 0.8169, "step": 4660 }, { "epoch": 0.51, "learning_rate": 1.0246789179670611e-05, "loss": 0.8174, "step": 4661 }, { "epoch": 0.51, "learning_rate": 1.0243264320614156e-05, "loss": 0.7712, "step": 4662 }, { "epoch": 0.51, "learning_rate": 1.0239739431314855e-05, "loss": 0.7439, "step": 4663 }, { "epoch": 0.51, "learning_rate": 1.0236214512210918e-05, "loss": 0.7837, "step": 4664 }, { "epoch": 0.51, "learning_rate": 1.0232689563740563e-05, "loss": 0.6589, "step": 4665 }, { "epoch": 0.51, "learning_rate": 1.0229164586342024e-05, "loss": 0.7329, "step": 4666 }, { "epoch": 0.51, "learning_rate": 1.0225639580453524e-05, "loss": 0.7803, "step": 4667 }, { "epoch": 0.51, "learning_rate": 1.0222114546513296e-05, "loss": 0.6553, "step": 4668 }, { "epoch": 0.51, "learning_rate": 1.0218589484959573e-05, "loss": 0.7012, "step": 4669 }, { "epoch": 0.51, "learning_rate": 1.0215064396230603e-05, "loss": 0.8137, "step": 4670 }, { "epoch": 0.51, "learning_rate": 1.0211539280764617e-05, "loss": 0.676, "step": 4671 }, { "epoch": 0.51, "learning_rate": 1.0208014138999866e-05, "loss": 0.7705, "step": 4672 }, { "epoch": 0.51, "learning_rate": 1.02044889713746e-05, "loss": 0.6768, "step": 4673 }, { "epoch": 0.51, "learning_rate": 1.020096377832707e-05, "loss": 0.8755, "step": 4674 }, { "epoch": 0.51, "learning_rate": 1.0197438560295534e-05, "loss": 0.7817, "step": 4675 }, { "epoch": 0.51, "learning_rate": 1.0193913317718245e-05, "loss": 0.72, "step": 4676 }, { "epoch": 0.51, "learning_rate": 1.0190388051033466e-05, "loss": 0.6719, "step": 4677 }, { "epoch": 0.51, "learning_rate": 1.0186862760679468e-05, "loss": 0.6731, "step": 4678 }, { "epoch": 0.51, "learning_rate": 1.018333744709451e-05, "loss": 0.8071, "step": 4679 }, { "epoch": 0.51, "learning_rate": 1.0179812110716864e-05, "loss": 0.7795, "step": 4680 }, { "epoch": 0.51, "learning_rate": 1.0176286751984808e-05, "loss": 0.717, "step": 4681 }, { "epoch": 0.51, "learning_rate": 1.0172761371336615e-05, "loss": 0.6821, "step": 4682 }, { "epoch": 0.51, "learning_rate": 1.0169235969210562e-05, "loss": 0.6816, "step": 4683 }, { "epoch": 0.51, "learning_rate": 1.0165710546044932e-05, "loss": 0.74, "step": 4684 }, { "epoch": 0.51, "learning_rate": 1.016218510227801e-05, "loss": 0.7188, "step": 4685 }, { "epoch": 0.51, "learning_rate": 1.015865963834808e-05, "loss": 0.7314, "step": 4686 }, { "epoch": 0.51, "learning_rate": 1.0155134154693434e-05, "loss": 0.8159, "step": 4687 }, { "epoch": 0.51, "learning_rate": 1.015160865175236e-05, "loss": 0.6748, "step": 4688 }, { "epoch": 0.51, "learning_rate": 1.0148083129963156e-05, "loss": 0.7153, "step": 4689 }, { "epoch": 0.51, "learning_rate": 1.0144557589764117e-05, "loss": 0.8032, "step": 4690 }, { "epoch": 0.51, "learning_rate": 1.0141032031593537e-05, "loss": 0.7629, "step": 4691 }, { "epoch": 0.51, "learning_rate": 1.0137506455889721e-05, "loss": 0.7773, "step": 4692 }, { "epoch": 0.51, "learning_rate": 1.0133980863090973e-05, "loss": 0.7441, "step": 4693 }, { "epoch": 0.51, "learning_rate": 1.0130455253635596e-05, "loss": 0.6194, "step": 4694 }, { "epoch": 0.51, "learning_rate": 1.0126929627961896e-05, "loss": 0.5867, "step": 4695 }, { "epoch": 0.51, "learning_rate": 1.0123403986508184e-05, "loss": 0.7388, "step": 4696 }, { "epoch": 0.51, "learning_rate": 1.0119878329712773e-05, "loss": 0.7021, "step": 4697 }, { "epoch": 0.51, "learning_rate": 1.0116352658013973e-05, "loss": 0.6404, "step": 4698 }, { "epoch": 0.51, "learning_rate": 1.0112826971850096e-05, "loss": 0.728, "step": 4699 }, { "epoch": 0.51, "learning_rate": 1.0109301271659464e-05, "loss": 0.6067, "step": 4700 }, { "epoch": 0.51, "learning_rate": 1.0105775557880398e-05, "loss": 0.8105, "step": 4701 }, { "epoch": 0.51, "learning_rate": 1.0102249830951209e-05, "loss": 0.636, "step": 4702 }, { "epoch": 0.51, "learning_rate": 1.0098724091310224e-05, "loss": 0.7656, "step": 4703 }, { "epoch": 0.51, "learning_rate": 1.0095198339395769e-05, "loss": 0.8064, "step": 4704 }, { "epoch": 0.51, "learning_rate": 1.0091672575646161e-05, "loss": 0.6709, "step": 4705 }, { "epoch": 0.51, "learning_rate": 1.0088146800499734e-05, "loss": 0.7949, "step": 4706 }, { "epoch": 0.51, "learning_rate": 1.008462101439481e-05, "loss": 0.6719, "step": 4707 }, { "epoch": 0.51, "learning_rate": 1.0081095217769725e-05, "loss": 0.72, "step": 4708 }, { "epoch": 0.51, "learning_rate": 1.0077569411062804e-05, "loss": 0.7507, "step": 4709 }, { "epoch": 0.51, "learning_rate": 1.007404359471238e-05, "loss": 0.6501, "step": 4710 }, { "epoch": 0.51, "learning_rate": 1.0070517769156783e-05, "loss": 0.6406, "step": 4711 }, { "epoch": 0.51, "learning_rate": 1.0066991934834352e-05, "loss": 0.8394, "step": 4712 }, { "epoch": 0.51, "learning_rate": 1.006346609218342e-05, "loss": 0.6973, "step": 4713 }, { "epoch": 0.51, "learning_rate": 1.0059940241642321e-05, "loss": 0.7817, "step": 4714 }, { "epoch": 0.51, "learning_rate": 1.0056414383649393e-05, "loss": 0.6309, "step": 4715 }, { "epoch": 0.51, "learning_rate": 1.0052888518642978e-05, "loss": 0.6631, "step": 4716 }, { "epoch": 0.51, "learning_rate": 1.0049362647061411e-05, "loss": 0.6941, "step": 4717 }, { "epoch": 0.51, "learning_rate": 1.0045836769343031e-05, "loss": 0.6865, "step": 4718 }, { "epoch": 0.51, "learning_rate": 1.0042310885926186e-05, "loss": 0.7554, "step": 4719 }, { "epoch": 0.51, "learning_rate": 1.0038784997249205e-05, "loss": 0.7227, "step": 4720 }, { "epoch": 0.51, "learning_rate": 1.0035259103750438e-05, "loss": 0.675, "step": 4721 }, { "epoch": 0.51, "learning_rate": 1.0031733205868223e-05, "loss": 0.6978, "step": 4722 }, { "epoch": 0.51, "learning_rate": 1.0028207304040912e-05, "loss": 0.6853, "step": 4723 }, { "epoch": 0.51, "learning_rate": 1.0024681398706837e-05, "loss": 0.8203, "step": 4724 }, { "epoch": 0.51, "learning_rate": 1.0021155490304349e-05, "loss": 0.7537, "step": 4725 }, { "epoch": 0.51, "learning_rate": 1.0017629579271789e-05, "loss": 0.7317, "step": 4726 }, { "epoch": 0.51, "learning_rate": 1.0014103666047503e-05, "loss": 0.814, "step": 4727 }, { "epoch": 0.51, "learning_rate": 1.001057775106984e-05, "loss": 0.8413, "step": 4728 }, { "epoch": 0.51, "learning_rate": 1.0007051834777135e-05, "loss": 0.7734, "step": 4729 }, { "epoch": 0.51, "learning_rate": 1.000352591760774e-05, "loss": 0.8154, "step": 4730 }, { "epoch": 0.52, "learning_rate": 1e-05, "loss": 0.7019, "step": 4731 }, { "epoch": 0.52, "learning_rate": 9.996474082392264e-06, "loss": 0.8081, "step": 4732 }, { "epoch": 0.52, "learning_rate": 9.992948165222869e-06, "loss": 0.7412, "step": 4733 }, { "epoch": 0.52, "learning_rate": 9.989422248930167e-06, "loss": 0.7681, "step": 4734 }, { "epoch": 0.52, "learning_rate": 9.985896333952502e-06, "loss": 0.79, "step": 4735 }, { "epoch": 0.52, "learning_rate": 9.982370420728213e-06, "loss": 0.6079, "step": 4736 }, { "epoch": 0.52, "learning_rate": 9.978844509695654e-06, "loss": 0.771, "step": 4737 }, { "epoch": 0.52, "learning_rate": 9.975318601293165e-06, "loss": 0.7327, "step": 4738 }, { "epoch": 0.52, "learning_rate": 9.971792695959091e-06, "loss": 0.6882, "step": 4739 }, { "epoch": 0.52, "learning_rate": 9.968266794131778e-06, "loss": 0.635, "step": 4740 }, { "epoch": 0.52, "learning_rate": 9.964740896249565e-06, "loss": 0.575, "step": 4741 }, { "epoch": 0.52, "learning_rate": 9.961215002750799e-06, "loss": 0.7021, "step": 4742 }, { "epoch": 0.52, "learning_rate": 9.957689114073821e-06, "loss": 0.6814, "step": 4743 }, { "epoch": 0.52, "learning_rate": 9.95416323065697e-06, "loss": 0.761, "step": 4744 }, { "epoch": 0.52, "learning_rate": 9.950637352938592e-06, "loss": 0.6208, "step": 4745 }, { "epoch": 0.52, "learning_rate": 9.947111481357023e-06, "loss": 0.7712, "step": 4746 }, { "epoch": 0.52, "learning_rate": 9.943585616350607e-06, "loss": 0.7449, "step": 4747 }, { "epoch": 0.52, "learning_rate": 9.940059758357682e-06, "loss": 0.834, "step": 4748 }, { "epoch": 0.52, "learning_rate": 9.936533907816583e-06, "loss": 0.8008, "step": 4749 }, { "epoch": 0.52, "learning_rate": 9.933008065165651e-06, "loss": 0.6096, "step": 4750 }, { "epoch": 0.52, "learning_rate": 9.92948223084322e-06, "loss": 0.7852, "step": 4751 }, { "epoch": 0.52, "learning_rate": 9.925956405287624e-06, "loss": 0.7302, "step": 4752 }, { "epoch": 0.52, "learning_rate": 9.9224305889372e-06, "loss": 0.6521, "step": 4753 }, { "epoch": 0.52, "learning_rate": 9.91890478223028e-06, "loss": 0.6938, "step": 4754 }, { "epoch": 0.52, "learning_rate": 9.91537898560519e-06, "loss": 0.7485, "step": 4755 }, { "epoch": 0.52, "learning_rate": 9.911853199500268e-06, "loss": 0.676, "step": 4756 }, { "epoch": 0.52, "learning_rate": 9.908327424353839e-06, "loss": 0.6628, "step": 4757 }, { "epoch": 0.52, "learning_rate": 9.904801660604234e-06, "loss": 0.7144, "step": 4758 }, { "epoch": 0.52, "learning_rate": 9.901275908689778e-06, "loss": 0.7896, "step": 4759 }, { "epoch": 0.52, "learning_rate": 9.897750169048793e-06, "loss": 0.8604, "step": 4760 }, { "epoch": 0.52, "learning_rate": 9.894224442119606e-06, "loss": 0.7046, "step": 4761 }, { "epoch": 0.52, "learning_rate": 9.890698728340537e-06, "loss": 0.6196, "step": 4762 }, { "epoch": 0.52, "learning_rate": 9.887173028149905e-06, "loss": 0.7808, "step": 4763 }, { "epoch": 0.52, "learning_rate": 9.883647341986032e-06, "loss": 0.7905, "step": 4764 }, { "epoch": 0.52, "learning_rate": 9.880121670287229e-06, "loss": 0.6462, "step": 4765 }, { "epoch": 0.52, "learning_rate": 9.876596013491817e-06, "loss": 0.6956, "step": 4766 }, { "epoch": 0.52, "learning_rate": 9.873070372038106e-06, "loss": 0.6709, "step": 4767 }, { "epoch": 0.52, "learning_rate": 9.869544746364408e-06, "loss": 0.7529, "step": 4768 }, { "epoch": 0.52, "learning_rate": 9.866019136909029e-06, "loss": 0.7358, "step": 4769 }, { "epoch": 0.52, "learning_rate": 9.862493544110282e-06, "loss": 0.7622, "step": 4770 }, { "epoch": 0.52, "learning_rate": 9.858967968406465e-06, "loss": 0.6494, "step": 4771 }, { "epoch": 0.52, "learning_rate": 9.855442410235889e-06, "loss": 0.7493, "step": 4772 }, { "epoch": 0.52, "learning_rate": 9.851916870036848e-06, "loss": 0.7468, "step": 4773 }, { "epoch": 0.52, "learning_rate": 9.848391348247643e-06, "loss": 0.5986, "step": 4774 }, { "epoch": 0.52, "learning_rate": 9.844865845306568e-06, "loss": 0.5459, "step": 4775 }, { "epoch": 0.52, "learning_rate": 9.841340361651921e-06, "loss": 0.7114, "step": 4776 }, { "epoch": 0.52, "learning_rate": 9.837814897721992e-06, "loss": 0.7192, "step": 4777 }, { "epoch": 0.52, "learning_rate": 9.83428945395507e-06, "loss": 0.7322, "step": 4778 }, { "epoch": 0.52, "learning_rate": 9.83076403078944e-06, "loss": 0.66, "step": 4779 }, { "epoch": 0.52, "learning_rate": 9.827238628663388e-06, "loss": 0.7441, "step": 4780 }, { "epoch": 0.52, "learning_rate": 9.823713248015195e-06, "loss": 0.7002, "step": 4781 }, { "epoch": 0.52, "learning_rate": 9.820187889283138e-06, "loss": 0.7139, "step": 4782 }, { "epoch": 0.52, "learning_rate": 9.816662552905494e-06, "loss": 0.793, "step": 4783 }, { "epoch": 0.52, "learning_rate": 9.813137239320534e-06, "loss": 0.6072, "step": 4784 }, { "epoch": 0.52, "learning_rate": 9.809611948966534e-06, "loss": 0.769, "step": 4785 }, { "epoch": 0.52, "learning_rate": 9.806086682281759e-06, "loss": 0.7024, "step": 4786 }, { "epoch": 0.52, "learning_rate": 9.802561439704468e-06, "loss": 0.6406, "step": 4787 }, { "epoch": 0.52, "learning_rate": 9.799036221672931e-06, "loss": 0.7329, "step": 4788 }, { "epoch": 0.52, "learning_rate": 9.795511028625402e-06, "loss": 0.7063, "step": 4789 }, { "epoch": 0.52, "learning_rate": 9.791985861000135e-06, "loss": 0.7139, "step": 4790 }, { "epoch": 0.52, "learning_rate": 9.788460719235386e-06, "loss": 0.6777, "step": 4791 }, { "epoch": 0.52, "learning_rate": 9.784935603769404e-06, "loss": 0.5908, "step": 4792 }, { "epoch": 0.52, "learning_rate": 9.781410515040428e-06, "loss": 0.7131, "step": 4793 }, { "epoch": 0.52, "learning_rate": 9.777885453486706e-06, "loss": 0.6863, "step": 4794 }, { "epoch": 0.52, "learning_rate": 9.774360419546477e-06, "loss": 0.7451, "step": 4795 }, { "epoch": 0.52, "learning_rate": 9.770835413657978e-06, "loss": 0.834, "step": 4796 }, { "epoch": 0.52, "learning_rate": 9.767310436259438e-06, "loss": 0.6699, "step": 4797 }, { "epoch": 0.52, "learning_rate": 9.763785487789087e-06, "loss": 0.7661, "step": 4798 }, { "epoch": 0.52, "learning_rate": 9.760260568685149e-06, "loss": 0.6897, "step": 4799 }, { "epoch": 0.52, "learning_rate": 9.756735679385845e-06, "loss": 0.8047, "step": 4800 }, { "epoch": 0.52, "learning_rate": 9.753210820329392e-06, "loss": 0.7583, "step": 4801 }, { "epoch": 0.52, "learning_rate": 9.749685991954008e-06, "loss": 0.6807, "step": 4802 }, { "epoch": 0.52, "learning_rate": 9.746161194697895e-06, "loss": 0.6165, "step": 4803 }, { "epoch": 0.52, "learning_rate": 9.74263642899927e-06, "loss": 0.7695, "step": 4804 }, { "epoch": 0.52, "learning_rate": 9.739111695296329e-06, "loss": 0.7085, "step": 4805 }, { "epoch": 0.52, "learning_rate": 9.735586994027267e-06, "loss": 0.6501, "step": 4806 }, { "epoch": 0.52, "learning_rate": 9.732062325630286e-06, "loss": 0.7678, "step": 4807 }, { "epoch": 0.52, "learning_rate": 9.728537690543573e-06, "loss": 0.6558, "step": 4808 }, { "epoch": 0.52, "learning_rate": 9.725013089205309e-06, "loss": 0.8179, "step": 4809 }, { "epoch": 0.52, "learning_rate": 9.721488522053682e-06, "loss": 0.677, "step": 4810 }, { "epoch": 0.52, "learning_rate": 9.71796398952687e-06, "loss": 0.6846, "step": 4811 }, { "epoch": 0.52, "learning_rate": 9.71443949206304e-06, "loss": 0.677, "step": 4812 }, { "epoch": 0.52, "learning_rate": 9.710915030100364e-06, "loss": 0.6477, "step": 4813 }, { "epoch": 0.52, "learning_rate": 9.707390604077009e-06, "loss": 0.7231, "step": 4814 }, { "epoch": 0.52, "learning_rate": 9.703866214431133e-06, "loss": 0.7366, "step": 4815 }, { "epoch": 0.52, "learning_rate": 9.700341861600894e-06, "loss": 0.8032, "step": 4816 }, { "epoch": 0.52, "learning_rate": 9.696817546024436e-06, "loss": 0.6575, "step": 4817 }, { "epoch": 0.52, "learning_rate": 9.693293268139914e-06, "loss": 0.751, "step": 4818 }, { "epoch": 0.52, "learning_rate": 9.689769028385463e-06, "loss": 0.6575, "step": 4819 }, { "epoch": 0.52, "learning_rate": 9.686244827199223e-06, "loss": 0.7544, "step": 4820 }, { "epoch": 0.52, "learning_rate": 9.682720665019325e-06, "loss": 0.6855, "step": 4821 }, { "epoch": 0.52, "learning_rate": 9.679196542283894e-06, "loss": 0.7034, "step": 4822 }, { "epoch": 0.53, "learning_rate": 9.67567245943106e-06, "loss": 0.6699, "step": 4823 }, { "epoch": 0.53, "learning_rate": 9.672148416898932e-06, "loss": 0.8564, "step": 4824 }, { "epoch": 0.53, "learning_rate": 9.668624415125625e-06, "loss": 0.658, "step": 4825 }, { "epoch": 0.53, "learning_rate": 9.665100454549249e-06, "loss": 0.7085, "step": 4826 }, { "epoch": 0.53, "learning_rate": 9.661576535607905e-06, "loss": 0.7139, "step": 4827 }, { "epoch": 0.53, "learning_rate": 9.658052658739683e-06, "loss": 0.7161, "step": 4828 }, { "epoch": 0.53, "learning_rate": 9.654528824382685e-06, "loss": 0.7349, "step": 4829 }, { "epoch": 0.53, "learning_rate": 9.651005032974994e-06, "loss": 0.7305, "step": 4830 }, { "epoch": 0.53, "learning_rate": 9.647481284954686e-06, "loss": 0.7258, "step": 4831 }, { "epoch": 0.53, "learning_rate": 9.643957580759841e-06, "loss": 0.5957, "step": 4832 }, { "epoch": 0.53, "learning_rate": 9.64043392082853e-06, "loss": 0.6064, "step": 4833 }, { "epoch": 0.53, "learning_rate": 9.63691030559882e-06, "loss": 0.6633, "step": 4834 }, { "epoch": 0.53, "learning_rate": 9.633386735508766e-06, "loss": 0.7554, "step": 4835 }, { "epoch": 0.53, "learning_rate": 9.62986321099642e-06, "loss": 0.6355, "step": 4836 }, { "epoch": 0.53, "learning_rate": 9.626339732499835e-06, "loss": 0.6328, "step": 4837 }, { "epoch": 0.53, "learning_rate": 9.622816300457051e-06, "loss": 0.7158, "step": 4838 }, { "epoch": 0.53, "learning_rate": 9.619292915306103e-06, "loss": 0.7021, "step": 4839 }, { "epoch": 0.53, "learning_rate": 9.615769577485024e-06, "loss": 0.7983, "step": 4840 }, { "epoch": 0.53, "learning_rate": 9.612246287431832e-06, "loss": 0.7788, "step": 4841 }, { "epoch": 0.53, "learning_rate": 9.608723045584557e-06, "loss": 0.6548, "step": 4842 }, { "epoch": 0.53, "learning_rate": 9.605199852381206e-06, "loss": 0.7651, "step": 4843 }, { "epoch": 0.53, "learning_rate": 9.601676708259785e-06, "loss": 0.7283, "step": 4844 }, { "epoch": 0.53, "learning_rate": 9.598153613658295e-06, "loss": 0.7769, "step": 4845 }, { "epoch": 0.53, "learning_rate": 9.594630569014733e-06, "loss": 0.6357, "step": 4846 }, { "epoch": 0.53, "learning_rate": 9.59110757476708e-06, "loss": 0.7393, "step": 4847 }, { "epoch": 0.53, "learning_rate": 9.58758463135333e-06, "loss": 0.6968, "step": 4848 }, { "epoch": 0.53, "learning_rate": 9.584061739211449e-06, "loss": 0.6428, "step": 4849 }, { "epoch": 0.53, "learning_rate": 9.580538898779406e-06, "loss": 0.7036, "step": 4850 }, { "epoch": 0.53, "learning_rate": 9.57701611049517e-06, "loss": 0.6562, "step": 4851 }, { "epoch": 0.53, "learning_rate": 9.573493374796694e-06, "loss": 0.7048, "step": 4852 }, { "epoch": 0.53, "learning_rate": 9.569970692121929e-06, "loss": 0.6855, "step": 4853 }, { "epoch": 0.53, "learning_rate": 9.566448062908819e-06, "loss": 0.6345, "step": 4854 }, { "epoch": 0.53, "learning_rate": 9.562925487595297e-06, "loss": 0.6846, "step": 4855 }, { "epoch": 0.53, "learning_rate": 9.559402966619296e-06, "loss": 0.708, "step": 4856 }, { "epoch": 0.53, "learning_rate": 9.555880500418739e-06, "loss": 0.657, "step": 4857 }, { "epoch": 0.53, "learning_rate": 9.55235808943154e-06, "loss": 0.738, "step": 4858 }, { "epoch": 0.53, "learning_rate": 9.548835734095613e-06, "loss": 0.7656, "step": 4859 }, { "epoch": 0.53, "learning_rate": 9.545313434848857e-06, "loss": 0.7183, "step": 4860 }, { "epoch": 0.53, "learning_rate": 9.541791192129164e-06, "loss": 0.731, "step": 4861 }, { "epoch": 0.53, "learning_rate": 9.538269006374431e-06, "loss": 0.7419, "step": 4862 }, { "epoch": 0.53, "learning_rate": 9.534746878022533e-06, "loss": 0.6282, "step": 4863 }, { "epoch": 0.53, "learning_rate": 9.53122480751135e-06, "loss": 0.717, "step": 4864 }, { "epoch": 0.53, "learning_rate": 9.527702795278745e-06, "loss": 0.6421, "step": 4865 }, { "epoch": 0.53, "learning_rate": 9.524180841762577e-06, "loss": 0.6685, "step": 4866 }, { "epoch": 0.53, "learning_rate": 9.520658947400704e-06, "loss": 0.6455, "step": 4867 }, { "epoch": 0.53, "learning_rate": 9.517137112630966e-06, "loss": 0.7891, "step": 4868 }, { "epoch": 0.53, "learning_rate": 9.513615337891201e-06, "loss": 0.7109, "step": 4869 }, { "epoch": 0.53, "learning_rate": 9.510093623619242e-06, "loss": 0.7305, "step": 4870 }, { "epoch": 0.53, "learning_rate": 9.50657197025291e-06, "loss": 0.7668, "step": 4871 }, { "epoch": 0.53, "learning_rate": 9.503050378230024e-06, "loss": 0.8081, "step": 4872 }, { "epoch": 0.53, "learning_rate": 9.499528847988388e-06, "loss": 0.7056, "step": 4873 }, { "epoch": 0.53, "learning_rate": 9.496007379965801e-06, "loss": 0.749, "step": 4874 }, { "epoch": 0.53, "learning_rate": 9.49248597460006e-06, "loss": 0.7009, "step": 4875 }, { "epoch": 0.53, "learning_rate": 9.488964632328945e-06, "loss": 0.8169, "step": 4876 }, { "epoch": 0.53, "learning_rate": 9.485443353590233e-06, "loss": 0.7209, "step": 4877 }, { "epoch": 0.53, "learning_rate": 9.481922138821697e-06, "loss": 0.6838, "step": 4878 }, { "epoch": 0.53, "learning_rate": 9.478400988461094e-06, "loss": 0.8076, "step": 4879 }, { "epoch": 0.53, "learning_rate": 9.474879902946174e-06, "loss": 0.7708, "step": 4880 }, { "epoch": 0.53, "learning_rate": 9.471358882714687e-06, "loss": 0.7542, "step": 4881 }, { "epoch": 0.53, "learning_rate": 9.46783792820437e-06, "loss": 0.6982, "step": 4882 }, { "epoch": 0.53, "learning_rate": 9.464317039852948e-06, "loss": 0.7129, "step": 4883 }, { "epoch": 0.53, "learning_rate": 9.460796218098143e-06, "loss": 0.7366, "step": 4884 }, { "epoch": 0.53, "learning_rate": 9.457275463377665e-06, "loss": 0.7188, "step": 4885 }, { "epoch": 0.53, "learning_rate": 9.453754776129219e-06, "loss": 0.7705, "step": 4886 }, { "epoch": 0.53, "learning_rate": 9.450234156790502e-06, "loss": 0.7544, "step": 4887 }, { "epoch": 0.53, "learning_rate": 9.446713605799197e-06, "loss": 0.7263, "step": 4888 }, { "epoch": 0.53, "learning_rate": 9.443193123592983e-06, "loss": 0.7466, "step": 4889 }, { "epoch": 0.53, "learning_rate": 9.439672710609532e-06, "loss": 0.6863, "step": 4890 }, { "epoch": 0.53, "learning_rate": 9.436152367286505e-06, "loss": 0.7346, "step": 4891 }, { "epoch": 0.53, "learning_rate": 9.432632094061555e-06, "loss": 0.7759, "step": 4892 }, { "epoch": 0.53, "learning_rate": 9.42911189137232e-06, "loss": 0.6528, "step": 4893 }, { "epoch": 0.53, "learning_rate": 9.425591759656442e-06, "loss": 0.7603, "step": 4894 }, { "epoch": 0.53, "learning_rate": 9.422071699351545e-06, "loss": 0.7031, "step": 4895 }, { "epoch": 0.53, "learning_rate": 9.418551710895243e-06, "loss": 0.6616, "step": 4896 }, { "epoch": 0.53, "learning_rate": 9.41503179472515e-06, "loss": 0.6721, "step": 4897 }, { "epoch": 0.53, "learning_rate": 9.41151195127886e-06, "loss": 0.6843, "step": 4898 }, { "epoch": 0.53, "learning_rate": 9.407992180993961e-06, "loss": 0.8062, "step": 4899 }, { "epoch": 0.53, "learning_rate": 9.404472484308045e-06, "loss": 0.5854, "step": 4900 }, { "epoch": 0.53, "learning_rate": 9.400952861658674e-06, "loss": 0.7026, "step": 4901 }, { "epoch": 0.53, "learning_rate": 9.397433313483417e-06, "loss": 0.7205, "step": 4902 }, { "epoch": 0.53, "learning_rate": 9.393913840219825e-06, "loss": 0.7119, "step": 4903 }, { "epoch": 0.53, "learning_rate": 9.39039444230544e-06, "loss": 0.6924, "step": 4904 }, { "epoch": 0.53, "learning_rate": 9.386875120177802e-06, "loss": 0.6226, "step": 4905 }, { "epoch": 0.53, "learning_rate": 9.383355874274434e-06, "loss": 0.6562, "step": 4906 }, { "epoch": 0.53, "learning_rate": 9.379836705032849e-06, "loss": 0.7227, "step": 4907 }, { "epoch": 0.53, "learning_rate": 9.376317612890557e-06, "loss": 0.6663, "step": 4908 }, { "epoch": 0.53, "learning_rate": 9.372798598285052e-06, "loss": 0.6909, "step": 4909 }, { "epoch": 0.53, "learning_rate": 9.369279661653826e-06, "loss": 0.7163, "step": 4910 }, { "epoch": 0.53, "learning_rate": 9.365760803434356e-06, "loss": 0.7246, "step": 4911 }, { "epoch": 0.53, "learning_rate": 9.362242024064106e-06, "loss": 0.7886, "step": 4912 }, { "epoch": 0.53, "learning_rate": 9.358723323980535e-06, "loss": 0.6848, "step": 4913 }, { "epoch": 0.53, "learning_rate": 9.355204703621093e-06, "loss": 0.7014, "step": 4914 }, { "epoch": 0.54, "learning_rate": 9.351686163423215e-06, "loss": 0.6636, "step": 4915 }, { "epoch": 0.54, "learning_rate": 9.348167703824334e-06, "loss": 0.6943, "step": 4916 }, { "epoch": 0.54, "learning_rate": 9.344649325261866e-06, "loss": 0.7627, "step": 4917 }, { "epoch": 0.54, "learning_rate": 9.341131028173215e-06, "loss": 0.7183, "step": 4918 }, { "epoch": 0.54, "learning_rate": 9.337612812995787e-06, "loss": 0.71, "step": 4919 }, { "epoch": 0.54, "learning_rate": 9.334094680166962e-06, "loss": 0.8208, "step": 4920 }, { "epoch": 0.54, "learning_rate": 9.330576630124124e-06, "loss": 0.8232, "step": 4921 }, { "epoch": 0.54, "learning_rate": 9.32705866330464e-06, "loss": 0.6013, "step": 4922 }, { "epoch": 0.54, "learning_rate": 9.323540780145858e-06, "loss": 0.7939, "step": 4923 }, { "epoch": 0.54, "learning_rate": 9.320022981085138e-06, "loss": 0.7251, "step": 4924 }, { "epoch": 0.54, "learning_rate": 9.316505266559808e-06, "loss": 0.6201, "step": 4925 }, { "epoch": 0.54, "learning_rate": 9.312987637007191e-06, "loss": 0.731, "step": 4926 }, { "epoch": 0.54, "learning_rate": 9.309470092864609e-06, "loss": 0.7214, "step": 4927 }, { "epoch": 0.54, "learning_rate": 9.305952634569361e-06, "loss": 0.761, "step": 4928 }, { "epoch": 0.54, "learning_rate": 9.302435262558748e-06, "loss": 0.7651, "step": 4929 }, { "epoch": 0.54, "learning_rate": 9.298917977270046e-06, "loss": 0.7383, "step": 4930 }, { "epoch": 0.54, "learning_rate": 9.295400779140528e-06, "loss": 0.7634, "step": 4931 }, { "epoch": 0.54, "learning_rate": 9.291883668607461e-06, "loss": 0.769, "step": 4932 }, { "epoch": 0.54, "learning_rate": 9.28836664610809e-06, "loss": 0.6943, "step": 4933 }, { "epoch": 0.54, "learning_rate": 9.284849712079654e-06, "loss": 0.7188, "step": 4934 }, { "epoch": 0.54, "learning_rate": 9.281332866959387e-06, "loss": 0.7124, "step": 4935 }, { "epoch": 0.54, "learning_rate": 9.277816111184504e-06, "loss": 0.7039, "step": 4936 }, { "epoch": 0.54, "learning_rate": 9.274299445192204e-06, "loss": 0.748, "step": 4937 }, { "epoch": 0.54, "learning_rate": 9.270782869419694e-06, "loss": 0.6045, "step": 4938 }, { "epoch": 0.54, "learning_rate": 9.267266384304153e-06, "loss": 0.6702, "step": 4939 }, { "epoch": 0.54, "learning_rate": 9.263749990282753e-06, "loss": 0.6863, "step": 4940 }, { "epoch": 0.54, "learning_rate": 9.260233687792657e-06, "loss": 0.6748, "step": 4941 }, { "epoch": 0.54, "learning_rate": 9.256717477271015e-06, "loss": 0.7563, "step": 4942 }, { "epoch": 0.54, "learning_rate": 9.253201359154964e-06, "loss": 0.6897, "step": 4943 }, { "epoch": 0.54, "learning_rate": 9.249685333881634e-06, "loss": 0.6643, "step": 4944 }, { "epoch": 0.54, "learning_rate": 9.246169401888136e-06, "loss": 0.6992, "step": 4945 }, { "epoch": 0.54, "learning_rate": 9.24265356361158e-06, "loss": 0.7729, "step": 4946 }, { "epoch": 0.54, "learning_rate": 9.239137819489047e-06, "loss": 0.6125, "step": 4947 }, { "epoch": 0.54, "learning_rate": 9.235622169957634e-06, "loss": 0.7014, "step": 4948 }, { "epoch": 0.54, "learning_rate": 9.232106615454401e-06, "loss": 0.6577, "step": 4949 }, { "epoch": 0.54, "learning_rate": 9.228591156416405e-06, "loss": 0.6755, "step": 4950 }, { "epoch": 0.54, "learning_rate": 9.225075793280693e-06, "loss": 0.6875, "step": 4951 }, { "epoch": 0.54, "learning_rate": 9.221560526484296e-06, "loss": 0.6833, "step": 4952 }, { "epoch": 0.54, "learning_rate": 9.218045356464236e-06, "loss": 0.6895, "step": 4953 }, { "epoch": 0.54, "learning_rate": 9.214530283657524e-06, "loss": 0.6257, "step": 4954 }, { "epoch": 0.54, "learning_rate": 9.211015308501158e-06, "loss": 0.7061, "step": 4955 }, { "epoch": 0.54, "learning_rate": 9.207500431432115e-06, "loss": 0.6733, "step": 4956 }, { "epoch": 0.54, "learning_rate": 9.20398565288738e-06, "loss": 0.6426, "step": 4957 }, { "epoch": 0.54, "learning_rate": 9.200470973303905e-06, "loss": 0.6697, "step": 4958 }, { "epoch": 0.54, "learning_rate": 9.196956393118643e-06, "loss": 0.707, "step": 4959 }, { "epoch": 0.54, "learning_rate": 9.193441912768528e-06, "loss": 0.6992, "step": 4960 }, { "epoch": 0.54, "learning_rate": 9.189927532690481e-06, "loss": 0.7285, "step": 4961 }, { "epoch": 0.54, "learning_rate": 9.18641325332142e-06, "loss": 0.7324, "step": 4962 }, { "epoch": 0.54, "learning_rate": 9.182899075098236e-06, "loss": 0.7407, "step": 4963 }, { "epoch": 0.54, "learning_rate": 9.179384998457818e-06, "loss": 0.7629, "step": 4964 }, { "epoch": 0.54, "learning_rate": 9.175871023837042e-06, "loss": 0.6594, "step": 4965 }, { "epoch": 0.54, "learning_rate": 9.17235715167276e-06, "loss": 0.5859, "step": 4966 }, { "epoch": 0.54, "learning_rate": 9.168843382401832e-06, "loss": 0.7288, "step": 4967 }, { "epoch": 0.54, "learning_rate": 9.165329716461088e-06, "loss": 0.7354, "step": 4968 }, { "epoch": 0.54, "learning_rate": 9.161816154287346e-06, "loss": 0.7102, "step": 4969 }, { "epoch": 0.54, "learning_rate": 9.158302696317421e-06, "loss": 0.7144, "step": 4970 }, { "epoch": 0.54, "learning_rate": 9.154789342988108e-06, "loss": 0.6699, "step": 4971 }, { "epoch": 0.54, "learning_rate": 9.15127609473619e-06, "loss": 0.6958, "step": 4972 }, { "epoch": 0.54, "learning_rate": 9.147762951998436e-06, "loss": 0.6946, "step": 4973 }, { "epoch": 0.54, "learning_rate": 9.144249915211605e-06, "loss": 0.6814, "step": 4974 }, { "epoch": 0.54, "learning_rate": 9.140736984812437e-06, "loss": 0.6709, "step": 4975 }, { "epoch": 0.54, "learning_rate": 9.137224161237672e-06, "loss": 0.7017, "step": 4976 }, { "epoch": 0.54, "learning_rate": 9.133711444924019e-06, "loss": 0.7188, "step": 4977 }, { "epoch": 0.54, "learning_rate": 9.130198836308186e-06, "loss": 0.7612, "step": 4978 }, { "epoch": 0.54, "learning_rate": 9.126686335826865e-06, "loss": 0.7383, "step": 4979 }, { "epoch": 0.54, "learning_rate": 9.123173943916729e-06, "loss": 0.7451, "step": 4980 }, { "epoch": 0.54, "learning_rate": 9.119661661014446e-06, "loss": 0.7166, "step": 4981 }, { "epoch": 0.54, "learning_rate": 9.116149487556665e-06, "loss": 0.729, "step": 4982 }, { "epoch": 0.54, "learning_rate": 9.11263742398002e-06, "loss": 0.7646, "step": 4983 }, { "epoch": 0.54, "learning_rate": 9.109125470721141e-06, "loss": 0.7129, "step": 4984 }, { "epoch": 0.54, "learning_rate": 9.105613628216626e-06, "loss": 0.6946, "step": 4985 }, { "epoch": 0.54, "learning_rate": 9.102101896903084e-06, "loss": 0.6816, "step": 4986 }, { "epoch": 0.54, "learning_rate": 9.09859027721709e-06, "loss": 0.8213, "step": 4987 }, { "epoch": 0.54, "learning_rate": 9.09507876959521e-06, "loss": 0.6985, "step": 4988 }, { "epoch": 0.54, "learning_rate": 9.091567374474002e-06, "loss": 0.6941, "step": 4989 }, { "epoch": 0.54, "learning_rate": 9.088056092290004e-06, "loss": 0.7856, "step": 4990 }, { "epoch": 0.54, "learning_rate": 9.08454492347974e-06, "loss": 0.7874, "step": 4991 }, { "epoch": 0.54, "learning_rate": 9.081033868479727e-06, "loss": 0.72, "step": 4992 }, { "epoch": 0.54, "learning_rate": 9.07752292772646e-06, "loss": 0.8486, "step": 4993 }, { "epoch": 0.54, "learning_rate": 9.074012101656418e-06, "loss": 0.709, "step": 4994 }, { "epoch": 0.54, "learning_rate": 9.07050139070608e-06, "loss": 0.7837, "step": 4995 }, { "epoch": 0.54, "learning_rate": 9.066990795311891e-06, "loss": 0.7466, "step": 4996 }, { "epoch": 0.54, "learning_rate": 9.0634803159103e-06, "loss": 0.6768, "step": 4997 }, { "epoch": 0.54, "learning_rate": 9.059969952937727e-06, "loss": 0.7441, "step": 4998 }, { "epoch": 0.54, "learning_rate": 9.056459706830587e-06, "loss": 0.7397, "step": 4999 }, { "epoch": 0.54, "learning_rate": 9.052949578025275e-06, "loss": 0.595, "step": 5000 }, { "epoch": 0.54, "learning_rate": 9.049439566958176e-06, "loss": 0.7866, "step": 5001 }, { "epoch": 0.54, "learning_rate": 9.045929674065655e-06, "loss": 0.6687, "step": 5002 }, { "epoch": 0.54, "learning_rate": 9.042419899784067e-06, "loss": 0.6426, "step": 5003 }, { "epoch": 0.54, "learning_rate": 9.038910244549748e-06, "loss": 0.7109, "step": 5004 }, { "epoch": 0.54, "learning_rate": 9.035400708799027e-06, "loss": 0.6128, "step": 5005 }, { "epoch": 0.54, "learning_rate": 9.03189129296821e-06, "loss": 0.7266, "step": 5006 }, { "epoch": 0.55, "learning_rate": 9.02838199749359e-06, "loss": 0.7183, "step": 5007 }, { "epoch": 0.55, "learning_rate": 9.024872822811446e-06, "loss": 0.6531, "step": 5008 }, { "epoch": 0.55, "learning_rate": 9.021363769358044e-06, "loss": 0.731, "step": 5009 }, { "epoch": 0.55, "learning_rate": 9.017854837569629e-06, "loss": 0.7891, "step": 5010 }, { "epoch": 0.55, "learning_rate": 9.01434602788244e-06, "loss": 0.7285, "step": 5011 }, { "epoch": 0.55, "learning_rate": 9.010837340732693e-06, "loss": 0.78, "step": 5012 }, { "epoch": 0.55, "learning_rate": 9.007328776556592e-06, "loss": 0.7434, "step": 5013 }, { "epoch": 0.55, "learning_rate": 9.003820335790316e-06, "loss": 0.7124, "step": 5014 }, { "epoch": 0.55, "learning_rate": 9.000312018870051e-06, "loss": 0.7383, "step": 5015 }, { "epoch": 0.55, "learning_rate": 8.99680382623195e-06, "loss": 0.7168, "step": 5016 }, { "epoch": 0.55, "learning_rate": 8.993295758312155e-06, "loss": 0.6714, "step": 5017 }, { "epoch": 0.55, "learning_rate": 8.989787815546789e-06, "loss": 0.6763, "step": 5018 }, { "epoch": 0.55, "learning_rate": 8.986279998371968e-06, "loss": 0.7222, "step": 5019 }, { "epoch": 0.55, "learning_rate": 8.982772307223783e-06, "loss": 0.7075, "step": 5020 }, { "epoch": 0.55, "learning_rate": 8.979264742538313e-06, "loss": 0.7837, "step": 5021 }, { "epoch": 0.55, "learning_rate": 8.975757304751626e-06, "loss": 0.6475, "step": 5022 }, { "epoch": 0.55, "learning_rate": 8.972249994299763e-06, "loss": 0.624, "step": 5023 }, { "epoch": 0.55, "learning_rate": 8.968742811618767e-06, "loss": 0.666, "step": 5024 }, { "epoch": 0.55, "learning_rate": 8.965235757144645e-06, "loss": 0.6187, "step": 5025 }, { "epoch": 0.55, "learning_rate": 8.9617288313134e-06, "loss": 0.7053, "step": 5026 }, { "epoch": 0.55, "learning_rate": 8.958222034561018e-06, "loss": 0.6963, "step": 5027 }, { "epoch": 0.55, "learning_rate": 8.954715367323468e-06, "loss": 0.6641, "step": 5028 }, { "epoch": 0.55, "learning_rate": 8.951208830036696e-06, "loss": 0.7354, "step": 5029 }, { "epoch": 0.55, "learning_rate": 8.947702423136647e-06, "loss": 0.6675, "step": 5030 }, { "epoch": 0.55, "learning_rate": 8.944196147059233e-06, "loss": 0.7041, "step": 5031 }, { "epoch": 0.55, "learning_rate": 8.940690002240365e-06, "loss": 0.7029, "step": 5032 }, { "epoch": 0.55, "learning_rate": 8.937183989115919e-06, "loss": 0.7266, "step": 5033 }, { "epoch": 0.55, "learning_rate": 8.933678108121776e-06, "loss": 0.7341, "step": 5034 }, { "epoch": 0.55, "learning_rate": 8.930172359693788e-06, "loss": 0.728, "step": 5035 }, { "epoch": 0.55, "learning_rate": 8.926666744267794e-06, "loss": 0.6653, "step": 5036 }, { "epoch": 0.55, "learning_rate": 8.923161262279611e-06, "loss": 0.8442, "step": 5037 }, { "epoch": 0.55, "learning_rate": 8.919655914165049e-06, "loss": 0.8311, "step": 5038 }, { "epoch": 0.55, "learning_rate": 8.916150700359896e-06, "loss": 0.7275, "step": 5039 }, { "epoch": 0.55, "learning_rate": 8.912645621299919e-06, "loss": 0.7041, "step": 5040 }, { "epoch": 0.55, "learning_rate": 8.909140677420875e-06, "loss": 0.7766, "step": 5041 }, { "epoch": 0.55, "learning_rate": 8.905635869158499e-06, "loss": 0.7644, "step": 5042 }, { "epoch": 0.55, "learning_rate": 8.902131196948518e-06, "loss": 0.6365, "step": 5043 }, { "epoch": 0.55, "learning_rate": 8.898626661226637e-06, "loss": 0.7754, "step": 5044 }, { "epoch": 0.55, "learning_rate": 8.895122262428536e-06, "loss": 0.7324, "step": 5045 }, { "epoch": 0.55, "learning_rate": 8.89161800098989e-06, "loss": 0.7773, "step": 5046 }, { "epoch": 0.55, "learning_rate": 8.888113877346353e-06, "loss": 0.7026, "step": 5047 }, { "epoch": 0.55, "learning_rate": 8.884609891933557e-06, "loss": 0.7314, "step": 5048 }, { "epoch": 0.55, "learning_rate": 8.881106045187124e-06, "loss": 0.7563, "step": 5049 }, { "epoch": 0.55, "learning_rate": 8.877602337542655e-06, "loss": 0.6919, "step": 5050 }, { "epoch": 0.55, "learning_rate": 8.874098769435734e-06, "loss": 0.7661, "step": 5051 }, { "epoch": 0.55, "learning_rate": 8.870595341301922e-06, "loss": 0.7407, "step": 5052 }, { "epoch": 0.55, "learning_rate": 8.867092053576777e-06, "loss": 0.6748, "step": 5053 }, { "epoch": 0.55, "learning_rate": 8.86358890669583e-06, "loss": 0.7556, "step": 5054 }, { "epoch": 0.55, "learning_rate": 8.860085901094595e-06, "loss": 0.7261, "step": 5055 }, { "epoch": 0.55, "learning_rate": 8.856583037208566e-06, "loss": 0.8086, "step": 5056 }, { "epoch": 0.55, "learning_rate": 8.853080315473225e-06, "loss": 0.7148, "step": 5057 }, { "epoch": 0.55, "learning_rate": 8.849577736324033e-06, "loss": 0.5898, "step": 5058 }, { "epoch": 0.55, "learning_rate": 8.846075300196435e-06, "loss": 0.772, "step": 5059 }, { "epoch": 0.55, "learning_rate": 8.842573007525852e-06, "loss": 0.7744, "step": 5060 }, { "epoch": 0.55, "learning_rate": 8.839070858747697e-06, "loss": 0.6812, "step": 5061 }, { "epoch": 0.55, "learning_rate": 8.835568854297362e-06, "loss": 0.6133, "step": 5062 }, { "epoch": 0.55, "learning_rate": 8.832066994610219e-06, "loss": 0.7073, "step": 5063 }, { "epoch": 0.55, "learning_rate": 8.828565280121619e-06, "loss": 0.6826, "step": 5064 }, { "epoch": 0.55, "learning_rate": 8.825063711266902e-06, "loss": 0.7307, "step": 5065 }, { "epoch": 0.55, "learning_rate": 8.821562288481383e-06, "loss": 0.7134, "step": 5066 }, { "epoch": 0.55, "learning_rate": 8.818061012200364e-06, "loss": 0.6265, "step": 5067 }, { "epoch": 0.55, "learning_rate": 8.814559882859129e-06, "loss": 0.7761, "step": 5068 }, { "epoch": 0.55, "learning_rate": 8.81105890089294e-06, "loss": 0.7739, "step": 5069 }, { "epoch": 0.55, "learning_rate": 8.807558066737042e-06, "loss": 0.7224, "step": 5070 }, { "epoch": 0.55, "learning_rate": 8.804057380826659e-06, "loss": 0.6509, "step": 5071 }, { "epoch": 0.55, "learning_rate": 8.800556843597002e-06, "loss": 0.7002, "step": 5072 }, { "epoch": 0.55, "learning_rate": 8.797056455483267e-06, "loss": 0.6313, "step": 5073 }, { "epoch": 0.55, "learning_rate": 8.79355621692062e-06, "loss": 0.7288, "step": 5074 }, { "epoch": 0.55, "learning_rate": 8.790056128344211e-06, "loss": 0.7256, "step": 5075 }, { "epoch": 0.55, "learning_rate": 8.786556190189183e-06, "loss": 0.6953, "step": 5076 }, { "epoch": 0.55, "learning_rate": 8.783056402890644e-06, "loss": 0.6299, "step": 5077 }, { "epoch": 0.55, "learning_rate": 8.779556766883694e-06, "loss": 0.5984, "step": 5078 }, { "epoch": 0.55, "learning_rate": 8.77605728260341e-06, "loss": 0.6238, "step": 5079 }, { "epoch": 0.55, "learning_rate": 8.772557950484847e-06, "loss": 0.7485, "step": 5080 }, { "epoch": 0.55, "learning_rate": 8.769058770963057e-06, "loss": 0.6812, "step": 5081 }, { "epoch": 0.55, "learning_rate": 8.765559744473054e-06, "loss": 0.801, "step": 5082 }, { "epoch": 0.55, "learning_rate": 8.762060871449838e-06, "loss": 0.6665, "step": 5083 }, { "epoch": 0.55, "learning_rate": 8.758562152328397e-06, "loss": 0.7305, "step": 5084 }, { "epoch": 0.55, "learning_rate": 8.755063587543693e-06, "loss": 0.7651, "step": 5085 }, { "epoch": 0.55, "learning_rate": 8.751565177530669e-06, "loss": 0.7422, "step": 5086 }, { "epoch": 0.55, "learning_rate": 8.748066922724256e-06, "loss": 0.7476, "step": 5087 }, { "epoch": 0.55, "learning_rate": 8.744568823559357e-06, "loss": 0.7861, "step": 5088 }, { "epoch": 0.55, "learning_rate": 8.741070880470857e-06, "loss": 0.8176, "step": 5089 }, { "epoch": 0.55, "learning_rate": 8.737573093893623e-06, "loss": 0.7778, "step": 5090 }, { "epoch": 0.55, "learning_rate": 8.734075464262507e-06, "loss": 0.6533, "step": 5091 }, { "epoch": 0.55, "learning_rate": 8.73057799201234e-06, "loss": 0.7251, "step": 5092 }, { "epoch": 0.55, "learning_rate": 8.727080677577926e-06, "loss": 0.7512, "step": 5093 }, { "epoch": 0.55, "learning_rate": 8.723583521394054e-06, "loss": 0.7009, "step": 5094 }, { "epoch": 0.55, "learning_rate": 8.720086523895499e-06, "loss": 0.7559, "step": 5095 }, { "epoch": 0.55, "learning_rate": 8.716589685517007e-06, "loss": 0.6526, "step": 5096 }, { "epoch": 0.55, "learning_rate": 8.71309300669331e-06, "loss": 0.5361, "step": 5097 }, { "epoch": 0.55, "learning_rate": 8.709596487859115e-06, "loss": 0.6619, "step": 5098 }, { "epoch": 0.56, "learning_rate": 8.706100129449118e-06, "loss": 0.7144, "step": 5099 }, { "epoch": 0.56, "learning_rate": 8.702603931897983e-06, "loss": 0.7539, "step": 5100 }, { "epoch": 0.56, "learning_rate": 8.699107895640367e-06, "loss": 0.7322, "step": 5101 }, { "epoch": 0.56, "learning_rate": 8.695612021110897e-06, "loss": 0.6758, "step": 5102 }, { "epoch": 0.56, "learning_rate": 8.692116308744187e-06, "loss": 0.7827, "step": 5103 }, { "epoch": 0.56, "learning_rate": 8.688620758974823e-06, "loss": 0.8511, "step": 5104 }, { "epoch": 0.56, "learning_rate": 8.685125372237374e-06, "loss": 0.7466, "step": 5105 }, { "epoch": 0.56, "learning_rate": 8.681630148966397e-06, "loss": 0.6941, "step": 5106 }, { "epoch": 0.56, "learning_rate": 8.678135089596418e-06, "loss": 0.7178, "step": 5107 }, { "epoch": 0.56, "learning_rate": 8.674640194561944e-06, "loss": 0.6792, "step": 5108 }, { "epoch": 0.56, "learning_rate": 8.67114546429746e-06, "loss": 0.6523, "step": 5109 }, { "epoch": 0.56, "learning_rate": 8.667650899237443e-06, "loss": 0.7229, "step": 5110 }, { "epoch": 0.56, "learning_rate": 8.664156499816336e-06, "loss": 0.7395, "step": 5111 }, { "epoch": 0.56, "learning_rate": 8.660662266468569e-06, "loss": 0.7622, "step": 5112 }, { "epoch": 0.56, "learning_rate": 8.657168199628544e-06, "loss": 0.7529, "step": 5113 }, { "epoch": 0.56, "learning_rate": 8.65367429973065e-06, "loss": 0.6685, "step": 5114 }, { "epoch": 0.56, "learning_rate": 8.650180567209253e-06, "loss": 0.6975, "step": 5115 }, { "epoch": 0.56, "learning_rate": 8.646687002498692e-06, "loss": 0.7329, "step": 5116 }, { "epoch": 0.56, "learning_rate": 8.643193606033293e-06, "loss": 0.6633, "step": 5117 }, { "epoch": 0.56, "learning_rate": 8.639700378247362e-06, "loss": 0.7056, "step": 5118 }, { "epoch": 0.56, "learning_rate": 8.636207319575171e-06, "loss": 0.7104, "step": 5119 }, { "epoch": 0.56, "learning_rate": 8.632714430450993e-06, "loss": 0.7185, "step": 5120 }, { "epoch": 0.56, "learning_rate": 8.629221711309056e-06, "loss": 0.7446, "step": 5121 }, { "epoch": 0.56, "learning_rate": 8.625729162583587e-06, "loss": 0.7456, "step": 5122 }, { "epoch": 0.56, "learning_rate": 8.622236784708778e-06, "loss": 0.6853, "step": 5123 }, { "epoch": 0.56, "learning_rate": 8.618744578118806e-06, "loss": 0.7837, "step": 5124 }, { "epoch": 0.56, "learning_rate": 8.615252543247826e-06, "loss": 0.6904, "step": 5125 }, { "epoch": 0.56, "learning_rate": 8.61176068052997e-06, "loss": 0.8472, "step": 5126 }, { "epoch": 0.56, "learning_rate": 8.60826899039935e-06, "loss": 0.7241, "step": 5127 }, { "epoch": 0.56, "learning_rate": 8.604777473290052e-06, "loss": 0.7644, "step": 5128 }, { "epoch": 0.56, "learning_rate": 8.60128612963615e-06, "loss": 0.7573, "step": 5129 }, { "epoch": 0.56, "learning_rate": 8.597794959871694e-06, "loss": 0.6362, "step": 5130 }, { "epoch": 0.56, "learning_rate": 8.594303964430706e-06, "loss": 0.7156, "step": 5131 }, { "epoch": 0.56, "learning_rate": 8.590813143747188e-06, "loss": 0.8022, "step": 5132 }, { "epoch": 0.56, "learning_rate": 8.587322498255124e-06, "loss": 0.6318, "step": 5133 }, { "epoch": 0.56, "learning_rate": 8.583832028388475e-06, "loss": 0.7368, "step": 5134 }, { "epoch": 0.56, "learning_rate": 8.580341734581179e-06, "loss": 0.7695, "step": 5135 }, { "epoch": 0.56, "learning_rate": 8.576851617267151e-06, "loss": 0.7993, "step": 5136 }, { "epoch": 0.56, "learning_rate": 8.573361676880288e-06, "loss": 0.6907, "step": 5137 }, { "epoch": 0.56, "learning_rate": 8.569871913854458e-06, "loss": 0.7117, "step": 5138 }, { "epoch": 0.56, "learning_rate": 8.566382328623519e-06, "loss": 0.6772, "step": 5139 }, { "epoch": 0.56, "learning_rate": 8.562892921621295e-06, "loss": 0.7793, "step": 5140 }, { "epoch": 0.56, "learning_rate": 8.559403693281596e-06, "loss": 0.7322, "step": 5141 }, { "epoch": 0.56, "learning_rate": 8.555914644038202e-06, "loss": 0.6899, "step": 5142 }, { "epoch": 0.56, "learning_rate": 8.552425774324875e-06, "loss": 0.7373, "step": 5143 }, { "epoch": 0.56, "learning_rate": 8.548937084575359e-06, "loss": 0.7227, "step": 5144 }, { "epoch": 0.56, "learning_rate": 8.545448575223369e-06, "loss": 0.6914, "step": 5145 }, { "epoch": 0.56, "learning_rate": 8.541960246702597e-06, "loss": 0.7412, "step": 5146 }, { "epoch": 0.56, "learning_rate": 8.538472099446714e-06, "loss": 0.7039, "step": 5147 }, { "epoch": 0.56, "learning_rate": 8.534984133889377e-06, "loss": 0.8398, "step": 5148 }, { "epoch": 0.56, "learning_rate": 8.53149635046421e-06, "loss": 0.731, "step": 5149 }, { "epoch": 0.56, "learning_rate": 8.52800874960482e-06, "loss": 0.7192, "step": 5150 }, { "epoch": 0.56, "learning_rate": 8.52452133174478e-06, "loss": 0.7317, "step": 5151 }, { "epoch": 0.56, "learning_rate": 8.52103409731766e-06, "loss": 0.7466, "step": 5152 }, { "epoch": 0.56, "learning_rate": 8.517547046756989e-06, "loss": 0.7534, "step": 5153 }, { "epoch": 0.56, "learning_rate": 8.514060180496285e-06, "loss": 0.7092, "step": 5154 }, { "epoch": 0.56, "learning_rate": 8.510573498969034e-06, "loss": 0.7441, "step": 5155 }, { "epoch": 0.56, "learning_rate": 8.507087002608707e-06, "loss": 0.7512, "step": 5156 }, { "epoch": 0.56, "learning_rate": 8.503600691848743e-06, "loss": 0.6311, "step": 5157 }, { "epoch": 0.56, "learning_rate": 8.500114567122575e-06, "loss": 0.7126, "step": 5158 }, { "epoch": 0.56, "learning_rate": 8.49662862886359e-06, "loss": 0.6123, "step": 5159 }, { "epoch": 0.56, "learning_rate": 8.49314287750517e-06, "loss": 0.6548, "step": 5160 }, { "epoch": 0.56, "learning_rate": 8.489657313480663e-06, "loss": 0.7544, "step": 5161 }, { "epoch": 0.56, "learning_rate": 8.4861719372234e-06, "loss": 0.7354, "step": 5162 }, { "epoch": 0.56, "learning_rate": 8.482686749166685e-06, "loss": 0.7993, "step": 5163 }, { "epoch": 0.56, "learning_rate": 8.479201749743801e-06, "loss": 0.7744, "step": 5164 }, { "epoch": 0.56, "learning_rate": 8.475716939388007e-06, "loss": 0.6267, "step": 5165 }, { "epoch": 0.56, "learning_rate": 8.472232318532531e-06, "loss": 0.6523, "step": 5166 }, { "epoch": 0.56, "learning_rate": 8.468747887610592e-06, "loss": 0.634, "step": 5167 }, { "epoch": 0.56, "learning_rate": 8.465263647055379e-06, "loss": 0.8057, "step": 5168 }, { "epoch": 0.56, "learning_rate": 8.461779597300053e-06, "loss": 0.6924, "step": 5169 }, { "epoch": 0.56, "learning_rate": 8.45829573877775e-06, "loss": 0.7014, "step": 5170 }, { "epoch": 0.56, "learning_rate": 8.454812071921597e-06, "loss": 0.6064, "step": 5171 }, { "epoch": 0.56, "learning_rate": 8.451328597164679e-06, "loss": 0.647, "step": 5172 }, { "epoch": 0.56, "learning_rate": 8.447845314940066e-06, "loss": 0.6643, "step": 5173 }, { "epoch": 0.56, "learning_rate": 8.444362225680802e-06, "loss": 0.6675, "step": 5174 }, { "epoch": 0.56, "learning_rate": 8.440879329819912e-06, "loss": 0.8472, "step": 5175 }, { "epoch": 0.56, "learning_rate": 8.437396627790384e-06, "loss": 0.7002, "step": 5176 }, { "epoch": 0.56, "learning_rate": 8.433914120025205e-06, "loss": 0.7935, "step": 5177 }, { "epoch": 0.56, "learning_rate": 8.430431806957311e-06, "loss": 0.7075, "step": 5178 }, { "epoch": 0.56, "learning_rate": 8.426949689019635e-06, "loss": 0.7158, "step": 5179 }, { "epoch": 0.56, "learning_rate": 8.423467766645075e-06, "loss": 0.7075, "step": 5180 }, { "epoch": 0.56, "learning_rate": 8.419986040266502e-06, "loss": 0.6692, "step": 5181 }, { "epoch": 0.56, "learning_rate": 8.416504510316774e-06, "loss": 0.8335, "step": 5182 }, { "epoch": 0.56, "learning_rate": 8.413023177228714e-06, "loss": 0.7334, "step": 5183 }, { "epoch": 0.56, "learning_rate": 8.409542041435129e-06, "loss": 0.719, "step": 5184 }, { "epoch": 0.56, "learning_rate": 8.40606110336879e-06, "loss": 0.7346, "step": 5185 }, { "epoch": 0.56, "learning_rate": 8.402580363462451e-06, "loss": 0.6799, "step": 5186 }, { "epoch": 0.56, "learning_rate": 8.39909982214885e-06, "loss": 0.6641, "step": 5187 }, { "epoch": 0.56, "learning_rate": 8.395619479860687e-06, "loss": 0.7061, "step": 5188 }, { "epoch": 0.56, "learning_rate": 8.392139337030638e-06, "loss": 0.6882, "step": 5189 }, { "epoch": 0.56, "learning_rate": 8.388659394091362e-06, "loss": 0.6938, "step": 5190 }, { "epoch": 0.57, "learning_rate": 8.385179651475484e-06, "loss": 0.7073, "step": 5191 }, { "epoch": 0.57, "learning_rate": 8.381700109615614e-06, "loss": 0.7061, "step": 5192 }, { "epoch": 0.57, "learning_rate": 8.378220768944328e-06, "loss": 0.73, "step": 5193 }, { "epoch": 0.57, "learning_rate": 8.374741629894183e-06, "loss": 0.7368, "step": 5194 }, { "epoch": 0.57, "learning_rate": 8.371262692897706e-06, "loss": 0.6265, "step": 5195 }, { "epoch": 0.57, "learning_rate": 8.367783958387407e-06, "loss": 0.6699, "step": 5196 }, { "epoch": 0.57, "learning_rate": 8.364305426795763e-06, "loss": 0.7224, "step": 5197 }, { "epoch": 0.57, "learning_rate": 8.360827098555228e-06, "loss": 0.7593, "step": 5198 }, { "epoch": 0.57, "learning_rate": 8.357348974098232e-06, "loss": 0.5132, "step": 5199 }, { "epoch": 0.57, "learning_rate": 8.353871053857176e-06, "loss": 0.6604, "step": 5200 }, { "epoch": 0.57, "learning_rate": 8.350393338264442e-06, "loss": 0.5674, "step": 5201 }, { "epoch": 0.57, "learning_rate": 8.346915827752383e-06, "loss": 0.793, "step": 5202 }, { "epoch": 0.57, "learning_rate": 8.343438522753322e-06, "loss": 0.7065, "step": 5203 }, { "epoch": 0.57, "learning_rate": 8.339961423699563e-06, "loss": 0.7913, "step": 5204 }, { "epoch": 0.57, "learning_rate": 8.33648453102338e-06, "loss": 0.783, "step": 5205 }, { "epoch": 0.57, "learning_rate": 8.333007845157032e-06, "loss": 0.7773, "step": 5206 }, { "epoch": 0.57, "learning_rate": 8.329531366532737e-06, "loss": 0.7976, "step": 5207 }, { "epoch": 0.57, "learning_rate": 8.326055095582694e-06, "loss": 0.7896, "step": 5208 }, { "epoch": 0.57, "learning_rate": 8.32257903273908e-06, "loss": 0.7803, "step": 5209 }, { "epoch": 0.57, "learning_rate": 8.31910317843404e-06, "loss": 0.6609, "step": 5210 }, { "epoch": 0.57, "learning_rate": 8.315627533099697e-06, "loss": 0.7148, "step": 5211 }, { "epoch": 0.57, "learning_rate": 8.312152097168142e-06, "loss": 0.7368, "step": 5212 }, { "epoch": 0.57, "learning_rate": 8.308676871071451e-06, "loss": 0.7568, "step": 5213 }, { "epoch": 0.57, "learning_rate": 8.30520185524166e-06, "loss": 0.7485, "step": 5214 }, { "epoch": 0.57, "learning_rate": 8.301727050110794e-06, "loss": 0.7319, "step": 5215 }, { "epoch": 0.57, "learning_rate": 8.298252456110839e-06, "loss": 0.8125, "step": 5216 }, { "epoch": 0.57, "learning_rate": 8.294778073673762e-06, "loss": 0.7505, "step": 5217 }, { "epoch": 0.57, "learning_rate": 8.291303903231504e-06, "loss": 0.7102, "step": 5218 }, { "epoch": 0.57, "learning_rate": 8.28782994521597e-06, "loss": 0.792, "step": 5219 }, { "epoch": 0.57, "learning_rate": 8.284356200059051e-06, "loss": 0.7729, "step": 5220 }, { "epoch": 0.57, "learning_rate": 8.280882668192608e-06, "loss": 0.7483, "step": 5221 }, { "epoch": 0.57, "learning_rate": 8.27740935004847e-06, "loss": 0.7397, "step": 5222 }, { "epoch": 0.57, "learning_rate": 8.273936246058442e-06, "loss": 0.645, "step": 5223 }, { "epoch": 0.57, "learning_rate": 8.270463356654305e-06, "loss": 0.7739, "step": 5224 }, { "epoch": 0.57, "learning_rate": 8.266990682267815e-06, "loss": 0.7363, "step": 5225 }, { "epoch": 0.57, "learning_rate": 8.263518223330698e-06, "loss": 0.793, "step": 5226 }, { "epoch": 0.57, "learning_rate": 8.260045980274649e-06, "loss": 0.8228, "step": 5227 }, { "epoch": 0.57, "learning_rate": 8.256573953531344e-06, "loss": 0.6943, "step": 5228 }, { "epoch": 0.57, "learning_rate": 8.253102143532428e-06, "loss": 0.6924, "step": 5229 }, { "epoch": 0.57, "learning_rate": 8.24963055070952e-06, "loss": 0.7803, "step": 5230 }, { "epoch": 0.57, "learning_rate": 8.246159175494209e-06, "loss": 0.6816, "step": 5231 }, { "epoch": 0.57, "learning_rate": 8.242688018318062e-06, "loss": 0.8196, "step": 5232 }, { "epoch": 0.57, "learning_rate": 8.239217079612615e-06, "loss": 0.6504, "step": 5233 }, { "epoch": 0.57, "learning_rate": 8.235746359809383e-06, "loss": 0.7622, "step": 5234 }, { "epoch": 0.57, "learning_rate": 8.232275859339842e-06, "loss": 0.6855, "step": 5235 }, { "epoch": 0.57, "learning_rate": 8.228805578635457e-06, "loss": 0.6995, "step": 5236 }, { "epoch": 0.57, "learning_rate": 8.22533551812765e-06, "loss": 0.6599, "step": 5237 }, { "epoch": 0.57, "learning_rate": 8.221865678247822e-06, "loss": 0.666, "step": 5238 }, { "epoch": 0.57, "learning_rate": 8.21839605942735e-06, "loss": 0.6538, "step": 5239 }, { "epoch": 0.57, "learning_rate": 8.21492666209758e-06, "loss": 0.6438, "step": 5240 }, { "epoch": 0.57, "learning_rate": 8.211457486689829e-06, "loss": 0.6724, "step": 5241 }, { "epoch": 0.57, "learning_rate": 8.207988533635387e-06, "loss": 0.699, "step": 5242 }, { "epoch": 0.57, "learning_rate": 8.204519803365517e-06, "loss": 0.6531, "step": 5243 }, { "epoch": 0.57, "learning_rate": 8.201051296311462e-06, "loss": 0.6204, "step": 5244 }, { "epoch": 0.57, "learning_rate": 8.197583012904424e-06, "loss": 0.7141, "step": 5245 }, { "epoch": 0.57, "learning_rate": 8.194114953575584e-06, "loss": 0.6523, "step": 5246 }, { "epoch": 0.57, "learning_rate": 8.190647118756097e-06, "loss": 0.6975, "step": 5247 }, { "epoch": 0.57, "learning_rate": 8.187179508877086e-06, "loss": 0.5994, "step": 5248 }, { "epoch": 0.57, "learning_rate": 8.183712124369646e-06, "loss": 0.752, "step": 5249 }, { "epoch": 0.57, "learning_rate": 8.180244965664845e-06, "loss": 0.7375, "step": 5250 }, { "epoch": 0.57, "learning_rate": 8.176778033193728e-06, "loss": 0.6367, "step": 5251 }, { "epoch": 0.57, "learning_rate": 8.173311327387304e-06, "loss": 0.7451, "step": 5252 }, { "epoch": 0.57, "learning_rate": 8.169844848676553e-06, "loss": 0.562, "step": 5253 }, { "epoch": 0.57, "learning_rate": 8.16637859749244e-06, "loss": 0.6926, "step": 5254 }, { "epoch": 0.57, "learning_rate": 8.162912574265889e-06, "loss": 0.7739, "step": 5255 }, { "epoch": 0.57, "learning_rate": 8.159446779427798e-06, "loss": 0.5801, "step": 5256 }, { "epoch": 0.57, "learning_rate": 8.155981213409037e-06, "loss": 0.793, "step": 5257 }, { "epoch": 0.57, "learning_rate": 8.152515876640452e-06, "loss": 0.7229, "step": 5258 }, { "epoch": 0.57, "learning_rate": 8.149050769552856e-06, "loss": 0.6638, "step": 5259 }, { "epoch": 0.57, "learning_rate": 8.145585892577032e-06, "loss": 0.7056, "step": 5260 }, { "epoch": 0.57, "learning_rate": 8.142121246143738e-06, "loss": 0.7073, "step": 5261 }, { "epoch": 0.57, "learning_rate": 8.1386568306837e-06, "loss": 0.7661, "step": 5262 }, { "epoch": 0.57, "learning_rate": 8.135192646627623e-06, "loss": 0.6431, "step": 5263 }, { "epoch": 0.57, "learning_rate": 8.131728694406174e-06, "loss": 0.6558, "step": 5264 }, { "epoch": 0.57, "learning_rate": 8.128264974449996e-06, "loss": 0.7222, "step": 5265 }, { "epoch": 0.57, "learning_rate": 8.1248014871897e-06, "loss": 0.6587, "step": 5266 }, { "epoch": 0.57, "learning_rate": 8.121338233055873e-06, "loss": 0.7563, "step": 5267 }, { "epoch": 0.57, "learning_rate": 8.11787521247907e-06, "loss": 0.7234, "step": 5268 }, { "epoch": 0.57, "learning_rate": 8.11441242588981e-06, "loss": 0.698, "step": 5269 }, { "epoch": 0.57, "learning_rate": 8.1109498737186e-06, "loss": 0.7278, "step": 5270 }, { "epoch": 0.57, "learning_rate": 8.107487556395902e-06, "loss": 0.8049, "step": 5271 }, { "epoch": 0.57, "learning_rate": 8.104025474352151e-06, "loss": 0.71, "step": 5272 }, { "epoch": 0.57, "learning_rate": 8.100563628017765e-06, "loss": 0.6252, "step": 5273 }, { "epoch": 0.57, "learning_rate": 8.097102017823121e-06, "loss": 0.7012, "step": 5274 }, { "epoch": 0.57, "learning_rate": 8.093640644198568e-06, "loss": 0.7839, "step": 5275 }, { "epoch": 0.57, "learning_rate": 8.090179507574428e-06, "loss": 0.6575, "step": 5276 }, { "epoch": 0.57, "learning_rate": 8.086718608380993e-06, "loss": 0.7773, "step": 5277 }, { "epoch": 0.57, "learning_rate": 8.083257947048528e-06, "loss": 0.6941, "step": 5278 }, { "epoch": 0.57, "learning_rate": 8.07979752400726e-06, "loss": 0.656, "step": 5279 }, { "epoch": 0.57, "learning_rate": 8.076337339687395e-06, "loss": 0.8418, "step": 5280 }, { "epoch": 0.57, "learning_rate": 8.072877394519103e-06, "loss": 0.7068, "step": 5281 }, { "epoch": 0.58, "learning_rate": 8.069417688932534e-06, "loss": 0.575, "step": 5282 }, { "epoch": 0.58, "learning_rate": 8.065958223357801e-06, "loss": 0.6831, "step": 5283 }, { "epoch": 0.58, "learning_rate": 8.062498998224983e-06, "loss": 0.6685, "step": 5284 }, { "epoch": 0.58, "learning_rate": 8.05904001396414e-06, "loss": 0.7302, "step": 5285 }, { "epoch": 0.58, "learning_rate": 8.055581271005292e-06, "loss": 0.7178, "step": 5286 }, { "epoch": 0.58, "learning_rate": 8.052122769778437e-06, "loss": 0.7988, "step": 5287 }, { "epoch": 0.58, "learning_rate": 8.048664510713533e-06, "loss": 0.7332, "step": 5288 }, { "epoch": 0.58, "learning_rate": 8.04520649424052e-06, "loss": 0.5786, "step": 5289 }, { "epoch": 0.58, "learning_rate": 8.041748720789301e-06, "loss": 0.7244, "step": 5290 }, { "epoch": 0.58, "learning_rate": 8.038291190789742e-06, "loss": 0.7075, "step": 5291 }, { "epoch": 0.58, "learning_rate": 8.034833904671698e-06, "loss": 0.6016, "step": 5292 }, { "epoch": 0.58, "learning_rate": 8.031376862864977e-06, "loss": 0.7705, "step": 5293 }, { "epoch": 0.58, "learning_rate": 8.027920065799362e-06, "loss": 0.6016, "step": 5294 }, { "epoch": 0.58, "learning_rate": 8.024463513904608e-06, "loss": 0.6992, "step": 5295 }, { "epoch": 0.58, "learning_rate": 8.021007207610427e-06, "loss": 0.7195, "step": 5296 }, { "epoch": 0.58, "learning_rate": 8.017551147346523e-06, "loss": 0.6604, "step": 5297 }, { "epoch": 0.58, "learning_rate": 8.014095333542548e-06, "loss": 0.7686, "step": 5298 }, { "epoch": 0.58, "learning_rate": 8.010639766628134e-06, "loss": 0.6167, "step": 5299 }, { "epoch": 0.58, "learning_rate": 8.007184447032881e-06, "loss": 0.7251, "step": 5300 }, { "epoch": 0.58, "learning_rate": 8.00372937518636e-06, "loss": 0.6843, "step": 5301 }, { "epoch": 0.58, "learning_rate": 8.000274551518106e-06, "loss": 0.7622, "step": 5302 }, { "epoch": 0.58, "learning_rate": 7.996819976457626e-06, "loss": 0.5527, "step": 5303 }, { "epoch": 0.58, "learning_rate": 7.993365650434401e-06, "loss": 0.6089, "step": 5304 }, { "epoch": 0.58, "learning_rate": 7.989911573877869e-06, "loss": 0.7319, "step": 5305 }, { "epoch": 0.58, "learning_rate": 7.986457747217448e-06, "loss": 0.676, "step": 5306 }, { "epoch": 0.58, "learning_rate": 7.983004170882518e-06, "loss": 0.7383, "step": 5307 }, { "epoch": 0.58, "learning_rate": 7.979550845302436e-06, "loss": 0.6257, "step": 5308 }, { "epoch": 0.58, "learning_rate": 7.976097770906517e-06, "loss": 0.7139, "step": 5309 }, { "epoch": 0.58, "learning_rate": 7.97264494812405e-06, "loss": 0.73, "step": 5310 }, { "epoch": 0.58, "learning_rate": 7.9691923773843e-06, "loss": 0.7607, "step": 5311 }, { "epoch": 0.58, "learning_rate": 7.965740059116491e-06, "loss": 0.6272, "step": 5312 }, { "epoch": 0.58, "learning_rate": 7.962287993749817e-06, "loss": 0.7676, "step": 5313 }, { "epoch": 0.58, "learning_rate": 7.958836181713445e-06, "loss": 0.7209, "step": 5314 }, { "epoch": 0.58, "learning_rate": 7.955384623436503e-06, "loss": 0.7734, "step": 5315 }, { "epoch": 0.58, "learning_rate": 7.951933319348095e-06, "loss": 0.7131, "step": 5316 }, { "epoch": 0.58, "learning_rate": 7.948482269877292e-06, "loss": 0.6899, "step": 5317 }, { "epoch": 0.58, "learning_rate": 7.945031475453126e-06, "loss": 0.6609, "step": 5318 }, { "epoch": 0.58, "learning_rate": 7.941580936504604e-06, "loss": 0.5698, "step": 5319 }, { "epoch": 0.58, "learning_rate": 7.938130653460708e-06, "loss": 0.6936, "step": 5320 }, { "epoch": 0.58, "learning_rate": 7.934680626750375e-06, "loss": 0.7783, "step": 5321 }, { "epoch": 0.58, "learning_rate": 7.931230856802513e-06, "loss": 0.709, "step": 5322 }, { "epoch": 0.58, "learning_rate": 7.927781344046008e-06, "loss": 0.6802, "step": 5323 }, { "epoch": 0.58, "learning_rate": 7.924332088909702e-06, "loss": 0.6714, "step": 5324 }, { "epoch": 0.58, "learning_rate": 7.92088309182241e-06, "loss": 0.7031, "step": 5325 }, { "epoch": 0.58, "learning_rate": 7.917434353212911e-06, "loss": 0.7361, "step": 5326 }, { "epoch": 0.58, "learning_rate": 7.913985873509964e-06, "loss": 0.7151, "step": 5327 }, { "epoch": 0.58, "learning_rate": 7.91053765314228e-06, "loss": 0.7217, "step": 5328 }, { "epoch": 0.58, "learning_rate": 7.907089692538545e-06, "loss": 0.7126, "step": 5329 }, { "epoch": 0.58, "learning_rate": 7.903641992127417e-06, "loss": 0.6746, "step": 5330 }, { "epoch": 0.58, "learning_rate": 7.900194552337516e-06, "loss": 0.6431, "step": 5331 }, { "epoch": 0.58, "learning_rate": 7.896747373597433e-06, "loss": 0.6736, "step": 5332 }, { "epoch": 0.58, "learning_rate": 7.893300456335722e-06, "loss": 0.6953, "step": 5333 }, { "epoch": 0.58, "learning_rate": 7.889853800980905e-06, "loss": 0.6101, "step": 5334 }, { "epoch": 0.58, "learning_rate": 7.886407407961476e-06, "loss": 0.7349, "step": 5335 }, { "epoch": 0.58, "learning_rate": 7.882961277705897e-06, "loss": 0.6682, "step": 5336 }, { "epoch": 0.58, "learning_rate": 7.879515410642585e-06, "loss": 0.7522, "step": 5337 }, { "epoch": 0.58, "learning_rate": 7.876069807199945e-06, "loss": 0.7954, "step": 5338 }, { "epoch": 0.58, "learning_rate": 7.872624467806324e-06, "loss": 0.7583, "step": 5339 }, { "epoch": 0.58, "learning_rate": 7.869179392890065e-06, "loss": 0.752, "step": 5340 }, { "epoch": 0.58, "learning_rate": 7.865734582879453e-06, "loss": 0.7368, "step": 5341 }, { "epoch": 0.58, "learning_rate": 7.862290038202755e-06, "loss": 0.7717, "step": 5342 }, { "epoch": 0.58, "learning_rate": 7.858845759288198e-06, "loss": 0.8118, "step": 5343 }, { "epoch": 0.58, "learning_rate": 7.855401746563978e-06, "loss": 0.7427, "step": 5344 }, { "epoch": 0.58, "learning_rate": 7.851958000458255e-06, "loss": 0.6572, "step": 5345 }, { "epoch": 0.58, "learning_rate": 7.848514521399167e-06, "loss": 0.7822, "step": 5346 }, { "epoch": 0.58, "learning_rate": 7.845071309814802e-06, "loss": 0.6316, "step": 5347 }, { "epoch": 0.58, "learning_rate": 7.841628366133225e-06, "loss": 0.6465, "step": 5348 }, { "epoch": 0.58, "learning_rate": 7.838185690782468e-06, "loss": 0.7534, "step": 5349 }, { "epoch": 0.58, "learning_rate": 7.83474328419053e-06, "loss": 0.6481, "step": 5350 }, { "epoch": 0.58, "learning_rate": 7.831301146785374e-06, "loss": 0.6887, "step": 5351 }, { "epoch": 0.58, "learning_rate": 7.827859278994924e-06, "loss": 0.7554, "step": 5352 }, { "epoch": 0.58, "learning_rate": 7.82441768124708e-06, "loss": 0.7485, "step": 5353 }, { "epoch": 0.58, "learning_rate": 7.820976353969706e-06, "loss": 0.623, "step": 5354 }, { "epoch": 0.58, "learning_rate": 7.81753529759063e-06, "loss": 0.6685, "step": 5355 }, { "epoch": 0.58, "learning_rate": 7.814094512537645e-06, "loss": 0.7063, "step": 5356 }, { "epoch": 0.58, "learning_rate": 7.810653999238516e-06, "loss": 0.6538, "step": 5357 }, { "epoch": 0.58, "learning_rate": 7.807213758120965e-06, "loss": 0.7439, "step": 5358 }, { "epoch": 0.58, "learning_rate": 7.803773789612698e-06, "loss": 0.7356, "step": 5359 }, { "epoch": 0.58, "learning_rate": 7.800334094141363e-06, "loss": 0.6548, "step": 5360 }, { "epoch": 0.58, "learning_rate": 7.796894672134594e-06, "loss": 0.6484, "step": 5361 }, { "epoch": 0.58, "learning_rate": 7.79345552401998e-06, "loss": 0.6716, "step": 5362 }, { "epoch": 0.58, "learning_rate": 7.790016650225081e-06, "loss": 0.6165, "step": 5363 }, { "epoch": 0.58, "learning_rate": 7.786578051177416e-06, "loss": 0.7102, "step": 5364 }, { "epoch": 0.58, "learning_rate": 7.783139727304481e-06, "loss": 0.6658, "step": 5365 }, { "epoch": 0.58, "learning_rate": 7.779701679033729e-06, "loss": 0.7122, "step": 5366 }, { "epoch": 0.58, "learning_rate": 7.776263906792576e-06, "loss": 0.7188, "step": 5367 }, { "epoch": 0.58, "learning_rate": 7.772826411008418e-06, "loss": 0.6665, "step": 5368 }, { "epoch": 0.58, "learning_rate": 7.769389192108608e-06, "loss": 0.6628, "step": 5369 }, { "epoch": 0.58, "learning_rate": 7.765952250520459e-06, "loss": 0.751, "step": 5370 }, { "epoch": 0.58, "learning_rate": 7.762515586671257e-06, "loss": 0.7004, "step": 5371 }, { "epoch": 0.58, "learning_rate": 7.75907920098825e-06, "loss": 0.71, "step": 5372 }, { "epoch": 0.58, "learning_rate": 7.755643093898654e-06, "loss": 0.7148, "step": 5373 }, { "epoch": 0.59, "learning_rate": 7.75220726582965e-06, "loss": 0.6609, "step": 5374 }, { "epoch": 0.59, "learning_rate": 7.74877171720838e-06, "loss": 0.7583, "step": 5375 }, { "epoch": 0.59, "learning_rate": 7.745336448461958e-06, "loss": 0.6206, "step": 5376 }, { "epoch": 0.59, "learning_rate": 7.741901460017455e-06, "loss": 0.6772, "step": 5377 }, { "epoch": 0.59, "learning_rate": 7.738466752301922e-06, "loss": 0.7729, "step": 5378 }, { "epoch": 0.59, "learning_rate": 7.735032325742355e-06, "loss": 0.6379, "step": 5379 }, { "epoch": 0.59, "learning_rate": 7.731598180765732e-06, "loss": 0.6509, "step": 5380 }, { "epoch": 0.59, "learning_rate": 7.728164317798988e-06, "loss": 0.6936, "step": 5381 }, { "epoch": 0.59, "learning_rate": 7.72473073726902e-06, "loss": 0.7542, "step": 5382 }, { "epoch": 0.59, "learning_rate": 7.721297439602695e-06, "loss": 0.6096, "step": 5383 }, { "epoch": 0.59, "learning_rate": 7.717864425226848e-06, "loss": 0.729, "step": 5384 }, { "epoch": 0.59, "learning_rate": 7.714431694568272e-06, "loss": 0.6284, "step": 5385 }, { "epoch": 0.59, "learning_rate": 7.710999248053722e-06, "loss": 0.7271, "step": 5386 }, { "epoch": 0.59, "learning_rate": 7.707567086109932e-06, "loss": 0.7549, "step": 5387 }, { "epoch": 0.59, "learning_rate": 7.704135209163589e-06, "loss": 0.7773, "step": 5388 }, { "epoch": 0.59, "learning_rate": 7.700703617641347e-06, "loss": 0.595, "step": 5389 }, { "epoch": 0.59, "learning_rate": 7.697272311969824e-06, "loss": 0.7371, "step": 5390 }, { "epoch": 0.59, "learning_rate": 7.6938412925756e-06, "loss": 0.7207, "step": 5391 }, { "epoch": 0.59, "learning_rate": 7.690410559885228e-06, "loss": 0.7534, "step": 5392 }, { "epoch": 0.59, "learning_rate": 7.686980114325217e-06, "loss": 0.6997, "step": 5393 }, { "epoch": 0.59, "learning_rate": 7.683549956322043e-06, "loss": 0.6213, "step": 5394 }, { "epoch": 0.59, "learning_rate": 7.68012008630215e-06, "loss": 0.5801, "step": 5395 }, { "epoch": 0.59, "learning_rate": 7.676690504691935e-06, "loss": 0.7107, "step": 5396 }, { "epoch": 0.59, "learning_rate": 7.673261211917777e-06, "loss": 0.6653, "step": 5397 }, { "epoch": 0.59, "learning_rate": 7.669832208406e-06, "loss": 0.7297, "step": 5398 }, { "epoch": 0.59, "learning_rate": 7.66640349458291e-06, "loss": 0.6145, "step": 5399 }, { "epoch": 0.59, "learning_rate": 7.662975070874761e-06, "loss": 0.6616, "step": 5400 }, { "epoch": 0.59, "learning_rate": 7.65954693770778e-06, "loss": 0.6792, "step": 5401 }, { "epoch": 0.59, "learning_rate": 7.656119095508155e-06, "loss": 0.6624, "step": 5402 }, { "epoch": 0.59, "learning_rate": 7.65269154470204e-06, "loss": 0.6765, "step": 5403 }, { "epoch": 0.59, "learning_rate": 7.649264285715551e-06, "loss": 0.708, "step": 5404 }, { "epoch": 0.59, "learning_rate": 7.645837318974763e-06, "loss": 0.7568, "step": 5405 }, { "epoch": 0.59, "learning_rate": 7.642410644905726e-06, "loss": 0.5994, "step": 5406 }, { "epoch": 0.59, "learning_rate": 7.63898426393445e-06, "loss": 0.6665, "step": 5407 }, { "epoch": 0.59, "learning_rate": 7.635558176486901e-06, "loss": 0.6116, "step": 5408 }, { "epoch": 0.59, "learning_rate": 7.632132382989014e-06, "loss": 0.8115, "step": 5409 }, { "epoch": 0.59, "learning_rate": 7.628706883866686e-06, "loss": 0.6401, "step": 5410 }, { "epoch": 0.59, "learning_rate": 7.6252816795457795e-06, "loss": 0.6394, "step": 5411 }, { "epoch": 0.59, "learning_rate": 7.62185677045212e-06, "loss": 0.7129, "step": 5412 }, { "epoch": 0.59, "learning_rate": 7.618432157011494e-06, "loss": 0.7139, "step": 5413 }, { "epoch": 0.59, "learning_rate": 7.615007839649655e-06, "loss": 0.7231, "step": 5414 }, { "epoch": 0.59, "learning_rate": 7.611583818792311e-06, "loss": 0.7283, "step": 5415 }, { "epoch": 0.59, "learning_rate": 7.608160094865148e-06, "loss": 0.7458, "step": 5416 }, { "epoch": 0.59, "learning_rate": 7.604736668293802e-06, "loss": 0.7664, "step": 5417 }, { "epoch": 0.59, "learning_rate": 7.601313539503878e-06, "loss": 0.791, "step": 5418 }, { "epoch": 0.59, "learning_rate": 7.5978907089209445e-06, "loss": 0.7534, "step": 5419 }, { "epoch": 0.59, "learning_rate": 7.5944681769705274e-06, "loss": 0.7861, "step": 5420 }, { "epoch": 0.59, "learning_rate": 7.591045944078119e-06, "loss": 0.7876, "step": 5421 }, { "epoch": 0.59, "learning_rate": 7.587624010669178e-06, "loss": 0.7783, "step": 5422 }, { "epoch": 0.59, "learning_rate": 7.584202377169121e-06, "loss": 0.6848, "step": 5423 }, { "epoch": 0.59, "learning_rate": 7.580781044003324e-06, "loss": 0.6814, "step": 5424 }, { "epoch": 0.59, "learning_rate": 7.577360011597135e-06, "loss": 0.7769, "step": 5425 }, { "epoch": 0.59, "learning_rate": 7.573939280375864e-06, "loss": 0.7534, "step": 5426 }, { "epoch": 0.59, "learning_rate": 7.5705188507647735e-06, "loss": 0.7305, "step": 5427 }, { "epoch": 0.59, "learning_rate": 7.567098723189097e-06, "loss": 0.6826, "step": 5428 }, { "epoch": 0.59, "learning_rate": 7.563678898074025e-06, "loss": 0.7334, "step": 5429 }, { "epoch": 0.59, "learning_rate": 7.560259375844719e-06, "loss": 0.6042, "step": 5430 }, { "epoch": 0.59, "learning_rate": 7.556840156926293e-06, "loss": 0.8159, "step": 5431 }, { "epoch": 0.59, "learning_rate": 7.553421241743826e-06, "loss": 0.6313, "step": 5432 }, { "epoch": 0.59, "learning_rate": 7.550002630722366e-06, "loss": 0.6226, "step": 5433 }, { "epoch": 0.59, "learning_rate": 7.546584324286911e-06, "loss": 0.6211, "step": 5434 }, { "epoch": 0.59, "learning_rate": 7.543166322862437e-06, "loss": 0.8213, "step": 5435 }, { "epoch": 0.59, "learning_rate": 7.539748626873866e-06, "loss": 0.686, "step": 5436 }, { "epoch": 0.59, "learning_rate": 7.536331236746095e-06, "loss": 0.6572, "step": 5437 }, { "epoch": 0.59, "learning_rate": 7.532914152903973e-06, "loss": 0.73, "step": 5438 }, { "epoch": 0.59, "learning_rate": 7.529497375772317e-06, "loss": 0.6128, "step": 5439 }, { "epoch": 0.59, "learning_rate": 7.5260809057759e-06, "loss": 0.6074, "step": 5440 }, { "epoch": 0.59, "learning_rate": 7.522664743339468e-06, "loss": 0.7148, "step": 5441 }, { "epoch": 0.59, "learning_rate": 7.519248888887715e-06, "loss": 0.6091, "step": 5442 }, { "epoch": 0.59, "learning_rate": 7.515833342845306e-06, "loss": 0.668, "step": 5443 }, { "epoch": 0.59, "learning_rate": 7.5124181056368606e-06, "loss": 0.6996, "step": 5444 }, { "epoch": 0.59, "learning_rate": 7.509003177686975e-06, "loss": 0.7964, "step": 5445 }, { "epoch": 0.59, "learning_rate": 7.505588559420188e-06, "loss": 0.6833, "step": 5446 }, { "epoch": 0.59, "learning_rate": 7.5021742512610105e-06, "loss": 0.7769, "step": 5447 }, { "epoch": 0.59, "learning_rate": 7.49876025363391e-06, "loss": 0.7686, "step": 5448 }, { "epoch": 0.59, "learning_rate": 7.495346566963323e-06, "loss": 0.6401, "step": 5449 }, { "epoch": 0.59, "learning_rate": 7.491933191673639e-06, "loss": 0.6846, "step": 5450 }, { "epoch": 0.59, "learning_rate": 7.488520128189209e-06, "loss": 0.5715, "step": 5451 }, { "epoch": 0.59, "learning_rate": 7.4851073769343555e-06, "loss": 0.6648, "step": 5452 }, { "epoch": 0.59, "learning_rate": 7.4816949383333455e-06, "loss": 0.6428, "step": 5453 }, { "epoch": 0.59, "learning_rate": 7.4782828128104275e-06, "loss": 0.6821, "step": 5454 }, { "epoch": 0.59, "learning_rate": 7.474871000789793e-06, "loss": 0.7256, "step": 5455 }, { "epoch": 0.59, "learning_rate": 7.471459502695606e-06, "loss": 0.7517, "step": 5456 }, { "epoch": 0.59, "learning_rate": 7.468048318951983e-06, "loss": 0.771, "step": 5457 }, { "epoch": 0.59, "learning_rate": 7.46463744998301e-06, "loss": 0.7087, "step": 5458 }, { "epoch": 0.59, "learning_rate": 7.461226896212723e-06, "loss": 0.5427, "step": 5459 }, { "epoch": 0.59, "learning_rate": 7.4578166580651335e-06, "loss": 0.7158, "step": 5460 }, { "epoch": 0.59, "learning_rate": 7.454406735964199e-06, "loss": 0.6658, "step": 5461 }, { "epoch": 0.59, "learning_rate": 7.450997130333846e-06, "loss": 0.6958, "step": 5462 }, { "epoch": 0.59, "learning_rate": 7.4475878415979586e-06, "loss": 0.7422, "step": 5463 }, { "epoch": 0.59, "learning_rate": 7.444178870180387e-06, "loss": 0.644, "step": 5464 }, { "epoch": 0.59, "learning_rate": 7.440770216504938e-06, "loss": 0.8066, "step": 5465 }, { "epoch": 0.6, "learning_rate": 7.4373618809953755e-06, "loss": 0.8184, "step": 5466 }, { "epoch": 0.6, "learning_rate": 7.433953864075425e-06, "loss": 0.6245, "step": 5467 }, { "epoch": 0.6, "learning_rate": 7.430546166168781e-06, "loss": 0.7275, "step": 5468 }, { "epoch": 0.6, "learning_rate": 7.4271387876990866e-06, "loss": 0.6626, "step": 5469 }, { "epoch": 0.6, "learning_rate": 7.423731729089949e-06, "loss": 0.7498, "step": 5470 }, { "epoch": 0.6, "learning_rate": 7.420324990764942e-06, "loss": 0.8022, "step": 5471 }, { "epoch": 0.6, "learning_rate": 7.416918573147589e-06, "loss": 0.7864, "step": 5472 }, { "epoch": 0.6, "learning_rate": 7.413512476661386e-06, "loss": 0.6506, "step": 5473 }, { "epoch": 0.6, "learning_rate": 7.410106701729776e-06, "loss": 0.7856, "step": 5474 }, { "epoch": 0.6, "learning_rate": 7.406701248776174e-06, "loss": 0.74, "step": 5475 }, { "epoch": 0.6, "learning_rate": 7.403296118223944e-06, "loss": 0.6104, "step": 5476 }, { "epoch": 0.6, "learning_rate": 7.3998913104964165e-06, "loss": 0.7944, "step": 5477 }, { "epoch": 0.6, "learning_rate": 7.39648682601688e-06, "loss": 0.7629, "step": 5478 }, { "epoch": 0.6, "learning_rate": 7.393082665208587e-06, "loss": 0.6775, "step": 5479 }, { "epoch": 0.6, "learning_rate": 7.389678828494742e-06, "loss": 0.6997, "step": 5480 }, { "epoch": 0.6, "learning_rate": 7.386275316298513e-06, "loss": 0.7119, "step": 5481 }, { "epoch": 0.6, "learning_rate": 7.382872129043026e-06, "loss": 0.8242, "step": 5482 }, { "epoch": 0.6, "learning_rate": 7.379469267151376e-06, "loss": 0.6948, "step": 5483 }, { "epoch": 0.6, "learning_rate": 7.376066731046606e-06, "loss": 0.7993, "step": 5484 }, { "epoch": 0.6, "learning_rate": 7.372664521151722e-06, "loss": 0.8354, "step": 5485 }, { "epoch": 0.6, "learning_rate": 7.369262637889689e-06, "loss": 0.7253, "step": 5486 }, { "epoch": 0.6, "learning_rate": 7.365861081683434e-06, "loss": 0.6296, "step": 5487 }, { "epoch": 0.6, "learning_rate": 7.3624598529558435e-06, "loss": 0.7673, "step": 5488 }, { "epoch": 0.6, "learning_rate": 7.359058952129756e-06, "loss": 0.6934, "step": 5489 }, { "epoch": 0.6, "learning_rate": 7.355658379627981e-06, "loss": 0.7153, "step": 5490 }, { "epoch": 0.6, "learning_rate": 7.352258135873277e-06, "loss": 0.6387, "step": 5491 }, { "epoch": 0.6, "learning_rate": 7.348858221288362e-06, "loss": 0.6689, "step": 5492 }, { "epoch": 0.6, "learning_rate": 7.345458636295923e-06, "loss": 0.6514, "step": 5493 }, { "epoch": 0.6, "learning_rate": 7.3420593813186025e-06, "loss": 0.6736, "step": 5494 }, { "epoch": 0.6, "learning_rate": 7.338660456778992e-06, "loss": 0.7812, "step": 5495 }, { "epoch": 0.6, "learning_rate": 7.335261863099652e-06, "loss": 0.6975, "step": 5496 }, { "epoch": 0.6, "learning_rate": 7.331863600703096e-06, "loss": 0.6721, "step": 5497 }, { "epoch": 0.6, "learning_rate": 7.328465670011804e-06, "loss": 0.6157, "step": 5498 }, { "epoch": 0.6, "learning_rate": 7.325068071448208e-06, "loss": 0.5867, "step": 5499 }, { "epoch": 0.6, "learning_rate": 7.321670805434698e-06, "loss": 0.6768, "step": 5500 }, { "epoch": 0.6, "learning_rate": 7.3182738723936255e-06, "loss": 0.792, "step": 5501 }, { "epoch": 0.6, "learning_rate": 7.3148772727473064e-06, "loss": 0.7317, "step": 5502 }, { "epoch": 0.6, "learning_rate": 7.311481006918005e-06, "loss": 0.5966, "step": 5503 }, { "epoch": 0.6, "learning_rate": 7.308085075327949e-06, "loss": 0.6987, "step": 5504 }, { "epoch": 0.6, "learning_rate": 7.3046894783993225e-06, "loss": 0.7959, "step": 5505 }, { "epoch": 0.6, "learning_rate": 7.301294216554271e-06, "loss": 0.6365, "step": 5506 }, { "epoch": 0.6, "learning_rate": 7.297899290214896e-06, "loss": 0.6638, "step": 5507 }, { "epoch": 0.6, "learning_rate": 7.294504699803258e-06, "loss": 0.7959, "step": 5508 }, { "epoch": 0.6, "learning_rate": 7.291110445741376e-06, "loss": 0.6912, "step": 5509 }, { "epoch": 0.6, "learning_rate": 7.2877165284512275e-06, "loss": 0.6484, "step": 5510 }, { "epoch": 0.6, "learning_rate": 7.2843229483547405e-06, "loss": 0.6282, "step": 5511 }, { "epoch": 0.6, "learning_rate": 7.280929705873818e-06, "loss": 0.7046, "step": 5512 }, { "epoch": 0.6, "learning_rate": 7.277536801430309e-06, "loss": 0.7158, "step": 5513 }, { "epoch": 0.6, "learning_rate": 7.274144235446024e-06, "loss": 0.731, "step": 5514 }, { "epoch": 0.6, "learning_rate": 7.270752008342723e-06, "loss": 0.7861, "step": 5515 }, { "epoch": 0.6, "learning_rate": 7.267360120542135e-06, "loss": 0.606, "step": 5516 }, { "epoch": 0.6, "learning_rate": 7.2639685724659445e-06, "loss": 0.7192, "step": 5517 }, { "epoch": 0.6, "learning_rate": 7.26057736453579e-06, "loss": 0.7915, "step": 5518 }, { "epoch": 0.6, "learning_rate": 7.2571864971732676e-06, "loss": 0.7312, "step": 5519 }, { "epoch": 0.6, "learning_rate": 7.253795970799935e-06, "loss": 0.6248, "step": 5520 }, { "epoch": 0.6, "learning_rate": 7.250405785837309e-06, "loss": 0.6941, "step": 5521 }, { "epoch": 0.6, "learning_rate": 7.247015942706857e-06, "loss": 0.7563, "step": 5522 }, { "epoch": 0.6, "learning_rate": 7.243626441830009e-06, "loss": 0.7217, "step": 5523 }, { "epoch": 0.6, "learning_rate": 7.240237283628149e-06, "loss": 0.574, "step": 5524 }, { "epoch": 0.6, "learning_rate": 7.2368484685226235e-06, "loss": 0.8008, "step": 5525 }, { "epoch": 0.6, "learning_rate": 7.233459996934731e-06, "loss": 0.6729, "step": 5526 }, { "epoch": 0.6, "learning_rate": 7.230071869285729e-06, "loss": 0.7153, "step": 5527 }, { "epoch": 0.6, "learning_rate": 7.2266840859968345e-06, "loss": 0.6873, "step": 5528 }, { "epoch": 0.6, "learning_rate": 7.223296647489219e-06, "loss": 0.5867, "step": 5529 }, { "epoch": 0.6, "learning_rate": 7.219909554184009e-06, "loss": 0.6411, "step": 5530 }, { "epoch": 0.6, "learning_rate": 7.216522806502295e-06, "loss": 0.6628, "step": 5531 }, { "epoch": 0.6, "learning_rate": 7.213136404865124e-06, "loss": 0.5913, "step": 5532 }, { "epoch": 0.6, "learning_rate": 7.2097503496934915e-06, "loss": 0.7861, "step": 5533 }, { "epoch": 0.6, "learning_rate": 7.206364641408358e-06, "loss": 0.6616, "step": 5534 }, { "epoch": 0.6, "learning_rate": 7.202979280430633e-06, "loss": 0.5913, "step": 5535 }, { "epoch": 0.6, "learning_rate": 7.199594267181193e-06, "loss": 0.7856, "step": 5536 }, { "epoch": 0.6, "learning_rate": 7.196209602080866e-06, "loss": 0.8374, "step": 5537 }, { "epoch": 0.6, "learning_rate": 7.192825285550431e-06, "loss": 0.6904, "step": 5538 }, { "epoch": 0.6, "learning_rate": 7.189441318010632e-06, "loss": 0.7695, "step": 5539 }, { "epoch": 0.6, "learning_rate": 7.186057699882172e-06, "loss": 0.666, "step": 5540 }, { "epoch": 0.6, "learning_rate": 7.182674431585703e-06, "loss": 0.7588, "step": 5541 }, { "epoch": 0.6, "learning_rate": 7.179291513541836e-06, "loss": 0.613, "step": 5542 }, { "epoch": 0.6, "learning_rate": 7.175908946171135e-06, "loss": 0.6511, "step": 5543 }, { "epoch": 0.6, "learning_rate": 7.172526729894129e-06, "loss": 0.6919, "step": 5544 }, { "epoch": 0.6, "learning_rate": 7.169144865131297e-06, "loss": 0.7275, "step": 5545 }, { "epoch": 0.6, "learning_rate": 7.165763352303072e-06, "loss": 0.7754, "step": 5546 }, { "epoch": 0.6, "learning_rate": 7.162382191829853e-06, "loss": 0.7036, "step": 5547 }, { "epoch": 0.6, "learning_rate": 7.159001384131985e-06, "loss": 0.6833, "step": 5548 }, { "epoch": 0.6, "learning_rate": 7.15562092962977e-06, "loss": 0.6108, "step": 5549 }, { "epoch": 0.6, "learning_rate": 7.1522408287434774e-06, "loss": 0.6694, "step": 5550 }, { "epoch": 0.6, "learning_rate": 7.148861081893322e-06, "loss": 0.7454, "step": 5551 }, { "epoch": 0.6, "learning_rate": 7.145481689499474e-06, "loss": 0.6658, "step": 5552 }, { "epoch": 0.6, "learning_rate": 7.142102651982065e-06, "loss": 0.6301, "step": 5553 }, { "epoch": 0.6, "learning_rate": 7.1387239697611785e-06, "loss": 0.6948, "step": 5554 }, { "epoch": 0.6, "learning_rate": 7.135345643256859e-06, "loss": 0.7576, "step": 5555 }, { "epoch": 0.6, "learning_rate": 7.131967672889101e-06, "loss": 0.793, "step": 5556 }, { "epoch": 0.6, "learning_rate": 7.128590059077854e-06, "loss": 0.6169, "step": 5557 }, { "epoch": 0.61, "learning_rate": 7.125212802243027e-06, "loss": 0.7473, "step": 5558 }, { "epoch": 0.61, "learning_rate": 7.12183590280449e-06, "loss": 0.7161, "step": 5559 }, { "epoch": 0.61, "learning_rate": 7.1184593611820595e-06, "loss": 0.6648, "step": 5560 }, { "epoch": 0.61, "learning_rate": 7.115083177795507e-06, "loss": 0.7344, "step": 5561 }, { "epoch": 0.61, "learning_rate": 7.111707353064565e-06, "loss": 0.7466, "step": 5562 }, { "epoch": 0.61, "learning_rate": 7.108331887408922e-06, "loss": 0.6775, "step": 5563 }, { "epoch": 0.61, "learning_rate": 7.104956781248213e-06, "loss": 0.6665, "step": 5564 }, { "epoch": 0.61, "learning_rate": 7.101582035002039e-06, "loss": 0.6799, "step": 5565 }, { "epoch": 0.61, "learning_rate": 7.09820764908995e-06, "loss": 0.7915, "step": 5566 }, { "epoch": 0.61, "learning_rate": 7.094833623931455e-06, "loss": 0.8105, "step": 5567 }, { "epoch": 0.61, "learning_rate": 7.0914599599460095e-06, "loss": 0.7612, "step": 5568 }, { "epoch": 0.61, "learning_rate": 7.088086657553039e-06, "loss": 0.7234, "step": 5569 }, { "epoch": 0.61, "learning_rate": 7.084713717171912e-06, "loss": 0.738, "step": 5570 }, { "epoch": 0.61, "learning_rate": 7.081341139221955e-06, "loss": 0.616, "step": 5571 }, { "epoch": 0.61, "learning_rate": 7.077968924122454e-06, "loss": 0.7983, "step": 5572 }, { "epoch": 0.61, "learning_rate": 7.074597072292639e-06, "loss": 0.665, "step": 5573 }, { "epoch": 0.61, "learning_rate": 7.071225584151708e-06, "loss": 0.5693, "step": 5574 }, { "epoch": 0.61, "learning_rate": 7.067854460118806e-06, "loss": 0.5823, "step": 5575 }, { "epoch": 0.61, "learning_rate": 7.0644837006130295e-06, "loss": 0.6877, "step": 5576 }, { "epoch": 0.61, "learning_rate": 7.061113306053443e-06, "loss": 0.8018, "step": 5577 }, { "epoch": 0.61, "learning_rate": 7.057743276859048e-06, "loss": 0.7075, "step": 5578 }, { "epoch": 0.61, "learning_rate": 7.0543736134488195e-06, "loss": 0.7466, "step": 5579 }, { "epoch": 0.61, "learning_rate": 7.051004316241672e-06, "loss": 0.5796, "step": 5580 }, { "epoch": 0.61, "learning_rate": 7.047635385656477e-06, "loss": 0.8376, "step": 5581 }, { "epoch": 0.61, "learning_rate": 7.044266822112069e-06, "loss": 0.8423, "step": 5582 }, { "epoch": 0.61, "learning_rate": 7.040898626027228e-06, "loss": 0.6836, "step": 5583 }, { "epoch": 0.61, "learning_rate": 7.037530797820691e-06, "loss": 0.6609, "step": 5584 }, { "epoch": 0.61, "learning_rate": 7.0341633379111515e-06, "loss": 0.6477, "step": 5585 }, { "epoch": 0.61, "learning_rate": 7.0307962467172555e-06, "loss": 0.8237, "step": 5586 }, { "epoch": 0.61, "learning_rate": 7.0274295246575955e-06, "loss": 0.7153, "step": 5587 }, { "epoch": 0.61, "learning_rate": 7.024063172150737e-06, "loss": 0.7739, "step": 5588 }, { "epoch": 0.61, "learning_rate": 7.02069718961518e-06, "loss": 0.7578, "step": 5589 }, { "epoch": 0.61, "learning_rate": 7.017331577469392e-06, "loss": 0.6121, "step": 5590 }, { "epoch": 0.61, "learning_rate": 7.0139663361317864e-06, "loss": 0.7148, "step": 5591 }, { "epoch": 0.61, "learning_rate": 7.010601466020732e-06, "loss": 0.6531, "step": 5592 }, { "epoch": 0.61, "learning_rate": 7.007236967554556e-06, "loss": 0.7861, "step": 5593 }, { "epoch": 0.61, "learning_rate": 7.003872841151533e-06, "loss": 0.8198, "step": 5594 }, { "epoch": 0.61, "learning_rate": 7.0005090872298955e-06, "loss": 0.7227, "step": 5595 }, { "epoch": 0.61, "learning_rate": 6.99714570620783e-06, "loss": 0.5596, "step": 5596 }, { "epoch": 0.61, "learning_rate": 6.993782698503469e-06, "loss": 0.6877, "step": 5597 }, { "epoch": 0.61, "learning_rate": 6.990420064534915e-06, "loss": 0.7686, "step": 5598 }, { "epoch": 0.61, "learning_rate": 6.987057804720208e-06, "loss": 0.7961, "step": 5599 }, { "epoch": 0.61, "learning_rate": 6.983695919477346e-06, "loss": 0.7422, "step": 5600 }, { "epoch": 0.61, "learning_rate": 6.9803344092242855e-06, "loss": 0.6265, "step": 5601 }, { "epoch": 0.61, "learning_rate": 6.976973274378931e-06, "loss": 0.7202, "step": 5602 }, { "epoch": 0.61, "learning_rate": 6.9736125153591405e-06, "loss": 0.6562, "step": 5603 }, { "epoch": 0.61, "learning_rate": 6.970252132582729e-06, "loss": 0.6416, "step": 5604 }, { "epoch": 0.61, "learning_rate": 6.966892126467463e-06, "loss": 0.6589, "step": 5605 }, { "epoch": 0.61, "learning_rate": 6.963532497431056e-06, "loss": 0.5569, "step": 5606 }, { "epoch": 0.61, "learning_rate": 6.960173245891187e-06, "loss": 0.6274, "step": 5607 }, { "epoch": 0.61, "learning_rate": 6.956814372265479e-06, "loss": 0.6282, "step": 5608 }, { "epoch": 0.61, "learning_rate": 6.953455876971511e-06, "loss": 0.6648, "step": 5609 }, { "epoch": 0.61, "learning_rate": 6.950097760426814e-06, "loss": 0.7322, "step": 5610 }, { "epoch": 0.61, "learning_rate": 6.94674002304887e-06, "loss": 0.7007, "step": 5611 }, { "epoch": 0.61, "learning_rate": 6.943382665255119e-06, "loss": 0.6445, "step": 5612 }, { "epoch": 0.61, "learning_rate": 6.940025687462952e-06, "loss": 0.6365, "step": 5613 }, { "epoch": 0.61, "learning_rate": 6.936669090089706e-06, "loss": 0.6765, "step": 5614 }, { "epoch": 0.61, "learning_rate": 6.933312873552682e-06, "loss": 0.6846, "step": 5615 }, { "epoch": 0.61, "learning_rate": 6.929957038269123e-06, "loss": 0.7051, "step": 5616 }, { "epoch": 0.61, "learning_rate": 6.926601584656236e-06, "loss": 0.6714, "step": 5617 }, { "epoch": 0.61, "learning_rate": 6.923246513131172e-06, "loss": 0.7974, "step": 5618 }, { "epoch": 0.61, "learning_rate": 6.919891824111032e-06, "loss": 0.6841, "step": 5619 }, { "epoch": 0.61, "learning_rate": 6.9165375180128805e-06, "loss": 0.6934, "step": 5620 }, { "epoch": 0.61, "learning_rate": 6.913183595253725e-06, "loss": 0.6445, "step": 5621 }, { "epoch": 0.61, "learning_rate": 6.909830056250527e-06, "loss": 0.575, "step": 5622 }, { "epoch": 0.61, "learning_rate": 6.906476901420205e-06, "loss": 0.72, "step": 5623 }, { "epoch": 0.61, "learning_rate": 6.903124131179625e-06, "loss": 0.7427, "step": 5624 }, { "epoch": 0.61, "learning_rate": 6.899771745945601e-06, "loss": 0.6829, "step": 5625 }, { "epoch": 0.61, "learning_rate": 6.896419746134915e-06, "loss": 0.7856, "step": 5626 }, { "epoch": 0.61, "learning_rate": 6.893068132164285e-06, "loss": 0.6455, "step": 5627 }, { "epoch": 0.61, "learning_rate": 6.8897169044503875e-06, "loss": 0.7048, "step": 5628 }, { "epoch": 0.61, "learning_rate": 6.886366063409853e-06, "loss": 0.7573, "step": 5629 }, { "epoch": 0.61, "learning_rate": 6.883015609459254e-06, "loss": 0.8379, "step": 5630 }, { "epoch": 0.61, "learning_rate": 6.87966554301513e-06, "loss": 0.6165, "step": 5631 }, { "epoch": 0.61, "learning_rate": 6.876315864493962e-06, "loss": 0.6672, "step": 5632 }, { "epoch": 0.61, "learning_rate": 6.872966574312182e-06, "loss": 0.6742, "step": 5633 }, { "epoch": 0.61, "learning_rate": 6.869617672886182e-06, "loss": 0.7222, "step": 5634 }, { "epoch": 0.61, "learning_rate": 6.866269160632293e-06, "loss": 0.8701, "step": 5635 }, { "epoch": 0.61, "learning_rate": 6.862921037966815e-06, "loss": 0.7197, "step": 5636 }, { "epoch": 0.61, "learning_rate": 6.859573305305987e-06, "loss": 0.7578, "step": 5637 }, { "epoch": 0.61, "learning_rate": 6.856225963065996e-06, "loss": 0.6423, "step": 5638 }, { "epoch": 0.61, "learning_rate": 6.852879011662994e-06, "loss": 0.6418, "step": 5639 }, { "epoch": 0.61, "learning_rate": 6.8495324515130744e-06, "loss": 0.7153, "step": 5640 }, { "epoch": 0.61, "learning_rate": 6.846186283032282e-06, "loss": 0.7778, "step": 5641 }, { "epoch": 0.61, "learning_rate": 6.842840506636621e-06, "loss": 0.8311, "step": 5642 }, { "epoch": 0.61, "learning_rate": 6.83949512274204e-06, "loss": 0.6836, "step": 5643 }, { "epoch": 0.61, "learning_rate": 6.836150131764434e-06, "loss": 0.7065, "step": 5644 }, { "epoch": 0.61, "learning_rate": 6.832805534119666e-06, "loss": 0.6416, "step": 5645 }, { "epoch": 0.61, "learning_rate": 6.8294613302235325e-06, "loss": 0.77, "step": 5646 }, { "epoch": 0.61, "learning_rate": 6.8261175204917905e-06, "loss": 0.7361, "step": 5647 }, { "epoch": 0.61, "learning_rate": 6.822774105340146e-06, "loss": 0.656, "step": 5648 }, { "epoch": 0.61, "learning_rate": 6.819431085184251e-06, "loss": 0.6318, "step": 5649 }, { "epoch": 0.62, "learning_rate": 6.81608846043972e-06, "loss": 0.6357, "step": 5650 }, { "epoch": 0.62, "learning_rate": 6.812746231522109e-06, "loss": 0.6494, "step": 5651 }, { "epoch": 0.62, "learning_rate": 6.809404398846922e-06, "loss": 0.7527, "step": 5652 }, { "epoch": 0.62, "learning_rate": 6.806062962829626e-06, "loss": 0.6248, "step": 5653 }, { "epoch": 0.62, "learning_rate": 6.802721923885624e-06, "loss": 0.6975, "step": 5654 }, { "epoch": 0.62, "learning_rate": 6.799381282430284e-06, "loss": 0.7334, "step": 5655 }, { "epoch": 0.62, "learning_rate": 6.796041038878918e-06, "loss": 0.6714, "step": 5656 }, { "epoch": 0.62, "learning_rate": 6.7927011936467806e-06, "loss": 0.7563, "step": 5657 }, { "epoch": 0.62, "learning_rate": 6.789361747149092e-06, "loss": 0.6421, "step": 5658 }, { "epoch": 0.62, "learning_rate": 6.786022699801014e-06, "loss": 0.6877, "step": 5659 }, { "epoch": 0.62, "learning_rate": 6.782684052017656e-06, "loss": 0.5889, "step": 5660 }, { "epoch": 0.62, "learning_rate": 6.779345804214088e-06, "loss": 0.6946, "step": 5661 }, { "epoch": 0.62, "learning_rate": 6.77600795680532e-06, "loss": 0.6399, "step": 5662 }, { "epoch": 0.62, "learning_rate": 6.772670510206315e-06, "loss": 0.6951, "step": 5663 }, { "epoch": 0.62, "learning_rate": 6.7693334648319905e-06, "loss": 0.6187, "step": 5664 }, { "epoch": 0.62, "learning_rate": 6.765996821097209e-06, "loss": 0.6277, "step": 5665 }, { "epoch": 0.62, "learning_rate": 6.762660579416791e-06, "loss": 0.7817, "step": 5666 }, { "epoch": 0.62, "learning_rate": 6.7593247402054955e-06, "loss": 0.7646, "step": 5667 }, { "epoch": 0.62, "learning_rate": 6.755989303878037e-06, "loss": 0.6311, "step": 5668 }, { "epoch": 0.62, "learning_rate": 6.752654270849084e-06, "loss": 0.6528, "step": 5669 }, { "epoch": 0.62, "learning_rate": 6.74931964153325e-06, "loss": 0.6506, "step": 5670 }, { "epoch": 0.62, "learning_rate": 6.745985416345093e-06, "loss": 0.7021, "step": 5671 }, { "epoch": 0.62, "learning_rate": 6.7426515956991364e-06, "loss": 0.6975, "step": 5672 }, { "epoch": 0.62, "learning_rate": 6.739318180009835e-06, "loss": 0.7305, "step": 5673 }, { "epoch": 0.62, "learning_rate": 6.735985169691612e-06, "loss": 0.7485, "step": 5674 }, { "epoch": 0.62, "learning_rate": 6.7326525651588235e-06, "loss": 0.5791, "step": 5675 }, { "epoch": 0.62, "learning_rate": 6.729320366825785e-06, "loss": 0.6553, "step": 5676 }, { "epoch": 0.62, "learning_rate": 6.725988575106757e-06, "loss": 0.76, "step": 5677 }, { "epoch": 0.62, "learning_rate": 6.722657190415951e-06, "loss": 0.6719, "step": 5678 }, { "epoch": 0.62, "learning_rate": 6.719326213167527e-06, "loss": 0.7393, "step": 5679 }, { "epoch": 0.62, "learning_rate": 6.715995643775601e-06, "loss": 0.616, "step": 5680 }, { "epoch": 0.62, "learning_rate": 6.712665482654226e-06, "loss": 0.7139, "step": 5681 }, { "epoch": 0.62, "learning_rate": 6.709335730217412e-06, "loss": 0.7075, "step": 5682 }, { "epoch": 0.62, "learning_rate": 6.7060063868791185e-06, "loss": 0.6912, "step": 5683 }, { "epoch": 0.62, "learning_rate": 6.70267745305325e-06, "loss": 0.6978, "step": 5684 }, { "epoch": 0.62, "learning_rate": 6.699348929153668e-06, "loss": 0.71, "step": 5685 }, { "epoch": 0.62, "learning_rate": 6.696020815594176e-06, "loss": 0.7432, "step": 5686 }, { "epoch": 0.62, "learning_rate": 6.692693112788524e-06, "loss": 0.7256, "step": 5687 }, { "epoch": 0.62, "learning_rate": 6.689365821150421e-06, "loss": 0.7573, "step": 5688 }, { "epoch": 0.62, "learning_rate": 6.6860389410935155e-06, "loss": 0.634, "step": 5689 }, { "epoch": 0.62, "learning_rate": 6.682712473031407e-06, "loss": 0.613, "step": 5690 }, { "epoch": 0.62, "learning_rate": 6.679386417377649e-06, "loss": 0.7512, "step": 5691 }, { "epoch": 0.62, "learning_rate": 6.676060774545735e-06, "loss": 0.6216, "step": 5692 }, { "epoch": 0.62, "learning_rate": 6.67273554494912e-06, "loss": 0.647, "step": 5693 }, { "epoch": 0.62, "learning_rate": 6.669410729001193e-06, "loss": 0.7852, "step": 5694 }, { "epoch": 0.62, "learning_rate": 6.6660863271152995e-06, "loss": 0.6743, "step": 5695 }, { "epoch": 0.62, "learning_rate": 6.6627623397047355e-06, "loss": 0.5845, "step": 5696 }, { "epoch": 0.62, "learning_rate": 6.65943876718274e-06, "loss": 0.7158, "step": 5697 }, { "epoch": 0.62, "learning_rate": 6.656115609962499e-06, "loss": 0.636, "step": 5698 }, { "epoch": 0.62, "learning_rate": 6.652792868457159e-06, "loss": 0.6841, "step": 5699 }, { "epoch": 0.62, "learning_rate": 6.649470543079799e-06, "loss": 0.7339, "step": 5700 }, { "epoch": 0.62, "learning_rate": 6.646148634243455e-06, "loss": 0.6765, "step": 5701 }, { "epoch": 0.62, "learning_rate": 6.642827142361111e-06, "loss": 0.5571, "step": 5702 }, { "epoch": 0.62, "learning_rate": 6.639506067845698e-06, "loss": 0.6389, "step": 5703 }, { "epoch": 0.62, "learning_rate": 6.636185411110099e-06, "loss": 0.6538, "step": 5704 }, { "epoch": 0.62, "learning_rate": 6.632865172567136e-06, "loss": 0.7607, "step": 5705 }, { "epoch": 0.62, "learning_rate": 6.629545352629583e-06, "loss": 0.645, "step": 5706 }, { "epoch": 0.62, "learning_rate": 6.62622595171017e-06, "loss": 0.7739, "step": 5707 }, { "epoch": 0.62, "learning_rate": 6.622906970221563e-06, "loss": 0.7129, "step": 5708 }, { "epoch": 0.62, "learning_rate": 6.619588408576378e-06, "loss": 0.7544, "step": 5709 }, { "epoch": 0.62, "learning_rate": 6.61627026718719e-06, "loss": 0.7437, "step": 5710 }, { "epoch": 0.62, "learning_rate": 6.6129525464665056e-06, "loss": 0.6685, "step": 5711 }, { "epoch": 0.62, "learning_rate": 6.6096352468267935e-06, "loss": 0.749, "step": 5712 }, { "epoch": 0.62, "learning_rate": 6.606318368680461e-06, "loss": 0.6826, "step": 5713 }, { "epoch": 0.62, "learning_rate": 6.603001912439864e-06, "loss": 0.7183, "step": 5714 }, { "epoch": 0.62, "learning_rate": 6.5996858785173105e-06, "loss": 0.7563, "step": 5715 }, { "epoch": 0.62, "learning_rate": 6.59637026732505e-06, "loss": 0.7725, "step": 5716 }, { "epoch": 0.62, "learning_rate": 6.593055079275281e-06, "loss": 0.5554, "step": 5717 }, { "epoch": 0.62, "learning_rate": 6.589740314780157e-06, "loss": 0.752, "step": 5718 }, { "epoch": 0.62, "learning_rate": 6.58642597425177e-06, "loss": 0.7061, "step": 5719 }, { "epoch": 0.62, "learning_rate": 6.583112058102158e-06, "loss": 0.7651, "step": 5720 }, { "epoch": 0.62, "learning_rate": 6.579798566743314e-06, "loss": 0.6843, "step": 5721 }, { "epoch": 0.62, "learning_rate": 6.576485500587173e-06, "loss": 0.6466, "step": 5722 }, { "epoch": 0.62, "learning_rate": 6.5731728600456214e-06, "loss": 0.7202, "step": 5723 }, { "epoch": 0.62, "learning_rate": 6.569860645530488e-06, "loss": 0.6653, "step": 5724 }, { "epoch": 0.62, "learning_rate": 6.566548857453548e-06, "loss": 0.6235, "step": 5725 }, { "epoch": 0.62, "learning_rate": 6.563237496226531e-06, "loss": 0.79, "step": 5726 }, { "epoch": 0.62, "learning_rate": 6.559926562261106e-06, "loss": 0.6401, "step": 5727 }, { "epoch": 0.62, "learning_rate": 6.5566160559688875e-06, "loss": 0.7007, "step": 5728 }, { "epoch": 0.62, "learning_rate": 6.553305977761448e-06, "loss": 0.7476, "step": 5729 }, { "epoch": 0.62, "learning_rate": 6.549996328050296e-06, "loss": 0.709, "step": 5730 }, { "epoch": 0.62, "learning_rate": 6.5466871072468875e-06, "loss": 0.6531, "step": 5731 }, { "epoch": 0.62, "learning_rate": 6.543378315762634e-06, "loss": 0.6638, "step": 5732 }, { "epoch": 0.62, "learning_rate": 6.540069954008883e-06, "loss": 0.7627, "step": 5733 }, { "epoch": 0.62, "learning_rate": 6.536762022396936e-06, "loss": 0.6394, "step": 5734 }, { "epoch": 0.62, "learning_rate": 6.533454521338039e-06, "loss": 0.6963, "step": 5735 }, { "epoch": 0.62, "learning_rate": 6.530147451243377e-06, "loss": 0.7554, "step": 5736 }, { "epoch": 0.62, "learning_rate": 6.526840812524096e-06, "loss": 0.7178, "step": 5737 }, { "epoch": 0.62, "learning_rate": 6.523534605591278e-06, "loss": 0.6582, "step": 5738 }, { "epoch": 0.62, "learning_rate": 6.52022883085595e-06, "loss": 0.7039, "step": 5739 }, { "epoch": 0.62, "learning_rate": 6.516923488729092e-06, "loss": 0.8008, "step": 5740 }, { "epoch": 0.62, "learning_rate": 6.5136185796216285e-06, "loss": 0.6804, "step": 5741 }, { "epoch": 0.63, "learning_rate": 6.510314103944431e-06, "loss": 0.5327, "step": 5742 }, { "epoch": 0.63, "learning_rate": 6.50701006210831e-06, "loss": 0.79, "step": 5743 }, { "epoch": 0.63, "learning_rate": 6.503706454524027e-06, "loss": 0.6338, "step": 5744 }, { "epoch": 0.63, "learning_rate": 6.500403281602295e-06, "loss": 0.5881, "step": 5745 }, { "epoch": 0.63, "learning_rate": 6.497100543753763e-06, "loss": 0.6436, "step": 5746 }, { "epoch": 0.63, "learning_rate": 6.493798241389031e-06, "loss": 0.7593, "step": 5747 }, { "epoch": 0.63, "learning_rate": 6.490496374918647e-06, "loss": 0.6499, "step": 5748 }, { "epoch": 0.63, "learning_rate": 6.487194944753099e-06, "loss": 0.655, "step": 5749 }, { "epoch": 0.63, "learning_rate": 6.483893951302823e-06, "loss": 0.6367, "step": 5750 }, { "epoch": 0.63, "learning_rate": 6.480593394978208e-06, "loss": 0.5706, "step": 5751 }, { "epoch": 0.63, "learning_rate": 6.477293276189576e-06, "loss": 0.6396, "step": 5752 }, { "epoch": 0.63, "learning_rate": 6.4739935953472055e-06, "loss": 0.7334, "step": 5753 }, { "epoch": 0.63, "learning_rate": 6.4706943528613135e-06, "loss": 0.7466, "step": 5754 }, { "epoch": 0.63, "learning_rate": 6.467395549142063e-06, "loss": 0.7874, "step": 5755 }, { "epoch": 0.63, "learning_rate": 6.4640971845995685e-06, "loss": 0.8105, "step": 5756 }, { "epoch": 0.63, "learning_rate": 6.460799259643884e-06, "loss": 0.7305, "step": 5757 }, { "epoch": 0.63, "learning_rate": 6.4575017746850086e-06, "loss": 0.7432, "step": 5758 }, { "epoch": 0.63, "learning_rate": 6.454204730132891e-06, "loss": 0.8447, "step": 5759 }, { "epoch": 0.63, "learning_rate": 6.450908126397424e-06, "loss": 0.697, "step": 5760 }, { "epoch": 0.63, "learning_rate": 6.447611963888443e-06, "loss": 0.7222, "step": 5761 }, { "epoch": 0.63, "learning_rate": 6.444316243015731e-06, "loss": 0.7144, "step": 5762 }, { "epoch": 0.63, "learning_rate": 6.441020964189013e-06, "loss": 0.6943, "step": 5763 }, { "epoch": 0.63, "learning_rate": 6.437726127817965e-06, "loss": 0.6824, "step": 5764 }, { "epoch": 0.63, "learning_rate": 6.434431734312201e-06, "loss": 0.6758, "step": 5765 }, { "epoch": 0.63, "learning_rate": 6.431137784081283e-06, "loss": 0.54, "step": 5766 }, { "epoch": 0.63, "learning_rate": 6.42784427753472e-06, "loss": 0.6929, "step": 5767 }, { "epoch": 0.63, "learning_rate": 6.424551215081964e-06, "loss": 0.7656, "step": 5768 }, { "epoch": 0.63, "learning_rate": 6.421258597132406e-06, "loss": 0.6365, "step": 5769 }, { "epoch": 0.63, "learning_rate": 6.417966424095397e-06, "loss": 0.7661, "step": 5770 }, { "epoch": 0.63, "learning_rate": 6.414674696380214e-06, "loss": 0.709, "step": 5771 }, { "epoch": 0.63, "learning_rate": 6.411383414396095e-06, "loss": 0.594, "step": 5772 }, { "epoch": 0.63, "learning_rate": 6.408092578552212e-06, "loss": 0.7578, "step": 5773 }, { "epoch": 0.63, "learning_rate": 6.404802189257683e-06, "loss": 0.832, "step": 5774 }, { "epoch": 0.63, "learning_rate": 6.401512246921576e-06, "loss": 0.6433, "step": 5775 }, { "epoch": 0.63, "learning_rate": 6.3982227519528986e-06, "loss": 0.7437, "step": 5776 }, { "epoch": 0.63, "learning_rate": 6.3949337047606015e-06, "loss": 0.6968, "step": 5777 }, { "epoch": 0.63, "learning_rate": 6.3916451057535836e-06, "loss": 0.7661, "step": 5778 }, { "epoch": 0.63, "learning_rate": 6.388356955340688e-06, "loss": 0.7666, "step": 5779 }, { "epoch": 0.63, "learning_rate": 6.3850692539307006e-06, "loss": 0.7102, "step": 5780 }, { "epoch": 0.63, "learning_rate": 6.381782001932352e-06, "loss": 0.6621, "step": 5781 }, { "epoch": 0.63, "learning_rate": 6.378495199754313e-06, "loss": 0.7891, "step": 5782 }, { "epoch": 0.63, "learning_rate": 6.375208847805206e-06, "loss": 0.6699, "step": 5783 }, { "epoch": 0.63, "learning_rate": 6.3719229464935915e-06, "loss": 0.7627, "step": 5784 }, { "epoch": 0.63, "learning_rate": 6.368637496227976e-06, "loss": 0.6821, "step": 5785 }, { "epoch": 0.63, "learning_rate": 6.3653524974168105e-06, "loss": 0.7327, "step": 5786 }, { "epoch": 0.63, "learning_rate": 6.362067950468489e-06, "loss": 0.6089, "step": 5787 }, { "epoch": 0.63, "learning_rate": 6.358783855791344e-06, "loss": 0.7673, "step": 5788 }, { "epoch": 0.63, "learning_rate": 6.355500213793668e-06, "loss": 0.7014, "step": 5789 }, { "epoch": 0.63, "learning_rate": 6.352217024883678e-06, "loss": 0.772, "step": 5790 }, { "epoch": 0.63, "learning_rate": 6.348934289469548e-06, "loss": 0.748, "step": 5791 }, { "epoch": 0.63, "learning_rate": 6.345652007959389e-06, "loss": 0.6099, "step": 5792 }, { "epoch": 0.63, "learning_rate": 6.342370180761256e-06, "loss": 0.7285, "step": 5793 }, { "epoch": 0.63, "learning_rate": 6.339088808283151e-06, "loss": 0.7783, "step": 5794 }, { "epoch": 0.63, "learning_rate": 6.335807890933018e-06, "loss": 0.6538, "step": 5795 }, { "epoch": 0.63, "learning_rate": 6.33252742911874e-06, "loss": 0.6265, "step": 5796 }, { "epoch": 0.63, "learning_rate": 6.3292474232481485e-06, "loss": 0.7256, "step": 5797 }, { "epoch": 0.63, "learning_rate": 6.3259678737290174e-06, "loss": 0.7549, "step": 5798 }, { "epoch": 0.63, "learning_rate": 6.3226887809690675e-06, "loss": 0.6975, "step": 5799 }, { "epoch": 0.63, "learning_rate": 6.319410145375955e-06, "loss": 0.7522, "step": 5800 }, { "epoch": 0.63, "learning_rate": 6.316131967357279e-06, "loss": 0.6423, "step": 5801 }, { "epoch": 0.63, "learning_rate": 6.312854247320594e-06, "loss": 0.6558, "step": 5802 }, { "epoch": 0.63, "learning_rate": 6.309576985673385e-06, "loss": 0.7134, "step": 5803 }, { "epoch": 0.63, "learning_rate": 6.3063001828230815e-06, "loss": 0.7383, "step": 5804 }, { "epoch": 0.63, "learning_rate": 6.303023839177065e-06, "loss": 0.6379, "step": 5805 }, { "epoch": 0.63, "learning_rate": 6.299747955142648e-06, "loss": 0.6785, "step": 5806 }, { "epoch": 0.63, "learning_rate": 6.296472531127092e-06, "loss": 0.7473, "step": 5807 }, { "epoch": 0.63, "learning_rate": 6.293197567537605e-06, "loss": 0.6914, "step": 5808 }, { "epoch": 0.63, "learning_rate": 6.2899230647813315e-06, "loss": 0.6523, "step": 5809 }, { "epoch": 0.63, "learning_rate": 6.2866490232653624e-06, "loss": 0.7153, "step": 5810 }, { "epoch": 0.63, "learning_rate": 6.283375443396726e-06, "loss": 0.7676, "step": 5811 }, { "epoch": 0.63, "learning_rate": 6.280102325582398e-06, "loss": 0.6311, "step": 5812 }, { "epoch": 0.63, "learning_rate": 6.276829670229299e-06, "loss": 0.7354, "step": 5813 }, { "epoch": 0.63, "learning_rate": 6.2735574777442855e-06, "loss": 0.7351, "step": 5814 }, { "epoch": 0.63, "learning_rate": 6.270285748534157e-06, "loss": 0.7617, "step": 5815 }, { "epoch": 0.63, "learning_rate": 6.267014483005664e-06, "loss": 0.6127, "step": 5816 }, { "epoch": 0.63, "learning_rate": 6.263743681565485e-06, "loss": 0.741, "step": 5817 }, { "epoch": 0.63, "learning_rate": 6.260473344620259e-06, "loss": 0.5884, "step": 5818 }, { "epoch": 0.63, "learning_rate": 6.257203472576554e-06, "loss": 0.6833, "step": 5819 }, { "epoch": 0.63, "learning_rate": 6.25393406584088e-06, "loss": 0.8179, "step": 5820 }, { "epoch": 0.63, "learning_rate": 6.250665124819697e-06, "loss": 0.7363, "step": 5821 }, { "epoch": 0.63, "learning_rate": 6.2473966499194014e-06, "loss": 0.7261, "step": 5822 }, { "epoch": 0.63, "learning_rate": 6.244128641546331e-06, "loss": 0.7412, "step": 5823 }, { "epoch": 0.63, "learning_rate": 6.240861100106772e-06, "loss": 0.7432, "step": 5824 }, { "epoch": 0.63, "learning_rate": 6.237594026006944e-06, "loss": 0.6726, "step": 5825 }, { "epoch": 0.63, "learning_rate": 6.234327419653013e-06, "loss": 0.707, "step": 5826 }, { "epoch": 0.63, "learning_rate": 6.231061281451091e-06, "loss": 0.5815, "step": 5827 }, { "epoch": 0.63, "learning_rate": 6.227795611807223e-06, "loss": 0.6841, "step": 5828 }, { "epoch": 0.63, "learning_rate": 6.224530411127403e-06, "loss": 0.8301, "step": 5829 }, { "epoch": 0.63, "learning_rate": 6.221265679817563e-06, "loss": 0.7573, "step": 5830 }, { "epoch": 0.63, "learning_rate": 6.218001418283577e-06, "loss": 0.6489, "step": 5831 }, { "epoch": 0.63, "learning_rate": 6.214737626931261e-06, "loss": 0.6787, "step": 5832 }, { "epoch": 0.63, "learning_rate": 6.211474306166374e-06, "loss": 0.7188, "step": 5833 }, { "epoch": 0.64, "learning_rate": 6.208211456394612e-06, "loss": 0.6597, "step": 5834 }, { "epoch": 0.64, "learning_rate": 6.20494907802162e-06, "loss": 0.71, "step": 5835 }, { "epoch": 0.64, "learning_rate": 6.2016871714529725e-06, "loss": 0.6902, "step": 5836 }, { "epoch": 0.64, "learning_rate": 6.198425737094202e-06, "loss": 0.6118, "step": 5837 }, { "epoch": 0.64, "learning_rate": 6.19516477535077e-06, "loss": 0.8022, "step": 5838 }, { "epoch": 0.64, "learning_rate": 6.191904286628081e-06, "loss": 0.6965, "step": 5839 }, { "epoch": 0.64, "learning_rate": 6.1886442713314835e-06, "loss": 0.7988, "step": 5840 }, { "epoch": 0.64, "learning_rate": 6.185384729866264e-06, "loss": 0.7307, "step": 5841 }, { "epoch": 0.64, "learning_rate": 6.18212566263765e-06, "loss": 0.728, "step": 5842 }, { "epoch": 0.64, "learning_rate": 6.178867070050818e-06, "loss": 0.696, "step": 5843 }, { "epoch": 0.64, "learning_rate": 6.175608952510875e-06, "loss": 0.7505, "step": 5844 }, { "epoch": 0.64, "learning_rate": 6.17235131042287e-06, "loss": 0.6523, "step": 5845 }, { "epoch": 0.64, "learning_rate": 6.169094144191805e-06, "loss": 0.769, "step": 5846 }, { "epoch": 0.64, "learning_rate": 6.165837454222607e-06, "loss": 0.7451, "step": 5847 }, { "epoch": 0.64, "learning_rate": 6.1625812409201546e-06, "loss": 0.6277, "step": 5848 }, { "epoch": 0.64, "learning_rate": 6.159325504689262e-06, "loss": 0.7139, "step": 5849 }, { "epoch": 0.64, "learning_rate": 6.1560702459346845e-06, "loss": 0.7058, "step": 5850 }, { "epoch": 0.64, "learning_rate": 6.15281546506112e-06, "loss": 0.7681, "step": 5851 }, { "epoch": 0.64, "learning_rate": 6.149561162473206e-06, "loss": 0.7495, "step": 5852 }, { "epoch": 0.64, "learning_rate": 6.146307338575519e-06, "loss": 0.7007, "step": 5853 }, { "epoch": 0.64, "learning_rate": 6.1430539937725796e-06, "loss": 0.6931, "step": 5854 }, { "epoch": 0.64, "learning_rate": 6.139801128468843e-06, "loss": 0.7246, "step": 5855 }, { "epoch": 0.64, "learning_rate": 6.136548743068713e-06, "loss": 0.7019, "step": 5856 }, { "epoch": 0.64, "learning_rate": 6.13329683797653e-06, "loss": 0.6765, "step": 5857 }, { "epoch": 0.64, "learning_rate": 6.130045413596568e-06, "loss": 0.6262, "step": 5858 }, { "epoch": 0.64, "learning_rate": 6.126794470333054e-06, "loss": 0.7407, "step": 5859 }, { "epoch": 0.64, "learning_rate": 6.123544008590144e-06, "loss": 0.6548, "step": 5860 }, { "epoch": 0.64, "learning_rate": 6.120294028771938e-06, "loss": 0.666, "step": 5861 }, { "epoch": 0.64, "learning_rate": 6.117044531282481e-06, "loss": 0.6069, "step": 5862 }, { "epoch": 0.64, "learning_rate": 6.113795516525749e-06, "loss": 0.7168, "step": 5863 }, { "epoch": 0.64, "learning_rate": 6.110546984905661e-06, "loss": 0.6863, "step": 5864 }, { "epoch": 0.64, "learning_rate": 6.107298936826086e-06, "loss": 0.7402, "step": 5865 }, { "epoch": 0.64, "learning_rate": 6.1040513726908154e-06, "loss": 0.6858, "step": 5866 }, { "epoch": 0.64, "learning_rate": 6.100804292903597e-06, "loss": 0.7961, "step": 5867 }, { "epoch": 0.64, "learning_rate": 6.097557697868108e-06, "loss": 0.6648, "step": 5868 }, { "epoch": 0.64, "learning_rate": 6.094311587987964e-06, "loss": 0.7234, "step": 5869 }, { "epoch": 0.64, "learning_rate": 6.0910659636667304e-06, "loss": 0.6987, "step": 5870 }, { "epoch": 0.64, "learning_rate": 6.087820825307904e-06, "loss": 0.7139, "step": 5871 }, { "epoch": 0.64, "learning_rate": 6.084576173314921e-06, "loss": 0.7395, "step": 5872 }, { "epoch": 0.64, "learning_rate": 6.081332008091164e-06, "loss": 0.7339, "step": 5873 }, { "epoch": 0.64, "learning_rate": 6.078088330039945e-06, "loss": 0.6333, "step": 5874 }, { "epoch": 0.64, "learning_rate": 6.074845139564529e-06, "loss": 0.6777, "step": 5875 }, { "epoch": 0.64, "learning_rate": 6.071602437068108e-06, "loss": 0.7537, "step": 5876 }, { "epoch": 0.64, "learning_rate": 6.068360222953816e-06, "loss": 0.7075, "step": 5877 }, { "epoch": 0.64, "learning_rate": 6.065118497624734e-06, "loss": 0.7014, "step": 5878 }, { "epoch": 0.64, "learning_rate": 6.061877261483871e-06, "loss": 0.752, "step": 5879 }, { "epoch": 0.64, "learning_rate": 6.058636514934181e-06, "loss": 0.7346, "step": 5880 }, { "epoch": 0.64, "learning_rate": 6.05539625837856e-06, "loss": 0.6611, "step": 5881 }, { "epoch": 0.64, "learning_rate": 6.0521564922198385e-06, "loss": 0.7466, "step": 5882 }, { "epoch": 0.64, "learning_rate": 6.0489172168607816e-06, "loss": 0.6077, "step": 5883 }, { "epoch": 0.64, "learning_rate": 6.045678432704107e-06, "loss": 0.6948, "step": 5884 }, { "epoch": 0.64, "learning_rate": 6.042440140152461e-06, "loss": 0.7998, "step": 5885 }, { "epoch": 0.64, "learning_rate": 6.039202339608432e-06, "loss": 0.7043, "step": 5886 }, { "epoch": 0.64, "learning_rate": 6.035965031474546e-06, "loss": 0.5664, "step": 5887 }, { "epoch": 0.64, "learning_rate": 6.032728216153265e-06, "loss": 0.783, "step": 5888 }, { "epoch": 0.64, "learning_rate": 6.029491894046997e-06, "loss": 0.7002, "step": 5889 }, { "epoch": 0.64, "learning_rate": 6.0262560655580825e-06, "loss": 0.7378, "step": 5890 }, { "epoch": 0.64, "learning_rate": 6.0230207310888035e-06, "loss": 0.668, "step": 5891 }, { "epoch": 0.64, "learning_rate": 6.019785891041381e-06, "loss": 0.6206, "step": 5892 }, { "epoch": 0.64, "learning_rate": 6.016551545817967e-06, "loss": 0.6958, "step": 5893 }, { "epoch": 0.64, "learning_rate": 6.013317695820668e-06, "loss": 0.7388, "step": 5894 }, { "epoch": 0.64, "learning_rate": 6.010084341451516e-06, "loss": 0.8052, "step": 5895 }, { "epoch": 0.64, "learning_rate": 6.00685148311248e-06, "loss": 0.7109, "step": 5896 }, { "epoch": 0.64, "learning_rate": 6.00361912120548e-06, "loss": 0.5974, "step": 5897 }, { "epoch": 0.64, "learning_rate": 6.000387256132359e-06, "loss": 0.6826, "step": 5898 }, { "epoch": 0.64, "learning_rate": 5.997155888294908e-06, "loss": 0.6497, "step": 5899 }, { "epoch": 0.64, "learning_rate": 5.993925018094856e-06, "loss": 0.655, "step": 5900 }, { "epoch": 0.64, "learning_rate": 5.990694645933866e-06, "loss": 0.667, "step": 5901 }, { "epoch": 0.64, "learning_rate": 5.987464772213539e-06, "loss": 0.7056, "step": 5902 }, { "epoch": 0.64, "learning_rate": 5.984235397335418e-06, "loss": 0.7017, "step": 5903 }, { "epoch": 0.64, "learning_rate": 5.981006521700983e-06, "loss": 0.6812, "step": 5904 }, { "epoch": 0.64, "learning_rate": 5.97777814571165e-06, "loss": 0.7134, "step": 5905 }, { "epoch": 0.64, "learning_rate": 5.974550269768775e-06, "loss": 0.6748, "step": 5906 }, { "epoch": 0.64, "learning_rate": 5.971322894273646e-06, "loss": 0.7344, "step": 5907 }, { "epoch": 0.64, "learning_rate": 5.9680960196274995e-06, "loss": 0.7344, "step": 5908 }, { "epoch": 0.64, "learning_rate": 5.964869646231501e-06, "loss": 0.66, "step": 5909 }, { "epoch": 0.64, "learning_rate": 5.961643774486754e-06, "loss": 0.71, "step": 5910 }, { "epoch": 0.64, "learning_rate": 5.958418404794306e-06, "loss": 0.8262, "step": 5911 }, { "epoch": 0.64, "learning_rate": 5.955193537555131e-06, "loss": 0.6453, "step": 5912 }, { "epoch": 0.64, "learning_rate": 5.951969173170158e-06, "loss": 0.702, "step": 5913 }, { "epoch": 0.64, "learning_rate": 5.948745312040237e-06, "loss": 0.7749, "step": 5914 }, { "epoch": 0.64, "learning_rate": 5.94552195456616e-06, "loss": 0.6855, "step": 5915 }, { "epoch": 0.64, "learning_rate": 5.9422991011486635e-06, "loss": 0.7197, "step": 5916 }, { "epoch": 0.64, "learning_rate": 5.939076752188411e-06, "loss": 0.728, "step": 5917 }, { "epoch": 0.64, "learning_rate": 5.935854908086007e-06, "loss": 0.7397, "step": 5918 }, { "epoch": 0.64, "learning_rate": 5.932633569242e-06, "loss": 0.6455, "step": 5919 }, { "epoch": 0.64, "learning_rate": 5.9294127360568655e-06, "loss": 0.7205, "step": 5920 }, { "epoch": 0.64, "learning_rate": 5.926192408931019e-06, "loss": 0.7029, "step": 5921 }, { "epoch": 0.64, "learning_rate": 5.922972588264818e-06, "loss": 0.7012, "step": 5922 }, { "epoch": 0.64, "learning_rate": 5.9197532744585525e-06, "loss": 0.5442, "step": 5923 }, { "epoch": 0.64, "learning_rate": 5.916534467912453e-06, "loss": 0.6643, "step": 5924 }, { "epoch": 0.65, "learning_rate": 5.913316169026683e-06, "loss": 0.7417, "step": 5925 }, { "epoch": 0.65, "learning_rate": 5.910098378201341e-06, "loss": 0.6445, "step": 5926 }, { "epoch": 0.65, "learning_rate": 5.906881095836472e-06, "loss": 0.7056, "step": 5927 }, { "epoch": 0.65, "learning_rate": 5.903664322332048e-06, "loss": 0.6626, "step": 5928 }, { "epoch": 0.65, "learning_rate": 5.9004480580879795e-06, "loss": 0.6277, "step": 5929 }, { "epoch": 0.65, "learning_rate": 5.89723230350412e-06, "loss": 0.75, "step": 5930 }, { "epoch": 0.65, "learning_rate": 5.894017058980249e-06, "loss": 0.6572, "step": 5931 }, { "epoch": 0.65, "learning_rate": 5.8908023249160974e-06, "loss": 0.6528, "step": 5932 }, { "epoch": 0.65, "learning_rate": 5.887588101711319e-06, "loss": 0.7886, "step": 5933 }, { "epoch": 0.65, "learning_rate": 5.884374389765508e-06, "loss": 0.6594, "step": 5934 }, { "epoch": 0.65, "learning_rate": 5.881161189478199e-06, "loss": 0.5798, "step": 5935 }, { "epoch": 0.65, "learning_rate": 5.877948501248858e-06, "loss": 0.7422, "step": 5936 }, { "epoch": 0.65, "learning_rate": 5.87473632547689e-06, "loss": 0.7598, "step": 5937 }, { "epoch": 0.65, "learning_rate": 5.8715246625616365e-06, "loss": 0.6658, "step": 5938 }, { "epoch": 0.65, "learning_rate": 5.868313512902375e-06, "loss": 0.7058, "step": 5939 }, { "epoch": 0.65, "learning_rate": 5.8651028768983155e-06, "loss": 0.658, "step": 5940 }, { "epoch": 0.65, "learning_rate": 5.8618927549486095e-06, "loss": 0.6157, "step": 5941 }, { "epoch": 0.65, "learning_rate": 5.858683147452342e-06, "loss": 0.6841, "step": 5942 }, { "epoch": 0.65, "learning_rate": 5.855474054808536e-06, "loss": 0.6819, "step": 5943 }, { "epoch": 0.65, "learning_rate": 5.8522654774161506e-06, "loss": 0.8066, "step": 5944 }, { "epoch": 0.65, "learning_rate": 5.849057415674072e-06, "loss": 0.6931, "step": 5945 }, { "epoch": 0.65, "learning_rate": 5.845849869981137e-06, "loss": 0.7666, "step": 5946 }, { "epoch": 0.65, "learning_rate": 5.842642840736108e-06, "loss": 0.719, "step": 5947 }, { "epoch": 0.65, "learning_rate": 5.839436328337682e-06, "loss": 0.6948, "step": 5948 }, { "epoch": 0.65, "learning_rate": 5.836230333184505e-06, "loss": 0.6162, "step": 5949 }, { "epoch": 0.65, "learning_rate": 5.833024855675136e-06, "loss": 0.6602, "step": 5950 }, { "epoch": 0.65, "learning_rate": 5.829819896208093e-06, "loss": 0.615, "step": 5951 }, { "epoch": 0.65, "learning_rate": 5.8266154551818225e-06, "loss": 0.6296, "step": 5952 }, { "epoch": 0.65, "learning_rate": 5.823411532994694e-06, "loss": 0.7581, "step": 5953 }, { "epoch": 0.65, "learning_rate": 5.820208130045031e-06, "loss": 0.6765, "step": 5954 }, { "epoch": 0.65, "learning_rate": 5.8170052467310734e-06, "loss": 0.6194, "step": 5955 }, { "epoch": 0.65, "learning_rate": 5.813802883451014e-06, "loss": 0.5886, "step": 5956 }, { "epoch": 0.65, "learning_rate": 5.810601040602977e-06, "loss": 0.7852, "step": 5957 }, { "epoch": 0.65, "learning_rate": 5.80739971858501e-06, "loss": 0.6711, "step": 5958 }, { "epoch": 0.65, "learning_rate": 5.804198917795106e-06, "loss": 0.6536, "step": 5959 }, { "epoch": 0.65, "learning_rate": 5.800998638631196e-06, "loss": 0.7437, "step": 5960 }, { "epoch": 0.65, "learning_rate": 5.797798881491138e-06, "loss": 0.7322, "step": 5961 }, { "epoch": 0.65, "learning_rate": 5.794599646772731e-06, "loss": 0.6401, "step": 5962 }, { "epoch": 0.65, "learning_rate": 5.79140093487371e-06, "loss": 0.6868, "step": 5963 }, { "epoch": 0.65, "learning_rate": 5.788202746191735e-06, "loss": 0.6707, "step": 5964 }, { "epoch": 0.65, "learning_rate": 5.785005081124414e-06, "loss": 0.7261, "step": 5965 }, { "epoch": 0.65, "learning_rate": 5.781807940069277e-06, "loss": 0.6877, "step": 5966 }, { "epoch": 0.65, "learning_rate": 5.778611323423801e-06, "loss": 0.6497, "step": 5967 }, { "epoch": 0.65, "learning_rate": 5.775415231585393e-06, "loss": 0.7241, "step": 5968 }, { "epoch": 0.65, "learning_rate": 5.77221966495139e-06, "loss": 0.6653, "step": 5969 }, { "epoch": 0.65, "learning_rate": 5.769024623919064e-06, "loss": 0.6931, "step": 5970 }, { "epoch": 0.65, "learning_rate": 5.76583010888564e-06, "loss": 0.6821, "step": 5971 }, { "epoch": 0.65, "learning_rate": 5.762636120248252e-06, "loss": 0.6548, "step": 5972 }, { "epoch": 0.65, "learning_rate": 5.759442658403985e-06, "loss": 0.6509, "step": 5973 }, { "epoch": 0.65, "learning_rate": 5.756249723749847e-06, "loss": 0.647, "step": 5974 }, { "epoch": 0.65, "learning_rate": 5.7530573166827905e-06, "loss": 0.5698, "step": 5975 }, { "epoch": 0.65, "learning_rate": 5.749865437599703e-06, "loss": 0.718, "step": 5976 }, { "epoch": 0.65, "learning_rate": 5.746674086897392e-06, "loss": 0.7603, "step": 5977 }, { "epoch": 0.65, "learning_rate": 5.743483264972616e-06, "loss": 0.7212, "step": 5978 }, { "epoch": 0.65, "learning_rate": 5.740292972222059e-06, "loss": 0.7034, "step": 5979 }, { "epoch": 0.65, "learning_rate": 5.737103209042342e-06, "loss": 0.7734, "step": 5980 }, { "epoch": 0.65, "learning_rate": 5.733913975830019e-06, "loss": 0.6792, "step": 5981 }, { "epoch": 0.65, "learning_rate": 5.7307252729815835e-06, "loss": 0.6719, "step": 5982 }, { "epoch": 0.65, "learning_rate": 5.727537100893448e-06, "loss": 0.7141, "step": 5983 }, { "epoch": 0.65, "learning_rate": 5.72434945996198e-06, "loss": 0.7646, "step": 5984 }, { "epoch": 0.65, "learning_rate": 5.72116235058346e-06, "loss": 0.6218, "step": 5985 }, { "epoch": 0.65, "learning_rate": 5.717975773154116e-06, "loss": 0.7256, "step": 5986 }, { "epoch": 0.65, "learning_rate": 5.714789728070111e-06, "loss": 0.8345, "step": 5987 }, { "epoch": 0.65, "learning_rate": 5.711604215727532e-06, "loss": 0.7114, "step": 5988 }, { "epoch": 0.65, "learning_rate": 5.708419236522401e-06, "loss": 0.729, "step": 5989 }, { "epoch": 0.65, "learning_rate": 5.7052347908506915e-06, "loss": 0.6699, "step": 5990 }, { "epoch": 0.65, "learning_rate": 5.702050879108284e-06, "loss": 0.6426, "step": 5991 }, { "epoch": 0.65, "learning_rate": 5.698867501691014e-06, "loss": 0.6345, "step": 5992 }, { "epoch": 0.65, "learning_rate": 5.695684658994634e-06, "loss": 0.7273, "step": 5993 }, { "epoch": 0.65, "learning_rate": 5.692502351414841e-06, "loss": 0.6567, "step": 5994 }, { "epoch": 0.65, "learning_rate": 5.689320579347268e-06, "loss": 0.7141, "step": 5995 }, { "epoch": 0.65, "learning_rate": 5.686139343187468e-06, "loss": 0.7397, "step": 5996 }, { "epoch": 0.65, "learning_rate": 5.682958643330938e-06, "loss": 0.7847, "step": 5997 }, { "epoch": 0.65, "learning_rate": 5.679778480173107e-06, "loss": 0.614, "step": 5998 }, { "epoch": 0.65, "learning_rate": 5.6765988541093345e-06, "loss": 0.6833, "step": 5999 }, { "epoch": 0.65, "learning_rate": 5.673419765534915e-06, "loss": 0.7537, "step": 6000 }, { "epoch": 0.65, "learning_rate": 5.6702412148450815e-06, "loss": 0.7842, "step": 6001 }, { "epoch": 0.65, "learning_rate": 5.667063202434985e-06, "loss": 0.7583, "step": 6002 }, { "epoch": 0.65, "learning_rate": 5.663885728699726e-06, "loss": 0.5737, "step": 6003 }, { "epoch": 0.65, "learning_rate": 5.660708794034325e-06, "loss": 0.7837, "step": 6004 }, { "epoch": 0.65, "learning_rate": 5.657532398833745e-06, "loss": 0.6731, "step": 6005 }, { "epoch": 0.65, "learning_rate": 5.654356543492883e-06, "loss": 0.5564, "step": 6006 }, { "epoch": 0.65, "learning_rate": 5.651181228406554e-06, "loss": 0.6104, "step": 6007 }, { "epoch": 0.65, "learning_rate": 5.6480064539695185e-06, "loss": 0.6646, "step": 6008 }, { "epoch": 0.65, "learning_rate": 5.64483222057648e-06, "loss": 0.6021, "step": 6009 }, { "epoch": 0.65, "learning_rate": 5.6416585286220475e-06, "loss": 0.7471, "step": 6010 }, { "epoch": 0.65, "learning_rate": 5.638485378500787e-06, "loss": 0.6836, "step": 6011 }, { "epoch": 0.65, "learning_rate": 5.63531277060718e-06, "loss": 0.6221, "step": 6012 }, { "epoch": 0.65, "learning_rate": 5.632140705335652e-06, "loss": 0.7578, "step": 6013 }, { "epoch": 0.65, "learning_rate": 5.628969183080559e-06, "loss": 0.6682, "step": 6014 }, { "epoch": 0.65, "learning_rate": 5.6257982042361835e-06, "loss": 0.7324, "step": 6015 }, { "epoch": 0.65, "learning_rate": 5.622627769196746e-06, "loss": 0.6018, "step": 6016 }, { "epoch": 0.66, "learning_rate": 5.619457878356398e-06, "loss": 0.6372, "step": 6017 }, { "epoch": 0.66, "learning_rate": 5.616288532109225e-06, "loss": 0.5645, "step": 6018 }, { "epoch": 0.66, "learning_rate": 5.613119730849241e-06, "loss": 0.6643, "step": 6019 }, { "epoch": 0.66, "learning_rate": 5.609951474970401e-06, "loss": 0.7427, "step": 6020 }, { "epoch": 0.66, "learning_rate": 5.606783764866576e-06, "loss": 0.7068, "step": 6021 }, { "epoch": 0.66, "learning_rate": 5.603616600931585e-06, "loss": 0.707, "step": 6022 }, { "epoch": 0.66, "learning_rate": 5.600449983559168e-06, "loss": 0.7334, "step": 6023 }, { "epoch": 0.66, "learning_rate": 5.597283913143006e-06, "loss": 0.7676, "step": 6024 }, { "epoch": 0.66, "learning_rate": 5.5941183900767085e-06, "loss": 0.6826, "step": 6025 }, { "epoch": 0.66, "learning_rate": 5.59095341475381e-06, "loss": 0.6785, "step": 6026 }, { "epoch": 0.66, "learning_rate": 5.587788987567785e-06, "loss": 0.7236, "step": 6027 }, { "epoch": 0.66, "learning_rate": 5.584625108912048e-06, "loss": 0.7214, "step": 6028 }, { "epoch": 0.66, "learning_rate": 5.581461779179924e-06, "loss": 0.6443, "step": 6029 }, { "epoch": 0.66, "learning_rate": 5.57829899876469e-06, "loss": 0.6418, "step": 6030 }, { "epoch": 0.66, "learning_rate": 5.575136768059537e-06, "loss": 0.7612, "step": 6031 }, { "epoch": 0.66, "learning_rate": 5.5719750874575995e-06, "loss": 0.8022, "step": 6032 }, { "epoch": 0.66, "learning_rate": 5.568813957351946e-06, "loss": 0.6736, "step": 6033 }, { "epoch": 0.66, "learning_rate": 5.565653378135565e-06, "loss": 0.6345, "step": 6034 }, { "epoch": 0.66, "learning_rate": 5.562493350201382e-06, "loss": 0.689, "step": 6035 }, { "epoch": 0.66, "learning_rate": 5.559333873942259e-06, "loss": 0.6321, "step": 6036 }, { "epoch": 0.66, "learning_rate": 5.5561749497509836e-06, "loss": 0.8135, "step": 6037 }, { "epoch": 0.66, "learning_rate": 5.553016578020276e-06, "loss": 0.7483, "step": 6038 }, { "epoch": 0.66, "learning_rate": 5.549858759142792e-06, "loss": 0.738, "step": 6039 }, { "epoch": 0.66, "learning_rate": 5.5467014935111065e-06, "loss": 0.6144, "step": 6040 }, { "epoch": 0.66, "learning_rate": 5.543544781517742e-06, "loss": 0.7327, "step": 6041 }, { "epoch": 0.66, "learning_rate": 5.540388623555137e-06, "loss": 0.7671, "step": 6042 }, { "epoch": 0.66, "learning_rate": 5.537233020015671e-06, "loss": 0.6787, "step": 6043 }, { "epoch": 0.66, "learning_rate": 5.534077971291656e-06, "loss": 0.7573, "step": 6044 }, { "epoch": 0.66, "learning_rate": 5.5309234777753225e-06, "loss": 0.7954, "step": 6045 }, { "epoch": 0.66, "learning_rate": 5.527769539858839e-06, "loss": 0.7344, "step": 6046 }, { "epoch": 0.66, "learning_rate": 5.524616157934319e-06, "loss": 0.7097, "step": 6047 }, { "epoch": 0.66, "learning_rate": 5.521463332393784e-06, "loss": 0.7388, "step": 6048 }, { "epoch": 0.66, "learning_rate": 5.518311063629202e-06, "loss": 0.6628, "step": 6049 }, { "epoch": 0.66, "learning_rate": 5.5151593520324575e-06, "loss": 0.646, "step": 6050 }, { "epoch": 0.66, "learning_rate": 5.512008197995379e-06, "loss": 0.6575, "step": 6051 }, { "epoch": 0.66, "learning_rate": 5.508857601909725e-06, "loss": 0.6646, "step": 6052 }, { "epoch": 0.66, "learning_rate": 5.505707564167173e-06, "loss": 0.7871, "step": 6053 }, { "epoch": 0.66, "learning_rate": 5.502558085159344e-06, "loss": 0.7231, "step": 6054 }, { "epoch": 0.66, "learning_rate": 5.499409165277785e-06, "loss": 0.6545, "step": 6055 }, { "epoch": 0.66, "learning_rate": 5.4962608049139646e-06, "loss": 0.7886, "step": 6056 }, { "epoch": 0.66, "learning_rate": 5.493113004459299e-06, "loss": 0.7197, "step": 6057 }, { "epoch": 0.66, "learning_rate": 5.489965764305125e-06, "loss": 0.6838, "step": 6058 }, { "epoch": 0.66, "learning_rate": 5.486819084842705e-06, "loss": 0.7021, "step": 6059 }, { "epoch": 0.66, "learning_rate": 5.483672966463245e-06, "loss": 0.7222, "step": 6060 }, { "epoch": 0.66, "learning_rate": 5.480527409557863e-06, "loss": 0.7247, "step": 6061 }, { "epoch": 0.66, "learning_rate": 5.477382414517625e-06, "loss": 0.7788, "step": 6062 }, { "epoch": 0.66, "learning_rate": 5.474237981733521e-06, "loss": 0.5459, "step": 6063 }, { "epoch": 0.66, "learning_rate": 5.471094111596464e-06, "loss": 0.7808, "step": 6064 }, { "epoch": 0.66, "learning_rate": 5.467950804497301e-06, "loss": 0.6541, "step": 6065 }, { "epoch": 0.66, "learning_rate": 5.464808060826825e-06, "loss": 0.562, "step": 6066 }, { "epoch": 0.66, "learning_rate": 5.461665880975731e-06, "loss": 0.6846, "step": 6067 }, { "epoch": 0.66, "learning_rate": 5.458524265334666e-06, "loss": 0.6743, "step": 6068 }, { "epoch": 0.66, "learning_rate": 5.455383214294192e-06, "loss": 0.6665, "step": 6069 }, { "epoch": 0.66, "learning_rate": 5.452242728244811e-06, "loss": 0.7563, "step": 6070 }, { "epoch": 0.66, "learning_rate": 5.4491028075769546e-06, "loss": 0.7373, "step": 6071 }, { "epoch": 0.66, "learning_rate": 5.445963452680974e-06, "loss": 0.7251, "step": 6072 }, { "epoch": 0.66, "learning_rate": 5.442824663947157e-06, "loss": 0.8101, "step": 6073 }, { "epoch": 0.66, "learning_rate": 5.4396864417657305e-06, "loss": 0.6123, "step": 6074 }, { "epoch": 0.66, "learning_rate": 5.436548786526825e-06, "loss": 0.7568, "step": 6075 }, { "epoch": 0.66, "learning_rate": 5.43341169862053e-06, "loss": 0.6165, "step": 6076 }, { "epoch": 0.66, "learning_rate": 5.430275178436852e-06, "loss": 0.7417, "step": 6077 }, { "epoch": 0.66, "learning_rate": 5.427139226365718e-06, "loss": 0.6316, "step": 6078 }, { "epoch": 0.66, "learning_rate": 5.424003842797e-06, "loss": 0.613, "step": 6079 }, { "epoch": 0.66, "learning_rate": 5.420869028120484e-06, "loss": 0.6799, "step": 6080 }, { "epoch": 0.66, "learning_rate": 5.417734782725896e-06, "loss": 0.6746, "step": 6081 }, { "epoch": 0.66, "learning_rate": 5.414601107002896e-06, "loss": 0.6697, "step": 6082 }, { "epoch": 0.66, "learning_rate": 5.411468001341054e-06, "loss": 0.6606, "step": 6083 }, { "epoch": 0.66, "learning_rate": 5.4083354661298816e-06, "loss": 0.7815, "step": 6084 }, { "epoch": 0.66, "learning_rate": 5.405203501758831e-06, "loss": 0.7446, "step": 6085 }, { "epoch": 0.66, "learning_rate": 5.402072108617258e-06, "loss": 0.792, "step": 6086 }, { "epoch": 0.66, "learning_rate": 5.39894128709447e-06, "loss": 0.6685, "step": 6087 }, { "epoch": 0.66, "learning_rate": 5.395811037579685e-06, "loss": 0.6833, "step": 6088 }, { "epoch": 0.66, "learning_rate": 5.392681360462062e-06, "loss": 0.6938, "step": 6089 }, { "epoch": 0.66, "learning_rate": 5.38955225613069e-06, "loss": 0.7617, "step": 6090 }, { "epoch": 0.66, "learning_rate": 5.386423724974574e-06, "loss": 0.6726, "step": 6091 }, { "epoch": 0.66, "learning_rate": 5.383295767382662e-06, "loss": 0.7493, "step": 6092 }, { "epoch": 0.66, "learning_rate": 5.3801683837438245e-06, "loss": 0.7234, "step": 6093 }, { "epoch": 0.66, "learning_rate": 5.377041574446852e-06, "loss": 0.6257, "step": 6094 }, { "epoch": 0.66, "learning_rate": 5.373915339880484e-06, "loss": 0.7056, "step": 6095 }, { "epoch": 0.66, "learning_rate": 5.370789680433376e-06, "loss": 0.6987, "step": 6096 }, { "epoch": 0.66, "learning_rate": 5.367664596494106e-06, "loss": 0.7024, "step": 6097 }, { "epoch": 0.66, "learning_rate": 5.364540088451193e-06, "loss": 0.6924, "step": 6098 }, { "epoch": 0.66, "learning_rate": 5.361416156693075e-06, "loss": 0.7075, "step": 6099 }, { "epoch": 0.66, "learning_rate": 5.358292801608123e-06, "loss": 0.7417, "step": 6100 }, { "epoch": 0.66, "learning_rate": 5.35517002358464e-06, "loss": 0.7087, "step": 6101 }, { "epoch": 0.66, "learning_rate": 5.352047823010846e-06, "loss": 0.7561, "step": 6102 }, { "epoch": 0.66, "learning_rate": 5.348926200274894e-06, "loss": 0.6863, "step": 6103 }, { "epoch": 0.66, "learning_rate": 5.345805155764881e-06, "loss": 0.6968, "step": 6104 }, { "epoch": 0.66, "learning_rate": 5.3426846898688054e-06, "loss": 0.6772, "step": 6105 }, { "epoch": 0.66, "learning_rate": 5.339564802974615e-06, "loss": 0.5972, "step": 6106 }, { "epoch": 0.66, "learning_rate": 5.3364454954701675e-06, "loss": 0.635, "step": 6107 }, { "epoch": 0.66, "learning_rate": 5.333326767743263e-06, "loss": 0.7102, "step": 6108 }, { "epoch": 0.67, "learning_rate": 5.33020862018163e-06, "loss": 0.7024, "step": 6109 }, { "epoch": 0.67, "learning_rate": 5.327091053172911e-06, "loss": 0.7188, "step": 6110 }, { "epoch": 0.67, "learning_rate": 5.323974067104687e-06, "loss": 0.6704, "step": 6111 }, { "epoch": 0.67, "learning_rate": 5.320857662364472e-06, "loss": 0.7524, "step": 6112 }, { "epoch": 0.67, "learning_rate": 5.317741839339685e-06, "loss": 0.7168, "step": 6113 }, { "epoch": 0.67, "learning_rate": 5.314626598417707e-06, "loss": 0.7534, "step": 6114 }, { "epoch": 0.67, "learning_rate": 5.311511939985813e-06, "loss": 0.7637, "step": 6115 }, { "epoch": 0.67, "learning_rate": 5.308397864431226e-06, "loss": 0.7734, "step": 6116 }, { "epoch": 0.67, "learning_rate": 5.305284372141095e-06, "loss": 0.6172, "step": 6117 }, { "epoch": 0.67, "learning_rate": 5.302171463502484e-06, "loss": 0.7202, "step": 6118 }, { "epoch": 0.67, "learning_rate": 5.299059138902396e-06, "loss": 0.7217, "step": 6119 }, { "epoch": 0.67, "learning_rate": 5.295947398727763e-06, "loss": 0.7119, "step": 6120 }, { "epoch": 0.67, "learning_rate": 5.292836243365433e-06, "loss": 0.6602, "step": 6121 }, { "epoch": 0.67, "learning_rate": 5.289725673202184e-06, "loss": 0.7065, "step": 6122 }, { "epoch": 0.67, "learning_rate": 5.286615688624739e-06, "loss": 0.6931, "step": 6123 }, { "epoch": 0.67, "learning_rate": 5.283506290019724e-06, "loss": 0.7095, "step": 6124 }, { "epoch": 0.67, "learning_rate": 5.280397477773707e-06, "loss": 0.6069, "step": 6125 }, { "epoch": 0.67, "learning_rate": 5.277289252273175e-06, "loss": 0.7007, "step": 6126 }, { "epoch": 0.67, "learning_rate": 5.274181613904544e-06, "loss": 0.7002, "step": 6127 }, { "epoch": 0.67, "learning_rate": 5.271074563054167e-06, "loss": 0.7009, "step": 6128 }, { "epoch": 0.67, "learning_rate": 5.267968100108306e-06, "loss": 0.6453, "step": 6129 }, { "epoch": 0.67, "learning_rate": 5.2648622254531625e-06, "loss": 0.7207, "step": 6130 }, { "epoch": 0.67, "learning_rate": 5.261756939474867e-06, "loss": 0.7356, "step": 6131 }, { "epoch": 0.67, "learning_rate": 5.258652242559461e-06, "loss": 0.7312, "step": 6132 }, { "epoch": 0.67, "learning_rate": 5.255548135092936e-06, "loss": 0.7002, "step": 6133 }, { "epoch": 0.67, "learning_rate": 5.252444617461188e-06, "loss": 0.7178, "step": 6134 }, { "epoch": 0.67, "learning_rate": 5.249341690050051e-06, "loss": 0.6729, "step": 6135 }, { "epoch": 0.67, "learning_rate": 5.24623935324529e-06, "loss": 0.6909, "step": 6136 }, { "epoch": 0.67, "learning_rate": 5.2431376074325835e-06, "loss": 0.792, "step": 6137 }, { "epoch": 0.67, "learning_rate": 5.240036452997544e-06, "loss": 0.7471, "step": 6138 }, { "epoch": 0.67, "learning_rate": 5.236935890325717e-06, "loss": 0.708, "step": 6139 }, { "epoch": 0.67, "learning_rate": 5.233835919802559e-06, "loss": 0.696, "step": 6140 }, { "epoch": 0.67, "learning_rate": 5.230736541813463e-06, "loss": 0.7227, "step": 6141 }, { "epoch": 0.67, "learning_rate": 5.227637756743749e-06, "loss": 0.7817, "step": 6142 }, { "epoch": 0.67, "learning_rate": 5.2245395649786615e-06, "loss": 0.6501, "step": 6143 }, { "epoch": 0.67, "learning_rate": 5.221441966903371e-06, "loss": 0.7021, "step": 6144 }, { "epoch": 0.67, "learning_rate": 5.218344962902969e-06, "loss": 0.6826, "step": 6145 }, { "epoch": 0.67, "learning_rate": 5.215248553362482e-06, "loss": 0.6621, "step": 6146 }, { "epoch": 0.67, "learning_rate": 5.21215273866686e-06, "loss": 0.6807, "step": 6147 }, { "epoch": 0.67, "learning_rate": 5.2090575192009725e-06, "loss": 0.73, "step": 6148 }, { "epoch": 0.67, "learning_rate": 5.205962895349623e-06, "loss": 0.6821, "step": 6149 }, { "epoch": 0.67, "learning_rate": 5.202868867497542e-06, "loss": 0.707, "step": 6150 }, { "epoch": 0.67, "learning_rate": 5.199775436029371e-06, "loss": 0.6917, "step": 6151 }, { "epoch": 0.67, "learning_rate": 5.196682601329701e-06, "loss": 0.8296, "step": 6152 }, { "epoch": 0.67, "learning_rate": 5.193590363783027e-06, "loss": 0.7686, "step": 6153 }, { "epoch": 0.67, "learning_rate": 5.190498723773784e-06, "loss": 0.6177, "step": 6154 }, { "epoch": 0.67, "learning_rate": 5.18740768168633e-06, "loss": 0.7095, "step": 6155 }, { "epoch": 0.67, "learning_rate": 5.184317237904939e-06, "loss": 0.6838, "step": 6156 }, { "epoch": 0.67, "learning_rate": 5.18122739281382e-06, "loss": 0.7324, "step": 6157 }, { "epoch": 0.67, "learning_rate": 5.178138146797111e-06, "loss": 0.5627, "step": 6158 }, { "epoch": 0.67, "learning_rate": 5.1750495002388624e-06, "loss": 0.7646, "step": 6159 }, { "epoch": 0.67, "learning_rate": 5.171961453523061e-06, "loss": 0.7312, "step": 6160 }, { "epoch": 0.67, "learning_rate": 5.168874007033615e-06, "loss": 0.6523, "step": 6161 }, { "epoch": 0.67, "learning_rate": 5.165787161154361e-06, "loss": 0.6545, "step": 6162 }, { "epoch": 0.67, "learning_rate": 5.162700916269061e-06, "loss": 0.6218, "step": 6163 }, { "epoch": 0.67, "learning_rate": 5.159615272761391e-06, "loss": 0.671, "step": 6164 }, { "epoch": 0.67, "learning_rate": 5.156530231014967e-06, "loss": 0.7485, "step": 6165 }, { "epoch": 0.67, "learning_rate": 5.153445791413327e-06, "loss": 0.6721, "step": 6166 }, { "epoch": 0.67, "learning_rate": 5.150361954339924e-06, "loss": 0.7822, "step": 6167 }, { "epoch": 0.67, "learning_rate": 5.1472787201781485e-06, "loss": 0.7009, "step": 6168 }, { "epoch": 0.67, "learning_rate": 5.144196089311313e-06, "loss": 0.6895, "step": 6169 }, { "epoch": 0.67, "learning_rate": 5.141114062122643e-06, "loss": 0.55, "step": 6170 }, { "epoch": 0.67, "learning_rate": 5.138032638995315e-06, "loss": 0.7122, "step": 6171 }, { "epoch": 0.67, "learning_rate": 5.134951820312402e-06, "loss": 0.6458, "step": 6172 }, { "epoch": 0.67, "learning_rate": 5.131871606456917e-06, "loss": 0.7192, "step": 6173 }, { "epoch": 0.67, "learning_rate": 5.128791997811799e-06, "loss": 0.6318, "step": 6174 }, { "epoch": 0.67, "learning_rate": 5.125712994759904e-06, "loss": 0.688, "step": 6175 }, { "epoch": 0.67, "learning_rate": 5.122634597684016e-06, "loss": 0.6411, "step": 6176 }, { "epoch": 0.67, "learning_rate": 5.119556806966851e-06, "loss": 0.7026, "step": 6177 }, { "epoch": 0.67, "learning_rate": 5.116479622991033e-06, "loss": 0.6821, "step": 6178 }, { "epoch": 0.67, "learning_rate": 5.113403046139127e-06, "loss": 0.6855, "step": 6179 }, { "epoch": 0.67, "learning_rate": 5.110327076793613e-06, "loss": 0.6467, "step": 6180 }, { "epoch": 0.67, "learning_rate": 5.107251715336899e-06, "loss": 0.6101, "step": 6181 }, { "epoch": 0.67, "learning_rate": 5.104176962151323e-06, "loss": 0.6272, "step": 6182 }, { "epoch": 0.67, "learning_rate": 5.101102817619132e-06, "loss": 0.6301, "step": 6183 }, { "epoch": 0.67, "learning_rate": 5.09802928212251e-06, "loss": 0.6179, "step": 6184 }, { "epoch": 0.67, "learning_rate": 5.0949563560435654e-06, "loss": 0.72, "step": 6185 }, { "epoch": 0.67, "learning_rate": 5.091884039764321e-06, "loss": 0.6716, "step": 6186 }, { "epoch": 0.67, "learning_rate": 5.088812333666733e-06, "loss": 0.6631, "step": 6187 }, { "epoch": 0.67, "learning_rate": 5.085741238132683e-06, "loss": 0.771, "step": 6188 }, { "epoch": 0.67, "learning_rate": 5.082670753543961e-06, "loss": 0.5798, "step": 6189 }, { "epoch": 0.67, "learning_rate": 5.079600880282308e-06, "loss": 0.5638, "step": 6190 }, { "epoch": 0.67, "learning_rate": 5.076531618729362e-06, "loss": 0.7031, "step": 6191 }, { "epoch": 0.67, "learning_rate": 5.073462969266701e-06, "loss": 0.6479, "step": 6192 }, { "epoch": 0.67, "learning_rate": 5.070394932275825e-06, "loss": 0.7266, "step": 6193 }, { "epoch": 0.67, "learning_rate": 5.067327508138148e-06, "loss": 0.6968, "step": 6194 }, { "epoch": 0.67, "learning_rate": 5.0642606972350194e-06, "loss": 0.6047, "step": 6195 }, { "epoch": 0.67, "learning_rate": 5.061194499947712e-06, "loss": 0.7122, "step": 6196 }, { "epoch": 0.67, "learning_rate": 5.0581289166574096e-06, "loss": 0.75, "step": 6197 }, { "epoch": 0.67, "learning_rate": 5.055063947745234e-06, "loss": 0.7908, "step": 6198 }, { "epoch": 0.67, "learning_rate": 5.051999593592223e-06, "loss": 0.6494, "step": 6199 }, { "epoch": 0.67, "learning_rate": 5.048935854579341e-06, "loss": 0.6682, "step": 6200 }, { "epoch": 0.68, "learning_rate": 5.045872731087479e-06, "loss": 0.7163, "step": 6201 }, { "epoch": 0.68, "learning_rate": 5.042810223497441e-06, "loss": 0.668, "step": 6202 }, { "epoch": 0.68, "learning_rate": 5.039748332189961e-06, "loss": 0.6777, "step": 6203 }, { "epoch": 0.68, "learning_rate": 5.036687057545704e-06, "loss": 0.7778, "step": 6204 }, { "epoch": 0.68, "learning_rate": 5.033626399945241e-06, "loss": 0.698, "step": 6205 }, { "epoch": 0.68, "learning_rate": 5.03056635976908e-06, "loss": 0.7935, "step": 6206 }, { "epoch": 0.68, "learning_rate": 5.027506937397653e-06, "loss": 0.708, "step": 6207 }, { "epoch": 0.68, "learning_rate": 5.0244481332113e-06, "loss": 0.8052, "step": 6208 }, { "epoch": 0.68, "learning_rate": 5.021389947590301e-06, "loss": 0.6689, "step": 6209 }, { "epoch": 0.68, "learning_rate": 5.01833238091485e-06, "loss": 0.7566, "step": 6210 }, { "epoch": 0.68, "learning_rate": 5.01527543356507e-06, "loss": 0.7871, "step": 6211 }, { "epoch": 0.68, "learning_rate": 5.012219105921004e-06, "loss": 0.6704, "step": 6212 }, { "epoch": 0.68, "learning_rate": 5.009163398362612e-06, "loss": 0.7493, "step": 6213 }, { "epoch": 0.68, "learning_rate": 5.006108311269786e-06, "loss": 0.6768, "step": 6214 }, { "epoch": 0.68, "learning_rate": 5.003053845022341e-06, "loss": 0.7673, "step": 6215 }, { "epoch": 0.68, "learning_rate": 5.000000000000003e-06, "loss": 0.6318, "step": 6216 }, { "epoch": 0.68, "learning_rate": 4.996946776582433e-06, "loss": 0.6638, "step": 6217 }, { "epoch": 0.68, "learning_rate": 4.993894175149211e-06, "loss": 0.7695, "step": 6218 }, { "epoch": 0.68, "learning_rate": 4.990842196079838e-06, "loss": 0.6914, "step": 6219 }, { "epoch": 0.68, "learning_rate": 4.987790839753745e-06, "loss": 0.6926, "step": 6220 }, { "epoch": 0.68, "learning_rate": 4.984740106550271e-06, "loss": 0.6619, "step": 6221 }, { "epoch": 0.68, "learning_rate": 4.9816899968486895e-06, "loss": 0.7666, "step": 6222 }, { "epoch": 0.68, "learning_rate": 4.978640511028198e-06, "loss": 0.6848, "step": 6223 }, { "epoch": 0.68, "learning_rate": 4.975591649467901e-06, "loss": 0.7637, "step": 6224 }, { "epoch": 0.68, "learning_rate": 4.972543412546842e-06, "loss": 0.7339, "step": 6225 }, { "epoch": 0.68, "learning_rate": 4.969495800643985e-06, "loss": 0.7515, "step": 6226 }, { "epoch": 0.68, "learning_rate": 4.9664488141382026e-06, "loss": 0.686, "step": 6227 }, { "epoch": 0.68, "learning_rate": 4.963402453408305e-06, "loss": 0.7217, "step": 6228 }, { "epoch": 0.68, "learning_rate": 4.960356718833016e-06, "loss": 0.6604, "step": 6229 }, { "epoch": 0.68, "learning_rate": 4.957311610790986e-06, "loss": 0.7192, "step": 6230 }, { "epoch": 0.68, "learning_rate": 4.954267129660789e-06, "loss": 0.5938, "step": 6231 }, { "epoch": 0.68, "learning_rate": 4.951223275820911e-06, "loss": 0.6807, "step": 6232 }, { "epoch": 0.68, "learning_rate": 4.94818004964977e-06, "loss": 0.7163, "step": 6233 }, { "epoch": 0.68, "learning_rate": 4.945137451525707e-06, "loss": 0.6793, "step": 6234 }, { "epoch": 0.68, "learning_rate": 4.9420954818269715e-06, "loss": 0.6277, "step": 6235 }, { "epoch": 0.68, "learning_rate": 4.939054140931751e-06, "loss": 0.6982, "step": 6236 }, { "epoch": 0.68, "learning_rate": 4.936013429218144e-06, "loss": 0.667, "step": 6237 }, { "epoch": 0.68, "learning_rate": 4.932973347064177e-06, "loss": 0.6455, "step": 6238 }, { "epoch": 0.68, "learning_rate": 4.929933894847799e-06, "loss": 0.6685, "step": 6239 }, { "epoch": 0.68, "learning_rate": 4.926895072946871e-06, "loss": 0.6357, "step": 6240 }, { "epoch": 0.68, "learning_rate": 4.923856881739186e-06, "loss": 0.7163, "step": 6241 }, { "epoch": 0.68, "learning_rate": 4.920819321602458e-06, "loss": 0.791, "step": 6242 }, { "epoch": 0.68, "learning_rate": 4.917782392914311e-06, "loss": 0.6514, "step": 6243 }, { "epoch": 0.68, "learning_rate": 4.914746096052303e-06, "loss": 0.7393, "step": 6244 }, { "epoch": 0.68, "learning_rate": 4.9117104313939145e-06, "loss": 0.6511, "step": 6245 }, { "epoch": 0.68, "learning_rate": 4.908675399316534e-06, "loss": 0.7246, "step": 6246 }, { "epoch": 0.68, "learning_rate": 4.905641000197483e-06, "loss": 0.7041, "step": 6247 }, { "epoch": 0.68, "learning_rate": 4.902607234413999e-06, "loss": 0.7373, "step": 6248 }, { "epoch": 0.68, "learning_rate": 4.899574102343247e-06, "loss": 0.7812, "step": 6249 }, { "epoch": 0.68, "learning_rate": 4.896541604362309e-06, "loss": 0.5061, "step": 6250 }, { "epoch": 0.68, "learning_rate": 4.893509740848183e-06, "loss": 0.6592, "step": 6251 }, { "epoch": 0.68, "learning_rate": 4.890478512177796e-06, "loss": 0.7524, "step": 6252 }, { "epoch": 0.68, "learning_rate": 4.887447918727995e-06, "loss": 0.7373, "step": 6253 }, { "epoch": 0.68, "learning_rate": 4.884417960875542e-06, "loss": 0.6216, "step": 6254 }, { "epoch": 0.68, "learning_rate": 4.881388638997125e-06, "loss": 0.7954, "step": 6255 }, { "epoch": 0.68, "learning_rate": 4.878359953469354e-06, "loss": 0.6959, "step": 6256 }, { "epoch": 0.68, "learning_rate": 4.875331904668759e-06, "loss": 0.5076, "step": 6257 }, { "epoch": 0.68, "learning_rate": 4.872304492971791e-06, "loss": 0.729, "step": 6258 }, { "epoch": 0.68, "learning_rate": 4.869277718754815e-06, "loss": 0.6675, "step": 6259 }, { "epoch": 0.68, "learning_rate": 4.8662515823941255e-06, "loss": 0.8364, "step": 6260 }, { "epoch": 0.68, "learning_rate": 4.863226084265939e-06, "loss": 0.6892, "step": 6261 }, { "epoch": 0.68, "learning_rate": 4.8602012247463816e-06, "loss": 0.666, "step": 6262 }, { "epoch": 0.68, "learning_rate": 4.857177004211507e-06, "loss": 0.6555, "step": 6263 }, { "epoch": 0.68, "learning_rate": 4.8541534230372976e-06, "loss": 0.6028, "step": 6264 }, { "epoch": 0.68, "learning_rate": 4.8511304815996374e-06, "loss": 0.6619, "step": 6265 }, { "epoch": 0.68, "learning_rate": 4.848108180274345e-06, "loss": 0.6855, "step": 6266 }, { "epoch": 0.68, "learning_rate": 4.845086519437157e-06, "loss": 0.6995, "step": 6267 }, { "epoch": 0.68, "learning_rate": 4.84206549946373e-06, "loss": 0.7327, "step": 6268 }, { "epoch": 0.68, "learning_rate": 4.839045120729642e-06, "loss": 0.7769, "step": 6269 }, { "epoch": 0.68, "learning_rate": 4.836025383610382e-06, "loss": 0.689, "step": 6270 }, { "epoch": 0.68, "learning_rate": 4.8330062884813714e-06, "loss": 0.6687, "step": 6271 }, { "epoch": 0.68, "learning_rate": 4.82998783571795e-06, "loss": 0.6663, "step": 6272 }, { "epoch": 0.68, "learning_rate": 4.826970025695366e-06, "loss": 0.5994, "step": 6273 }, { "epoch": 0.68, "learning_rate": 4.823952858788804e-06, "loss": 0.783, "step": 6274 }, { "epoch": 0.68, "learning_rate": 4.820936335373357e-06, "loss": 0.7324, "step": 6275 }, { "epoch": 0.68, "learning_rate": 4.817920455824045e-06, "loss": 0.6316, "step": 6276 }, { "epoch": 0.68, "learning_rate": 4.814905220515807e-06, "loss": 0.615, "step": 6277 }, { "epoch": 0.68, "learning_rate": 4.811890629823492e-06, "loss": 0.6863, "step": 6278 }, { "epoch": 0.68, "learning_rate": 4.808876684121882e-06, "loss": 0.7373, "step": 6279 }, { "epoch": 0.68, "learning_rate": 4.805863383785676e-06, "loss": 0.6787, "step": 6280 }, { "epoch": 0.68, "learning_rate": 4.802850729189484e-06, "loss": 0.6401, "step": 6281 }, { "epoch": 0.68, "learning_rate": 4.799838720707847e-06, "loss": 0.8184, "step": 6282 }, { "epoch": 0.68, "learning_rate": 4.796827358715222e-06, "loss": 0.6829, "step": 6283 }, { "epoch": 0.68, "learning_rate": 4.793816643585977e-06, "loss": 0.7065, "step": 6284 }, { "epoch": 0.68, "learning_rate": 4.790806575694413e-06, "loss": 0.7393, "step": 6285 }, { "epoch": 0.68, "learning_rate": 4.787797155414742e-06, "loss": 0.7271, "step": 6286 }, { "epoch": 0.68, "learning_rate": 4.7847883831211e-06, "loss": 0.6831, "step": 6287 }, { "epoch": 0.68, "learning_rate": 4.781780259187543e-06, "loss": 0.6248, "step": 6288 }, { "epoch": 0.68, "learning_rate": 4.778772783988037e-06, "loss": 0.542, "step": 6289 }, { "epoch": 0.68, "learning_rate": 4.775765957896477e-06, "loss": 0.6165, "step": 6290 }, { "epoch": 0.68, "learning_rate": 4.772759781286679e-06, "loss": 0.7297, "step": 6291 }, { "epoch": 0.68, "learning_rate": 4.769754254532366e-06, "loss": 0.6885, "step": 6292 }, { "epoch": 0.69, "learning_rate": 4.766749378007193e-06, "loss": 0.7573, "step": 6293 }, { "epoch": 0.69, "learning_rate": 4.76374515208473e-06, "loss": 0.7471, "step": 6294 }, { "epoch": 0.69, "learning_rate": 4.760741577138457e-06, "loss": 0.7419, "step": 6295 }, { "epoch": 0.69, "learning_rate": 4.757738653541795e-06, "loss": 0.5796, "step": 6296 }, { "epoch": 0.69, "learning_rate": 4.754736381668057e-06, "loss": 0.5881, "step": 6297 }, { "epoch": 0.69, "learning_rate": 4.751734761890497e-06, "loss": 0.686, "step": 6298 }, { "epoch": 0.69, "learning_rate": 4.748733794582278e-06, "loss": 0.7551, "step": 6299 }, { "epoch": 0.69, "learning_rate": 4.745733480116478e-06, "loss": 0.604, "step": 6300 }, { "epoch": 0.69, "learning_rate": 4.742733818866102e-06, "loss": 0.8003, "step": 6301 }, { "epoch": 0.69, "learning_rate": 4.7397348112040755e-06, "loss": 0.6016, "step": 6302 }, { "epoch": 0.69, "learning_rate": 4.736736457503229e-06, "loss": 0.77, "step": 6303 }, { "epoch": 0.69, "learning_rate": 4.733738758136327e-06, "loss": 0.7207, "step": 6304 }, { "epoch": 0.69, "learning_rate": 4.730741713476044e-06, "loss": 0.5774, "step": 6305 }, { "epoch": 0.69, "learning_rate": 4.727745323894976e-06, "loss": 0.6418, "step": 6306 }, { "epoch": 0.69, "learning_rate": 4.724749589765641e-06, "loss": 0.6243, "step": 6307 }, { "epoch": 0.69, "learning_rate": 4.7217545114604625e-06, "loss": 0.6179, "step": 6308 }, { "epoch": 0.69, "learning_rate": 4.718760089351798e-06, "loss": 0.7808, "step": 6309 }, { "epoch": 0.69, "learning_rate": 4.715766323811919e-06, "loss": 0.7046, "step": 6310 }, { "epoch": 0.69, "learning_rate": 4.712773215213006e-06, "loss": 0.7495, "step": 6311 }, { "epoch": 0.69, "learning_rate": 4.709780763927169e-06, "loss": 0.6228, "step": 6312 }, { "epoch": 0.69, "learning_rate": 4.7067889703264355e-06, "loss": 0.6711, "step": 6313 }, { "epoch": 0.69, "learning_rate": 4.703797834782738e-06, "loss": 0.636, "step": 6314 }, { "epoch": 0.69, "learning_rate": 4.700807357667953e-06, "loss": 0.6416, "step": 6315 }, { "epoch": 0.69, "learning_rate": 4.697817539353845e-06, "loss": 0.6138, "step": 6316 }, { "epoch": 0.69, "learning_rate": 4.694828380212118e-06, "loss": 0.6394, "step": 6317 }, { "epoch": 0.69, "learning_rate": 4.69183988061439e-06, "loss": 0.7651, "step": 6318 }, { "epoch": 0.69, "learning_rate": 4.688852040932185e-06, "loss": 0.7324, "step": 6319 }, { "epoch": 0.69, "learning_rate": 4.685864861536959e-06, "loss": 0.6467, "step": 6320 }, { "epoch": 0.69, "learning_rate": 4.682878342800087e-06, "loss": 0.7349, "step": 6321 }, { "epoch": 0.69, "learning_rate": 4.679892485092844e-06, "loss": 0.7373, "step": 6322 }, { "epoch": 0.69, "learning_rate": 4.6769072887864415e-06, "loss": 0.7202, "step": 6323 }, { "epoch": 0.69, "learning_rate": 4.673922754252001e-06, "loss": 0.6733, "step": 6324 }, { "epoch": 0.69, "learning_rate": 4.670938881860564e-06, "loss": 0.6548, "step": 6325 }, { "epoch": 0.69, "learning_rate": 4.66795567198309e-06, "loss": 0.6318, "step": 6326 }, { "epoch": 0.69, "learning_rate": 4.664973124990447e-06, "loss": 0.6155, "step": 6327 }, { "epoch": 0.69, "learning_rate": 4.661991241253434e-06, "loss": 0.6787, "step": 6328 }, { "epoch": 0.69, "learning_rate": 4.659010021142764e-06, "loss": 0.79, "step": 6329 }, { "epoch": 0.69, "learning_rate": 4.656029465029057e-06, "loss": 0.5254, "step": 6330 }, { "epoch": 0.69, "learning_rate": 4.653049573282864e-06, "loss": 0.6418, "step": 6331 }, { "epoch": 0.69, "learning_rate": 4.65007034627465e-06, "loss": 0.6768, "step": 6332 }, { "epoch": 0.69, "learning_rate": 4.647091784374786e-06, "loss": 0.7021, "step": 6333 }, { "epoch": 0.69, "learning_rate": 4.6441138879535814e-06, "loss": 0.7681, "step": 6334 }, { "epoch": 0.69, "learning_rate": 4.641136657381244e-06, "loss": 0.6636, "step": 6335 }, { "epoch": 0.69, "learning_rate": 4.638160093027908e-06, "loss": 0.7202, "step": 6336 }, { "epoch": 0.69, "learning_rate": 4.635184195263624e-06, "loss": 0.6594, "step": 6337 }, { "epoch": 0.69, "learning_rate": 4.632208964458356e-06, "loss": 0.7954, "step": 6338 }, { "epoch": 0.69, "learning_rate": 4.629234400981986e-06, "loss": 0.6208, "step": 6339 }, { "epoch": 0.69, "learning_rate": 4.6262605052043216e-06, "loss": 0.6624, "step": 6340 }, { "epoch": 0.69, "learning_rate": 4.623287277495072e-06, "loss": 0.6948, "step": 6341 }, { "epoch": 0.69, "learning_rate": 4.620314718223876e-06, "loss": 0.6973, "step": 6342 }, { "epoch": 0.69, "learning_rate": 4.6173428277602835e-06, "loss": 0.7595, "step": 6343 }, { "epoch": 0.69, "learning_rate": 4.614371606473764e-06, "loss": 0.718, "step": 6344 }, { "epoch": 0.69, "learning_rate": 4.611401054733706e-06, "loss": 0.6648, "step": 6345 }, { "epoch": 0.69, "learning_rate": 4.608431172909405e-06, "loss": 0.7305, "step": 6346 }, { "epoch": 0.69, "learning_rate": 4.605461961370081e-06, "loss": 0.7273, "step": 6347 }, { "epoch": 0.69, "learning_rate": 4.6024934204848745e-06, "loss": 0.7078, "step": 6348 }, { "epoch": 0.69, "learning_rate": 4.599525550622829e-06, "loss": 0.634, "step": 6349 }, { "epoch": 0.69, "learning_rate": 4.596558352152918e-06, "loss": 0.7944, "step": 6350 }, { "epoch": 0.69, "learning_rate": 4.593591825444028e-06, "loss": 0.7271, "step": 6351 }, { "epoch": 0.69, "learning_rate": 4.590625970864952e-06, "loss": 0.7026, "step": 6352 }, { "epoch": 0.69, "learning_rate": 4.587660788784419e-06, "loss": 0.7593, "step": 6353 }, { "epoch": 0.69, "learning_rate": 4.584696279571056e-06, "loss": 0.7185, "step": 6354 }, { "epoch": 0.69, "learning_rate": 4.581732443593417e-06, "loss": 0.7358, "step": 6355 }, { "epoch": 0.69, "learning_rate": 4.578769281219969e-06, "loss": 0.7388, "step": 6356 }, { "epoch": 0.69, "learning_rate": 4.5758067928190906e-06, "loss": 0.688, "step": 6357 }, { "epoch": 0.69, "learning_rate": 4.572844978759085e-06, "loss": 0.752, "step": 6358 }, { "epoch": 0.69, "learning_rate": 4.56988383940817e-06, "loss": 0.6934, "step": 6359 }, { "epoch": 0.69, "learning_rate": 4.5669233751344725e-06, "loss": 0.6719, "step": 6360 }, { "epoch": 0.69, "learning_rate": 4.56396358630604e-06, "loss": 0.6311, "step": 6361 }, { "epoch": 0.69, "learning_rate": 4.56100447329084e-06, "loss": 0.6592, "step": 6362 }, { "epoch": 0.69, "learning_rate": 4.558046036456749e-06, "loss": 0.6746, "step": 6363 }, { "epoch": 0.69, "learning_rate": 4.55508827617157e-06, "loss": 0.6663, "step": 6364 }, { "epoch": 0.69, "learning_rate": 4.552131192803005e-06, "loss": 0.7017, "step": 6365 }, { "epoch": 0.69, "learning_rate": 4.549174786718684e-06, "loss": 0.6682, "step": 6366 }, { "epoch": 0.69, "learning_rate": 4.546219058286156e-06, "loss": 0.6724, "step": 6367 }, { "epoch": 0.69, "learning_rate": 4.5432640078728714e-06, "loss": 0.5991, "step": 6368 }, { "epoch": 0.69, "learning_rate": 4.5403096358462095e-06, "loss": 0.6875, "step": 6369 }, { "epoch": 0.69, "learning_rate": 4.537355942573464e-06, "loss": 0.7837, "step": 6370 }, { "epoch": 0.69, "learning_rate": 4.53440292842183e-06, "loss": 0.8145, "step": 6371 }, { "epoch": 0.69, "learning_rate": 4.531450593758442e-06, "loss": 0.7109, "step": 6372 }, { "epoch": 0.69, "learning_rate": 4.528498938950329e-06, "loss": 0.679, "step": 6373 }, { "epoch": 0.69, "learning_rate": 4.525547964364445e-06, "loss": 0.647, "step": 6374 }, { "epoch": 0.69, "learning_rate": 4.522597670367662e-06, "loss": 0.8032, "step": 6375 }, { "epoch": 0.69, "learning_rate": 4.519648057326757e-06, "loss": 0.5615, "step": 6376 }, { "epoch": 0.69, "learning_rate": 4.516699125608433e-06, "loss": 0.7891, "step": 6377 }, { "epoch": 0.69, "learning_rate": 4.513750875579303e-06, "loss": 0.6562, "step": 6378 }, { "epoch": 0.69, "learning_rate": 4.510803307605896e-06, "loss": 0.7502, "step": 6379 }, { "epoch": 0.69, "learning_rate": 4.507856422054654e-06, "loss": 0.7722, "step": 6380 }, { "epoch": 0.69, "learning_rate": 4.504910219291941e-06, "loss": 0.7173, "step": 6381 }, { "epoch": 0.69, "learning_rate": 4.5019646996840285e-06, "loss": 0.6726, "step": 6382 }, { "epoch": 0.69, "learning_rate": 4.49901986359711e-06, "loss": 0.7593, "step": 6383 }, { "epoch": 0.69, "learning_rate": 4.496075711397286e-06, "loss": 0.7429, "step": 6384 }, { "epoch": 0.7, "learning_rate": 4.493132243450579e-06, "loss": 0.7131, "step": 6385 }, { "epoch": 0.7, "learning_rate": 4.490189460122926e-06, "loss": 0.7153, "step": 6386 }, { "epoch": 0.7, "learning_rate": 4.487247361780169e-06, "loss": 0.6472, "step": 6387 }, { "epoch": 0.7, "learning_rate": 4.484305948788078e-06, "loss": 0.6406, "step": 6388 }, { "epoch": 0.7, "learning_rate": 4.481365221512335e-06, "loss": 0.6399, "step": 6389 }, { "epoch": 0.7, "learning_rate": 4.478425180318523e-06, "loss": 0.6619, "step": 6390 }, { "epoch": 0.7, "learning_rate": 4.475485825572164e-06, "loss": 0.7378, "step": 6391 }, { "epoch": 0.7, "learning_rate": 4.472547157638674e-06, "loss": 0.6379, "step": 6392 }, { "epoch": 0.7, "learning_rate": 4.469609176883392e-06, "loss": 0.5686, "step": 6393 }, { "epoch": 0.7, "learning_rate": 4.466671883671574e-06, "loss": 0.6953, "step": 6394 }, { "epoch": 0.7, "learning_rate": 4.463735278368381e-06, "loss": 0.8193, "step": 6395 }, { "epoch": 0.7, "learning_rate": 4.460799361338898e-06, "loss": 0.6316, "step": 6396 }, { "epoch": 0.7, "learning_rate": 4.457864132948125e-06, "loss": 0.6902, "step": 6397 }, { "epoch": 0.7, "learning_rate": 4.454929593560962e-06, "loss": 0.6621, "step": 6398 }, { "epoch": 0.7, "learning_rate": 4.451995743542242e-06, "loss": 0.5481, "step": 6399 }, { "epoch": 0.7, "learning_rate": 4.449062583256702e-06, "loss": 0.6052, "step": 6400 }, { "epoch": 0.7, "learning_rate": 4.446130113068994e-06, "loss": 0.751, "step": 6401 }, { "epoch": 0.7, "learning_rate": 4.44319833334369e-06, "loss": 0.6606, "step": 6402 }, { "epoch": 0.7, "learning_rate": 4.4402672444452664e-06, "loss": 0.6968, "step": 6403 }, { "epoch": 0.7, "learning_rate": 4.43733684673812e-06, "loss": 0.6685, "step": 6404 }, { "epoch": 0.7, "learning_rate": 4.4344071405865656e-06, "loss": 0.6316, "step": 6405 }, { "epoch": 0.7, "learning_rate": 4.431478126354818e-06, "loss": 0.6653, "step": 6406 }, { "epoch": 0.7, "learning_rate": 4.428549804407022e-06, "loss": 0.6658, "step": 6407 }, { "epoch": 0.7, "learning_rate": 4.425622175107229e-06, "loss": 0.6973, "step": 6408 }, { "epoch": 0.7, "learning_rate": 4.4226952388193976e-06, "loss": 0.6611, "step": 6409 }, { "epoch": 0.7, "learning_rate": 4.419768995907419e-06, "loss": 0.6965, "step": 6410 }, { "epoch": 0.7, "learning_rate": 4.416843446735077e-06, "loss": 0.6746, "step": 6411 }, { "epoch": 0.7, "learning_rate": 4.413918591666082e-06, "loss": 0.5745, "step": 6412 }, { "epoch": 0.7, "learning_rate": 4.410994431064058e-06, "loss": 0.679, "step": 6413 }, { "epoch": 0.7, "learning_rate": 4.408070965292534e-06, "loss": 0.6936, "step": 6414 }, { "epoch": 0.7, "learning_rate": 4.405148194714957e-06, "loss": 0.8008, "step": 6415 }, { "epoch": 0.7, "learning_rate": 4.4022261196946995e-06, "loss": 0.7207, "step": 6416 }, { "epoch": 0.7, "learning_rate": 4.399304740595023e-06, "loss": 0.7913, "step": 6417 }, { "epoch": 0.7, "learning_rate": 4.396384057779123e-06, "loss": 0.6792, "step": 6418 }, { "epoch": 0.7, "learning_rate": 4.393464071610099e-06, "loss": 0.7642, "step": 6419 }, { "epoch": 0.7, "learning_rate": 4.39054478245097e-06, "loss": 0.5957, "step": 6420 }, { "epoch": 0.7, "learning_rate": 4.387626190664666e-06, "loss": 0.6504, "step": 6421 }, { "epoch": 0.7, "learning_rate": 4.384708296614023e-06, "loss": 0.7192, "step": 6422 }, { "epoch": 0.7, "learning_rate": 4.381791100661798e-06, "loss": 0.6638, "step": 6423 }, { "epoch": 0.7, "learning_rate": 4.378874603170666e-06, "loss": 0.7007, "step": 6424 }, { "epoch": 0.7, "learning_rate": 4.375958804503201e-06, "loss": 0.7346, "step": 6425 }, { "epoch": 0.7, "learning_rate": 4.373043705021899e-06, "loss": 0.623, "step": 6426 }, { "epoch": 0.7, "learning_rate": 4.370129305089174e-06, "loss": 0.6519, "step": 6427 }, { "epoch": 0.7, "learning_rate": 4.367215605067335e-06, "loss": 0.8062, "step": 6428 }, { "epoch": 0.7, "learning_rate": 4.364302605318631e-06, "loss": 0.729, "step": 6429 }, { "epoch": 0.7, "learning_rate": 4.361390306205198e-06, "loss": 0.6772, "step": 6430 }, { "epoch": 0.7, "learning_rate": 4.358478708089099e-06, "loss": 0.7197, "step": 6431 }, { "epoch": 0.7, "learning_rate": 4.355567811332311e-06, "loss": 0.7109, "step": 6432 }, { "epoch": 0.7, "learning_rate": 4.352657616296711e-06, "loss": 0.7607, "step": 6433 }, { "epoch": 0.7, "learning_rate": 4.349748123344102e-06, "loss": 0.7256, "step": 6434 }, { "epoch": 0.7, "learning_rate": 4.346839332836198e-06, "loss": 0.6238, "step": 6435 }, { "epoch": 0.7, "learning_rate": 4.343931245134616e-06, "loss": 0.7725, "step": 6436 }, { "epoch": 0.7, "learning_rate": 4.341023860600895e-06, "loss": 0.5452, "step": 6437 }, { "epoch": 0.7, "learning_rate": 4.338117179596485e-06, "loss": 0.7783, "step": 6438 }, { "epoch": 0.7, "learning_rate": 4.3352112024827455e-06, "loss": 0.7197, "step": 6439 }, { "epoch": 0.7, "learning_rate": 4.3323059296209554e-06, "loss": 0.7349, "step": 6440 }, { "epoch": 0.7, "learning_rate": 4.3294013613722944e-06, "loss": 0.6899, "step": 6441 }, { "epoch": 0.7, "learning_rate": 4.326497498097863e-06, "loss": 0.6387, "step": 6442 }, { "epoch": 0.7, "learning_rate": 4.323594340158675e-06, "loss": 0.7466, "step": 6443 }, { "epoch": 0.7, "learning_rate": 4.32069188791565e-06, "loss": 0.5879, "step": 6444 }, { "epoch": 0.7, "learning_rate": 4.317790141729625e-06, "loss": 0.7915, "step": 6445 }, { "epoch": 0.7, "learning_rate": 4.314889101961353e-06, "loss": 0.5811, "step": 6446 }, { "epoch": 0.7, "learning_rate": 4.311988768971484e-06, "loss": 0.7017, "step": 6447 }, { "epoch": 0.7, "learning_rate": 4.309089143120597e-06, "loss": 0.7119, "step": 6448 }, { "epoch": 0.7, "learning_rate": 4.306190224769174e-06, "loss": 0.6677, "step": 6449 }, { "epoch": 0.7, "learning_rate": 4.3032920142776125e-06, "loss": 0.6399, "step": 6450 }, { "epoch": 0.7, "learning_rate": 4.300394512006223e-06, "loss": 0.7039, "step": 6451 }, { "epoch": 0.7, "learning_rate": 4.29749771831522e-06, "loss": 0.5598, "step": 6452 }, { "epoch": 0.7, "learning_rate": 4.294601633564739e-06, "loss": 0.7007, "step": 6453 }, { "epoch": 0.7, "learning_rate": 4.2917062581148276e-06, "loss": 0.8076, "step": 6454 }, { "epoch": 0.7, "learning_rate": 4.2888115923254335e-06, "loss": 0.5933, "step": 6455 }, { "epoch": 0.7, "learning_rate": 4.2859176365564294e-06, "loss": 0.7529, "step": 6456 }, { "epoch": 0.7, "learning_rate": 4.283024391167593e-06, "loss": 0.7246, "step": 6457 }, { "epoch": 0.7, "learning_rate": 4.2801318565186165e-06, "loss": 0.6512, "step": 6458 }, { "epoch": 0.7, "learning_rate": 4.2772400329691055e-06, "loss": 0.6306, "step": 6459 }, { "epoch": 0.7, "learning_rate": 4.2743489208785675e-06, "loss": 0.7256, "step": 6460 }, { "epoch": 0.7, "learning_rate": 4.2714585206064315e-06, "loss": 0.718, "step": 6461 }, { "epoch": 0.7, "learning_rate": 4.26856883251204e-06, "loss": 0.7134, "step": 6462 }, { "epoch": 0.7, "learning_rate": 4.265679856954632e-06, "loss": 0.6504, "step": 6463 }, { "epoch": 0.7, "learning_rate": 4.262791594293374e-06, "loss": 0.7476, "step": 6464 }, { "epoch": 0.7, "learning_rate": 4.2599040448873385e-06, "loss": 0.6558, "step": 6465 }, { "epoch": 0.7, "learning_rate": 4.257017209095503e-06, "loss": 0.7061, "step": 6466 }, { "epoch": 0.7, "learning_rate": 4.254131087276764e-06, "loss": 0.6418, "step": 6467 }, { "epoch": 0.7, "learning_rate": 4.251245679789928e-06, "loss": 0.605, "step": 6468 }, { "epoch": 0.7, "learning_rate": 4.2483609869937115e-06, "loss": 0.8074, "step": 6469 }, { "epoch": 0.7, "learning_rate": 4.245477009246746e-06, "loss": 0.7837, "step": 6470 }, { "epoch": 0.7, "learning_rate": 4.2425937469075626e-06, "loss": 0.6685, "step": 6471 }, { "epoch": 0.7, "learning_rate": 4.2397112003346155e-06, "loss": 0.7251, "step": 6472 }, { "epoch": 0.7, "learning_rate": 4.2368293698862675e-06, "loss": 0.5447, "step": 6473 }, { "epoch": 0.7, "learning_rate": 4.2339482559207854e-06, "loss": 0.6631, "step": 6474 }, { "epoch": 0.7, "learning_rate": 4.231067858796354e-06, "loss": 0.6387, "step": 6475 }, { "epoch": 0.7, "learning_rate": 4.228188178871069e-06, "loss": 0.6443, "step": 6476 }, { "epoch": 0.71, "learning_rate": 4.225309216502933e-06, "loss": 0.6189, "step": 6477 }, { "epoch": 0.71, "learning_rate": 4.222430972049865e-06, "loss": 0.7112, "step": 6478 }, { "epoch": 0.71, "learning_rate": 4.219553445869687e-06, "loss": 0.6758, "step": 6479 }, { "epoch": 0.71, "learning_rate": 4.216676638320135e-06, "loss": 0.7266, "step": 6480 }, { "epoch": 0.71, "learning_rate": 4.213800549758863e-06, "loss": 0.751, "step": 6481 }, { "epoch": 0.71, "learning_rate": 4.21092518054342e-06, "loss": 0.5718, "step": 6482 }, { "epoch": 0.71, "learning_rate": 4.20805053103128e-06, "loss": 0.7578, "step": 6483 }, { "epoch": 0.71, "learning_rate": 4.205176601579825e-06, "loss": 0.5431, "step": 6484 }, { "epoch": 0.71, "learning_rate": 4.202303392546336e-06, "loss": 0.6804, "step": 6485 }, { "epoch": 0.71, "learning_rate": 4.19943090428802e-06, "loss": 0.7351, "step": 6486 }, { "epoch": 0.71, "learning_rate": 4.196559137161984e-06, "loss": 0.689, "step": 6487 }, { "epoch": 0.71, "learning_rate": 4.193688091525252e-06, "loss": 0.6763, "step": 6488 }, { "epoch": 0.71, "learning_rate": 4.1908177677347565e-06, "loss": 0.6165, "step": 6489 }, { "epoch": 0.71, "learning_rate": 4.187948166147332e-06, "loss": 0.6416, "step": 6490 }, { "epoch": 0.71, "learning_rate": 4.185079287119733e-06, "loss": 0.7339, "step": 6491 }, { "epoch": 0.71, "learning_rate": 4.182211131008628e-06, "loss": 0.7065, "step": 6492 }, { "epoch": 0.71, "learning_rate": 4.179343698170578e-06, "loss": 0.7104, "step": 6493 }, { "epoch": 0.71, "learning_rate": 4.1764769889620716e-06, "loss": 0.719, "step": 6494 }, { "epoch": 0.71, "learning_rate": 4.173611003739498e-06, "loss": 0.5869, "step": 6495 }, { "epoch": 0.71, "learning_rate": 4.1707457428591615e-06, "loss": 0.8223, "step": 6496 }, { "epoch": 0.71, "learning_rate": 4.167881206677277e-06, "loss": 0.6885, "step": 6497 }, { "epoch": 0.71, "learning_rate": 4.165017395549959e-06, "loss": 0.6687, "step": 6498 }, { "epoch": 0.71, "learning_rate": 4.1621543098332414e-06, "loss": 0.6965, "step": 6499 }, { "epoch": 0.71, "learning_rate": 4.159291949883072e-06, "loss": 0.7161, "step": 6500 }, { "epoch": 0.71, "learning_rate": 4.1564303160552935e-06, "loss": 0.582, "step": 6501 }, { "epoch": 0.71, "learning_rate": 4.15356940870567e-06, "loss": 0.6736, "step": 6502 }, { "epoch": 0.71, "learning_rate": 4.150709228189878e-06, "loss": 0.7192, "step": 6503 }, { "epoch": 0.71, "learning_rate": 4.147849774863488e-06, "loss": 0.6709, "step": 6504 }, { "epoch": 0.71, "learning_rate": 4.144991049081995e-06, "loss": 0.7412, "step": 6505 }, { "epoch": 0.71, "learning_rate": 4.142133051200799e-06, "loss": 0.7097, "step": 6506 }, { "epoch": 0.71, "learning_rate": 4.139275781575207e-06, "loss": 0.6904, "step": 6507 }, { "epoch": 0.71, "learning_rate": 4.136419240560443e-06, "loss": 0.6565, "step": 6508 }, { "epoch": 0.71, "learning_rate": 4.133563428511628e-06, "loss": 0.7686, "step": 6509 }, { "epoch": 0.71, "learning_rate": 4.1307083457838004e-06, "loss": 0.8105, "step": 6510 }, { "epoch": 0.71, "learning_rate": 4.1278539927319126e-06, "loss": 0.6731, "step": 6511 }, { "epoch": 0.71, "learning_rate": 4.125000369710813e-06, "loss": 0.7427, "step": 6512 }, { "epoch": 0.71, "learning_rate": 4.12214747707527e-06, "loss": 0.7356, "step": 6513 }, { "epoch": 0.71, "learning_rate": 4.119295315179958e-06, "loss": 0.7073, "step": 6514 }, { "epoch": 0.71, "learning_rate": 4.116443884379459e-06, "loss": 0.6582, "step": 6515 }, { "epoch": 0.71, "learning_rate": 4.113593185028273e-06, "loss": 0.8018, "step": 6516 }, { "epoch": 0.71, "learning_rate": 4.11074321748079e-06, "loss": 0.6733, "step": 6517 }, { "epoch": 0.71, "learning_rate": 4.107893982091328e-06, "loss": 0.6616, "step": 6518 }, { "epoch": 0.71, "learning_rate": 4.105045479214108e-06, "loss": 0.6394, "step": 6519 }, { "epoch": 0.71, "learning_rate": 4.102197709203252e-06, "loss": 0.6548, "step": 6520 }, { "epoch": 0.71, "learning_rate": 4.0993506724128005e-06, "loss": 0.7139, "step": 6521 }, { "epoch": 0.71, "learning_rate": 4.0965043691967045e-06, "loss": 0.7075, "step": 6522 }, { "epoch": 0.71, "learning_rate": 4.093658799908812e-06, "loss": 0.6624, "step": 6523 }, { "epoch": 0.71, "learning_rate": 4.090813964902889e-06, "loss": 0.6714, "step": 6524 }, { "epoch": 0.71, "learning_rate": 4.0879698645326105e-06, "loss": 0.5833, "step": 6525 }, { "epoch": 0.71, "learning_rate": 4.085126499151555e-06, "loss": 0.6675, "step": 6526 }, { "epoch": 0.71, "learning_rate": 4.0822838691132175e-06, "loss": 0.7227, "step": 6527 }, { "epoch": 0.71, "learning_rate": 4.079441974770989e-06, "loss": 0.5681, "step": 6528 }, { "epoch": 0.71, "learning_rate": 4.076600816478181e-06, "loss": 0.7056, "step": 6529 }, { "epoch": 0.71, "learning_rate": 4.073760394588011e-06, "loss": 0.6177, "step": 6530 }, { "epoch": 0.71, "learning_rate": 4.070920709453597e-06, "loss": 0.6565, "step": 6531 }, { "epoch": 0.71, "learning_rate": 4.068081761427975e-06, "loss": 0.6633, "step": 6532 }, { "epoch": 0.71, "learning_rate": 4.065243550864088e-06, "loss": 0.6777, "step": 6533 }, { "epoch": 0.71, "learning_rate": 4.062406078114776e-06, "loss": 0.6299, "step": 6534 }, { "epoch": 0.71, "learning_rate": 4.059569343532809e-06, "loss": 0.6611, "step": 6535 }, { "epoch": 0.71, "learning_rate": 4.056733347470842e-06, "loss": 0.5649, "step": 6536 }, { "epoch": 0.71, "learning_rate": 4.053898090281455e-06, "loss": 0.6841, "step": 6537 }, { "epoch": 0.71, "learning_rate": 4.05106357231713e-06, "loss": 0.7607, "step": 6538 }, { "epoch": 0.71, "learning_rate": 4.048229793930252e-06, "loss": 0.6514, "step": 6539 }, { "epoch": 0.71, "learning_rate": 4.045396755473121e-06, "loss": 0.6814, "step": 6540 }, { "epoch": 0.71, "learning_rate": 4.042564457297947e-06, "loss": 0.6121, "step": 6541 }, { "epoch": 0.71, "learning_rate": 4.039732899756839e-06, "loss": 0.7949, "step": 6542 }, { "epoch": 0.71, "learning_rate": 4.0369020832018195e-06, "loss": 0.6492, "step": 6543 }, { "epoch": 0.71, "learning_rate": 4.03407200798482e-06, "loss": 0.6399, "step": 6544 }, { "epoch": 0.71, "learning_rate": 4.031242674457677e-06, "loss": 0.7059, "step": 6545 }, { "epoch": 0.71, "learning_rate": 4.028414082972141e-06, "loss": 0.6472, "step": 6546 }, { "epoch": 0.71, "learning_rate": 4.025586233879857e-06, "loss": 0.6479, "step": 6547 }, { "epoch": 0.71, "learning_rate": 4.022759127532389e-06, "loss": 0.7739, "step": 6548 }, { "epoch": 0.71, "learning_rate": 4.019932764281212e-06, "loss": 0.7705, "step": 6549 }, { "epoch": 0.71, "learning_rate": 4.017107144477691e-06, "loss": 0.6968, "step": 6550 }, { "epoch": 0.71, "learning_rate": 4.0142822684731165e-06, "loss": 0.6252, "step": 6551 }, { "epoch": 0.71, "learning_rate": 4.011458136618681e-06, "loss": 0.6938, "step": 6552 }, { "epoch": 0.71, "learning_rate": 4.008634749265474e-06, "loss": 0.7642, "step": 6553 }, { "epoch": 0.71, "learning_rate": 4.005812106764516e-06, "loss": 0.5977, "step": 6554 }, { "epoch": 0.71, "learning_rate": 4.002990209466709e-06, "loss": 0.7261, "step": 6555 }, { "epoch": 0.71, "learning_rate": 4.000169057722879e-06, "loss": 0.7808, "step": 6556 }, { "epoch": 0.71, "learning_rate": 3.997348651883757e-06, "loss": 0.729, "step": 6557 }, { "epoch": 0.71, "learning_rate": 3.9945289922999705e-06, "loss": 0.7246, "step": 6558 }, { "epoch": 0.71, "learning_rate": 3.991710079322067e-06, "loss": 0.6685, "step": 6559 }, { "epoch": 0.71, "learning_rate": 3.9888919133005e-06, "loss": 0.8018, "step": 6560 }, { "epoch": 0.71, "learning_rate": 3.986074494585619e-06, "loss": 0.634, "step": 6561 }, { "epoch": 0.71, "learning_rate": 3.983257823527692e-06, "loss": 0.7378, "step": 6562 }, { "epoch": 0.71, "learning_rate": 3.9804419004768906e-06, "loss": 0.6401, "step": 6563 }, { "epoch": 0.71, "learning_rate": 3.977626725783291e-06, "loss": 0.6233, "step": 6564 }, { "epoch": 0.71, "learning_rate": 3.974812299796884e-06, "loss": 0.6792, "step": 6565 }, { "epoch": 0.71, "learning_rate": 3.9719986228675546e-06, "loss": 0.6394, "step": 6566 }, { "epoch": 0.71, "learning_rate": 3.9691856953451044e-06, "loss": 0.7529, "step": 6567 }, { "epoch": 0.72, "learning_rate": 3.966373517579244e-06, "loss": 0.6958, "step": 6568 }, { "epoch": 0.72, "learning_rate": 3.963562089919578e-06, "loss": 0.6599, "step": 6569 }, { "epoch": 0.72, "learning_rate": 3.960751412715629e-06, "loss": 0.7056, "step": 6570 }, { "epoch": 0.72, "learning_rate": 3.957941486316827e-06, "loss": 0.7109, "step": 6571 }, { "epoch": 0.72, "learning_rate": 3.955132311072496e-06, "loss": 0.7871, "step": 6572 }, { "epoch": 0.72, "learning_rate": 3.9523238873318855e-06, "loss": 0.6411, "step": 6573 }, { "epoch": 0.72, "learning_rate": 3.949516215444135e-06, "loss": 0.7051, "step": 6574 }, { "epoch": 0.72, "learning_rate": 3.946709295758296e-06, "loss": 0.7217, "step": 6575 }, { "epoch": 0.72, "learning_rate": 3.943903128623336e-06, "loss": 0.7222, "step": 6576 }, { "epoch": 0.72, "learning_rate": 3.941097714388109e-06, "loss": 0.6846, "step": 6577 }, { "epoch": 0.72, "learning_rate": 3.938293053401393e-06, "loss": 0.7263, "step": 6578 }, { "epoch": 0.72, "learning_rate": 3.9354891460118695e-06, "loss": 0.7158, "step": 6579 }, { "epoch": 0.72, "learning_rate": 3.932685992568114e-06, "loss": 0.5786, "step": 6580 }, { "epoch": 0.72, "learning_rate": 3.929883593418622e-06, "loss": 0.6685, "step": 6581 }, { "epoch": 0.72, "learning_rate": 3.9270819489117905e-06, "loss": 0.7861, "step": 6582 }, { "epoch": 0.72, "learning_rate": 3.9242810593959225e-06, "loss": 0.7139, "step": 6583 }, { "epoch": 0.72, "learning_rate": 3.92148092521923e-06, "loss": 0.6729, "step": 6584 }, { "epoch": 0.72, "learning_rate": 3.918681546729822e-06, "loss": 0.6028, "step": 6585 }, { "epoch": 0.72, "learning_rate": 3.915882924275725e-06, "loss": 0.7412, "step": 6586 }, { "epoch": 0.72, "learning_rate": 3.9130850582048664e-06, "loss": 0.6208, "step": 6587 }, { "epoch": 0.72, "learning_rate": 3.910287948865076e-06, "loss": 0.7163, "step": 6588 }, { "epoch": 0.72, "learning_rate": 3.907491596604095e-06, "loss": 0.6528, "step": 6589 }, { "epoch": 0.72, "learning_rate": 3.904696001769571e-06, "loss": 0.7036, "step": 6590 }, { "epoch": 0.72, "learning_rate": 3.9019011647090465e-06, "loss": 0.7769, "step": 6591 }, { "epoch": 0.72, "learning_rate": 3.899107085769992e-06, "loss": 0.6929, "step": 6592 }, { "epoch": 0.72, "learning_rate": 3.896313765299758e-06, "loss": 0.6919, "step": 6593 }, { "epoch": 0.72, "learning_rate": 3.893521203645618e-06, "loss": 0.7524, "step": 6594 }, { "epoch": 0.72, "learning_rate": 3.890729401154749e-06, "loss": 0.6934, "step": 6595 }, { "epoch": 0.72, "learning_rate": 3.887938358174224e-06, "loss": 0.7175, "step": 6596 }, { "epoch": 0.72, "learning_rate": 3.88514807505103e-06, "loss": 0.6167, "step": 6597 }, { "epoch": 0.72, "learning_rate": 3.882358552132062e-06, "loss": 0.687, "step": 6598 }, { "epoch": 0.72, "learning_rate": 3.87956978976411e-06, "loss": 0.6484, "step": 6599 }, { "epoch": 0.72, "learning_rate": 3.876781788293877e-06, "loss": 0.6855, "step": 6600 }, { "epoch": 0.72, "learning_rate": 3.873994548067972e-06, "loss": 0.5664, "step": 6601 }, { "epoch": 0.72, "learning_rate": 3.8712080694329065e-06, "loss": 0.7285, "step": 6602 }, { "epoch": 0.72, "learning_rate": 3.8684223527351025e-06, "loss": 0.6772, "step": 6603 }, { "epoch": 0.72, "learning_rate": 3.865637398320875e-06, "loss": 0.5808, "step": 6604 }, { "epoch": 0.72, "learning_rate": 3.862853206536456e-06, "loss": 0.6772, "step": 6605 }, { "epoch": 0.72, "learning_rate": 3.860069777727983e-06, "loss": 0.627, "step": 6606 }, { "epoch": 0.72, "learning_rate": 3.857287112241487e-06, "loss": 0.6091, "step": 6607 }, { "epoch": 0.72, "learning_rate": 3.854505210422914e-06, "loss": 0.7539, "step": 6608 }, { "epoch": 0.72, "learning_rate": 3.851724072618118e-06, "loss": 0.729, "step": 6609 }, { "epoch": 0.72, "learning_rate": 3.848943699172841e-06, "loss": 0.6504, "step": 6610 }, { "epoch": 0.72, "learning_rate": 3.846164090432757e-06, "loss": 0.7593, "step": 6611 }, { "epoch": 0.72, "learning_rate": 3.8433852467434175e-06, "loss": 0.7671, "step": 6612 }, { "epoch": 0.72, "learning_rate": 3.840607168450295e-06, "loss": 0.6521, "step": 6613 }, { "epoch": 0.72, "learning_rate": 3.837829855898768e-06, "loss": 0.6213, "step": 6614 }, { "epoch": 0.72, "learning_rate": 3.835053309434106e-06, "loss": 0.7837, "step": 6615 }, { "epoch": 0.72, "learning_rate": 3.832277529401494e-06, "loss": 0.6616, "step": 6616 }, { "epoch": 0.72, "learning_rate": 3.8295025161460265e-06, "loss": 0.593, "step": 6617 }, { "epoch": 0.72, "learning_rate": 3.826728270012686e-06, "loss": 0.6687, "step": 6618 }, { "epoch": 0.72, "learning_rate": 3.823954791346375e-06, "loss": 0.6648, "step": 6619 }, { "epoch": 0.72, "learning_rate": 3.821182080491893e-06, "loss": 0.6833, "step": 6620 }, { "epoch": 0.72, "learning_rate": 3.818410137793947e-06, "loss": 0.772, "step": 6621 }, { "epoch": 0.72, "learning_rate": 3.815638963597151e-06, "loss": 0.6987, "step": 6622 }, { "epoch": 0.72, "learning_rate": 3.8128685582460144e-06, "loss": 0.7119, "step": 6623 }, { "epoch": 0.72, "learning_rate": 3.810098922084958e-06, "loss": 0.6626, "step": 6624 }, { "epoch": 0.72, "learning_rate": 3.8073300554583103e-06, "loss": 0.6914, "step": 6625 }, { "epoch": 0.72, "learning_rate": 3.804561958710292e-06, "loss": 0.6489, "step": 6626 }, { "epoch": 0.72, "learning_rate": 3.8017946321850383e-06, "loss": 0.7173, "step": 6627 }, { "epoch": 0.72, "learning_rate": 3.799028076226592e-06, "loss": 0.7041, "step": 6628 }, { "epoch": 0.72, "learning_rate": 3.7962622911788803e-06, "loss": 0.6213, "step": 6629 }, { "epoch": 0.72, "learning_rate": 3.7934972773857637e-06, "loss": 0.6646, "step": 6630 }, { "epoch": 0.72, "learning_rate": 3.790733035190981e-06, "loss": 0.7458, "step": 6631 }, { "epoch": 0.72, "learning_rate": 3.7879695649381886e-06, "loss": 0.7437, "step": 6632 }, { "epoch": 0.72, "learning_rate": 3.7852068669709487e-06, "loss": 0.7158, "step": 6633 }, { "epoch": 0.72, "learning_rate": 3.7824449416327123e-06, "loss": 0.6628, "step": 6634 }, { "epoch": 0.72, "learning_rate": 3.7796837892668513e-06, "loss": 0.7578, "step": 6635 }, { "epoch": 0.72, "learning_rate": 3.7769234102166365e-06, "loss": 0.6792, "step": 6636 }, { "epoch": 0.72, "learning_rate": 3.774163804825234e-06, "loss": 0.6743, "step": 6637 }, { "epoch": 0.72, "learning_rate": 3.771404973435725e-06, "loss": 0.687, "step": 6638 }, { "epoch": 0.72, "learning_rate": 3.768646916391089e-06, "loss": 0.7219, "step": 6639 }, { "epoch": 0.72, "learning_rate": 3.765889634034211e-06, "loss": 0.6777, "step": 6640 }, { "epoch": 0.72, "learning_rate": 3.763133126707882e-06, "loss": 0.6965, "step": 6641 }, { "epoch": 0.72, "learning_rate": 3.7603773947547872e-06, "loss": 0.75, "step": 6642 }, { "epoch": 0.72, "learning_rate": 3.757622438517524e-06, "loss": 0.6045, "step": 6643 }, { "epoch": 0.72, "learning_rate": 3.7548682583385977e-06, "loss": 0.605, "step": 6644 }, { "epoch": 0.72, "learning_rate": 3.7521148545604003e-06, "loss": 0.5981, "step": 6645 }, { "epoch": 0.72, "learning_rate": 3.7493622275252417e-06, "loss": 0.6357, "step": 6646 }, { "epoch": 0.72, "learning_rate": 3.746610377575336e-06, "loss": 0.71, "step": 6647 }, { "epoch": 0.72, "learning_rate": 3.743859305052785e-06, "loss": 0.6868, "step": 6648 }, { "epoch": 0.72, "learning_rate": 3.741109010299617e-06, "loss": 0.7979, "step": 6649 }, { "epoch": 0.72, "learning_rate": 3.7383594936577427e-06, "loss": 0.7275, "step": 6650 }, { "epoch": 0.72, "learning_rate": 3.735610755468988e-06, "loss": 0.5776, "step": 6651 }, { "epoch": 0.72, "learning_rate": 3.7328627960750806e-06, "loss": 0.7332, "step": 6652 }, { "epoch": 0.72, "learning_rate": 3.7301156158176444e-06, "loss": 0.6902, "step": 6653 }, { "epoch": 0.72, "learning_rate": 3.7273692150382134e-06, "loss": 0.582, "step": 6654 }, { "epoch": 0.72, "learning_rate": 3.724623594078227e-06, "loss": 0.6509, "step": 6655 }, { "epoch": 0.72, "learning_rate": 3.7218787532790167e-06, "loss": 0.6719, "step": 6656 }, { "epoch": 0.72, "learning_rate": 3.719134692981826e-06, "loss": 0.7144, "step": 6657 }, { "epoch": 0.72, "learning_rate": 3.7163914135278e-06, "loss": 0.6641, "step": 6658 }, { "epoch": 0.72, "learning_rate": 3.713648915257986e-06, "loss": 0.6973, "step": 6659 }, { "epoch": 0.73, "learning_rate": 3.710907198513337e-06, "loss": 0.8057, "step": 6660 }, { "epoch": 0.73, "learning_rate": 3.708166263634699e-06, "loss": 0.803, "step": 6661 }, { "epoch": 0.73, "learning_rate": 3.705426110962832e-06, "loss": 0.7649, "step": 6662 }, { "epoch": 0.73, "learning_rate": 3.702686740838396e-06, "loss": 0.6455, "step": 6663 }, { "epoch": 0.73, "learning_rate": 3.6999481536019465e-06, "loss": 0.7354, "step": 6664 }, { "epoch": 0.73, "learning_rate": 3.6972103495939506e-06, "loss": 0.7554, "step": 6665 }, { "epoch": 0.73, "learning_rate": 3.6944733291547784e-06, "loss": 0.7437, "step": 6666 }, { "epoch": 0.73, "learning_rate": 3.6917370926246877e-06, "loss": 0.7351, "step": 6667 }, { "epoch": 0.73, "learning_rate": 3.6890016403438642e-06, "loss": 0.7227, "step": 6668 }, { "epoch": 0.73, "learning_rate": 3.6862669726523714e-06, "loss": 0.6768, "step": 6669 }, { "epoch": 0.73, "learning_rate": 3.68353308989019e-06, "loss": 0.7195, "step": 6670 }, { "epoch": 0.73, "learning_rate": 3.6807999923972025e-06, "loss": 0.7725, "step": 6671 }, { "epoch": 0.73, "learning_rate": 3.678067680513182e-06, "loss": 0.7053, "step": 6672 }, { "epoch": 0.73, "learning_rate": 3.6753361545778157e-06, "loss": 0.6516, "step": 6673 }, { "epoch": 0.73, "learning_rate": 3.6726054149306945e-06, "loss": 0.7217, "step": 6674 }, { "epoch": 0.73, "learning_rate": 3.6698754619112974e-06, "loss": 0.7197, "step": 6675 }, { "epoch": 0.73, "learning_rate": 3.667146295859021e-06, "loss": 0.7158, "step": 6676 }, { "epoch": 0.73, "learning_rate": 3.6644179171131557e-06, "loss": 0.7117, "step": 6677 }, { "epoch": 0.73, "learning_rate": 3.661690326012897e-06, "loss": 0.6379, "step": 6678 }, { "epoch": 0.73, "learning_rate": 3.6589635228973442e-06, "loss": 0.6252, "step": 6679 }, { "epoch": 0.73, "learning_rate": 3.656237508105489e-06, "loss": 0.5676, "step": 6680 }, { "epoch": 0.73, "learning_rate": 3.653512281976238e-06, "loss": 0.6235, "step": 6681 }, { "epoch": 0.73, "learning_rate": 3.6507878448483948e-06, "loss": 0.6101, "step": 6682 }, { "epoch": 0.73, "learning_rate": 3.648064197060659e-06, "loss": 0.6479, "step": 6683 }, { "epoch": 0.73, "learning_rate": 3.645341338951639e-06, "loss": 0.6868, "step": 6684 }, { "epoch": 0.73, "learning_rate": 3.642619270859847e-06, "loss": 0.676, "step": 6685 }, { "epoch": 0.73, "learning_rate": 3.6398979931236866e-06, "loss": 0.7295, "step": 6686 }, { "epoch": 0.73, "learning_rate": 3.6371775060814727e-06, "loss": 0.6248, "step": 6687 }, { "epoch": 0.73, "learning_rate": 3.634457810071419e-06, "loss": 0.6772, "step": 6688 }, { "epoch": 0.73, "learning_rate": 3.631738905431641e-06, "loss": 0.6987, "step": 6689 }, { "epoch": 0.73, "learning_rate": 3.6290207925001585e-06, "loss": 0.5618, "step": 6690 }, { "epoch": 0.73, "learning_rate": 3.6263034716148836e-06, "loss": 0.6987, "step": 6691 }, { "epoch": 0.73, "learning_rate": 3.6235869431136393e-06, "loss": 0.6152, "step": 6692 }, { "epoch": 0.73, "learning_rate": 3.62087120733415e-06, "loss": 0.7288, "step": 6693 }, { "epoch": 0.73, "learning_rate": 3.618156264614032e-06, "loss": 0.7939, "step": 6694 }, { "epoch": 0.73, "learning_rate": 3.6154421152908137e-06, "loss": 0.6904, "step": 6695 }, { "epoch": 0.73, "learning_rate": 3.612728759701919e-06, "loss": 0.6997, "step": 6696 }, { "epoch": 0.73, "learning_rate": 3.610016198184677e-06, "loss": 0.7041, "step": 6697 }, { "epoch": 0.73, "learning_rate": 3.6073044310763184e-06, "loss": 0.748, "step": 6698 }, { "epoch": 0.73, "learning_rate": 3.6045934587139653e-06, "loss": 0.7866, "step": 6699 }, { "epoch": 0.73, "learning_rate": 3.6018832814346516e-06, "loss": 0.6033, "step": 6700 }, { "epoch": 0.73, "learning_rate": 3.5991738995753146e-06, "loss": 0.6003, "step": 6701 }, { "epoch": 0.73, "learning_rate": 3.596465313472778e-06, "loss": 0.6484, "step": 6702 }, { "epoch": 0.73, "learning_rate": 3.59375752346378e-06, "loss": 0.6228, "step": 6703 }, { "epoch": 0.73, "learning_rate": 3.5910505298849608e-06, "loss": 0.719, "step": 6704 }, { "epoch": 0.73, "learning_rate": 3.5883443330728463e-06, "loss": 0.6335, "step": 6705 }, { "epoch": 0.73, "learning_rate": 3.5856389333638795e-06, "loss": 0.7139, "step": 6706 }, { "epoch": 0.73, "learning_rate": 3.5829343310943977e-06, "loss": 0.697, "step": 6707 }, { "epoch": 0.73, "learning_rate": 3.5802305266006387e-06, "loss": 0.6797, "step": 6708 }, { "epoch": 0.73, "learning_rate": 3.5775275202187475e-06, "loss": 0.7642, "step": 6709 }, { "epoch": 0.73, "learning_rate": 3.5748253122847542e-06, "loss": 0.7346, "step": 6710 }, { "epoch": 0.73, "learning_rate": 3.5721239031346067e-06, "loss": 0.7627, "step": 6711 }, { "epoch": 0.73, "learning_rate": 3.5694232931041484e-06, "loss": 0.6294, "step": 6712 }, { "epoch": 0.73, "learning_rate": 3.566723482529115e-06, "loss": 0.6772, "step": 6713 }, { "epoch": 0.73, "learning_rate": 3.5640244717451544e-06, "loss": 0.707, "step": 6714 }, { "epoch": 0.73, "learning_rate": 3.5613262610878076e-06, "loss": 0.6926, "step": 6715 }, { "epoch": 0.73, "learning_rate": 3.5586288508925203e-06, "loss": 0.6484, "step": 6716 }, { "epoch": 0.73, "learning_rate": 3.555932241494642e-06, "loss": 0.615, "step": 6717 }, { "epoch": 0.73, "learning_rate": 3.553236433229408e-06, "loss": 0.7002, "step": 6718 }, { "epoch": 0.73, "learning_rate": 3.550541426431968e-06, "loss": 0.7886, "step": 6719 }, { "epoch": 0.73, "learning_rate": 3.5478472214373716e-06, "loss": 0.6672, "step": 6720 }, { "epoch": 0.73, "learning_rate": 3.545153818580559e-06, "loss": 0.6504, "step": 6721 }, { "epoch": 0.73, "learning_rate": 3.542461218196379e-06, "loss": 0.7087, "step": 6722 }, { "epoch": 0.73, "learning_rate": 3.539769420619582e-06, "loss": 0.7241, "step": 6723 }, { "epoch": 0.73, "learning_rate": 3.537078426184808e-06, "loss": 0.6875, "step": 6724 }, { "epoch": 0.73, "learning_rate": 3.534388235226607e-06, "loss": 0.769, "step": 6725 }, { "epoch": 0.73, "learning_rate": 3.5316988480794255e-06, "loss": 0.6394, "step": 6726 }, { "epoch": 0.73, "learning_rate": 3.5290102650776127e-06, "loss": 0.7998, "step": 6727 }, { "epoch": 0.73, "learning_rate": 3.5263224865554178e-06, "loss": 0.7988, "step": 6728 }, { "epoch": 0.73, "learning_rate": 3.5236355128469814e-06, "loss": 0.6372, "step": 6729 }, { "epoch": 0.73, "learning_rate": 3.520949344286354e-06, "loss": 0.7461, "step": 6730 }, { "epoch": 0.73, "learning_rate": 3.5182639812074857e-06, "loss": 0.6338, "step": 6731 }, { "epoch": 0.73, "learning_rate": 3.515579423944219e-06, "loss": 0.6675, "step": 6732 }, { "epoch": 0.73, "learning_rate": 3.5128956728303e-06, "loss": 0.6382, "step": 6733 }, { "epoch": 0.73, "learning_rate": 3.510212728199378e-06, "loss": 0.6089, "step": 6734 }, { "epoch": 0.73, "learning_rate": 3.5075305903849986e-06, "loss": 0.6799, "step": 6735 }, { "epoch": 0.73, "learning_rate": 3.5048492597206107e-06, "loss": 0.7046, "step": 6736 }, { "epoch": 0.73, "learning_rate": 3.502168736539553e-06, "loss": 0.7593, "step": 6737 }, { "epoch": 0.73, "learning_rate": 3.4994890211750754e-06, "loss": 0.6968, "step": 6738 }, { "epoch": 0.73, "learning_rate": 3.496810113960325e-06, "loss": 0.7974, "step": 6739 }, { "epoch": 0.73, "learning_rate": 3.494132015228339e-06, "loss": 0.7534, "step": 6740 }, { "epoch": 0.73, "learning_rate": 3.4914547253120655e-06, "loss": 0.7822, "step": 6741 }, { "epoch": 0.73, "learning_rate": 3.4887782445443498e-06, "loss": 0.6819, "step": 6742 }, { "epoch": 0.73, "learning_rate": 3.4861025732579303e-06, "loss": 0.6216, "step": 6743 }, { "epoch": 0.73, "learning_rate": 3.483427711785449e-06, "loss": 0.593, "step": 6744 }, { "epoch": 0.73, "learning_rate": 3.4807536604594495e-06, "loss": 0.6848, "step": 6745 }, { "epoch": 0.73, "learning_rate": 3.478080419612372e-06, "loss": 0.5632, "step": 6746 }, { "epoch": 0.73, "learning_rate": 3.4754079895765604e-06, "loss": 0.6814, "step": 6747 }, { "epoch": 0.73, "learning_rate": 3.4727363706842453e-06, "loss": 0.6868, "step": 6748 }, { "epoch": 0.73, "learning_rate": 3.4700655632675694e-06, "loss": 0.6252, "step": 6749 }, { "epoch": 0.73, "learning_rate": 3.4673955676585734e-06, "loss": 0.5464, "step": 6750 }, { "epoch": 0.73, "learning_rate": 3.4647263841891865e-06, "loss": 0.6536, "step": 6751 }, { "epoch": 0.74, "learning_rate": 3.4620580131912472e-06, "loss": 0.6543, "step": 6752 }, { "epoch": 0.74, "learning_rate": 3.4593904549964917e-06, "loss": 0.6816, "step": 6753 }, { "epoch": 0.74, "learning_rate": 3.4567237099365514e-06, "loss": 0.6062, "step": 6754 }, { "epoch": 0.74, "learning_rate": 3.454057778342963e-06, "loss": 0.6951, "step": 6755 }, { "epoch": 0.74, "learning_rate": 3.4513926605471504e-06, "loss": 0.6968, "step": 6756 }, { "epoch": 0.74, "learning_rate": 3.4487283568804463e-06, "loss": 0.7319, "step": 6757 }, { "epoch": 0.74, "learning_rate": 3.446064867674085e-06, "loss": 0.6536, "step": 6758 }, { "epoch": 0.74, "learning_rate": 3.4434021932591855e-06, "loss": 0.7075, "step": 6759 }, { "epoch": 0.74, "learning_rate": 3.440740333966779e-06, "loss": 0.7361, "step": 6760 }, { "epoch": 0.74, "learning_rate": 3.4380792901277917e-06, "loss": 0.6152, "step": 6761 }, { "epoch": 0.74, "learning_rate": 3.435419062073041e-06, "loss": 0.7861, "step": 6762 }, { "epoch": 0.74, "learning_rate": 3.4327596501332526e-06, "loss": 0.6426, "step": 6763 }, { "epoch": 0.74, "learning_rate": 3.430101054639048e-06, "loss": 0.7617, "step": 6764 }, { "epoch": 0.74, "learning_rate": 3.4274432759209454e-06, "loss": 0.7576, "step": 6765 }, { "epoch": 0.74, "learning_rate": 3.424786314309365e-06, "loss": 0.7002, "step": 6766 }, { "epoch": 0.74, "learning_rate": 3.422130170134618e-06, "loss": 0.7554, "step": 6767 }, { "epoch": 0.74, "learning_rate": 3.419474843726921e-06, "loss": 0.6819, "step": 6768 }, { "epoch": 0.74, "learning_rate": 3.4168203354163898e-06, "loss": 0.6375, "step": 6769 }, { "epoch": 0.74, "learning_rate": 3.4141666455330292e-06, "loss": 0.6064, "step": 6770 }, { "epoch": 0.74, "learning_rate": 3.4115137744067516e-06, "loss": 0.5605, "step": 6771 }, { "epoch": 0.74, "learning_rate": 3.4088617223673683e-06, "loss": 0.6553, "step": 6772 }, { "epoch": 0.74, "learning_rate": 3.4062104897445737e-06, "loss": 0.5522, "step": 6773 }, { "epoch": 0.74, "learning_rate": 3.4035600768679855e-06, "loss": 0.5967, "step": 6774 }, { "epoch": 0.74, "learning_rate": 3.400910484067097e-06, "loss": 0.6465, "step": 6775 }, { "epoch": 0.74, "learning_rate": 3.398261711671309e-06, "loss": 0.6694, "step": 6776 }, { "epoch": 0.74, "learning_rate": 3.3956137600099248e-06, "loss": 0.5972, "step": 6777 }, { "epoch": 0.74, "learning_rate": 3.3929666294121323e-06, "loss": 0.6638, "step": 6778 }, { "epoch": 0.74, "learning_rate": 3.39032032020703e-06, "loss": 0.7026, "step": 6779 }, { "epoch": 0.74, "learning_rate": 3.387674832723611e-06, "loss": 0.7598, "step": 6780 }, { "epoch": 0.74, "learning_rate": 3.3850301672907594e-06, "loss": 0.7681, "step": 6781 }, { "epoch": 0.74, "learning_rate": 3.3823863242372657e-06, "loss": 0.6899, "step": 6782 }, { "epoch": 0.74, "learning_rate": 3.379743303891815e-06, "loss": 0.718, "step": 6783 }, { "epoch": 0.74, "learning_rate": 3.3771011065829906e-06, "loss": 0.7017, "step": 6784 }, { "epoch": 0.74, "learning_rate": 3.374459732639275e-06, "loss": 0.6694, "step": 6785 }, { "epoch": 0.74, "learning_rate": 3.37181918238904e-06, "loss": 0.6064, "step": 6786 }, { "epoch": 0.74, "learning_rate": 3.369179456160566e-06, "loss": 0.7554, "step": 6787 }, { "epoch": 0.74, "learning_rate": 3.3665405542820283e-06, "loss": 0.6663, "step": 6788 }, { "epoch": 0.74, "learning_rate": 3.363902477081491e-06, "loss": 0.6687, "step": 6789 }, { "epoch": 0.74, "learning_rate": 3.361265224886927e-06, "loss": 0.6907, "step": 6790 }, { "epoch": 0.74, "learning_rate": 3.3586287980262034e-06, "loss": 0.6357, "step": 6791 }, { "epoch": 0.74, "learning_rate": 3.355993196827075e-06, "loss": 0.6221, "step": 6792 }, { "epoch": 0.74, "learning_rate": 3.3533584216172153e-06, "loss": 0.6687, "step": 6793 }, { "epoch": 0.74, "learning_rate": 3.350724472724172e-06, "loss": 0.7224, "step": 6794 }, { "epoch": 0.74, "learning_rate": 3.348091350475402e-06, "loss": 0.7212, "step": 6795 }, { "epoch": 0.74, "learning_rate": 3.3454590551982623e-06, "loss": 0.6943, "step": 6796 }, { "epoch": 0.74, "learning_rate": 3.3428275872199967e-06, "loss": 0.6907, "step": 6797 }, { "epoch": 0.74, "learning_rate": 3.340196946867753e-06, "loss": 0.6094, "step": 6798 }, { "epoch": 0.74, "learning_rate": 3.337567134468579e-06, "loss": 0.6821, "step": 6799 }, { "epoch": 0.74, "learning_rate": 3.3349381503494093e-06, "loss": 0.6138, "step": 6800 }, { "epoch": 0.74, "learning_rate": 3.3323099948370853e-06, "loss": 0.7524, "step": 6801 }, { "epoch": 0.74, "learning_rate": 3.3296826682583407e-06, "loss": 0.7305, "step": 6802 }, { "epoch": 0.74, "learning_rate": 3.3270561709398075e-06, "loss": 0.7012, "step": 6803 }, { "epoch": 0.74, "learning_rate": 3.3244305032080183e-06, "loss": 0.7087, "step": 6804 }, { "epoch": 0.74, "learning_rate": 3.3218056653893914e-06, "loss": 0.7417, "step": 6805 }, { "epoch": 0.74, "learning_rate": 3.3191816578102533e-06, "loss": 0.7236, "step": 6806 }, { "epoch": 0.74, "learning_rate": 3.3165584807968254e-06, "loss": 0.7158, "step": 6807 }, { "epoch": 0.74, "learning_rate": 3.3139361346752175e-06, "loss": 0.6343, "step": 6808 }, { "epoch": 0.74, "learning_rate": 3.311314619771445e-06, "loss": 0.7268, "step": 6809 }, { "epoch": 0.74, "learning_rate": 3.308693936411421e-06, "loss": 0.6238, "step": 6810 }, { "epoch": 0.74, "learning_rate": 3.3060740849209417e-06, "loss": 0.6179, "step": 6811 }, { "epoch": 0.74, "learning_rate": 3.303455065625721e-06, "loss": 0.6458, "step": 6812 }, { "epoch": 0.74, "learning_rate": 3.300836878851351e-06, "loss": 0.709, "step": 6813 }, { "epoch": 0.74, "learning_rate": 3.2982195249233275e-06, "loss": 0.6885, "step": 6814 }, { "epoch": 0.74, "learning_rate": 3.2956030041670473e-06, "loss": 0.6394, "step": 6815 }, { "epoch": 0.74, "learning_rate": 3.292987316907792e-06, "loss": 0.7778, "step": 6816 }, { "epoch": 0.74, "learning_rate": 3.29037246347075e-06, "loss": 0.7451, "step": 6817 }, { "epoch": 0.74, "learning_rate": 3.287758444181004e-06, "loss": 0.7573, "step": 6818 }, { "epoch": 0.74, "learning_rate": 3.2851452593635267e-06, "loss": 0.7896, "step": 6819 }, { "epoch": 0.74, "learning_rate": 3.2825329093431946e-06, "loss": 0.5969, "step": 6820 }, { "epoch": 0.74, "learning_rate": 3.279921394444776e-06, "loss": 0.7427, "step": 6821 }, { "epoch": 0.74, "learning_rate": 3.2773107149929382e-06, "loss": 0.6855, "step": 6822 }, { "epoch": 0.74, "learning_rate": 3.2747008713122473e-06, "loss": 0.6943, "step": 6823 }, { "epoch": 0.74, "learning_rate": 3.2720918637271547e-06, "loss": 0.6687, "step": 6824 }, { "epoch": 0.74, "learning_rate": 3.2694836925620164e-06, "loss": 0.7329, "step": 6825 }, { "epoch": 0.74, "learning_rate": 3.2668763581410877e-06, "loss": 0.627, "step": 6826 }, { "epoch": 0.74, "learning_rate": 3.264269860788507e-06, "loss": 0.6802, "step": 6827 }, { "epoch": 0.74, "learning_rate": 3.2616642008283218e-06, "loss": 0.582, "step": 6828 }, { "epoch": 0.74, "learning_rate": 3.2590593785844715e-06, "loss": 0.7427, "step": 6829 }, { "epoch": 0.74, "learning_rate": 3.256455394380782e-06, "loss": 0.6875, "step": 6830 }, { "epoch": 0.74, "learning_rate": 3.253852248540994e-06, "loss": 0.7201, "step": 6831 }, { "epoch": 0.74, "learning_rate": 3.2512499413887255e-06, "loss": 0.7891, "step": 6832 }, { "epoch": 0.74, "learning_rate": 3.2486484732474997e-06, "loss": 0.7305, "step": 6833 }, { "epoch": 0.74, "learning_rate": 3.2460478444407373e-06, "loss": 0.6899, "step": 6834 }, { "epoch": 0.74, "learning_rate": 3.2434480552917445e-06, "loss": 0.7129, "step": 6835 }, { "epoch": 0.74, "learning_rate": 3.2408491061237325e-06, "loss": 0.5708, "step": 6836 }, { "epoch": 0.74, "learning_rate": 3.2382509972598087e-06, "loss": 0.5823, "step": 6837 }, { "epoch": 0.74, "learning_rate": 3.235653729022965e-06, "loss": 0.7617, "step": 6838 }, { "epoch": 0.74, "learning_rate": 3.233057301736102e-06, "loss": 0.6274, "step": 6839 }, { "epoch": 0.74, "learning_rate": 3.2304617157220075e-06, "loss": 0.6423, "step": 6840 }, { "epoch": 0.74, "learning_rate": 3.2278669713033684e-06, "loss": 0.7849, "step": 6841 }, { "epoch": 0.74, "learning_rate": 3.225273068802768e-06, "loss": 0.6553, "step": 6842 }, { "epoch": 0.74, "learning_rate": 3.222680008542678e-06, "loss": 0.8608, "step": 6843 }, { "epoch": 0.75, "learning_rate": 3.220087790845472e-06, "loss": 0.6321, "step": 6844 }, { "epoch": 0.75, "learning_rate": 3.217496416033421e-06, "loss": 0.5789, "step": 6845 }, { "epoch": 0.75, "learning_rate": 3.2149058844286796e-06, "loss": 0.7427, "step": 6846 }, { "epoch": 0.75, "learning_rate": 3.21231619635331e-06, "loss": 0.7073, "step": 6847 }, { "epoch": 0.75, "learning_rate": 3.209727352129266e-06, "loss": 0.6587, "step": 6848 }, { "epoch": 0.75, "learning_rate": 3.2071393520783867e-06, "loss": 0.7944, "step": 6849 }, { "epoch": 0.75, "learning_rate": 3.204552196522428e-06, "loss": 0.7427, "step": 6850 }, { "epoch": 0.75, "learning_rate": 3.201965885783017e-06, "loss": 0.6572, "step": 6851 }, { "epoch": 0.75, "learning_rate": 3.19938042018169e-06, "loss": 0.6169, "step": 6852 }, { "epoch": 0.75, "learning_rate": 3.196795800039878e-06, "loss": 0.7876, "step": 6853 }, { "epoch": 0.75, "learning_rate": 3.1942120256788966e-06, "loss": 0.5269, "step": 6854 }, { "epoch": 0.75, "learning_rate": 3.1916290974199658e-06, "loss": 0.7131, "step": 6855 }, { "epoch": 0.75, "learning_rate": 3.1890470155842023e-06, "loss": 0.6914, "step": 6856 }, { "epoch": 0.75, "learning_rate": 3.1864657804926046e-06, "loss": 0.7041, "step": 6857 }, { "epoch": 0.75, "learning_rate": 3.1838853924660795e-06, "loss": 0.5742, "step": 6858 }, { "epoch": 0.75, "learning_rate": 3.1813058518254227e-06, "loss": 0.6045, "step": 6859 }, { "epoch": 0.75, "learning_rate": 3.178727158891325e-06, "loss": 0.7095, "step": 6860 }, { "epoch": 0.75, "learning_rate": 3.1761493139843734e-06, "loss": 0.7163, "step": 6861 }, { "epoch": 0.75, "learning_rate": 3.1735723174250456e-06, "loss": 0.7065, "step": 6862 }, { "epoch": 0.75, "learning_rate": 3.1709961695337157e-06, "loss": 0.6174, "step": 6863 }, { "epoch": 0.75, "learning_rate": 3.1684208706306572e-06, "loss": 0.7524, "step": 6864 }, { "epoch": 0.75, "learning_rate": 3.1658464210360285e-06, "loss": 0.698, "step": 6865 }, { "epoch": 0.75, "learning_rate": 3.1632728210698902e-06, "loss": 0.6992, "step": 6866 }, { "epoch": 0.75, "learning_rate": 3.160700071052197e-06, "loss": 0.7603, "step": 6867 }, { "epoch": 0.75, "learning_rate": 3.1581281713027877e-06, "loss": 0.7617, "step": 6868 }, { "epoch": 0.75, "learning_rate": 3.155557122141414e-06, "loss": 0.7048, "step": 6869 }, { "epoch": 0.75, "learning_rate": 3.152986923887703e-06, "loss": 0.6858, "step": 6870 }, { "epoch": 0.75, "learning_rate": 3.150417576861188e-06, "loss": 0.7285, "step": 6871 }, { "epoch": 0.75, "learning_rate": 3.1478490813812946e-06, "loss": 0.6172, "step": 6872 }, { "epoch": 0.75, "learning_rate": 3.1452814377673344e-06, "loss": 0.6965, "step": 6873 }, { "epoch": 0.75, "learning_rate": 3.1427146463385226e-06, "loss": 0.7095, "step": 6874 }, { "epoch": 0.75, "learning_rate": 3.140148707413969e-06, "loss": 0.7915, "step": 6875 }, { "epoch": 0.75, "learning_rate": 3.1375836213126653e-06, "loss": 0.7446, "step": 6876 }, { "epoch": 0.75, "learning_rate": 3.135019388353512e-06, "loss": 0.752, "step": 6877 }, { "epoch": 0.75, "learning_rate": 3.1324560088552934e-06, "loss": 0.5859, "step": 6878 }, { "epoch": 0.75, "learning_rate": 3.1298934831366934e-06, "loss": 0.7568, "step": 6879 }, { "epoch": 0.75, "learning_rate": 3.127331811516291e-06, "loss": 0.7156, "step": 6880 }, { "epoch": 0.75, "learning_rate": 3.124770994312547e-06, "loss": 0.6565, "step": 6881 }, { "epoch": 0.75, "learning_rate": 3.12221103184383e-06, "loss": 0.7068, "step": 6882 }, { "epoch": 0.75, "learning_rate": 3.1196519244284005e-06, "loss": 0.6753, "step": 6883 }, { "epoch": 0.75, "learning_rate": 3.1170936723844014e-06, "loss": 0.6614, "step": 6884 }, { "epoch": 0.75, "learning_rate": 3.1145362760298802e-06, "loss": 0.6399, "step": 6885 }, { "epoch": 0.75, "learning_rate": 3.1119797356827796e-06, "loss": 0.719, "step": 6886 }, { "epoch": 0.75, "learning_rate": 3.10942405166092e-06, "loss": 0.6938, "step": 6887 }, { "epoch": 0.75, "learning_rate": 3.1068692242820387e-06, "loss": 0.707, "step": 6888 }, { "epoch": 0.75, "learning_rate": 3.104315253863747e-06, "loss": 0.6521, "step": 6889 }, { "epoch": 0.75, "learning_rate": 3.101762140723559e-06, "loss": 0.687, "step": 6890 }, { "epoch": 0.75, "learning_rate": 3.099209885178882e-06, "loss": 0.6733, "step": 6891 }, { "epoch": 0.75, "learning_rate": 3.0966584875470107e-06, "loss": 0.6165, "step": 6892 }, { "epoch": 0.75, "learning_rate": 3.0941079481451384e-06, "loss": 0.772, "step": 6893 }, { "epoch": 0.75, "learning_rate": 3.0915582672903554e-06, "loss": 0.6091, "step": 6894 }, { "epoch": 0.75, "learning_rate": 3.0890094452996344e-06, "loss": 0.7095, "step": 6895 }, { "epoch": 0.75, "learning_rate": 3.0864614824898487e-06, "loss": 0.7026, "step": 6896 }, { "epoch": 0.75, "learning_rate": 3.0839143791777647e-06, "loss": 0.5728, "step": 6897 }, { "epoch": 0.75, "learning_rate": 3.081368135680041e-06, "loss": 0.647, "step": 6898 }, { "epoch": 0.75, "learning_rate": 3.0788227523132307e-06, "loss": 0.7524, "step": 6899 }, { "epoch": 0.75, "learning_rate": 3.076278229393773e-06, "loss": 0.7356, "step": 6900 }, { "epoch": 0.75, "learning_rate": 3.073734567238009e-06, "loss": 0.73, "step": 6901 }, { "epoch": 0.75, "learning_rate": 3.0711917661621716e-06, "loss": 0.6897, "step": 6902 }, { "epoch": 0.75, "learning_rate": 3.0686498264823783e-06, "loss": 0.7275, "step": 6903 }, { "epoch": 0.75, "learning_rate": 3.066108748514648e-06, "loss": 0.7871, "step": 6904 }, { "epoch": 0.75, "learning_rate": 3.0635685325748944e-06, "loss": 0.759, "step": 6905 }, { "epoch": 0.75, "learning_rate": 3.0610291789789094e-06, "loss": 0.6301, "step": 6906 }, { "epoch": 0.75, "learning_rate": 3.058490688042399e-06, "loss": 0.6035, "step": 6907 }, { "epoch": 0.75, "learning_rate": 3.0559530600809438e-06, "loss": 0.697, "step": 6908 }, { "epoch": 0.75, "learning_rate": 3.0534162954100264e-06, "loss": 0.8071, "step": 6909 }, { "epoch": 0.75, "learning_rate": 3.050880394345023e-06, "loss": 0.655, "step": 6910 }, { "epoch": 0.75, "learning_rate": 3.048345357201192e-06, "loss": 0.8062, "step": 6911 }, { "epoch": 0.75, "learning_rate": 3.0458111842936956e-06, "loss": 0.6152, "step": 6912 }, { "epoch": 0.75, "learning_rate": 3.043277875937588e-06, "loss": 0.6096, "step": 6913 }, { "epoch": 0.75, "learning_rate": 3.040745432447806e-06, "loss": 0.7773, "step": 6914 }, { "epoch": 0.75, "learning_rate": 3.038213854139187e-06, "loss": 0.7573, "step": 6915 }, { "epoch": 0.75, "learning_rate": 3.035683141326462e-06, "loss": 0.6367, "step": 6916 }, { "epoch": 0.75, "learning_rate": 3.033153294324249e-06, "loss": 0.7153, "step": 6917 }, { "epoch": 0.75, "learning_rate": 3.0306243134470668e-06, "loss": 0.7109, "step": 6918 }, { "epoch": 0.75, "learning_rate": 3.028096199009313e-06, "loss": 0.7744, "step": 6919 }, { "epoch": 0.75, "learning_rate": 3.0255689513252873e-06, "loss": 0.6106, "step": 6920 }, { "epoch": 0.75, "learning_rate": 3.023042570709185e-06, "loss": 0.7891, "step": 6921 }, { "epoch": 0.75, "learning_rate": 3.020517057475079e-06, "loss": 0.6838, "step": 6922 }, { "epoch": 0.75, "learning_rate": 3.0179924119369496e-06, "loss": 0.6033, "step": 6923 }, { "epoch": 0.75, "learning_rate": 3.015468634408664e-06, "loss": 0.6338, "step": 6924 }, { "epoch": 0.75, "learning_rate": 3.0129457252039763e-06, "loss": 0.658, "step": 6925 }, { "epoch": 0.75, "learning_rate": 3.0104236846365376e-06, "loss": 0.728, "step": 6926 }, { "epoch": 0.75, "learning_rate": 3.0079025130198936e-06, "loss": 0.6943, "step": 6927 }, { "epoch": 0.75, "learning_rate": 3.0053822106674756e-06, "loss": 0.6917, "step": 6928 }, { "epoch": 0.75, "learning_rate": 3.0028627778926157e-06, "loss": 0.6953, "step": 6929 }, { "epoch": 0.75, "learning_rate": 3.000344215008524e-06, "loss": 0.6497, "step": 6930 }, { "epoch": 0.75, "learning_rate": 2.9978265223283152e-06, "loss": 0.6899, "step": 6931 }, { "epoch": 0.75, "learning_rate": 2.9953097001649935e-06, "loss": 0.7202, "step": 6932 }, { "epoch": 0.75, "learning_rate": 2.9927937488314464e-06, "loss": 0.7368, "step": 6933 }, { "epoch": 0.75, "learning_rate": 2.990278668640463e-06, "loss": 0.7627, "step": 6934 }, { "epoch": 0.75, "learning_rate": 2.9877644599047196e-06, "loss": 0.7607, "step": 6935 }, { "epoch": 0.76, "learning_rate": 2.9852511229367862e-06, "loss": 0.6892, "step": 6936 }, { "epoch": 0.76, "learning_rate": 2.982738658049126e-06, "loss": 0.6475, "step": 6937 }, { "epoch": 0.76, "learning_rate": 2.980227065554084e-06, "loss": 0.5698, "step": 6938 }, { "epoch": 0.76, "learning_rate": 2.977716345763908e-06, "loss": 0.6833, "step": 6939 }, { "epoch": 0.76, "learning_rate": 2.975206498990736e-06, "loss": 0.6892, "step": 6940 }, { "epoch": 0.76, "learning_rate": 2.972697525546587e-06, "loss": 0.7263, "step": 6941 }, { "epoch": 0.76, "learning_rate": 2.970189425743383e-06, "loss": 0.6311, "step": 6942 }, { "epoch": 0.76, "learning_rate": 2.9676821998929374e-06, "loss": 0.6172, "step": 6943 }, { "epoch": 0.76, "learning_rate": 2.9651758483069436e-06, "loss": 0.7039, "step": 6944 }, { "epoch": 0.76, "learning_rate": 2.9626703712969962e-06, "loss": 0.7212, "step": 6945 }, { "epoch": 0.76, "learning_rate": 2.96016576917458e-06, "loss": 0.7974, "step": 6946 }, { "epoch": 0.76, "learning_rate": 2.9576620422510684e-06, "loss": 0.7544, "step": 6947 }, { "epoch": 0.76, "learning_rate": 2.955159190837731e-06, "loss": 0.6963, "step": 6948 }, { "epoch": 0.76, "learning_rate": 2.952657215245718e-06, "loss": 0.6357, "step": 6949 }, { "epoch": 0.76, "learning_rate": 2.9501561157860803e-06, "loss": 0.8008, "step": 6950 }, { "epoch": 0.76, "learning_rate": 2.9476558927697605e-06, "loss": 0.6182, "step": 6951 }, { "epoch": 0.76, "learning_rate": 2.9451565465075827e-06, "loss": 0.7085, "step": 6952 }, { "epoch": 0.76, "learning_rate": 2.94265807731027e-06, "loss": 0.7485, "step": 6953 }, { "epoch": 0.76, "learning_rate": 2.940160485488436e-06, "loss": 0.5901, "step": 6954 }, { "epoch": 0.76, "learning_rate": 2.9376637713525824e-06, "loss": 0.6846, "step": 6955 }, { "epoch": 0.76, "learning_rate": 2.935167935213107e-06, "loss": 0.5706, "step": 6956 }, { "epoch": 0.76, "learning_rate": 2.9326729773802877e-06, "loss": 0.7168, "step": 6957 }, { "epoch": 0.76, "learning_rate": 2.930178898164303e-06, "loss": 0.7158, "step": 6958 }, { "epoch": 0.76, "learning_rate": 2.927685697875223e-06, "loss": 0.6709, "step": 6959 }, { "epoch": 0.76, "learning_rate": 2.925193376822999e-06, "loss": 0.7021, "step": 6960 }, { "epoch": 0.76, "learning_rate": 2.9227019353174814e-06, "loss": 0.6902, "step": 6961 }, { "epoch": 0.76, "learning_rate": 2.9202113736684103e-06, "loss": 0.6428, "step": 6962 }, { "epoch": 0.76, "learning_rate": 2.91772169218541e-06, "loss": 0.6992, "step": 6963 }, { "epoch": 0.76, "learning_rate": 2.9152328911780027e-06, "loss": 0.6292, "step": 6964 }, { "epoch": 0.76, "learning_rate": 2.912744970955599e-06, "loss": 0.6208, "step": 6965 }, { "epoch": 0.76, "learning_rate": 2.9102579318274994e-06, "loss": 0.6816, "step": 6966 }, { "epoch": 0.76, "learning_rate": 2.9077717741028965e-06, "loss": 0.6412, "step": 6967 }, { "epoch": 0.76, "learning_rate": 2.905286498090868e-06, "loss": 0.6531, "step": 6968 }, { "epoch": 0.76, "learning_rate": 2.9028021041003874e-06, "loss": 0.6985, "step": 6969 }, { "epoch": 0.76, "learning_rate": 2.900318592440321e-06, "loss": 0.645, "step": 6970 }, { "epoch": 0.76, "learning_rate": 2.897835963419414e-06, "loss": 0.7134, "step": 6971 }, { "epoch": 0.76, "learning_rate": 2.8953542173463133e-06, "loss": 0.7109, "step": 6972 }, { "epoch": 0.76, "learning_rate": 2.8928733545295506e-06, "loss": 0.6597, "step": 6973 }, { "epoch": 0.76, "learning_rate": 2.8903933752775504e-06, "loss": 0.7092, "step": 6974 }, { "epoch": 0.76, "learning_rate": 2.8879142798986293e-06, "loss": 0.658, "step": 6975 }, { "epoch": 0.76, "learning_rate": 2.885436068700984e-06, "loss": 0.6506, "step": 6976 }, { "epoch": 0.76, "learning_rate": 2.8829587419927107e-06, "loss": 0.7012, "step": 6977 }, { "epoch": 0.76, "learning_rate": 2.880482300081797e-06, "loss": 0.5889, "step": 6978 }, { "epoch": 0.76, "learning_rate": 2.8780067432761105e-06, "loss": 0.7368, "step": 6979 }, { "epoch": 0.76, "learning_rate": 2.8755320718834166e-06, "loss": 0.7568, "step": 6980 }, { "epoch": 0.76, "learning_rate": 2.8730582862113743e-06, "loss": 0.6565, "step": 6981 }, { "epoch": 0.76, "learning_rate": 2.8705853865675182e-06, "loss": 0.6672, "step": 6982 }, { "epoch": 0.76, "learning_rate": 2.8681133732592847e-06, "loss": 0.6367, "step": 6983 }, { "epoch": 0.76, "learning_rate": 2.865642246593999e-06, "loss": 0.6892, "step": 6984 }, { "epoch": 0.76, "learning_rate": 2.8631720068788728e-06, "loss": 0.7898, "step": 6985 }, { "epoch": 0.76, "learning_rate": 2.8607026544210115e-06, "loss": 0.7207, "step": 6986 }, { "epoch": 0.76, "learning_rate": 2.858234189527401e-06, "loss": 0.6074, "step": 6987 }, { "epoch": 0.76, "learning_rate": 2.8557666125049268e-06, "loss": 0.5923, "step": 6988 }, { "epoch": 0.76, "learning_rate": 2.853299923660363e-06, "loss": 0.6079, "step": 6989 }, { "epoch": 0.76, "learning_rate": 2.8508341233003656e-06, "loss": 0.6252, "step": 6990 }, { "epoch": 0.76, "learning_rate": 2.8483692117314874e-06, "loss": 0.6243, "step": 6991 }, { "epoch": 0.76, "learning_rate": 2.8459051892601685e-06, "loss": 0.7158, "step": 6992 }, { "epoch": 0.76, "learning_rate": 2.84344205619274e-06, "loss": 0.6882, "step": 6993 }, { "epoch": 0.76, "learning_rate": 2.8409798128354214e-06, "loss": 0.7363, "step": 6994 }, { "epoch": 0.76, "learning_rate": 2.838518459494317e-06, "loss": 0.6252, "step": 6995 }, { "epoch": 0.76, "learning_rate": 2.8360579964754277e-06, "loss": 0.7891, "step": 6996 }, { "epoch": 0.76, "learning_rate": 2.8335984240846424e-06, "loss": 0.6335, "step": 6997 }, { "epoch": 0.76, "learning_rate": 2.831139742627732e-06, "loss": 0.6753, "step": 6998 }, { "epoch": 0.76, "learning_rate": 2.8286819524103657e-06, "loss": 0.7065, "step": 6999 }, { "epoch": 0.76, "learning_rate": 2.826225053738101e-06, "loss": 0.6221, "step": 7000 }, { "epoch": 0.76, "learning_rate": 2.8237690469163746e-06, "loss": 0.6101, "step": 7001 }, { "epoch": 0.76, "learning_rate": 2.8213139322505245e-06, "loss": 0.6609, "step": 7002 }, { "epoch": 0.76, "learning_rate": 2.818859710045773e-06, "loss": 0.6211, "step": 7003 }, { "epoch": 0.76, "learning_rate": 2.8164063806072283e-06, "loss": 0.6145, "step": 7004 }, { "epoch": 0.76, "learning_rate": 2.813953944239898e-06, "loss": 0.5801, "step": 7005 }, { "epoch": 0.76, "learning_rate": 2.8115024012486624e-06, "loss": 0.5476, "step": 7006 }, { "epoch": 0.76, "learning_rate": 2.809051751938303e-06, "loss": 0.6367, "step": 7007 }, { "epoch": 0.76, "learning_rate": 2.8066019966134907e-06, "loss": 0.7244, "step": 7008 }, { "epoch": 0.76, "learning_rate": 2.8041531355787756e-06, "loss": 0.719, "step": 7009 }, { "epoch": 0.76, "learning_rate": 2.8017051691386045e-06, "loss": 0.6094, "step": 7010 }, { "epoch": 0.76, "learning_rate": 2.7992580975973136e-06, "loss": 0.6433, "step": 7011 }, { "epoch": 0.76, "learning_rate": 2.796811921259117e-06, "loss": 0.7764, "step": 7012 }, { "epoch": 0.76, "learning_rate": 2.794366640428138e-06, "loss": 0.6611, "step": 7013 }, { "epoch": 0.76, "learning_rate": 2.7919222554083667e-06, "loss": 0.7053, "step": 7014 }, { "epoch": 0.76, "learning_rate": 2.7894787665036936e-06, "loss": 0.6868, "step": 7015 }, { "epoch": 0.76, "learning_rate": 2.7870361740179007e-06, "loss": 0.6426, "step": 7016 }, { "epoch": 0.76, "learning_rate": 2.7845944782546453e-06, "loss": 0.6292, "step": 7017 }, { "epoch": 0.76, "learning_rate": 2.7821536795174855e-06, "loss": 0.6873, "step": 7018 }, { "epoch": 0.76, "learning_rate": 2.779713778109867e-06, "loss": 0.7148, "step": 7019 }, { "epoch": 0.76, "learning_rate": 2.7772747743351136e-06, "loss": 0.6843, "step": 7020 }, { "epoch": 0.76, "learning_rate": 2.774836668496448e-06, "loss": 0.551, "step": 7021 }, { "epoch": 0.76, "learning_rate": 2.7723994608969775e-06, "loss": 0.7124, "step": 7022 }, { "epoch": 0.76, "learning_rate": 2.7699631518396985e-06, "loss": 0.7065, "step": 7023 }, { "epoch": 0.76, "learning_rate": 2.7675277416274993e-06, "loss": 0.6826, "step": 7024 }, { "epoch": 0.76, "learning_rate": 2.765093230563144e-06, "loss": 0.574, "step": 7025 }, { "epoch": 0.76, "learning_rate": 2.7626596189492983e-06, "loss": 0.6646, "step": 7026 }, { "epoch": 0.76, "learning_rate": 2.7602269070885134e-06, "loss": 0.7283, "step": 7027 }, { "epoch": 0.77, "learning_rate": 2.757795095283221e-06, "loss": 0.7083, "step": 7028 }, { "epoch": 0.77, "learning_rate": 2.755364183835748e-06, "loss": 0.7212, "step": 7029 }, { "epoch": 0.77, "learning_rate": 2.7529341730483115e-06, "loss": 0.7178, "step": 7030 }, { "epoch": 0.77, "learning_rate": 2.7505050632230047e-06, "loss": 0.7617, "step": 7031 }, { "epoch": 0.77, "learning_rate": 2.7480768546618263e-06, "loss": 0.6763, "step": 7032 }, { "epoch": 0.77, "learning_rate": 2.7456495476666466e-06, "loss": 0.6519, "step": 7033 }, { "epoch": 0.77, "learning_rate": 2.743223142539233e-06, "loss": 0.6914, "step": 7034 }, { "epoch": 0.77, "learning_rate": 2.7407976395812417e-06, "loss": 0.6992, "step": 7035 }, { "epoch": 0.77, "learning_rate": 2.7383730390942075e-06, "loss": 0.7266, "step": 7036 }, { "epoch": 0.77, "learning_rate": 2.7359493413795623e-06, "loss": 0.7393, "step": 7037 }, { "epoch": 0.77, "learning_rate": 2.733526546738624e-06, "loss": 0.71, "step": 7038 }, { "epoch": 0.77, "learning_rate": 2.7311046554725928e-06, "loss": 0.6968, "step": 7039 }, { "epoch": 0.77, "learning_rate": 2.728683667882562e-06, "loss": 0.6665, "step": 7040 }, { "epoch": 0.77, "learning_rate": 2.726263584269513e-06, "loss": 0.6299, "step": 7041 }, { "epoch": 0.77, "learning_rate": 2.7238444049343114e-06, "loss": 0.7256, "step": 7042 }, { "epoch": 0.77, "learning_rate": 2.7214261301777143e-06, "loss": 0.5925, "step": 7043 }, { "epoch": 0.77, "learning_rate": 2.719008760300359e-06, "loss": 0.7859, "step": 7044 }, { "epoch": 0.77, "learning_rate": 2.716592295602778e-06, "loss": 0.6836, "step": 7045 }, { "epoch": 0.77, "learning_rate": 2.714176736385392e-06, "loss": 0.7319, "step": 7046 }, { "epoch": 0.77, "learning_rate": 2.7117620829484994e-06, "loss": 0.6497, "step": 7047 }, { "epoch": 0.77, "learning_rate": 2.7093483355922934e-06, "loss": 0.6438, "step": 7048 }, { "epoch": 0.77, "learning_rate": 2.706935494616859e-06, "loss": 0.6729, "step": 7049 }, { "epoch": 0.77, "learning_rate": 2.7045235603221533e-06, "loss": 0.7166, "step": 7050 }, { "epoch": 0.77, "learning_rate": 2.70211253300804e-06, "loss": 0.6758, "step": 7051 }, { "epoch": 0.77, "learning_rate": 2.6997024129742544e-06, "loss": 0.7622, "step": 7052 }, { "epoch": 0.77, "learning_rate": 2.6972932005204267e-06, "loss": 0.7617, "step": 7053 }, { "epoch": 0.77, "learning_rate": 2.694884895946075e-06, "loss": 0.7173, "step": 7054 }, { "epoch": 0.77, "learning_rate": 2.6924774995505963e-06, "loss": 0.7102, "step": 7055 }, { "epoch": 0.77, "learning_rate": 2.690071011633284e-06, "loss": 0.7617, "step": 7056 }, { "epoch": 0.77, "learning_rate": 2.687665432493317e-06, "loss": 0.6101, "step": 7057 }, { "epoch": 0.77, "learning_rate": 2.6852607624297533e-06, "loss": 0.6152, "step": 7058 }, { "epoch": 0.77, "learning_rate": 2.6828570017415477e-06, "loss": 0.7544, "step": 7059 }, { "epoch": 0.77, "learning_rate": 2.6804541507275373e-06, "loss": 0.7068, "step": 7060 }, { "epoch": 0.77, "learning_rate": 2.678052209686448e-06, "loss": 0.5723, "step": 7061 }, { "epoch": 0.77, "learning_rate": 2.6756511789168926e-06, "loss": 0.7085, "step": 7062 }, { "epoch": 0.77, "learning_rate": 2.6732510587173645e-06, "loss": 0.7102, "step": 7063 }, { "epoch": 0.77, "learning_rate": 2.670851849386251e-06, "loss": 0.7402, "step": 7064 }, { "epoch": 0.77, "learning_rate": 2.668453551221829e-06, "loss": 0.7844, "step": 7065 }, { "epoch": 0.77, "learning_rate": 2.666056164522249e-06, "loss": 0.7471, "step": 7066 }, { "epoch": 0.77, "learning_rate": 2.6636596895855617e-06, "loss": 0.6372, "step": 7067 }, { "epoch": 0.77, "learning_rate": 2.6612641267097005e-06, "loss": 0.6611, "step": 7068 }, { "epoch": 0.77, "learning_rate": 2.658869476192475e-06, "loss": 0.6448, "step": 7069 }, { "epoch": 0.77, "learning_rate": 2.656475738331603e-06, "loss": 0.6536, "step": 7070 }, { "epoch": 0.77, "learning_rate": 2.6540829134246683e-06, "loss": 0.6492, "step": 7071 }, { "epoch": 0.77, "learning_rate": 2.6516910017691498e-06, "loss": 0.6641, "step": 7072 }, { "epoch": 0.77, "learning_rate": 2.6493000036624173e-06, "loss": 0.6306, "step": 7073 }, { "epoch": 0.77, "learning_rate": 2.6469099194017144e-06, "loss": 0.6533, "step": 7074 }, { "epoch": 0.77, "learning_rate": 2.644520749284183e-06, "loss": 0.676, "step": 7075 }, { "epoch": 0.77, "learning_rate": 2.6421324936068492e-06, "loss": 0.6807, "step": 7076 }, { "epoch": 0.77, "learning_rate": 2.6397451526666185e-06, "loss": 0.7332, "step": 7077 }, { "epoch": 0.77, "learning_rate": 2.6373587267602887e-06, "loss": 0.7361, "step": 7078 }, { "epoch": 0.77, "learning_rate": 2.6349732161845422e-06, "loss": 0.6431, "step": 7079 }, { "epoch": 0.77, "learning_rate": 2.6325886212359496e-06, "loss": 0.708, "step": 7080 }, { "epoch": 0.77, "learning_rate": 2.630204942210969e-06, "loss": 0.7009, "step": 7081 }, { "epoch": 0.77, "learning_rate": 2.6278221794059343e-06, "loss": 0.6621, "step": 7082 }, { "epoch": 0.77, "learning_rate": 2.6254403331170773e-06, "loss": 0.6831, "step": 7083 }, { "epoch": 0.77, "learning_rate": 2.6230594036405133e-06, "loss": 0.6611, "step": 7084 }, { "epoch": 0.77, "learning_rate": 2.620679391272236e-06, "loss": 0.7446, "step": 7085 }, { "epoch": 0.77, "learning_rate": 2.618300296308135e-06, "loss": 0.656, "step": 7086 }, { "epoch": 0.77, "learning_rate": 2.615922119043982e-06, "loss": 0.7874, "step": 7087 }, { "epoch": 0.77, "learning_rate": 2.6135448597754276e-06, "loss": 0.6086, "step": 7088 }, { "epoch": 0.77, "learning_rate": 2.611168518798026e-06, "loss": 0.6621, "step": 7089 }, { "epoch": 0.77, "learning_rate": 2.6087930964071974e-06, "loss": 0.6448, "step": 7090 }, { "epoch": 0.77, "learning_rate": 2.60641859289826e-06, "loss": 0.7886, "step": 7091 }, { "epoch": 0.77, "learning_rate": 2.6040450085664158e-06, "loss": 0.7114, "step": 7092 }, { "epoch": 0.77, "learning_rate": 2.601672343706747e-06, "loss": 0.8662, "step": 7093 }, { "epoch": 0.77, "learning_rate": 2.5993005986142273e-06, "loss": 0.7217, "step": 7094 }, { "epoch": 0.77, "learning_rate": 2.5969297735837175e-06, "loss": 0.6836, "step": 7095 }, { "epoch": 0.77, "learning_rate": 2.594559868909956e-06, "loss": 0.6414, "step": 7096 }, { "epoch": 0.77, "learning_rate": 2.592190884887573e-06, "loss": 0.634, "step": 7097 }, { "epoch": 0.77, "learning_rate": 2.5898228218110834e-06, "loss": 0.6753, "step": 7098 }, { "epoch": 0.77, "learning_rate": 2.5874556799748875e-06, "loss": 0.6748, "step": 7099 }, { "epoch": 0.77, "learning_rate": 2.585089459673272e-06, "loss": 0.6865, "step": 7100 }, { "epoch": 0.77, "learning_rate": 2.582724161200405e-06, "loss": 0.7339, "step": 7101 }, { "epoch": 0.77, "learning_rate": 2.5803597848503424e-06, "loss": 0.6863, "step": 7102 }, { "epoch": 0.77, "learning_rate": 2.57799633091703e-06, "loss": 0.6384, "step": 7103 }, { "epoch": 0.77, "learning_rate": 2.5756337996942895e-06, "loss": 0.6995, "step": 7104 }, { "epoch": 0.77, "learning_rate": 2.573272191475834e-06, "loss": 0.6782, "step": 7105 }, { "epoch": 0.77, "learning_rate": 2.5709115065552647e-06, "loss": 0.6387, "step": 7106 }, { "epoch": 0.77, "learning_rate": 2.5685517452260566e-06, "loss": 0.6694, "step": 7107 }, { "epoch": 0.77, "learning_rate": 2.5661929077815885e-06, "loss": 0.6656, "step": 7108 }, { "epoch": 0.77, "learning_rate": 2.563834994515103e-06, "loss": 0.6875, "step": 7109 }, { "epoch": 0.77, "learning_rate": 2.561478005719743e-06, "loss": 0.6333, "step": 7110 }, { "epoch": 0.77, "learning_rate": 2.5591219416885337e-06, "loss": 0.6177, "step": 7111 }, { "epoch": 0.77, "learning_rate": 2.5567668027143777e-06, "loss": 0.5962, "step": 7112 }, { "epoch": 0.77, "learning_rate": 2.554412589090071e-06, "loss": 0.6289, "step": 7113 }, { "epoch": 0.77, "learning_rate": 2.5520593011082937e-06, "loss": 0.7236, "step": 7114 }, { "epoch": 0.77, "learning_rate": 2.549706939061605e-06, "loss": 0.7129, "step": 7115 }, { "epoch": 0.77, "learning_rate": 2.5473555032424534e-06, "loss": 0.6279, "step": 7116 }, { "epoch": 0.77, "learning_rate": 2.5450049939431733e-06, "loss": 0.6697, "step": 7117 }, { "epoch": 0.77, "learning_rate": 2.542655411455982e-06, "loss": 0.7344, "step": 7118 }, { "epoch": 0.77, "learning_rate": 2.5403067560729833e-06, "loss": 0.6526, "step": 7119 }, { "epoch": 0.78, "learning_rate": 2.53795902808616e-06, "loss": 0.656, "step": 7120 }, { "epoch": 0.78, "learning_rate": 2.5356122277873873e-06, "loss": 0.7104, "step": 7121 }, { "epoch": 0.78, "learning_rate": 2.5332663554684223e-06, "loss": 0.5994, "step": 7122 }, { "epoch": 0.78, "learning_rate": 2.5309214114209026e-06, "loss": 0.6902, "step": 7123 }, { "epoch": 0.78, "learning_rate": 2.5285773959363548e-06, "loss": 0.6028, "step": 7124 }, { "epoch": 0.78, "learning_rate": 2.526234309306194e-06, "loss": 0.5896, "step": 7125 }, { "epoch": 0.78, "learning_rate": 2.5238921518217042e-06, "loss": 0.6396, "step": 7126 }, { "epoch": 0.78, "learning_rate": 2.5215509237740777e-06, "loss": 0.6875, "step": 7127 }, { "epoch": 0.78, "learning_rate": 2.519210625454369e-06, "loss": 0.6333, "step": 7128 }, { "epoch": 0.78, "learning_rate": 2.5168712571535305e-06, "loss": 0.6636, "step": 7129 }, { "epoch": 0.78, "learning_rate": 2.5145328191623952e-06, "loss": 0.6235, "step": 7130 }, { "epoch": 0.78, "learning_rate": 2.5121953117716744e-06, "loss": 0.616, "step": 7131 }, { "epoch": 0.78, "learning_rate": 2.509858735271975e-06, "loss": 0.6826, "step": 7132 }, { "epoch": 0.78, "learning_rate": 2.507523089953782e-06, "loss": 0.7363, "step": 7133 }, { "epoch": 0.78, "learning_rate": 2.5051883761074613e-06, "loss": 0.6484, "step": 7134 }, { "epoch": 0.78, "learning_rate": 2.5028545940232685e-06, "loss": 0.729, "step": 7135 }, { "epoch": 0.78, "learning_rate": 2.500521743991342e-06, "loss": 0.7617, "step": 7136 }, { "epoch": 0.78, "learning_rate": 2.4981898263017045e-06, "loss": 0.6377, "step": 7137 }, { "epoch": 0.78, "learning_rate": 2.495858841244264e-06, "loss": 0.6877, "step": 7138 }, { "epoch": 0.78, "learning_rate": 2.4935287891088065e-06, "loss": 0.7349, "step": 7139 }, { "epoch": 0.78, "learning_rate": 2.4911996701850083e-06, "loss": 0.7258, "step": 7140 }, { "epoch": 0.78, "learning_rate": 2.4888714847624295e-06, "loss": 0.5854, "step": 7141 }, { "epoch": 0.78, "learning_rate": 2.486544233130509e-06, "loss": 0.7057, "step": 7142 }, { "epoch": 0.78, "learning_rate": 2.484217915578574e-06, "loss": 0.7168, "step": 7143 }, { "epoch": 0.78, "learning_rate": 2.4818925323958375e-06, "loss": 0.6519, "step": 7144 }, { "epoch": 0.78, "learning_rate": 2.4795680838713855e-06, "loss": 0.8345, "step": 7145 }, { "epoch": 0.78, "learning_rate": 2.477244570294206e-06, "loss": 0.6685, "step": 7146 }, { "epoch": 0.78, "learning_rate": 2.474921991953153e-06, "loss": 0.6252, "step": 7147 }, { "epoch": 0.78, "learning_rate": 2.4726003491369743e-06, "loss": 0.7058, "step": 7148 }, { "epoch": 0.78, "learning_rate": 2.4702796421343012e-06, "loss": 0.5811, "step": 7149 }, { "epoch": 0.78, "learning_rate": 2.4679598712336415e-06, "loss": 0.6802, "step": 7150 }, { "epoch": 0.78, "learning_rate": 2.4656410367233928e-06, "loss": 0.6904, "step": 7151 }, { "epoch": 0.78, "learning_rate": 2.4633231388918377e-06, "loss": 0.646, "step": 7152 }, { "epoch": 0.78, "learning_rate": 2.4610061780271355e-06, "loss": 0.8267, "step": 7153 }, { "epoch": 0.78, "learning_rate": 2.4586901544173335e-06, "loss": 0.6194, "step": 7154 }, { "epoch": 0.78, "learning_rate": 2.456375068350364e-06, "loss": 0.6135, "step": 7155 }, { "epoch": 0.78, "learning_rate": 2.4540609201140386e-06, "loss": 0.6509, "step": 7156 }, { "epoch": 0.78, "learning_rate": 2.4517477099960594e-06, "loss": 0.7283, "step": 7157 }, { "epoch": 0.78, "learning_rate": 2.449435438284e-06, "loss": 0.6851, "step": 7158 }, { "epoch": 0.78, "learning_rate": 2.4471241052653283e-06, "loss": 0.571, "step": 7159 }, { "epoch": 0.78, "learning_rate": 2.444813711227393e-06, "loss": 0.6807, "step": 7160 }, { "epoch": 0.78, "learning_rate": 2.4425042564574186e-06, "loss": 0.7029, "step": 7161 }, { "epoch": 0.78, "learning_rate": 2.4401957412425213e-06, "loss": 0.6052, "step": 7162 }, { "epoch": 0.78, "learning_rate": 2.437888165869703e-06, "loss": 0.6367, "step": 7163 }, { "epoch": 0.78, "learning_rate": 2.4355815306258355e-06, "loss": 0.6384, "step": 7164 }, { "epoch": 0.78, "learning_rate": 2.433275835797687e-06, "loss": 0.7117, "step": 7165 }, { "epoch": 0.78, "learning_rate": 2.4309710816719014e-06, "loss": 0.6973, "step": 7166 }, { "epoch": 0.78, "learning_rate": 2.428667268535009e-06, "loss": 0.833, "step": 7167 }, { "epoch": 0.78, "learning_rate": 2.4263643966734253e-06, "loss": 0.6384, "step": 7168 }, { "epoch": 0.78, "learning_rate": 2.4240624663734393e-06, "loss": 0.6125, "step": 7169 }, { "epoch": 0.78, "learning_rate": 2.421761477921232e-06, "loss": 0.7295, "step": 7170 }, { "epoch": 0.78, "learning_rate": 2.4194614316028675e-06, "loss": 0.7021, "step": 7171 }, { "epoch": 0.78, "learning_rate": 2.4171623277042843e-06, "loss": 0.7456, "step": 7172 }, { "epoch": 0.78, "learning_rate": 2.4148641665113116e-06, "loss": 0.7231, "step": 7173 }, { "epoch": 0.78, "learning_rate": 2.4125669483096583e-06, "loss": 0.6052, "step": 7174 }, { "epoch": 0.78, "learning_rate": 2.410270673384918e-06, "loss": 0.6809, "step": 7175 }, { "epoch": 0.78, "learning_rate": 2.4079753420225694e-06, "loss": 0.6982, "step": 7176 }, { "epoch": 0.78, "learning_rate": 2.4056809545079617e-06, "loss": 0.7319, "step": 7177 }, { "epoch": 0.78, "learning_rate": 2.4033875111263403e-06, "loss": 0.8154, "step": 7178 }, { "epoch": 0.78, "learning_rate": 2.401095012162832e-06, "loss": 0.7114, "step": 7179 }, { "epoch": 0.78, "learning_rate": 2.3988034579024344e-06, "loss": 0.4749, "step": 7180 }, { "epoch": 0.78, "learning_rate": 2.3965128486300395e-06, "loss": 0.6816, "step": 7181 }, { "epoch": 0.78, "learning_rate": 2.394223184630422e-06, "loss": 0.6841, "step": 7182 }, { "epoch": 0.78, "learning_rate": 2.391934466188227e-06, "loss": 0.7158, "step": 7183 }, { "epoch": 0.78, "learning_rate": 2.3896466935879957e-06, "loss": 0.6633, "step": 7184 }, { "epoch": 0.78, "learning_rate": 2.387359867114144e-06, "loss": 0.7148, "step": 7185 }, { "epoch": 0.78, "learning_rate": 2.3850739870509745e-06, "loss": 0.6851, "step": 7186 }, { "epoch": 0.78, "learning_rate": 2.3827890536826703e-06, "loss": 0.6934, "step": 7187 }, { "epoch": 0.78, "learning_rate": 2.380505067293293e-06, "loss": 0.7812, "step": 7188 }, { "epoch": 0.78, "learning_rate": 2.378222028166791e-06, "loss": 0.5713, "step": 7189 }, { "epoch": 0.78, "learning_rate": 2.3759399365869985e-06, "loss": 0.6633, "step": 7190 }, { "epoch": 0.78, "learning_rate": 2.3736587928376197e-06, "loss": 0.8184, "step": 7191 }, { "epoch": 0.78, "learning_rate": 2.371378597202254e-06, "loss": 0.6797, "step": 7192 }, { "epoch": 0.78, "learning_rate": 2.3690993499643745e-06, "loss": 0.6213, "step": 7193 }, { "epoch": 0.78, "learning_rate": 2.366821051407342e-06, "loss": 0.6807, "step": 7194 }, { "epoch": 0.78, "learning_rate": 2.364543701814398e-06, "loss": 0.7471, "step": 7195 }, { "epoch": 0.78, "learning_rate": 2.362267301468659e-06, "loss": 0.7004, "step": 7196 }, { "epoch": 0.78, "learning_rate": 2.3599918506531337e-06, "loss": 0.769, "step": 7197 }, { "epoch": 0.78, "learning_rate": 2.357717349650709e-06, "loss": 0.7014, "step": 7198 }, { "epoch": 0.78, "learning_rate": 2.355443798744149e-06, "loss": 0.7827, "step": 7199 }, { "epoch": 0.78, "learning_rate": 2.3531711982161066e-06, "loss": 0.5833, "step": 7200 }, { "epoch": 0.78, "learning_rate": 2.3508995483491147e-06, "loss": 0.6694, "step": 7201 }, { "epoch": 0.78, "learning_rate": 2.348628849425584e-06, "loss": 0.6208, "step": 7202 }, { "epoch": 0.78, "learning_rate": 2.34635910172781e-06, "loss": 0.6743, "step": 7203 }, { "epoch": 0.78, "learning_rate": 2.3440903055379714e-06, "loss": 0.7109, "step": 7204 }, { "epoch": 0.78, "learning_rate": 2.341822461138128e-06, "loss": 0.7673, "step": 7205 }, { "epoch": 0.78, "learning_rate": 2.339555568810221e-06, "loss": 0.6792, "step": 7206 }, { "epoch": 0.78, "learning_rate": 2.3372896288360682e-06, "loss": 0.7244, "step": 7207 }, { "epoch": 0.78, "learning_rate": 2.3350246414973765e-06, "loss": 0.7358, "step": 7208 }, { "epoch": 0.78, "learning_rate": 2.3327606070757335e-06, "loss": 0.6287, "step": 7209 }, { "epoch": 0.78, "learning_rate": 2.3304975258526007e-06, "loss": 0.6726, "step": 7210 }, { "epoch": 0.78, "learning_rate": 2.32823539810933e-06, "loss": 0.7642, "step": 7211 }, { "epoch": 0.79, "learning_rate": 2.3259742241271497e-06, "loss": 0.6851, "step": 7212 }, { "epoch": 0.79, "learning_rate": 2.323714004187173e-06, "loss": 0.7654, "step": 7213 }, { "epoch": 0.79, "learning_rate": 2.3214547385703933e-06, "loss": 0.6299, "step": 7214 }, { "epoch": 0.79, "learning_rate": 2.3191964275576806e-06, "loss": 0.6252, "step": 7215 }, { "epoch": 0.79, "learning_rate": 2.3169390714297936e-06, "loss": 0.6841, "step": 7216 }, { "epoch": 0.79, "learning_rate": 2.3146826704673696e-06, "loss": 0.7419, "step": 7217 }, { "epoch": 0.79, "learning_rate": 2.3124272249509225e-06, "loss": 0.6245, "step": 7218 }, { "epoch": 0.79, "learning_rate": 2.310172735160854e-06, "loss": 0.6887, "step": 7219 }, { "epoch": 0.79, "learning_rate": 2.3079192013774477e-06, "loss": 0.7275, "step": 7220 }, { "epoch": 0.79, "learning_rate": 2.305666623880858e-06, "loss": 0.7708, "step": 7221 }, { "epoch": 0.79, "learning_rate": 2.3034150029511314e-06, "loss": 0.6865, "step": 7222 }, { "epoch": 0.79, "learning_rate": 2.3011643388681915e-06, "loss": 0.6763, "step": 7223 }, { "epoch": 0.79, "learning_rate": 2.2989146319118428e-06, "loss": 0.6565, "step": 7224 }, { "epoch": 0.79, "learning_rate": 2.2966658823617738e-06, "loss": 0.6687, "step": 7225 }, { "epoch": 0.79, "learning_rate": 2.2944180904975457e-06, "loss": 0.6538, "step": 7226 }, { "epoch": 0.79, "learning_rate": 2.2921712565986085e-06, "loss": 0.6853, "step": 7227 }, { "epoch": 0.79, "learning_rate": 2.2899253809442944e-06, "loss": 0.6938, "step": 7228 }, { "epoch": 0.79, "learning_rate": 2.287680463813806e-06, "loss": 0.6459, "step": 7229 }, { "epoch": 0.79, "learning_rate": 2.2854365054862383e-06, "loss": 0.5366, "step": 7230 }, { "epoch": 0.79, "learning_rate": 2.28319350624056e-06, "loss": 0.6711, "step": 7231 }, { "epoch": 0.79, "learning_rate": 2.2809514663556244e-06, "loss": 0.5759, "step": 7232 }, { "epoch": 0.79, "learning_rate": 2.2787103861101656e-06, "loss": 0.6565, "step": 7233 }, { "epoch": 0.79, "learning_rate": 2.276470265782793e-06, "loss": 0.6897, "step": 7234 }, { "epoch": 0.79, "learning_rate": 2.2742311056520017e-06, "loss": 0.7007, "step": 7235 }, { "epoch": 0.79, "learning_rate": 2.27199290599617e-06, "loss": 0.7266, "step": 7236 }, { "epoch": 0.79, "learning_rate": 2.2697556670935472e-06, "loss": 0.6985, "step": 7237 }, { "epoch": 0.79, "learning_rate": 2.2675193892222714e-06, "loss": 0.7449, "step": 7238 }, { "epoch": 0.79, "learning_rate": 2.265284072660362e-06, "loss": 0.7332, "step": 7239 }, { "epoch": 0.79, "learning_rate": 2.2630497176857105e-06, "loss": 0.6614, "step": 7240 }, { "epoch": 0.79, "learning_rate": 2.260816324576095e-06, "loss": 0.6063, "step": 7241 }, { "epoch": 0.79, "learning_rate": 2.2585838936091753e-06, "loss": 0.6257, "step": 7242 }, { "epoch": 0.79, "learning_rate": 2.256352425062488e-06, "loss": 0.6553, "step": 7243 }, { "epoch": 0.79, "learning_rate": 2.2541219192134554e-06, "loss": 0.6792, "step": 7244 }, { "epoch": 0.79, "learning_rate": 2.2518923763393687e-06, "loss": 0.6545, "step": 7245 }, { "epoch": 0.79, "learning_rate": 2.2496637967174104e-06, "loss": 0.686, "step": 7246 }, { "epoch": 0.79, "learning_rate": 2.247436180624644e-06, "loss": 0.6672, "step": 7247 }, { "epoch": 0.79, "learning_rate": 2.2452095283380004e-06, "loss": 0.7727, "step": 7248 }, { "epoch": 0.79, "learning_rate": 2.2429838401343053e-06, "loss": 0.7512, "step": 7249 }, { "epoch": 0.79, "learning_rate": 2.2407591162902576e-06, "loss": 0.7793, "step": 7250 }, { "epoch": 0.79, "learning_rate": 2.2385353570824308e-06, "loss": 0.7065, "step": 7251 }, { "epoch": 0.79, "learning_rate": 2.236312562787296e-06, "loss": 0.7175, "step": 7252 }, { "epoch": 0.79, "learning_rate": 2.2340907336811836e-06, "loss": 0.7151, "step": 7253 }, { "epoch": 0.79, "learning_rate": 2.2318698700403174e-06, "loss": 0.6396, "step": 7254 }, { "epoch": 0.79, "learning_rate": 2.2296499721407995e-06, "loss": 0.6741, "step": 7255 }, { "epoch": 0.79, "learning_rate": 2.2274310402586042e-06, "loss": 0.678, "step": 7256 }, { "epoch": 0.79, "learning_rate": 2.2252130746695945e-06, "loss": 0.6858, "step": 7257 }, { "epoch": 0.79, "learning_rate": 2.222996075649513e-06, "loss": 0.7485, "step": 7258 }, { "epoch": 0.79, "learning_rate": 2.2207800434739722e-06, "loss": 0.6631, "step": 7259 }, { "epoch": 0.79, "learning_rate": 2.218564978418475e-06, "loss": 0.6494, "step": 7260 }, { "epoch": 0.79, "learning_rate": 2.2163508807584e-06, "loss": 0.7188, "step": 7261 }, { "epoch": 0.79, "learning_rate": 2.2141377507690064e-06, "loss": 0.6091, "step": 7262 }, { "epoch": 0.79, "learning_rate": 2.2119255887254355e-06, "loss": 0.6631, "step": 7263 }, { "epoch": 0.79, "learning_rate": 2.209714394902699e-06, "loss": 0.7466, "step": 7264 }, { "epoch": 0.79, "learning_rate": 2.207504169575698e-06, "loss": 0.7034, "step": 7265 }, { "epoch": 0.79, "learning_rate": 2.2052949130192136e-06, "loss": 0.6975, "step": 7266 }, { "epoch": 0.79, "learning_rate": 2.203086625507895e-06, "loss": 0.6987, "step": 7267 }, { "epoch": 0.79, "learning_rate": 2.2008793073162825e-06, "loss": 0.6748, "step": 7268 }, { "epoch": 0.79, "learning_rate": 2.198672958718796e-06, "loss": 0.5989, "step": 7269 }, { "epoch": 0.79, "learning_rate": 2.1964675799897206e-06, "loss": 0.77, "step": 7270 }, { "epoch": 0.79, "learning_rate": 2.1942631714032426e-06, "loss": 0.6626, "step": 7271 }, { "epoch": 0.79, "learning_rate": 2.192059733233408e-06, "loss": 0.7666, "step": 7272 }, { "epoch": 0.79, "learning_rate": 2.189857265754154e-06, "loss": 0.771, "step": 7273 }, { "epoch": 0.79, "learning_rate": 2.1876557692392942e-06, "loss": 0.7793, "step": 7274 }, { "epoch": 0.79, "learning_rate": 2.1854552439625175e-06, "loss": 0.5938, "step": 7275 }, { "epoch": 0.79, "learning_rate": 2.1832556901973967e-06, "loss": 0.7749, "step": 7276 }, { "epoch": 0.79, "learning_rate": 2.181057108217386e-06, "loss": 0.8071, "step": 7277 }, { "epoch": 0.79, "learning_rate": 2.1788594982958087e-06, "loss": 0.647, "step": 7278 }, { "epoch": 0.79, "learning_rate": 2.1766628607058772e-06, "loss": 0.6328, "step": 7279 }, { "epoch": 0.79, "learning_rate": 2.1744671957206796e-06, "loss": 0.6216, "step": 7280 }, { "epoch": 0.79, "learning_rate": 2.172272503613183e-06, "loss": 0.6038, "step": 7281 }, { "epoch": 0.79, "learning_rate": 2.1700787846562353e-06, "loss": 0.7319, "step": 7282 }, { "epoch": 0.79, "learning_rate": 2.1678860391225588e-06, "loss": 0.7041, "step": 7283 }, { "epoch": 0.79, "learning_rate": 2.165694267284757e-06, "loss": 0.7549, "step": 7284 }, { "epoch": 0.79, "learning_rate": 2.1635034694153188e-06, "loss": 0.7549, "step": 7285 }, { "epoch": 0.79, "learning_rate": 2.161313645786599e-06, "loss": 0.7412, "step": 7286 }, { "epoch": 0.79, "learning_rate": 2.159124796670843e-06, "loss": 0.7524, "step": 7287 }, { "epoch": 0.79, "learning_rate": 2.1569369223401713e-06, "loss": 0.7585, "step": 7288 }, { "epoch": 0.79, "learning_rate": 2.154750023066576e-06, "loss": 0.7402, "step": 7289 }, { "epoch": 0.79, "learning_rate": 2.152564099121944e-06, "loss": 0.7085, "step": 7290 }, { "epoch": 0.79, "learning_rate": 2.150379150778025e-06, "loss": 0.6599, "step": 7291 }, { "epoch": 0.79, "learning_rate": 2.148195178306455e-06, "loss": 0.6736, "step": 7292 }, { "epoch": 0.79, "learning_rate": 2.1460121819787516e-06, "loss": 0.6367, "step": 7293 }, { "epoch": 0.79, "learning_rate": 2.1438301620662994e-06, "loss": 0.7026, "step": 7294 }, { "epoch": 0.79, "learning_rate": 2.1416491188403745e-06, "loss": 0.6531, "step": 7295 }, { "epoch": 0.79, "learning_rate": 2.1394690525721275e-06, "loss": 0.7339, "step": 7296 }, { "epoch": 0.79, "learning_rate": 2.1372899635325804e-06, "loss": 0.5303, "step": 7297 }, { "epoch": 0.79, "learning_rate": 2.135111851992645e-06, "loss": 0.6675, "step": 7298 }, { "epoch": 0.79, "learning_rate": 2.132934718223103e-06, "loss": 0.7219, "step": 7299 }, { "epoch": 0.79, "learning_rate": 2.130758562494619e-06, "loss": 0.707, "step": 7300 }, { "epoch": 0.79, "learning_rate": 2.128583385077738e-06, "loss": 0.6658, "step": 7301 }, { "epoch": 0.79, "learning_rate": 2.1264091862428737e-06, "loss": 0.7375, "step": 7302 }, { "epoch": 0.8, "learning_rate": 2.1242359662603285e-06, "loss": 0.7114, "step": 7303 }, { "epoch": 0.8, "learning_rate": 2.122063725400282e-06, "loss": 0.7793, "step": 7304 }, { "epoch": 0.8, "learning_rate": 2.119892463932781e-06, "loss": 0.5977, "step": 7305 }, { "epoch": 0.8, "learning_rate": 2.117722182127765e-06, "loss": 0.7363, "step": 7306 }, { "epoch": 0.8, "learning_rate": 2.1155528802550474e-06, "loss": 0.6987, "step": 7307 }, { "epoch": 0.8, "learning_rate": 2.113384558584307e-06, "loss": 0.8081, "step": 7308 }, { "epoch": 0.8, "learning_rate": 2.1112172173851263e-06, "loss": 0.7004, "step": 7309 }, { "epoch": 0.8, "learning_rate": 2.1090508569269406e-06, "loss": 0.7036, "step": 7310 }, { "epoch": 0.8, "learning_rate": 2.1068854774790783e-06, "loss": 0.6887, "step": 7311 }, { "epoch": 0.8, "learning_rate": 2.104721079310743e-06, "loss": 0.7524, "step": 7312 }, { "epoch": 0.8, "learning_rate": 2.1025576626910094e-06, "loss": 0.5928, "step": 7313 }, { "epoch": 0.8, "learning_rate": 2.1003952278888382e-06, "loss": 0.6335, "step": 7314 }, { "epoch": 0.8, "learning_rate": 2.0982337751730686e-06, "loss": 0.6345, "step": 7315 }, { "epoch": 0.8, "learning_rate": 2.0960733048124082e-06, "loss": 0.6365, "step": 7316 }, { "epoch": 0.8, "learning_rate": 2.0939138170754524e-06, "loss": 0.5896, "step": 7317 }, { "epoch": 0.8, "learning_rate": 2.09175531223067e-06, "loss": 0.6797, "step": 7318 }, { "epoch": 0.8, "learning_rate": 2.089597790546409e-06, "loss": 0.7002, "step": 7319 }, { "epoch": 0.8, "learning_rate": 2.087441252290897e-06, "loss": 0.7144, "step": 7320 }, { "epoch": 0.8, "learning_rate": 2.0852856977322323e-06, "loss": 0.7114, "step": 7321 }, { "epoch": 0.8, "learning_rate": 2.083131127138396e-06, "loss": 0.7605, "step": 7322 }, { "epoch": 0.8, "learning_rate": 2.0809775407772505e-06, "loss": 0.8213, "step": 7323 }, { "epoch": 0.8, "learning_rate": 2.0788249389165273e-06, "loss": 0.6448, "step": 7324 }, { "epoch": 0.8, "learning_rate": 2.0766733218238412e-06, "loss": 0.71, "step": 7325 }, { "epoch": 0.8, "learning_rate": 2.0745226897666858e-06, "loss": 0.688, "step": 7326 }, { "epoch": 0.8, "learning_rate": 2.072373043012422e-06, "loss": 0.7788, "step": 7327 }, { "epoch": 0.8, "learning_rate": 2.0702243818283075e-06, "loss": 0.7295, "step": 7328 }, { "epoch": 0.8, "learning_rate": 2.0680767064814566e-06, "loss": 0.5825, "step": 7329 }, { "epoch": 0.8, "learning_rate": 2.0659300172388742e-06, "loss": 0.6113, "step": 7330 }, { "epoch": 0.8, "learning_rate": 2.063784314367441e-06, "loss": 0.7622, "step": 7331 }, { "epoch": 0.8, "learning_rate": 2.0616395981339076e-06, "loss": 0.5894, "step": 7332 }, { "epoch": 0.8, "learning_rate": 2.0594958688049093e-06, "loss": 0.623, "step": 7333 }, { "epoch": 0.8, "learning_rate": 2.057353126646959e-06, "loss": 0.6221, "step": 7334 }, { "epoch": 0.8, "learning_rate": 2.05521137192644e-06, "loss": 0.7412, "step": 7335 }, { "epoch": 0.8, "learning_rate": 2.0530706049096206e-06, "loss": 0.749, "step": 7336 }, { "epoch": 0.8, "learning_rate": 2.0509308258626404e-06, "loss": 0.6973, "step": 7337 }, { "epoch": 0.8, "learning_rate": 2.048792035051521e-06, "loss": 0.6296, "step": 7338 }, { "epoch": 0.8, "learning_rate": 2.046654232742161e-06, "loss": 0.644, "step": 7339 }, { "epoch": 0.8, "learning_rate": 2.044517419200329e-06, "loss": 0.6665, "step": 7340 }, { "epoch": 0.8, "learning_rate": 2.0423815946916783e-06, "loss": 0.5837, "step": 7341 }, { "epoch": 0.8, "learning_rate": 2.040246759481739e-06, "loss": 0.7986, "step": 7342 }, { "epoch": 0.8, "learning_rate": 2.0381129138359103e-06, "loss": 0.7112, "step": 7343 }, { "epoch": 0.8, "learning_rate": 2.0359800580194766e-06, "loss": 0.6423, "step": 7344 }, { "epoch": 0.8, "learning_rate": 2.0338481922975993e-06, "loss": 0.5486, "step": 7345 }, { "epoch": 0.8, "learning_rate": 2.0317173169353066e-06, "loss": 0.709, "step": 7346 }, { "epoch": 0.8, "learning_rate": 2.0295874321975206e-06, "loss": 0.7971, "step": 7347 }, { "epoch": 0.8, "learning_rate": 2.027458538349024e-06, "loss": 0.7068, "step": 7348 }, { "epoch": 0.8, "learning_rate": 2.0253306356544843e-06, "loss": 0.7681, "step": 7349 }, { "epoch": 0.8, "learning_rate": 2.0232037243784475e-06, "loss": 0.7383, "step": 7350 }, { "epoch": 0.8, "learning_rate": 2.0210778047853287e-06, "loss": 0.645, "step": 7351 }, { "epoch": 0.8, "learning_rate": 2.018952877139425e-06, "loss": 0.7446, "step": 7352 }, { "epoch": 0.8, "learning_rate": 2.0168289417049137e-06, "loss": 0.5852, "step": 7353 }, { "epoch": 0.8, "learning_rate": 2.0147059987458382e-06, "loss": 0.7749, "step": 7354 }, { "epoch": 0.8, "learning_rate": 2.0125840485261283e-06, "loss": 0.6052, "step": 7355 }, { "epoch": 0.8, "learning_rate": 2.010463091309587e-06, "loss": 0.6296, "step": 7356 }, { "epoch": 0.8, "learning_rate": 2.008343127359893e-06, "loss": 0.6633, "step": 7357 }, { "epoch": 0.8, "learning_rate": 2.006224156940605e-06, "loss": 0.7449, "step": 7358 }, { "epoch": 0.8, "learning_rate": 2.004106180315151e-06, "loss": 0.71, "step": 7359 }, { "epoch": 0.8, "learning_rate": 2.001989197746841e-06, "loss": 0.6365, "step": 7360 }, { "epoch": 0.8, "learning_rate": 1.9998732094988637e-06, "loss": 0.6802, "step": 7361 }, { "epoch": 0.8, "learning_rate": 1.9977582158342757e-06, "loss": 0.678, "step": 7362 }, { "epoch": 0.8, "learning_rate": 1.995644217016017e-06, "loss": 0.7319, "step": 7363 }, { "epoch": 0.8, "learning_rate": 1.993531213306905e-06, "loss": 0.7644, "step": 7364 }, { "epoch": 0.8, "learning_rate": 1.9914192049696235e-06, "loss": 0.7388, "step": 7365 }, { "epoch": 0.8, "learning_rate": 1.989308192266748e-06, "loss": 0.6482, "step": 7366 }, { "epoch": 0.8, "learning_rate": 1.987198175460715e-06, "loss": 0.7185, "step": 7367 }, { "epoch": 0.8, "learning_rate": 1.9850891548138463e-06, "loss": 0.7139, "step": 7368 }, { "epoch": 0.8, "learning_rate": 1.9829811305883396e-06, "loss": 0.6069, "step": 7369 }, { "epoch": 0.8, "learning_rate": 1.980874103046262e-06, "loss": 0.7671, "step": 7370 }, { "epoch": 0.8, "learning_rate": 1.9787680724495617e-06, "loss": 0.7266, "step": 7371 }, { "epoch": 0.8, "learning_rate": 1.976663039060068e-06, "loss": 0.7056, "step": 7372 }, { "epoch": 0.8, "learning_rate": 1.9745590031394735e-06, "loss": 0.6782, "step": 7373 }, { "epoch": 0.8, "learning_rate": 1.9724559649493567e-06, "loss": 0.5947, "step": 7374 }, { "epoch": 0.8, "learning_rate": 1.9703539247511695e-06, "loss": 0.7051, "step": 7375 }, { "epoch": 0.8, "learning_rate": 1.9682528828062397e-06, "loss": 0.6655, "step": 7376 }, { "epoch": 0.8, "learning_rate": 1.9661528393757744e-06, "loss": 0.6069, "step": 7377 }, { "epoch": 0.8, "learning_rate": 1.964053794720846e-06, "loss": 0.5981, "step": 7378 }, { "epoch": 0.8, "learning_rate": 1.9619557491024134e-06, "loss": 0.6453, "step": 7379 }, { "epoch": 0.8, "learning_rate": 1.95985870278131e-06, "loss": 0.6562, "step": 7380 }, { "epoch": 0.8, "learning_rate": 1.9577626560182372e-06, "loss": 0.7417, "step": 7381 }, { "epoch": 0.8, "learning_rate": 1.9556676090737803e-06, "loss": 0.6724, "step": 7382 }, { "epoch": 0.8, "learning_rate": 1.9535735622083996e-06, "loss": 0.7603, "step": 7383 }, { "epoch": 0.8, "learning_rate": 1.9514805156824223e-06, "loss": 0.6262, "step": 7384 }, { "epoch": 0.8, "learning_rate": 1.9493884697560683e-06, "loss": 0.678, "step": 7385 }, { "epoch": 0.8, "learning_rate": 1.947297424689414e-06, "loss": 0.6372, "step": 7386 }, { "epoch": 0.8, "learning_rate": 1.9452073807424232e-06, "loss": 0.6277, "step": 7387 }, { "epoch": 0.8, "learning_rate": 1.943118338174935e-06, "loss": 0.551, "step": 7388 }, { "epoch": 0.8, "learning_rate": 1.9410302972466554e-06, "loss": 0.7065, "step": 7389 }, { "epoch": 0.8, "learning_rate": 1.938943258217174e-06, "loss": 0.7004, "step": 7390 }, { "epoch": 0.8, "learning_rate": 1.936857221345957e-06, "loss": 0.6707, "step": 7391 }, { "epoch": 0.8, "learning_rate": 1.9347721868923376e-06, "loss": 0.53, "step": 7392 }, { "epoch": 0.8, "learning_rate": 1.9326881551155307e-06, "loss": 0.5178, "step": 7393 }, { "epoch": 0.8, "learning_rate": 1.930605126274625e-06, "loss": 0.614, "step": 7394 }, { "epoch": 0.81, "learning_rate": 1.9285231006285855e-06, "loss": 0.6262, "step": 7395 }, { "epoch": 0.81, "learning_rate": 1.926442078436255e-06, "loss": 0.6841, "step": 7396 }, { "epoch": 0.81, "learning_rate": 1.9243620599563407e-06, "loss": 0.7698, "step": 7397 }, { "epoch": 0.81, "learning_rate": 1.9222830454474363e-06, "loss": 0.6658, "step": 7398 }, { "epoch": 0.81, "learning_rate": 1.920205035168009e-06, "loss": 0.7227, "step": 7399 }, { "epoch": 0.81, "learning_rate": 1.918128029376396e-06, "loss": 0.7578, "step": 7400 }, { "epoch": 0.81, "learning_rate": 1.9160520283308115e-06, "loss": 0.6316, "step": 7401 }, { "epoch": 0.81, "learning_rate": 1.9139770322893523e-06, "loss": 0.7295, "step": 7402 }, { "epoch": 0.81, "learning_rate": 1.911903041509976e-06, "loss": 0.6711, "step": 7403 }, { "epoch": 0.81, "learning_rate": 1.9098300562505266e-06, "loss": 0.7524, "step": 7404 }, { "epoch": 0.81, "learning_rate": 1.90775807676872e-06, "loss": 0.6807, "step": 7405 }, { "epoch": 0.81, "learning_rate": 1.9056871033221458e-06, "loss": 0.6885, "step": 7406 }, { "epoch": 0.81, "learning_rate": 1.9036171361682732e-06, "loss": 0.6238, "step": 7407 }, { "epoch": 0.81, "learning_rate": 1.9015481755644362e-06, "loss": 0.7896, "step": 7408 }, { "epoch": 0.81, "learning_rate": 1.899480221767852e-06, "loss": 0.6414, "step": 7409 }, { "epoch": 0.81, "learning_rate": 1.8974132750356156e-06, "loss": 0.6782, "step": 7410 }, { "epoch": 0.81, "learning_rate": 1.8953473356246842e-06, "loss": 0.6238, "step": 7411 }, { "epoch": 0.81, "learning_rate": 1.8932824037919006e-06, "loss": 0.7026, "step": 7412 }, { "epoch": 0.81, "learning_rate": 1.8912184797939803e-06, "loss": 0.6785, "step": 7413 }, { "epoch": 0.81, "learning_rate": 1.8891555638875115e-06, "loss": 0.7104, "step": 7414 }, { "epoch": 0.81, "learning_rate": 1.8870936563289598e-06, "loss": 0.6323, "step": 7415 }, { "epoch": 0.81, "learning_rate": 1.8850327573746584e-06, "loss": 0.6819, "step": 7416 }, { "epoch": 0.81, "learning_rate": 1.8829728672808246e-06, "loss": 0.6982, "step": 7417 }, { "epoch": 0.81, "learning_rate": 1.8809139863035452e-06, "loss": 0.6697, "step": 7418 }, { "epoch": 0.81, "learning_rate": 1.8788561146987805e-06, "loss": 0.6978, "step": 7419 }, { "epoch": 0.81, "learning_rate": 1.8767992527223677e-06, "loss": 0.7151, "step": 7420 }, { "epoch": 0.81, "learning_rate": 1.8747434006300213e-06, "loss": 0.6516, "step": 7421 }, { "epoch": 0.81, "learning_rate": 1.8726885586773213e-06, "loss": 0.7896, "step": 7422 }, { "epoch": 0.81, "learning_rate": 1.87063472711973e-06, "loss": 0.7356, "step": 7423 }, { "epoch": 0.81, "learning_rate": 1.868581906212581e-06, "loss": 0.6777, "step": 7424 }, { "epoch": 0.81, "learning_rate": 1.8665300962110844e-06, "loss": 0.7603, "step": 7425 }, { "epoch": 0.81, "learning_rate": 1.8644792973703252e-06, "loss": 0.6663, "step": 7426 }, { "epoch": 0.81, "learning_rate": 1.8624295099452561e-06, "loss": 0.7441, "step": 7427 }, { "epoch": 0.81, "learning_rate": 1.8603807341907099e-06, "loss": 0.5784, "step": 7428 }, { "epoch": 0.81, "learning_rate": 1.858332970361395e-06, "loss": 0.7168, "step": 7429 }, { "epoch": 0.81, "learning_rate": 1.8562862187118879e-06, "loss": 0.6331, "step": 7430 }, { "epoch": 0.81, "learning_rate": 1.854240479496643e-06, "loss": 0.6609, "step": 7431 }, { "epoch": 0.81, "learning_rate": 1.8521957529699909e-06, "loss": 0.7664, "step": 7432 }, { "epoch": 0.81, "learning_rate": 1.8501520393861317e-06, "loss": 0.6445, "step": 7433 }, { "epoch": 0.81, "learning_rate": 1.8481093389991466e-06, "loss": 0.6516, "step": 7434 }, { "epoch": 0.81, "learning_rate": 1.8460676520629794e-06, "loss": 0.6277, "step": 7435 }, { "epoch": 0.81, "learning_rate": 1.844026978831457e-06, "loss": 0.687, "step": 7436 }, { "epoch": 0.81, "learning_rate": 1.8419873195582815e-06, "loss": 0.5825, "step": 7437 }, { "epoch": 0.81, "learning_rate": 1.8399486744970185e-06, "loss": 0.8027, "step": 7438 }, { "epoch": 0.81, "learning_rate": 1.8379110439011193e-06, "loss": 0.79, "step": 7439 }, { "epoch": 0.81, "learning_rate": 1.8358744280239048e-06, "loss": 0.7651, "step": 7440 }, { "epoch": 0.81, "learning_rate": 1.8338388271185648e-06, "loss": 0.7319, "step": 7441 }, { "epoch": 0.81, "learning_rate": 1.8318042414381687e-06, "loss": 0.6802, "step": 7442 }, { "epoch": 0.81, "learning_rate": 1.8297706712356588e-06, "loss": 0.7246, "step": 7443 }, { "epoch": 0.81, "learning_rate": 1.8277381167638508e-06, "loss": 0.72, "step": 7444 }, { "epoch": 0.81, "learning_rate": 1.8257065782754357e-06, "loss": 0.7166, "step": 7445 }, { "epoch": 0.81, "learning_rate": 1.8236760560229715e-06, "loss": 0.7114, "step": 7446 }, { "epoch": 0.81, "learning_rate": 1.8216465502588964e-06, "loss": 0.6711, "step": 7447 }, { "epoch": 0.81, "learning_rate": 1.8196180612355252e-06, "loss": 0.5999, "step": 7448 }, { "epoch": 0.81, "learning_rate": 1.817590589205035e-06, "loss": 0.752, "step": 7449 }, { "epoch": 0.81, "learning_rate": 1.8155641344194852e-06, "loss": 0.7363, "step": 7450 }, { "epoch": 0.81, "learning_rate": 1.8135386971308066e-06, "loss": 0.7324, "step": 7451 }, { "epoch": 0.81, "learning_rate": 1.8115142775908046e-06, "loss": 0.6611, "step": 7452 }, { "epoch": 0.81, "learning_rate": 1.8094908760511599e-06, "loss": 0.7808, "step": 7453 }, { "epoch": 0.81, "learning_rate": 1.8074684927634167e-06, "loss": 0.6716, "step": 7454 }, { "epoch": 0.81, "learning_rate": 1.805447127979003e-06, "loss": 0.7236, "step": 7455 }, { "epoch": 0.81, "learning_rate": 1.803426781949219e-06, "loss": 0.6704, "step": 7456 }, { "epoch": 0.81, "learning_rate": 1.8014074549252325e-06, "loss": 0.668, "step": 7457 }, { "epoch": 0.81, "learning_rate": 1.7993891471580894e-06, "loss": 0.7424, "step": 7458 }, { "epoch": 0.81, "learning_rate": 1.79737185889871e-06, "loss": 0.7783, "step": 7459 }, { "epoch": 0.81, "learning_rate": 1.7953555903978815e-06, "loss": 0.6433, "step": 7460 }, { "epoch": 0.81, "learning_rate": 1.7933403419062689e-06, "loss": 0.6516, "step": 7461 }, { "epoch": 0.81, "learning_rate": 1.791326113674412e-06, "loss": 0.6641, "step": 7462 }, { "epoch": 0.81, "learning_rate": 1.7893129059527214e-06, "loss": 0.6648, "step": 7463 }, { "epoch": 0.81, "learning_rate": 1.7873007189914816e-06, "loss": 0.6951, "step": 7464 }, { "epoch": 0.81, "learning_rate": 1.7852895530408465e-06, "loss": 0.5789, "step": 7465 }, { "epoch": 0.81, "learning_rate": 1.7832794083508476e-06, "loss": 0.6912, "step": 7466 }, { "epoch": 0.81, "learning_rate": 1.7812702851713904e-06, "loss": 0.6831, "step": 7467 }, { "epoch": 0.81, "learning_rate": 1.7792621837522472e-06, "loss": 0.7134, "step": 7468 }, { "epoch": 0.81, "learning_rate": 1.7772551043430686e-06, "loss": 0.7144, "step": 7469 }, { "epoch": 0.81, "learning_rate": 1.7752490471933769e-06, "loss": 0.5933, "step": 7470 }, { "epoch": 0.81, "learning_rate": 1.7732440125525675e-06, "loss": 0.7219, "step": 7471 }, { "epoch": 0.81, "learning_rate": 1.7712400006699094e-06, "loss": 0.626, "step": 7472 }, { "epoch": 0.81, "learning_rate": 1.76923701179454e-06, "loss": 0.7915, "step": 7473 }, { "epoch": 0.81, "learning_rate": 1.767235046175474e-06, "loss": 0.7192, "step": 7474 }, { "epoch": 0.81, "learning_rate": 1.7652341040616006e-06, "loss": 0.6038, "step": 7475 }, { "epoch": 0.81, "learning_rate": 1.7632341857016733e-06, "loss": 0.709, "step": 7476 }, { "epoch": 0.81, "learning_rate": 1.7612352913443265e-06, "loss": 0.575, "step": 7477 }, { "epoch": 0.81, "learning_rate": 1.7592374212380691e-06, "loss": 0.7954, "step": 7478 }, { "epoch": 0.81, "learning_rate": 1.7572405756312706e-06, "loss": 0.7021, "step": 7479 }, { "epoch": 0.81, "learning_rate": 1.7552447547721841e-06, "loss": 0.5762, "step": 7480 }, { "epoch": 0.81, "learning_rate": 1.7532499589089324e-06, "loss": 0.6528, "step": 7481 }, { "epoch": 0.81, "learning_rate": 1.7512561882895107e-06, "loss": 0.5688, "step": 7482 }, { "epoch": 0.81, "learning_rate": 1.7492634431617873e-06, "loss": 0.6743, "step": 7483 }, { "epoch": 0.81, "learning_rate": 1.7472717237734993e-06, "loss": 0.7515, "step": 7484 }, { "epoch": 0.81, "learning_rate": 1.74528103037226e-06, "loss": 0.6824, "step": 7485 }, { "epoch": 0.81, "learning_rate": 1.7432913632055582e-06, "loss": 0.584, "step": 7486 }, { "epoch": 0.82, "learning_rate": 1.7413027225207445e-06, "loss": 0.6567, "step": 7487 }, { "epoch": 0.82, "learning_rate": 1.739315108565053e-06, "loss": 0.6653, "step": 7488 }, { "epoch": 0.82, "learning_rate": 1.7373285215855862e-06, "loss": 0.8042, "step": 7489 }, { "epoch": 0.82, "learning_rate": 1.7353429618293139e-06, "loss": 0.6523, "step": 7490 }, { "epoch": 0.82, "learning_rate": 1.7333584295430894e-06, "loss": 0.5132, "step": 7491 }, { "epoch": 0.82, "learning_rate": 1.7313749249736266e-06, "loss": 0.7134, "step": 7492 }, { "epoch": 0.82, "learning_rate": 1.7293924483675173e-06, "loss": 0.6733, "step": 7493 }, { "epoch": 0.82, "learning_rate": 1.7274109999712295e-06, "loss": 0.7581, "step": 7494 }, { "epoch": 0.82, "learning_rate": 1.7254305800310922e-06, "loss": 0.7043, "step": 7495 }, { "epoch": 0.82, "learning_rate": 1.7234511887933159e-06, "loss": 0.6899, "step": 7496 }, { "epoch": 0.82, "learning_rate": 1.7214728265039838e-06, "loss": 0.707, "step": 7497 }, { "epoch": 0.82, "learning_rate": 1.7194954934090414e-06, "loss": 0.6997, "step": 7498 }, { "epoch": 0.82, "learning_rate": 1.7175191897543164e-06, "loss": 0.6736, "step": 7499 }, { "epoch": 0.82, "learning_rate": 1.7155439157855037e-06, "loss": 0.6423, "step": 7500 }, { "epoch": 0.82, "learning_rate": 1.7135696717481708e-06, "loss": 0.6924, "step": 7501 }, { "epoch": 0.82, "learning_rate": 1.711596457887762e-06, "loss": 0.6514, "step": 7502 }, { "epoch": 0.82, "learning_rate": 1.709624274449584e-06, "loss": 0.7256, "step": 7503 }, { "epoch": 0.82, "learning_rate": 1.7076531216788205e-06, "loss": 0.6885, "step": 7504 }, { "epoch": 0.82, "learning_rate": 1.7056829998205326e-06, "loss": 0.6216, "step": 7505 }, { "epoch": 0.82, "learning_rate": 1.7037139091196396e-06, "loss": 0.7368, "step": 7506 }, { "epoch": 0.82, "learning_rate": 1.7017458498209472e-06, "loss": 0.7349, "step": 7507 }, { "epoch": 0.82, "learning_rate": 1.6997788221691248e-06, "loss": 0.7234, "step": 7508 }, { "epoch": 0.82, "learning_rate": 1.6978128264087101e-06, "loss": 0.7458, "step": 7509 }, { "epoch": 0.82, "learning_rate": 1.695847862784128e-06, "loss": 0.6013, "step": 7510 }, { "epoch": 0.82, "learning_rate": 1.693883931539655e-06, "loss": 0.6838, "step": 7511 }, { "epoch": 0.82, "learning_rate": 1.6919210329194535e-06, "loss": 0.8501, "step": 7512 }, { "epoch": 0.82, "learning_rate": 1.689959167167554e-06, "loss": 0.6675, "step": 7513 }, { "epoch": 0.82, "learning_rate": 1.6879983345278528e-06, "loss": 0.6545, "step": 7514 }, { "epoch": 0.82, "learning_rate": 1.6860385352441254e-06, "loss": 0.7681, "step": 7515 }, { "epoch": 0.82, "learning_rate": 1.6840797695600187e-06, "loss": 0.7009, "step": 7516 }, { "epoch": 0.82, "learning_rate": 1.6821220377190428e-06, "loss": 0.6218, "step": 7517 }, { "epoch": 0.82, "learning_rate": 1.6801653399645867e-06, "loss": 0.6528, "step": 7518 }, { "epoch": 0.82, "learning_rate": 1.6782096765399103e-06, "loss": 0.8262, "step": 7519 }, { "epoch": 0.82, "learning_rate": 1.6762550476881423e-06, "loss": 0.5015, "step": 7520 }, { "epoch": 0.82, "learning_rate": 1.6743014536522872e-06, "loss": 0.5002, "step": 7521 }, { "epoch": 0.82, "learning_rate": 1.6723488946752131e-06, "loss": 0.7954, "step": 7522 }, { "epoch": 0.82, "learning_rate": 1.6703973709996646e-06, "loss": 0.6389, "step": 7523 }, { "epoch": 0.82, "learning_rate": 1.6684468828682621e-06, "loss": 0.6194, "step": 7524 }, { "epoch": 0.82, "learning_rate": 1.6664974305234848e-06, "loss": 0.7197, "step": 7525 }, { "epoch": 0.82, "learning_rate": 1.6645490142076948e-06, "loss": 0.6655, "step": 7526 }, { "epoch": 0.82, "learning_rate": 1.6626016341631224e-06, "loss": 0.5969, "step": 7527 }, { "epoch": 0.82, "learning_rate": 1.6606552906318608e-06, "loss": 0.5952, "step": 7528 }, { "epoch": 0.82, "learning_rate": 1.6587099838558906e-06, "loss": 0.6902, "step": 7529 }, { "epoch": 0.82, "learning_rate": 1.6567657140770477e-06, "loss": 0.5776, "step": 7530 }, { "epoch": 0.82, "learning_rate": 1.6548224815370485e-06, "loss": 0.6655, "step": 7531 }, { "epoch": 0.82, "learning_rate": 1.6528802864774773e-06, "loss": 0.6577, "step": 7532 }, { "epoch": 0.82, "learning_rate": 1.650939129139787e-06, "loss": 0.6357, "step": 7533 }, { "epoch": 0.82, "learning_rate": 1.6489990097653065e-06, "loss": 0.7166, "step": 7534 }, { "epoch": 0.82, "learning_rate": 1.6470599285952348e-06, "loss": 0.5659, "step": 7535 }, { "epoch": 0.82, "learning_rate": 1.6451218858706374e-06, "loss": 0.7427, "step": 7536 }, { "epoch": 0.82, "learning_rate": 1.6431848818324524e-06, "loss": 0.7178, "step": 7537 }, { "epoch": 0.82, "learning_rate": 1.641248916721494e-06, "loss": 0.7417, "step": 7538 }, { "epoch": 0.82, "learning_rate": 1.6393139907784405e-06, "loss": 0.7524, "step": 7539 }, { "epoch": 0.82, "learning_rate": 1.6373801042438475e-06, "loss": 0.7031, "step": 7540 }, { "epoch": 0.82, "learning_rate": 1.6354472573581326e-06, "loss": 0.584, "step": 7541 }, { "epoch": 0.82, "learning_rate": 1.6335154503615902e-06, "loss": 0.7451, "step": 7542 }, { "epoch": 0.82, "learning_rate": 1.6315846834943894e-06, "loss": 0.6431, "step": 7543 }, { "epoch": 0.82, "learning_rate": 1.629654956996558e-06, "loss": 0.7419, "step": 7544 }, { "epoch": 0.82, "learning_rate": 1.6277262711080043e-06, "loss": 0.6687, "step": 7545 }, { "epoch": 0.82, "learning_rate": 1.6257986260685077e-06, "loss": 0.7769, "step": 7546 }, { "epoch": 0.82, "learning_rate": 1.6238720221177062e-06, "loss": 0.6506, "step": 7547 }, { "epoch": 0.82, "learning_rate": 1.6219464594951273e-06, "loss": 0.6702, "step": 7548 }, { "epoch": 0.82, "learning_rate": 1.6200219384401527e-06, "loss": 0.5562, "step": 7549 }, { "epoch": 0.82, "learning_rate": 1.6180984591920413e-06, "loss": 0.6179, "step": 7550 }, { "epoch": 0.82, "learning_rate": 1.616176021989926e-06, "loss": 0.6768, "step": 7551 }, { "epoch": 0.82, "learning_rate": 1.6142546270727989e-06, "loss": 0.679, "step": 7552 }, { "epoch": 0.82, "learning_rate": 1.6123342746795345e-06, "loss": 0.6738, "step": 7553 }, { "epoch": 0.82, "learning_rate": 1.6104149650488743e-06, "loss": 0.7366, "step": 7554 }, { "epoch": 0.82, "learning_rate": 1.6084966984194228e-06, "loss": 0.6289, "step": 7555 }, { "epoch": 0.82, "learning_rate": 1.6065794750296648e-06, "loss": 0.7146, "step": 7556 }, { "epoch": 0.82, "learning_rate": 1.6046632951179508e-06, "loss": 0.7412, "step": 7557 }, { "epoch": 0.82, "learning_rate": 1.6027481589225024e-06, "loss": 0.6738, "step": 7558 }, { "epoch": 0.82, "learning_rate": 1.6008340666814127e-06, "loss": 0.6436, "step": 7559 }, { "epoch": 0.82, "learning_rate": 1.5989210186326388e-06, "loss": 0.7446, "step": 7560 }, { "epoch": 0.82, "learning_rate": 1.597009015014016e-06, "loss": 0.6824, "step": 7561 }, { "epoch": 0.82, "learning_rate": 1.5950980560632479e-06, "loss": 0.7048, "step": 7562 }, { "epoch": 0.82, "learning_rate": 1.5931881420179019e-06, "loss": 0.7153, "step": 7563 }, { "epoch": 0.82, "learning_rate": 1.5912792731154237e-06, "loss": 0.7034, "step": 7564 }, { "epoch": 0.82, "learning_rate": 1.5893714495931266e-06, "loss": 0.7075, "step": 7565 }, { "epoch": 0.82, "learning_rate": 1.587464671688187e-06, "loss": 0.6819, "step": 7566 }, { "epoch": 0.82, "learning_rate": 1.5855589396376669e-06, "loss": 0.5862, "step": 7567 }, { "epoch": 0.82, "learning_rate": 1.5836542536784816e-06, "loss": 0.7576, "step": 7568 }, { "epoch": 0.82, "learning_rate": 1.5817506140474248e-06, "loss": 0.6292, "step": 7569 }, { "epoch": 0.82, "learning_rate": 1.5798480209811628e-06, "loss": 0.6619, "step": 7570 }, { "epoch": 0.82, "learning_rate": 1.577946474716222e-06, "loss": 0.6064, "step": 7571 }, { "epoch": 0.82, "learning_rate": 1.5760459754890068e-06, "loss": 0.6512, "step": 7572 }, { "epoch": 0.82, "learning_rate": 1.574146523535791e-06, "loss": 0.6943, "step": 7573 }, { "epoch": 0.82, "learning_rate": 1.572248119092713e-06, "loss": 0.7261, "step": 7574 }, { "epoch": 0.82, "learning_rate": 1.5703507623957848e-06, "loss": 0.5564, "step": 7575 }, { "epoch": 0.82, "learning_rate": 1.56845445368089e-06, "loss": 0.7441, "step": 7576 }, { "epoch": 0.82, "learning_rate": 1.5665591931837766e-06, "loss": 0.7334, "step": 7577 }, { "epoch": 0.82, "learning_rate": 1.5646649811400704e-06, "loss": 0.6841, "step": 7578 }, { "epoch": 0.83, "learning_rate": 1.5627718177852546e-06, "loss": 0.6528, "step": 7579 }, { "epoch": 0.83, "learning_rate": 1.560879703354693e-06, "loss": 0.6084, "step": 7580 }, { "epoch": 0.83, "learning_rate": 1.558988638083616e-06, "loss": 0.6609, "step": 7581 }, { "epoch": 0.83, "learning_rate": 1.5570986222071194e-06, "loss": 0.6733, "step": 7582 }, { "epoch": 0.83, "learning_rate": 1.5552096559601736e-06, "loss": 0.6326, "step": 7583 }, { "epoch": 0.83, "learning_rate": 1.553321739577619e-06, "loss": 0.6614, "step": 7584 }, { "epoch": 0.83, "learning_rate": 1.5514348732941553e-06, "loss": 0.8008, "step": 7585 }, { "epoch": 0.83, "learning_rate": 1.5495490573443705e-06, "loss": 0.6755, "step": 7586 }, { "epoch": 0.83, "learning_rate": 1.5476642919627027e-06, "loss": 0.689, "step": 7587 }, { "epoch": 0.83, "learning_rate": 1.5457805773834711e-06, "loss": 0.7163, "step": 7588 }, { "epoch": 0.83, "learning_rate": 1.5438979138408616e-06, "loss": 0.7891, "step": 7589 }, { "epoch": 0.83, "learning_rate": 1.542016301568926e-06, "loss": 0.6562, "step": 7590 }, { "epoch": 0.83, "learning_rate": 1.5401357408015893e-06, "loss": 0.7766, "step": 7591 }, { "epoch": 0.83, "learning_rate": 1.5382562317726468e-06, "loss": 0.6768, "step": 7592 }, { "epoch": 0.83, "learning_rate": 1.536377774715757e-06, "loss": 0.7048, "step": 7593 }, { "epoch": 0.83, "learning_rate": 1.5345003698644533e-06, "loss": 0.6656, "step": 7594 }, { "epoch": 0.83, "learning_rate": 1.5326240174521368e-06, "loss": 0.7275, "step": 7595 }, { "epoch": 0.83, "learning_rate": 1.5307487177120773e-06, "loss": 0.606, "step": 7596 }, { "epoch": 0.83, "learning_rate": 1.528874470877416e-06, "loss": 0.6111, "step": 7597 }, { "epoch": 0.83, "learning_rate": 1.527001277181156e-06, "loss": 0.686, "step": 7598 }, { "epoch": 0.83, "learning_rate": 1.5251291368561771e-06, "loss": 0.6677, "step": 7599 }, { "epoch": 0.83, "learning_rate": 1.523258050135229e-06, "loss": 0.7627, "step": 7600 }, { "epoch": 0.83, "learning_rate": 1.521388017250921e-06, "loss": 0.6531, "step": 7601 }, { "epoch": 0.83, "learning_rate": 1.5195190384357405e-06, "loss": 0.6934, "step": 7602 }, { "epoch": 0.83, "learning_rate": 1.517651113922043e-06, "loss": 0.6353, "step": 7603 }, { "epoch": 0.83, "learning_rate": 1.5157842439420422e-06, "loss": 0.6858, "step": 7604 }, { "epoch": 0.83, "learning_rate": 1.5139184287278397e-06, "loss": 0.5671, "step": 7605 }, { "epoch": 0.83, "learning_rate": 1.5120536685113895e-06, "loss": 0.6951, "step": 7606 }, { "epoch": 0.83, "learning_rate": 1.510189963524521e-06, "loss": 0.5581, "step": 7607 }, { "epoch": 0.83, "learning_rate": 1.508327313998935e-06, "loss": 0.6938, "step": 7608 }, { "epoch": 0.83, "learning_rate": 1.5064657201661926e-06, "loss": 0.6572, "step": 7609 }, { "epoch": 0.83, "learning_rate": 1.5046051822577313e-06, "loss": 0.7036, "step": 7610 }, { "epoch": 0.83, "learning_rate": 1.5027457005048573e-06, "loss": 0.5903, "step": 7611 }, { "epoch": 0.83, "learning_rate": 1.5008872751387393e-06, "loss": 0.7529, "step": 7612 }, { "epoch": 0.83, "learning_rate": 1.4990299063904202e-06, "loss": 0.6228, "step": 7613 }, { "epoch": 0.83, "learning_rate": 1.4971735944908107e-06, "loss": 0.7437, "step": 7614 }, { "epoch": 0.83, "learning_rate": 1.495318339670687e-06, "loss": 0.6382, "step": 7615 }, { "epoch": 0.83, "learning_rate": 1.493464142160701e-06, "loss": 0.7043, "step": 7616 }, { "epoch": 0.83, "learning_rate": 1.491611002191362e-06, "loss": 0.6206, "step": 7617 }, { "epoch": 0.83, "learning_rate": 1.4897589199930573e-06, "loss": 0.7769, "step": 7618 }, { "epoch": 0.83, "learning_rate": 1.4879078957960413e-06, "loss": 0.5129, "step": 7619 }, { "epoch": 0.83, "learning_rate": 1.4860579298304311e-06, "loss": 0.6465, "step": 7620 }, { "epoch": 0.83, "learning_rate": 1.4842090223262185e-06, "loss": 0.6667, "step": 7621 }, { "epoch": 0.83, "learning_rate": 1.4823611735132637e-06, "loss": 0.7278, "step": 7622 }, { "epoch": 0.83, "learning_rate": 1.4805143836212854e-06, "loss": 0.6675, "step": 7623 }, { "epoch": 0.83, "learning_rate": 1.4786686528798878e-06, "loss": 0.6895, "step": 7624 }, { "epoch": 0.83, "learning_rate": 1.476823981518527e-06, "loss": 0.7927, "step": 7625 }, { "epoch": 0.83, "learning_rate": 1.4749803697665366e-06, "loss": 0.7107, "step": 7626 }, { "epoch": 0.83, "learning_rate": 1.4731378178531197e-06, "loss": 0.6401, "step": 7627 }, { "epoch": 0.83, "learning_rate": 1.4712963260073376e-06, "loss": 0.5964, "step": 7628 }, { "epoch": 0.83, "learning_rate": 1.4694558944581294e-06, "loss": 0.7122, "step": 7629 }, { "epoch": 0.83, "learning_rate": 1.467616523434302e-06, "loss": 0.6553, "step": 7630 }, { "epoch": 0.83, "learning_rate": 1.4657782131645227e-06, "loss": 0.6086, "step": 7631 }, { "epoch": 0.83, "learning_rate": 1.463940963877335e-06, "loss": 0.7168, "step": 7632 }, { "epoch": 0.83, "learning_rate": 1.4621047758011464e-06, "loss": 0.5781, "step": 7633 }, { "epoch": 0.83, "learning_rate": 1.4602696491642343e-06, "loss": 0.7329, "step": 7634 }, { "epoch": 0.83, "learning_rate": 1.4584355841947452e-06, "loss": 0.7341, "step": 7635 }, { "epoch": 0.83, "learning_rate": 1.4566025811206875e-06, "loss": 0.647, "step": 7636 }, { "epoch": 0.83, "learning_rate": 1.4547706401699434e-06, "loss": 0.7163, "step": 7637 }, { "epoch": 0.83, "learning_rate": 1.4529397615702656e-06, "loss": 0.6455, "step": 7638 }, { "epoch": 0.83, "learning_rate": 1.451109945549265e-06, "loss": 0.6902, "step": 7639 }, { "epoch": 0.83, "learning_rate": 1.4492811923344285e-06, "loss": 0.7075, "step": 7640 }, { "epoch": 0.83, "learning_rate": 1.4474535021531099e-06, "loss": 0.5579, "step": 7641 }, { "epoch": 0.83, "learning_rate": 1.4456268752325264e-06, "loss": 0.8062, "step": 7642 }, { "epoch": 0.83, "learning_rate": 1.4438013117997673e-06, "loss": 0.6072, "step": 7643 }, { "epoch": 0.83, "learning_rate": 1.441976812081789e-06, "loss": 0.6548, "step": 7644 }, { "epoch": 0.83, "learning_rate": 1.4401533763054132e-06, "loss": 0.7192, "step": 7645 }, { "epoch": 0.83, "learning_rate": 1.4383310046973365e-06, "loss": 0.6011, "step": 7646 }, { "epoch": 0.83, "learning_rate": 1.436509697484111e-06, "loss": 0.6758, "step": 7647 }, { "epoch": 0.83, "learning_rate": 1.4346894548921663e-06, "loss": 0.655, "step": 7648 }, { "epoch": 0.83, "learning_rate": 1.4328702771477987e-06, "loss": 0.7061, "step": 7649 }, { "epoch": 0.83, "learning_rate": 1.4310521644771657e-06, "loss": 0.5442, "step": 7650 }, { "epoch": 0.83, "learning_rate": 1.4292351171063001e-06, "loss": 0.71, "step": 7651 }, { "epoch": 0.83, "learning_rate": 1.4274191352610966e-06, "loss": 0.696, "step": 7652 }, { "epoch": 0.83, "learning_rate": 1.4256042191673226e-06, "loss": 0.759, "step": 7653 }, { "epoch": 0.83, "learning_rate": 1.4237903690506106e-06, "loss": 0.6125, "step": 7654 }, { "epoch": 0.83, "learning_rate": 1.421977585136457e-06, "loss": 0.5476, "step": 7655 }, { "epoch": 0.83, "learning_rate": 1.4201658676502294e-06, "loss": 0.5283, "step": 7656 }, { "epoch": 0.83, "learning_rate": 1.4183552168171655e-06, "loss": 0.6719, "step": 7657 }, { "epoch": 0.83, "learning_rate": 1.4165456328623628e-06, "loss": 0.7119, "step": 7658 }, { "epoch": 0.83, "learning_rate": 1.4147371160107914e-06, "loss": 0.6523, "step": 7659 }, { "epoch": 0.83, "learning_rate": 1.4129296664872926e-06, "loss": 0.7832, "step": 7660 }, { "epoch": 0.83, "learning_rate": 1.4111232845165634e-06, "loss": 0.772, "step": 7661 }, { "epoch": 0.83, "learning_rate": 1.4093179703231786e-06, "loss": 0.6204, "step": 7662 }, { "epoch": 0.83, "learning_rate": 1.407513724131576e-06, "loss": 0.655, "step": 7663 }, { "epoch": 0.83, "learning_rate": 1.4057105461660613e-06, "loss": 0.6873, "step": 7664 }, { "epoch": 0.83, "learning_rate": 1.4039084366508094e-06, "loss": 0.6533, "step": 7665 }, { "epoch": 0.83, "learning_rate": 1.4021073958098553e-06, "loss": 0.7222, "step": 7666 }, { "epoch": 0.83, "learning_rate": 1.4003074238671098e-06, "loss": 0.7483, "step": 7667 }, { "epoch": 0.83, "learning_rate": 1.3985085210463479e-06, "loss": 0.7222, "step": 7668 }, { "epoch": 0.83, "learning_rate": 1.3967106875712077e-06, "loss": 0.7773, "step": 7669 }, { "epoch": 0.83, "learning_rate": 1.3949139236651987e-06, "loss": 0.6807, "step": 7670 }, { "epoch": 0.84, "learning_rate": 1.3931182295516965e-06, "loss": 0.6575, "step": 7671 }, { "epoch": 0.84, "learning_rate": 1.3913236054539448e-06, "loss": 0.7104, "step": 7672 }, { "epoch": 0.84, "learning_rate": 1.3895300515950528e-06, "loss": 0.6919, "step": 7673 }, { "epoch": 0.84, "learning_rate": 1.3877375681979944e-06, "loss": 0.6541, "step": 7674 }, { "epoch": 0.84, "learning_rate": 1.3859461554856145e-06, "loss": 0.6309, "step": 7675 }, { "epoch": 0.84, "learning_rate": 1.3841558136806254e-06, "loss": 0.687, "step": 7676 }, { "epoch": 0.84, "learning_rate": 1.3823665430056e-06, "loss": 0.6973, "step": 7677 }, { "epoch": 0.84, "learning_rate": 1.3805783436829833e-06, "loss": 0.6619, "step": 7678 }, { "epoch": 0.84, "learning_rate": 1.3787912159350903e-06, "loss": 0.5811, "step": 7679 }, { "epoch": 0.84, "learning_rate": 1.3770051599840906e-06, "loss": 0.7832, "step": 7680 }, { "epoch": 0.84, "learning_rate": 1.3752201760520333e-06, "loss": 0.6724, "step": 7681 }, { "epoch": 0.84, "learning_rate": 1.373436264360829e-06, "loss": 0.7334, "step": 7682 }, { "epoch": 0.84, "learning_rate": 1.3716534251322543e-06, "loss": 0.7078, "step": 7683 }, { "epoch": 0.84, "learning_rate": 1.3698716585879568e-06, "loss": 0.6765, "step": 7684 }, { "epoch": 0.84, "learning_rate": 1.3680909649494423e-06, "loss": 0.6084, "step": 7685 }, { "epoch": 0.84, "learning_rate": 1.3663113444380905e-06, "loss": 0.7822, "step": 7686 }, { "epoch": 0.84, "learning_rate": 1.3645327972751477e-06, "loss": 0.7158, "step": 7687 }, { "epoch": 0.84, "learning_rate": 1.3627553236817215e-06, "loss": 0.7104, "step": 7688 }, { "epoch": 0.84, "learning_rate": 1.3609789238787885e-06, "loss": 0.7158, "step": 7689 }, { "epoch": 0.84, "learning_rate": 1.3592035980871954e-06, "loss": 0.6255, "step": 7690 }, { "epoch": 0.84, "learning_rate": 1.35742934652765e-06, "loss": 0.6611, "step": 7691 }, { "epoch": 0.84, "learning_rate": 1.3556561694207337e-06, "loss": 0.6104, "step": 7692 }, { "epoch": 0.84, "learning_rate": 1.3538840669868824e-06, "loss": 0.6504, "step": 7693 }, { "epoch": 0.84, "learning_rate": 1.35211303944641e-06, "loss": 0.6516, "step": 7694 }, { "epoch": 0.84, "learning_rate": 1.3503430870194933e-06, "loss": 0.6641, "step": 7695 }, { "epoch": 0.84, "learning_rate": 1.34857420992617e-06, "loss": 0.5892, "step": 7696 }, { "epoch": 0.84, "learning_rate": 1.346806408386352e-06, "loss": 0.6899, "step": 7697 }, { "epoch": 0.84, "learning_rate": 1.3450396826198142e-06, "loss": 0.6804, "step": 7698 }, { "epoch": 0.84, "learning_rate": 1.3432740328461958e-06, "loss": 0.71, "step": 7699 }, { "epoch": 0.84, "learning_rate": 1.3415094592850042e-06, "loss": 0.7031, "step": 7700 }, { "epoch": 0.84, "learning_rate": 1.339745962155613e-06, "loss": 0.6577, "step": 7701 }, { "epoch": 0.84, "learning_rate": 1.3379835416772635e-06, "loss": 0.6904, "step": 7702 }, { "epoch": 0.84, "learning_rate": 1.3362221980690627e-06, "loss": 0.8809, "step": 7703 }, { "epoch": 0.84, "learning_rate": 1.3344619315499774e-06, "loss": 0.6455, "step": 7704 }, { "epoch": 0.84, "learning_rate": 1.3327027423388493e-06, "loss": 0.6724, "step": 7705 }, { "epoch": 0.84, "learning_rate": 1.3309446306543827e-06, "loss": 0.6584, "step": 7706 }, { "epoch": 0.84, "learning_rate": 1.3291875967151457e-06, "loss": 0.7065, "step": 7707 }, { "epoch": 0.84, "learning_rate": 1.327431640739575e-06, "loss": 0.7197, "step": 7708 }, { "epoch": 0.84, "learning_rate": 1.3256767629459732e-06, "loss": 0.5781, "step": 7709 }, { "epoch": 0.84, "learning_rate": 1.3239229635525074e-06, "loss": 0.7222, "step": 7710 }, { "epoch": 0.84, "learning_rate": 1.3221702427772155e-06, "loss": 0.6865, "step": 7711 }, { "epoch": 0.84, "learning_rate": 1.3204186008379926e-06, "loss": 0.6577, "step": 7712 }, { "epoch": 0.84, "learning_rate": 1.3186680379526062e-06, "loss": 0.6143, "step": 7713 }, { "epoch": 0.84, "learning_rate": 1.3169185543386897e-06, "loss": 0.7217, "step": 7714 }, { "epoch": 0.84, "learning_rate": 1.315170150213737e-06, "loss": 0.6611, "step": 7715 }, { "epoch": 0.84, "learning_rate": 1.3134228257951142e-06, "loss": 0.6365, "step": 7716 }, { "epoch": 0.84, "learning_rate": 1.311676581300051e-06, "loss": 0.6252, "step": 7717 }, { "epoch": 0.84, "learning_rate": 1.309931416945638e-06, "loss": 0.7378, "step": 7718 }, { "epoch": 0.84, "learning_rate": 1.3081873329488393e-06, "loss": 0.5421, "step": 7719 }, { "epoch": 0.84, "learning_rate": 1.3064443295264795e-06, "loss": 0.7593, "step": 7720 }, { "epoch": 0.84, "learning_rate": 1.3047024068952507e-06, "loss": 0.5232, "step": 7721 }, { "epoch": 0.84, "learning_rate": 1.3029615652717132e-06, "loss": 0.8315, "step": 7722 }, { "epoch": 0.84, "learning_rate": 1.3012218048722858e-06, "loss": 0.6182, "step": 7723 }, { "epoch": 0.84, "learning_rate": 1.299483125913259e-06, "loss": 0.71, "step": 7724 }, { "epoch": 0.84, "learning_rate": 1.2977455286107898e-06, "loss": 0.75, "step": 7725 }, { "epoch": 0.84, "learning_rate": 1.2960090131808923e-06, "loss": 0.6611, "step": 7726 }, { "epoch": 0.84, "learning_rate": 1.2942735798394546e-06, "loss": 0.6594, "step": 7727 }, { "epoch": 0.84, "learning_rate": 1.2925392288022299e-06, "loss": 0.7534, "step": 7728 }, { "epoch": 0.84, "learning_rate": 1.2908059602848278e-06, "loss": 0.7466, "step": 7729 }, { "epoch": 0.84, "learning_rate": 1.2890737745027382e-06, "loss": 0.6095, "step": 7730 }, { "epoch": 0.84, "learning_rate": 1.2873426716713012e-06, "loss": 0.6492, "step": 7731 }, { "epoch": 0.84, "learning_rate": 1.2856126520057333e-06, "loss": 0.7041, "step": 7732 }, { "epoch": 0.84, "learning_rate": 1.2838837157211116e-06, "loss": 0.6643, "step": 7733 }, { "epoch": 0.84, "learning_rate": 1.282155863032377e-06, "loss": 0.6121, "step": 7734 }, { "epoch": 0.84, "learning_rate": 1.2804290941543384e-06, "loss": 0.6274, "step": 7735 }, { "epoch": 0.84, "learning_rate": 1.2787034093016726e-06, "loss": 0.7246, "step": 7736 }, { "epoch": 0.84, "learning_rate": 1.2769788086889135e-06, "loss": 0.7627, "step": 7737 }, { "epoch": 0.84, "learning_rate": 1.2752552925304685e-06, "loss": 0.6228, "step": 7738 }, { "epoch": 0.84, "learning_rate": 1.2735328610406038e-06, "loss": 0.6968, "step": 7739 }, { "epoch": 0.84, "learning_rate": 1.2718115144334576e-06, "loss": 0.7427, "step": 7740 }, { "epoch": 0.84, "learning_rate": 1.270091252923028e-06, "loss": 0.7532, "step": 7741 }, { "epoch": 0.84, "learning_rate": 1.2683720767231778e-06, "loss": 0.6456, "step": 7742 }, { "epoch": 0.84, "learning_rate": 1.2666539860476367e-06, "loss": 0.7036, "step": 7743 }, { "epoch": 0.84, "learning_rate": 1.2649369811100033e-06, "loss": 0.6169, "step": 7744 }, { "epoch": 0.84, "learning_rate": 1.2632210621237329e-06, "loss": 0.7471, "step": 7745 }, { "epoch": 0.84, "learning_rate": 1.2615062293021508e-06, "loss": 0.6335, "step": 7746 }, { "epoch": 0.84, "learning_rate": 1.2597924828584495e-06, "loss": 0.6416, "step": 7747 }, { "epoch": 0.84, "learning_rate": 1.258079823005678e-06, "loss": 0.5996, "step": 7748 }, { "epoch": 0.84, "learning_rate": 1.2563682499567632e-06, "loss": 0.6406, "step": 7749 }, { "epoch": 0.84, "learning_rate": 1.254657763924484e-06, "loss": 0.7646, "step": 7750 }, { "epoch": 0.84, "learning_rate": 1.2529483651214913e-06, "loss": 0.6917, "step": 7751 }, { "epoch": 0.84, "learning_rate": 1.251240053760302e-06, "loss": 0.6699, "step": 7752 }, { "epoch": 0.84, "learning_rate": 1.2495328300532893e-06, "loss": 0.699, "step": 7753 }, { "epoch": 0.84, "learning_rate": 1.2478266942127003e-06, "loss": 0.7512, "step": 7754 }, { "epoch": 0.84, "learning_rate": 1.2461216464506454e-06, "loss": 0.7217, "step": 7755 }, { "epoch": 0.84, "learning_rate": 1.2444176869790925e-06, "loss": 0.6997, "step": 7756 }, { "epoch": 0.84, "learning_rate": 1.2427148160098823e-06, "loss": 0.5203, "step": 7757 }, { "epoch": 0.84, "learning_rate": 1.2410130337547178e-06, "loss": 0.6545, "step": 7758 }, { "epoch": 0.84, "learning_rate": 1.239312340425166e-06, "loss": 0.6279, "step": 7759 }, { "epoch": 0.84, "learning_rate": 1.2376127362326607e-06, "loss": 0.6035, "step": 7760 }, { "epoch": 0.84, "learning_rate": 1.2359142213884933e-06, "loss": 0.709, "step": 7761 }, { "epoch": 0.84, "learning_rate": 1.2342167961038275e-06, "loss": 0.7559, "step": 7762 }, { "epoch": 0.85, "learning_rate": 1.2325204605896924e-06, "loss": 0.6721, "step": 7763 }, { "epoch": 0.85, "learning_rate": 1.230825215056971e-06, "loss": 0.7529, "step": 7764 }, { "epoch": 0.85, "learning_rate": 1.2291310597164219e-06, "loss": 0.6855, "step": 7765 }, { "epoch": 0.85, "learning_rate": 1.2274379947786662e-06, "loss": 0.6558, "step": 7766 }, { "epoch": 0.85, "learning_rate": 1.2257460204541793e-06, "loss": 0.7087, "step": 7767 }, { "epoch": 0.85, "learning_rate": 1.2240551369533205e-06, "loss": 0.6047, "step": 7768 }, { "epoch": 0.85, "learning_rate": 1.2223653444862926e-06, "loss": 0.6885, "step": 7769 }, { "epoch": 0.85, "learning_rate": 1.2206766432631766e-06, "loss": 0.6322, "step": 7770 }, { "epoch": 0.85, "learning_rate": 1.2189890334939136e-06, "loss": 0.708, "step": 7771 }, { "epoch": 0.85, "learning_rate": 1.2173025153883067e-06, "loss": 0.5942, "step": 7772 }, { "epoch": 0.85, "learning_rate": 1.215617089156026e-06, "loss": 0.6743, "step": 7773 }, { "epoch": 0.85, "learning_rate": 1.2139327550066082e-06, "loss": 0.6597, "step": 7774 }, { "epoch": 0.85, "learning_rate": 1.212249513149446e-06, "loss": 0.6714, "step": 7775 }, { "epoch": 0.85, "learning_rate": 1.2105673637938054e-06, "loss": 0.6606, "step": 7776 }, { "epoch": 0.85, "learning_rate": 1.2088863071488122e-06, "loss": 0.6855, "step": 7777 }, { "epoch": 0.85, "learning_rate": 1.207206343423456e-06, "loss": 0.71, "step": 7778 }, { "epoch": 0.85, "learning_rate": 1.2055274728265943e-06, "loss": 0.7058, "step": 7779 }, { "epoch": 0.85, "learning_rate": 1.203849695566942e-06, "loss": 0.6367, "step": 7780 }, { "epoch": 0.85, "learning_rate": 1.202173011853085e-06, "loss": 0.6238, "step": 7781 }, { "epoch": 0.85, "learning_rate": 1.2004974218934695e-06, "loss": 0.6667, "step": 7782 }, { "epoch": 0.85, "learning_rate": 1.1988229258964045e-06, "loss": 0.615, "step": 7783 }, { "epoch": 0.85, "learning_rate": 1.197149524070067e-06, "loss": 0.7061, "step": 7784 }, { "epoch": 0.85, "learning_rate": 1.195477216622496e-06, "loss": 0.7048, "step": 7785 }, { "epoch": 0.85, "learning_rate": 1.1938060037615906e-06, "loss": 0.696, "step": 7786 }, { "epoch": 0.85, "learning_rate": 1.1921358856951248e-06, "loss": 0.6902, "step": 7787 }, { "epoch": 0.85, "learning_rate": 1.1904668626307225e-06, "loss": 0.6704, "step": 7788 }, { "epoch": 0.85, "learning_rate": 1.188798934775881e-06, "loss": 0.6677, "step": 7789 }, { "epoch": 0.85, "learning_rate": 1.187132102337961e-06, "loss": 0.6973, "step": 7790 }, { "epoch": 0.85, "learning_rate": 1.1854663655241804e-06, "loss": 0.6528, "step": 7791 }, { "epoch": 0.85, "learning_rate": 1.1838017245416266e-06, "loss": 0.7417, "step": 7792 }, { "epoch": 0.85, "learning_rate": 1.182138179597252e-06, "loss": 0.7092, "step": 7793 }, { "epoch": 0.85, "learning_rate": 1.1804757308978653e-06, "loss": 0.751, "step": 7794 }, { "epoch": 0.85, "learning_rate": 1.1788143786501494e-06, "loss": 0.6294, "step": 7795 }, { "epoch": 0.85, "learning_rate": 1.1771541230606364e-06, "loss": 0.6523, "step": 7796 }, { "epoch": 0.85, "learning_rate": 1.1754949643357395e-06, "loss": 0.7036, "step": 7797 }, { "epoch": 0.85, "learning_rate": 1.1738369026817265e-06, "loss": 0.7363, "step": 7798 }, { "epoch": 0.85, "learning_rate": 1.172179938304724e-06, "loss": 0.75, "step": 7799 }, { "epoch": 0.85, "learning_rate": 1.1705240714107301e-06, "loss": 0.5637, "step": 7800 }, { "epoch": 0.85, "learning_rate": 1.1688693022056064e-06, "loss": 0.5713, "step": 7801 }, { "epoch": 0.85, "learning_rate": 1.1672156308950698e-06, "loss": 0.6582, "step": 7802 }, { "epoch": 0.85, "learning_rate": 1.1655630576847089e-06, "loss": 0.7056, "step": 7803 }, { "epoch": 0.85, "learning_rate": 1.1639115827799764e-06, "loss": 0.6616, "step": 7804 }, { "epoch": 0.85, "learning_rate": 1.1622612063861782e-06, "loss": 0.5989, "step": 7805 }, { "epoch": 0.85, "learning_rate": 1.1606119287084982e-06, "loss": 0.6848, "step": 7806 }, { "epoch": 0.85, "learning_rate": 1.15896374995197e-06, "loss": 0.6333, "step": 7807 }, { "epoch": 0.85, "learning_rate": 1.1573166703215011e-06, "loss": 0.75, "step": 7808 }, { "epoch": 0.85, "learning_rate": 1.1556706900218572e-06, "loss": 0.6155, "step": 7809 }, { "epoch": 0.85, "learning_rate": 1.1540258092576662e-06, "loss": 0.6387, "step": 7810 }, { "epoch": 0.85, "learning_rate": 1.152382028233422e-06, "loss": 0.6958, "step": 7811 }, { "epoch": 0.85, "learning_rate": 1.1507393471534834e-06, "loss": 0.6038, "step": 7812 }, { "epoch": 0.85, "learning_rate": 1.1490977662220659e-06, "loss": 0.6733, "step": 7813 }, { "epoch": 0.85, "learning_rate": 1.1474572856432576e-06, "loss": 0.55, "step": 7814 }, { "epoch": 0.85, "learning_rate": 1.1458179056209962e-06, "loss": 0.592, "step": 7815 }, { "epoch": 0.85, "learning_rate": 1.1441796263590988e-06, "loss": 0.6638, "step": 7816 }, { "epoch": 0.85, "learning_rate": 1.1425424480612378e-06, "loss": 0.6941, "step": 7817 }, { "epoch": 0.85, "learning_rate": 1.1409063709309442e-06, "loss": 0.7119, "step": 7818 }, { "epoch": 0.85, "learning_rate": 1.1392713951716183e-06, "loss": 0.6025, "step": 7819 }, { "epoch": 0.85, "learning_rate": 1.1376375209865254e-06, "loss": 0.6736, "step": 7820 }, { "epoch": 0.85, "learning_rate": 1.136004748578785e-06, "loss": 0.6362, "step": 7821 }, { "epoch": 0.85, "learning_rate": 1.1343730781513896e-06, "loss": 0.6016, "step": 7822 }, { "epoch": 0.85, "learning_rate": 1.1327425099071843e-06, "loss": 0.8008, "step": 7823 }, { "epoch": 0.85, "learning_rate": 1.131113044048885e-06, "loss": 0.6599, "step": 7824 }, { "epoch": 0.85, "learning_rate": 1.1294846807790739e-06, "loss": 0.7046, "step": 7825 }, { "epoch": 0.85, "learning_rate": 1.1278574203001846e-06, "loss": 0.666, "step": 7826 }, { "epoch": 0.85, "learning_rate": 1.126231262814521e-06, "loss": 0.7449, "step": 7827 }, { "epoch": 0.85, "learning_rate": 1.1246062085242514e-06, "loss": 0.5374, "step": 7828 }, { "epoch": 0.85, "learning_rate": 1.1229822576313997e-06, "loss": 0.7478, "step": 7829 }, { "epoch": 0.85, "learning_rate": 1.121359410337859e-06, "loss": 0.5874, "step": 7830 }, { "epoch": 0.85, "learning_rate": 1.1197376668453851e-06, "loss": 0.6292, "step": 7831 }, { "epoch": 0.85, "learning_rate": 1.1181170273555918e-06, "loss": 0.7236, "step": 7832 }, { "epoch": 0.85, "learning_rate": 1.1164974920699611e-06, "loss": 0.707, "step": 7833 }, { "epoch": 0.85, "learning_rate": 1.1148790611898297e-06, "loss": 0.7251, "step": 7834 }, { "epoch": 0.85, "learning_rate": 1.1132617349164089e-06, "loss": 0.6553, "step": 7835 }, { "epoch": 0.85, "learning_rate": 1.1116455134507665e-06, "loss": 0.7014, "step": 7836 }, { "epoch": 0.85, "learning_rate": 1.1100303969938264e-06, "loss": 0.6604, "step": 7837 }, { "epoch": 0.85, "learning_rate": 1.1084163857463858e-06, "loss": 0.6443, "step": 7838 }, { "epoch": 0.85, "learning_rate": 1.106803479909102e-06, "loss": 0.7373, "step": 7839 }, { "epoch": 0.85, "learning_rate": 1.105191679682488e-06, "loss": 0.7053, "step": 7840 }, { "epoch": 0.85, "learning_rate": 1.1035809852669287e-06, "loss": 0.6677, "step": 7841 }, { "epoch": 0.85, "learning_rate": 1.1019713968626632e-06, "loss": 0.6165, "step": 7842 }, { "epoch": 0.85, "learning_rate": 1.100362914669797e-06, "loss": 0.7505, "step": 7843 }, { "epoch": 0.85, "learning_rate": 1.0987555388883042e-06, "loss": 0.6729, "step": 7844 }, { "epoch": 0.85, "learning_rate": 1.0971492697180097e-06, "loss": 0.7151, "step": 7845 }, { "epoch": 0.85, "learning_rate": 1.095544107358607e-06, "loss": 0.7817, "step": 7846 }, { "epoch": 0.85, "learning_rate": 1.0939400520096554e-06, "loss": 0.7329, "step": 7847 }, { "epoch": 0.85, "learning_rate": 1.0923371038705677e-06, "loss": 0.646, "step": 7848 }, { "epoch": 0.85, "learning_rate": 1.0907352631406254e-06, "loss": 0.7686, "step": 7849 }, { "epoch": 0.85, "learning_rate": 1.0891345300189727e-06, "loss": 0.6809, "step": 7850 }, { "epoch": 0.85, "learning_rate": 1.0875349047046113e-06, "loss": 0.6604, "step": 7851 }, { "epoch": 0.85, "learning_rate": 1.0859363873964123e-06, "loss": 0.6201, "step": 7852 }, { "epoch": 0.85, "learning_rate": 1.084338978293098e-06, "loss": 0.6328, "step": 7853 }, { "epoch": 0.85, "learning_rate": 1.0827426775932658e-06, "loss": 0.6274, "step": 7854 }, { "epoch": 0.86, "learning_rate": 1.0811474854953708e-06, "loss": 0.4943, "step": 7855 }, { "epoch": 0.86, "learning_rate": 1.0795534021977229e-06, "loss": 0.5159, "step": 7856 }, { "epoch": 0.86, "learning_rate": 1.0779604278985033e-06, "loss": 0.6211, "step": 7857 }, { "epoch": 0.86, "learning_rate": 1.0763685627957532e-06, "loss": 0.7163, "step": 7858 }, { "epoch": 0.86, "learning_rate": 1.0747778070873705e-06, "loss": 0.6089, "step": 7859 }, { "epoch": 0.86, "learning_rate": 1.0731881609711247e-06, "loss": 0.5769, "step": 7860 }, { "epoch": 0.86, "learning_rate": 1.071599624644638e-06, "loss": 0.6648, "step": 7861 }, { "epoch": 0.86, "learning_rate": 1.0700121983053991e-06, "loss": 0.6973, "step": 7862 }, { "epoch": 0.86, "learning_rate": 1.068425882150762e-06, "loss": 0.5869, "step": 7863 }, { "epoch": 0.86, "learning_rate": 1.066840676377935e-06, "loss": 0.7031, "step": 7864 }, { "epoch": 0.86, "learning_rate": 1.0652565811839943e-06, "loss": 0.6958, "step": 7865 }, { "epoch": 0.86, "learning_rate": 1.0636735967658785e-06, "loss": 0.7744, "step": 7866 }, { "epoch": 0.86, "learning_rate": 1.062091723320381e-06, "loss": 0.7305, "step": 7867 }, { "epoch": 0.86, "learning_rate": 1.0605109610441633e-06, "loss": 0.7476, "step": 7868 }, { "epoch": 0.86, "learning_rate": 1.0589313101337495e-06, "loss": 0.6309, "step": 7869 }, { "epoch": 0.86, "learning_rate": 1.0573527707855202e-06, "loss": 0.668, "step": 7870 }, { "epoch": 0.86, "learning_rate": 1.055775343195724e-06, "loss": 0.6318, "step": 7871 }, { "epoch": 0.86, "learning_rate": 1.054199027560463e-06, "loss": 0.6726, "step": 7872 }, { "epoch": 0.86, "learning_rate": 1.0526238240757126e-06, "loss": 0.6545, "step": 7873 }, { "epoch": 0.86, "learning_rate": 1.0510497329373014e-06, "loss": 0.6948, "step": 7874 }, { "epoch": 0.86, "learning_rate": 1.0494767543409202e-06, "loss": 0.6978, "step": 7875 }, { "epoch": 0.86, "learning_rate": 1.0479048884821253e-06, "loss": 0.6519, "step": 7876 }, { "epoch": 0.86, "learning_rate": 1.0463341355563318e-06, "loss": 0.6609, "step": 7877 }, { "epoch": 0.86, "learning_rate": 1.0447644957588166e-06, "loss": 0.7139, "step": 7878 }, { "epoch": 0.86, "learning_rate": 1.0431959692847205e-06, "loss": 0.5945, "step": 7879 }, { "epoch": 0.86, "learning_rate": 1.0416285563290407e-06, "loss": 0.6816, "step": 7880 }, { "epoch": 0.86, "learning_rate": 1.0400622570866426e-06, "loss": 0.6689, "step": 7881 }, { "epoch": 0.86, "learning_rate": 1.038497071752248e-06, "loss": 0.6807, "step": 7882 }, { "epoch": 0.86, "learning_rate": 1.0369330005204448e-06, "loss": 0.6616, "step": 7883 }, { "epoch": 0.86, "learning_rate": 1.0353700435856773e-06, "loss": 0.7817, "step": 7884 }, { "epoch": 0.86, "learning_rate": 1.0338082011422568e-06, "loss": 0.6489, "step": 7885 }, { "epoch": 0.86, "learning_rate": 1.03224747338435e-06, "loss": 0.7505, "step": 7886 }, { "epoch": 0.86, "learning_rate": 1.0306878605059888e-06, "loss": 0.7598, "step": 7887 }, { "epoch": 0.86, "learning_rate": 1.0291293627010678e-06, "loss": 0.7629, "step": 7888 }, { "epoch": 0.86, "learning_rate": 1.0275719801633388e-06, "loss": 0.6118, "step": 7889 }, { "epoch": 0.86, "learning_rate": 1.0260157130864178e-06, "loss": 0.6904, "step": 7890 }, { "epoch": 0.86, "learning_rate": 1.024460561663778e-06, "loss": 0.6816, "step": 7891 }, { "epoch": 0.86, "learning_rate": 1.0229065260887626e-06, "loss": 0.749, "step": 7892 }, { "epoch": 0.86, "learning_rate": 1.0213536065545704e-06, "loss": 0.6772, "step": 7893 }, { "epoch": 0.86, "learning_rate": 1.019801803254259e-06, "loss": 0.7314, "step": 7894 }, { "epoch": 0.86, "learning_rate": 1.0182511163807506e-06, "loss": 0.6882, "step": 7895 }, { "epoch": 0.86, "learning_rate": 1.0167015461268303e-06, "loss": 0.6951, "step": 7896 }, { "epoch": 0.86, "learning_rate": 1.0151530926851395e-06, "loss": 0.6145, "step": 7897 }, { "epoch": 0.86, "learning_rate": 1.013605756248185e-06, "loss": 0.717, "step": 7898 }, { "epoch": 0.86, "learning_rate": 1.012059537008332e-06, "loss": 0.7156, "step": 7899 }, { "epoch": 0.86, "learning_rate": 1.0105144351578078e-06, "loss": 0.7407, "step": 7900 }, { "epoch": 0.86, "learning_rate": 1.008970450888701e-06, "loss": 0.6411, "step": 7901 }, { "epoch": 0.86, "learning_rate": 1.0074275843929627e-06, "loss": 0.655, "step": 7902 }, { "epoch": 0.86, "learning_rate": 1.0058858358624023e-06, "loss": 0.7031, "step": 7903 }, { "epoch": 0.86, "learning_rate": 1.0043452054886949e-06, "loss": 0.7285, "step": 7904 }, { "epoch": 0.86, "learning_rate": 1.0028056934633668e-06, "loss": 0.6094, "step": 7905 }, { "epoch": 0.86, "learning_rate": 1.001267299977815e-06, "loss": 0.707, "step": 7906 }, { "epoch": 0.86, "learning_rate": 9.997300252232966e-07, "loss": 0.7188, "step": 7907 }, { "epoch": 0.86, "learning_rate": 9.981938693909221e-07, "loss": 0.7427, "step": 7908 }, { "epoch": 0.86, "learning_rate": 9.96658832671672e-07, "loss": 0.7139, "step": 7909 }, { "epoch": 0.86, "learning_rate": 9.95124915256378e-07, "loss": 0.8203, "step": 7910 }, { "epoch": 0.86, "learning_rate": 9.935921173357444e-07, "loss": 0.6428, "step": 7911 }, { "epoch": 0.86, "learning_rate": 9.920604391003285e-07, "loss": 0.7056, "step": 7912 }, { "epoch": 0.86, "learning_rate": 9.905298807405472e-07, "loss": 0.752, "step": 7913 }, { "epoch": 0.86, "learning_rate": 9.890004424466825e-07, "loss": 0.6514, "step": 7914 }, { "epoch": 0.86, "learning_rate": 9.874721244088793e-07, "loss": 0.6312, "step": 7915 }, { "epoch": 0.86, "learning_rate": 9.859449268171328e-07, "loss": 0.6294, "step": 7916 }, { "epoch": 0.86, "learning_rate": 9.844188498613117e-07, "loss": 0.7236, "step": 7917 }, { "epoch": 0.86, "learning_rate": 9.82893893731135e-07, "loss": 0.6545, "step": 7918 }, { "epoch": 0.86, "learning_rate": 9.81370058616188e-07, "loss": 0.6431, "step": 7919 }, { "epoch": 0.86, "learning_rate": 9.798473447059153e-07, "loss": 0.7183, "step": 7920 }, { "epoch": 0.86, "learning_rate": 9.783257521896228e-07, "loss": 0.79, "step": 7921 }, { "epoch": 0.86, "learning_rate": 9.768052812564766e-07, "loss": 0.8225, "step": 7922 }, { "epoch": 0.86, "learning_rate": 9.752859320955045e-07, "loss": 0.6868, "step": 7923 }, { "epoch": 0.86, "learning_rate": 9.737677048955896e-07, "loss": 0.7024, "step": 7924 }, { "epoch": 0.86, "learning_rate": 9.722505998454812e-07, "loss": 0.6709, "step": 7925 }, { "epoch": 0.86, "learning_rate": 9.707346171337895e-07, "loss": 0.6309, "step": 7926 }, { "epoch": 0.86, "learning_rate": 9.69219756948978e-07, "loss": 0.719, "step": 7927 }, { "epoch": 0.86, "learning_rate": 9.677060194793808e-07, "loss": 0.5967, "step": 7928 }, { "epoch": 0.86, "learning_rate": 9.661934049131815e-07, "loss": 0.7075, "step": 7929 }, { "epoch": 0.86, "learning_rate": 9.646819134384344e-07, "loss": 0.6292, "step": 7930 }, { "epoch": 0.86, "learning_rate": 9.631715452430501e-07, "loss": 0.6621, "step": 7931 }, { "epoch": 0.86, "learning_rate": 9.616623005147952e-07, "loss": 0.6335, "step": 7932 }, { "epoch": 0.86, "learning_rate": 9.601541794413017e-07, "loss": 0.6699, "step": 7933 }, { "epoch": 0.86, "learning_rate": 9.58647182210064e-07, "loss": 0.7305, "step": 7934 }, { "epoch": 0.86, "learning_rate": 9.571413090084281e-07, "loss": 0.558, "step": 7935 }, { "epoch": 0.86, "learning_rate": 9.556365600236107e-07, "loss": 0.6196, "step": 7936 }, { "epoch": 0.86, "learning_rate": 9.541329354426787e-07, "loss": 0.6335, "step": 7937 }, { "epoch": 0.86, "learning_rate": 9.526304354525672e-07, "loss": 0.7329, "step": 7938 }, { "epoch": 0.86, "learning_rate": 9.51129060240068e-07, "loss": 0.6748, "step": 7939 }, { "epoch": 0.86, "learning_rate": 9.496288099918327e-07, "loss": 0.687, "step": 7940 }, { "epoch": 0.86, "learning_rate": 9.481296848943744e-07, "loss": 0.6667, "step": 7941 }, { "epoch": 0.86, "learning_rate": 9.466316851340684e-07, "loss": 0.6257, "step": 7942 }, { "epoch": 0.86, "learning_rate": 9.451348108971425e-07, "loss": 0.6763, "step": 7943 }, { "epoch": 0.86, "learning_rate": 9.436390623696911e-07, "loss": 0.7405, "step": 7944 }, { "epoch": 0.86, "learning_rate": 9.421444397376711e-07, "loss": 0.5449, "step": 7945 }, { "epoch": 0.87, "learning_rate": 9.406509431868893e-07, "loss": 0.6221, "step": 7946 }, { "epoch": 0.87, "learning_rate": 9.39158572903024e-07, "loss": 0.7754, "step": 7947 }, { "epoch": 0.87, "learning_rate": 9.37667329071602e-07, "loss": 0.6125, "step": 7948 }, { "epoch": 0.87, "learning_rate": 9.361772118780211e-07, "loss": 0.665, "step": 7949 }, { "epoch": 0.87, "learning_rate": 9.346882215075348e-07, "loss": 0.5747, "step": 7950 }, { "epoch": 0.87, "learning_rate": 9.33200358145252e-07, "loss": 0.6841, "step": 7951 }, { "epoch": 0.87, "learning_rate": 9.317136219761469e-07, "loss": 0.6768, "step": 7952 }, { "epoch": 0.87, "learning_rate": 9.302280131850538e-07, "loss": 0.6296, "step": 7953 }, { "epoch": 0.87, "learning_rate": 9.287435319566618e-07, "loss": 0.7515, "step": 7954 }, { "epoch": 0.87, "learning_rate": 9.272601784755264e-07, "loss": 0.8115, "step": 7955 }, { "epoch": 0.87, "learning_rate": 9.257779529260558e-07, "loss": 0.6008, "step": 7956 }, { "epoch": 0.87, "learning_rate": 9.242968554925225e-07, "loss": 0.6768, "step": 7957 }, { "epoch": 0.87, "learning_rate": 9.228168863590603e-07, "loss": 0.7002, "step": 7958 }, { "epoch": 0.87, "learning_rate": 9.213380457096588e-07, "loss": 0.6768, "step": 7959 }, { "epoch": 0.87, "learning_rate": 9.198603337281687e-07, "loss": 0.6248, "step": 7960 }, { "epoch": 0.87, "learning_rate": 9.183837505983029e-07, "loss": 0.7756, "step": 7961 }, { "epoch": 0.87, "learning_rate": 9.16908296503628e-07, "loss": 0.6741, "step": 7962 }, { "epoch": 0.87, "learning_rate": 9.154339716275762e-07, "loss": 0.6226, "step": 7963 }, { "epoch": 0.87, "learning_rate": 9.139607761534374e-07, "loss": 0.6509, "step": 7964 }, { "epoch": 0.87, "learning_rate": 9.124887102643576e-07, "loss": 0.637, "step": 7965 }, { "epoch": 0.87, "learning_rate": 9.110177741433501e-07, "loss": 0.5364, "step": 7966 }, { "epoch": 0.87, "learning_rate": 9.095479679732788e-07, "loss": 0.7317, "step": 7967 }, { "epoch": 0.87, "learning_rate": 9.080792919368697e-07, "loss": 0.7585, "step": 7968 }, { "epoch": 0.87, "learning_rate": 9.06611746216719e-07, "loss": 0.6318, "step": 7969 }, { "epoch": 0.87, "learning_rate": 9.051453309952641e-07, "loss": 0.6921, "step": 7970 }, { "epoch": 0.87, "learning_rate": 9.036800464548157e-07, "loss": 0.603, "step": 7971 }, { "epoch": 0.87, "learning_rate": 9.022158927775404e-07, "loss": 0.7246, "step": 7972 }, { "epoch": 0.87, "learning_rate": 9.007528701454593e-07, "loss": 0.6023, "step": 7973 }, { "epoch": 0.87, "learning_rate": 8.992909787404602e-07, "loss": 0.7454, "step": 7974 }, { "epoch": 0.87, "learning_rate": 8.978302187442833e-07, "loss": 0.7593, "step": 7975 }, { "epoch": 0.87, "learning_rate": 8.963705903385344e-07, "loss": 0.6597, "step": 7976 }, { "epoch": 0.87, "learning_rate": 8.949120937046751e-07, "loss": 0.6091, "step": 7977 }, { "epoch": 0.87, "learning_rate": 8.934547290240269e-07, "loss": 0.6482, "step": 7978 }, { "epoch": 0.87, "learning_rate": 8.919984964777706e-07, "loss": 0.7056, "step": 7979 }, { "epoch": 0.87, "learning_rate": 8.905433962469489e-07, "loss": 0.7241, "step": 7980 }, { "epoch": 0.87, "learning_rate": 8.890894285124585e-07, "loss": 0.5358, "step": 7981 }, { "epoch": 0.87, "learning_rate": 8.876365934550579e-07, "loss": 0.7573, "step": 7982 }, { "epoch": 0.87, "learning_rate": 8.861848912553672e-07, "loss": 0.7559, "step": 7983 }, { "epoch": 0.87, "learning_rate": 8.847343220938608e-07, "loss": 0.6963, "step": 7984 }, { "epoch": 0.87, "learning_rate": 8.832848861508781e-07, "loss": 0.7393, "step": 7985 }, { "epoch": 0.87, "learning_rate": 8.818365836066101e-07, "loss": 0.6819, "step": 7986 }, { "epoch": 0.87, "learning_rate": 8.803894146411118e-07, "loss": 0.6614, "step": 7987 }, { "epoch": 0.87, "learning_rate": 8.789433794343016e-07, "loss": 0.7234, "step": 7988 }, { "epoch": 0.87, "learning_rate": 8.774984781659468e-07, "loss": 0.6738, "step": 7989 }, { "epoch": 0.87, "learning_rate": 8.760547110156803e-07, "loss": 0.6697, "step": 7990 }, { "epoch": 0.87, "learning_rate": 8.746120781629952e-07, "loss": 0.5862, "step": 7991 }, { "epoch": 0.87, "learning_rate": 8.731705797872369e-07, "loss": 0.7769, "step": 7992 }, { "epoch": 0.87, "learning_rate": 8.717302160676178e-07, "loss": 0.5564, "step": 7993 }, { "epoch": 0.87, "learning_rate": 8.702909871832022e-07, "loss": 0.7261, "step": 7994 }, { "epoch": 0.87, "learning_rate": 8.688528933129158e-07, "loss": 0.6787, "step": 7995 }, { "epoch": 0.87, "learning_rate": 8.67415934635546e-07, "loss": 0.6702, "step": 7996 }, { "epoch": 0.87, "learning_rate": 8.659801113297372e-07, "loss": 0.7158, "step": 7997 }, { "epoch": 0.87, "learning_rate": 8.645454235739903e-07, "loss": 0.6948, "step": 7998 }, { "epoch": 0.87, "learning_rate": 8.631118715466702e-07, "loss": 0.7134, "step": 7999 }, { "epoch": 0.87, "learning_rate": 8.616794554259944e-07, "loss": 0.6978, "step": 8000 }, { "epoch": 0.87, "learning_rate": 8.602481753900427e-07, "loss": 0.6709, "step": 8001 }, { "epoch": 0.87, "learning_rate": 8.588180316167549e-07, "loss": 0.6807, "step": 8002 }, { "epoch": 0.87, "learning_rate": 8.573890242839256e-07, "loss": 0.6855, "step": 8003 }, { "epoch": 0.87, "learning_rate": 8.559611535692136e-07, "loss": 0.6941, "step": 8004 }, { "epoch": 0.87, "learning_rate": 8.545344196501293e-07, "loss": 0.6904, "step": 8005 }, { "epoch": 0.87, "learning_rate": 8.53108822704044e-07, "loss": 0.6907, "step": 8006 }, { "epoch": 0.87, "learning_rate": 8.516843629081983e-07, "loss": 0.6963, "step": 8007 }, { "epoch": 0.87, "learning_rate": 8.502610404396738e-07, "loss": 0.7239, "step": 8008 }, { "epoch": 0.87, "learning_rate": 8.488388554754223e-07, "loss": 0.592, "step": 8009 }, { "epoch": 0.87, "learning_rate": 8.474178081922524e-07, "loss": 0.6719, "step": 8010 }, { "epoch": 0.87, "learning_rate": 8.459978987668271e-07, "loss": 0.7065, "step": 8011 }, { "epoch": 0.87, "learning_rate": 8.445791273756753e-07, "loss": 0.7273, "step": 8012 }, { "epoch": 0.87, "learning_rate": 8.431614941951749e-07, "loss": 0.7437, "step": 8013 }, { "epoch": 0.87, "learning_rate": 8.417449994015703e-07, "loss": 0.6377, "step": 8014 }, { "epoch": 0.87, "learning_rate": 8.403296431709595e-07, "loss": 0.6765, "step": 8015 }, { "epoch": 0.87, "learning_rate": 8.389154256793042e-07, "loss": 0.6479, "step": 8016 }, { "epoch": 0.87, "learning_rate": 8.37502347102418e-07, "loss": 0.5925, "step": 8017 }, { "epoch": 0.87, "learning_rate": 8.360904076159804e-07, "loss": 0.6436, "step": 8018 }, { "epoch": 0.87, "learning_rate": 8.346796073955199e-07, "loss": 0.7136, "step": 8019 }, { "epoch": 0.87, "learning_rate": 8.332699466164307e-07, "loss": 0.7397, "step": 8020 }, { "epoch": 0.87, "learning_rate": 8.318614254539659e-07, "loss": 0.6543, "step": 8021 }, { "epoch": 0.87, "learning_rate": 8.304540440832299e-07, "loss": 0.7563, "step": 8022 }, { "epoch": 0.87, "learning_rate": 8.290478026791926e-07, "loss": 0.7043, "step": 8023 }, { "epoch": 0.87, "learning_rate": 8.276427014166766e-07, "loss": 0.5828, "step": 8024 }, { "epoch": 0.87, "learning_rate": 8.262387404703654e-07, "loss": 0.678, "step": 8025 }, { "epoch": 0.87, "learning_rate": 8.248359200148059e-07, "loss": 0.7075, "step": 8026 }, { "epoch": 0.87, "learning_rate": 8.234342402243934e-07, "loss": 0.6743, "step": 8027 }, { "epoch": 0.87, "learning_rate": 8.22033701273387e-07, "loss": 0.6641, "step": 8028 }, { "epoch": 0.87, "learning_rate": 8.206343033359043e-07, "loss": 0.6161, "step": 8029 }, { "epoch": 0.87, "learning_rate": 8.192360465859173e-07, "loss": 0.6111, "step": 8030 }, { "epoch": 0.87, "learning_rate": 8.178389311972612e-07, "loss": 0.7197, "step": 8031 }, { "epoch": 0.87, "learning_rate": 8.16442957343625e-07, "loss": 0.7114, "step": 8032 }, { "epoch": 0.87, "learning_rate": 8.150481251985565e-07, "loss": 0.6169, "step": 8033 }, { "epoch": 0.87, "learning_rate": 8.136544349354669e-07, "loss": 0.6577, "step": 8034 }, { "epoch": 0.87, "learning_rate": 8.122618867276156e-07, "loss": 0.6943, "step": 8035 }, { "epoch": 0.87, "learning_rate": 8.108704807481282e-07, "loss": 0.6616, "step": 8036 }, { "epoch": 0.87, "learning_rate": 8.094802171699889e-07, "loss": 0.6392, "step": 8037 }, { "epoch": 0.88, "learning_rate": 8.080910961660305e-07, "loss": 0.6179, "step": 8038 }, { "epoch": 0.88, "learning_rate": 8.067031179089535e-07, "loss": 0.6604, "step": 8039 }, { "epoch": 0.88, "learning_rate": 8.053162825713135e-07, "loss": 0.7925, "step": 8040 }, { "epoch": 0.88, "learning_rate": 8.03930590325519e-07, "loss": 0.6919, "step": 8041 }, { "epoch": 0.88, "learning_rate": 8.025460413438457e-07, "loss": 0.6924, "step": 8042 }, { "epoch": 0.88, "learning_rate": 8.011626357984182e-07, "loss": 0.728, "step": 8043 }, { "epoch": 0.88, "learning_rate": 7.997803738612209e-07, "loss": 0.6902, "step": 8044 }, { "epoch": 0.88, "learning_rate": 7.983992557041053e-07, "loss": 0.6587, "step": 8045 }, { "epoch": 0.88, "learning_rate": 7.970192814987676e-07, "loss": 0.6841, "step": 8046 }, { "epoch": 0.88, "learning_rate": 7.956404514167693e-07, "loss": 0.6855, "step": 8047 }, { "epoch": 0.88, "learning_rate": 7.942627656295299e-07, "loss": 0.6887, "step": 8048 }, { "epoch": 0.88, "learning_rate": 7.928862243083191e-07, "loss": 0.5811, "step": 8049 }, { "epoch": 0.88, "learning_rate": 7.915108276242755e-07, "loss": 0.6946, "step": 8050 }, { "epoch": 0.88, "learning_rate": 7.901365757483859e-07, "loss": 0.6667, "step": 8051 }, { "epoch": 0.88, "learning_rate": 7.887634688515e-07, "loss": 0.6897, "step": 8052 }, { "epoch": 0.88, "learning_rate": 7.873915071043248e-07, "loss": 0.708, "step": 8053 }, { "epoch": 0.88, "learning_rate": 7.860206906774192e-07, "loss": 0.6638, "step": 8054 }, { "epoch": 0.88, "learning_rate": 7.846510197412105e-07, "loss": 0.6018, "step": 8055 }, { "epoch": 0.88, "learning_rate": 7.832824944659768e-07, "loss": 0.6055, "step": 8056 }, { "epoch": 0.88, "learning_rate": 7.819151150218507e-07, "loss": 0.6465, "step": 8057 }, { "epoch": 0.88, "learning_rate": 7.805488815788287e-07, "loss": 0.7466, "step": 8058 }, { "epoch": 0.88, "learning_rate": 7.791837943067626e-07, "loss": 0.6567, "step": 8059 }, { "epoch": 0.88, "learning_rate": 7.77819853375359e-07, "loss": 0.7444, "step": 8060 }, { "epoch": 0.88, "learning_rate": 7.764570589541876e-07, "loss": 0.6687, "step": 8061 }, { "epoch": 0.88, "learning_rate": 7.750954112126686e-07, "loss": 0.6938, "step": 8062 }, { "epoch": 0.88, "learning_rate": 7.737349103200842e-07, "loss": 0.5852, "step": 8063 }, { "epoch": 0.88, "learning_rate": 7.723755564455771e-07, "loss": 0.6689, "step": 8064 }, { "epoch": 0.88, "learning_rate": 7.710173497581386e-07, "loss": 0.7339, "step": 8065 }, { "epoch": 0.88, "learning_rate": 7.696602904266237e-07, "loss": 0.7312, "step": 8066 }, { "epoch": 0.88, "learning_rate": 7.683043786197464e-07, "loss": 0.6313, "step": 8067 }, { "epoch": 0.88, "learning_rate": 7.669496145060706e-07, "loss": 0.6797, "step": 8068 }, { "epoch": 0.88, "learning_rate": 7.655959982540251e-07, "loss": 0.8105, "step": 8069 }, { "epoch": 0.88, "learning_rate": 7.642435300318906e-07, "loss": 0.6887, "step": 8070 }, { "epoch": 0.88, "learning_rate": 7.628922100078062e-07, "loss": 0.6084, "step": 8071 }, { "epoch": 0.88, "learning_rate": 7.615420383497741e-07, "loss": 0.7593, "step": 8072 }, { "epoch": 0.88, "learning_rate": 7.601930152256421e-07, "loss": 0.6816, "step": 8073 }, { "epoch": 0.88, "learning_rate": 7.588451408031272e-07, "loss": 0.739, "step": 8074 }, { "epoch": 0.88, "learning_rate": 7.574984152497988e-07, "loss": 0.6665, "step": 8075 }, { "epoch": 0.88, "learning_rate": 7.561528387330797e-07, "loss": 0.7412, "step": 8076 }, { "epoch": 0.88, "learning_rate": 7.54808411420257e-07, "loss": 0.7456, "step": 8077 }, { "epoch": 0.88, "learning_rate": 7.534651334784671e-07, "loss": 0.6587, "step": 8078 }, { "epoch": 0.88, "learning_rate": 7.521230050747086e-07, "loss": 0.7119, "step": 8079 }, { "epoch": 0.88, "learning_rate": 7.507820263758403e-07, "loss": 0.677, "step": 8080 }, { "epoch": 0.88, "learning_rate": 7.494421975485689e-07, "loss": 0.6689, "step": 8081 }, { "epoch": 0.88, "learning_rate": 7.481035187594621e-07, "loss": 0.7092, "step": 8082 }, { "epoch": 0.88, "learning_rate": 7.467659901749536e-07, "loss": 0.6958, "step": 8083 }, { "epoch": 0.88, "learning_rate": 7.454296119613191e-07, "loss": 0.7556, "step": 8084 }, { "epoch": 0.88, "learning_rate": 7.440943842847003e-07, "loss": 0.7085, "step": 8085 }, { "epoch": 0.88, "learning_rate": 7.427603073110967e-07, "loss": 0.6294, "step": 8086 }, { "epoch": 0.88, "learning_rate": 7.414273812063577e-07, "loss": 0.6885, "step": 8087 }, { "epoch": 0.88, "learning_rate": 7.400956061361975e-07, "loss": 0.626, "step": 8088 }, { "epoch": 0.88, "learning_rate": 7.387649822661802e-07, "loss": 0.6992, "step": 8089 }, { "epoch": 0.88, "learning_rate": 7.374355097617325e-07, "loss": 0.6379, "step": 8090 }, { "epoch": 0.88, "learning_rate": 7.361071887881376e-07, "loss": 0.6656, "step": 8091 }, { "epoch": 0.88, "learning_rate": 7.347800195105271e-07, "loss": 0.6821, "step": 8092 }, { "epoch": 0.88, "learning_rate": 7.334540020939018e-07, "loss": 0.5752, "step": 8093 }, { "epoch": 0.88, "learning_rate": 7.321291367031135e-07, "loss": 0.5929, "step": 8094 }, { "epoch": 0.88, "learning_rate": 7.308054235028672e-07, "loss": 0.792, "step": 8095 }, { "epoch": 0.88, "learning_rate": 7.294828626577321e-07, "loss": 0.6577, "step": 8096 }, { "epoch": 0.88, "learning_rate": 7.281614543321269e-07, "loss": 0.6697, "step": 8097 }, { "epoch": 0.88, "learning_rate": 7.268411986903312e-07, "loss": 0.6196, "step": 8098 }, { "epoch": 0.88, "learning_rate": 7.255220958964826e-07, "loss": 0.6868, "step": 8099 }, { "epoch": 0.88, "learning_rate": 7.242041461145688e-07, "loss": 0.5989, "step": 8100 }, { "epoch": 0.88, "learning_rate": 7.22887349508441e-07, "loss": 0.623, "step": 8101 }, { "epoch": 0.88, "learning_rate": 7.21571706241807e-07, "loss": 0.6189, "step": 8102 }, { "epoch": 0.88, "learning_rate": 7.202572164782263e-07, "loss": 0.7463, "step": 8103 }, { "epoch": 0.88, "learning_rate": 7.189438803811166e-07, "loss": 0.6528, "step": 8104 }, { "epoch": 0.88, "learning_rate": 7.176316981137565e-07, "loss": 0.6016, "step": 8105 }, { "epoch": 0.88, "learning_rate": 7.163206698392744e-07, "loss": 0.6755, "step": 8106 }, { "epoch": 0.88, "learning_rate": 7.150107957206609e-07, "loss": 0.5713, "step": 8107 }, { "epoch": 0.88, "learning_rate": 7.13702075920758e-07, "loss": 0.6157, "step": 8108 }, { "epoch": 0.88, "learning_rate": 7.12394510602269e-07, "loss": 0.6562, "step": 8109 }, { "epoch": 0.88, "learning_rate": 7.110880999277536e-07, "loss": 0.6453, "step": 8110 }, { "epoch": 0.88, "learning_rate": 7.0978284405962e-07, "loss": 0.7212, "step": 8111 }, { "epoch": 0.88, "learning_rate": 7.084787431601437e-07, "loss": 0.6943, "step": 8112 }, { "epoch": 0.88, "learning_rate": 7.071757973914528e-07, "loss": 0.6946, "step": 8113 }, { "epoch": 0.88, "learning_rate": 7.058740069155268e-07, "loss": 0.769, "step": 8114 }, { "epoch": 0.88, "learning_rate": 7.045733718942094e-07, "loss": 0.6577, "step": 8115 }, { "epoch": 0.88, "learning_rate": 7.032738924891936e-07, "loss": 0.5854, "step": 8116 }, { "epoch": 0.88, "learning_rate": 7.019755688620322e-07, "loss": 0.658, "step": 8117 }, { "epoch": 0.88, "learning_rate": 7.006784011741374e-07, "loss": 0.5435, "step": 8118 }, { "epoch": 0.88, "learning_rate": 6.99382389586769e-07, "loss": 0.8149, "step": 8119 }, { "epoch": 0.88, "learning_rate": 6.980875342610527e-07, "loss": 0.5908, "step": 8120 }, { "epoch": 0.88, "learning_rate": 6.96793835357964e-07, "loss": 0.644, "step": 8121 }, { "epoch": 0.88, "learning_rate": 6.955012930383375e-07, "loss": 0.6812, "step": 8122 }, { "epoch": 0.88, "learning_rate": 6.942099074628639e-07, "loss": 0.6572, "step": 8123 }, { "epoch": 0.88, "learning_rate": 6.9291967879209e-07, "loss": 0.7192, "step": 8124 }, { "epoch": 0.88, "learning_rate": 6.916306071864154e-07, "loss": 0.7095, "step": 8125 }, { "epoch": 0.88, "learning_rate": 6.903426928061019e-07, "loss": 0.7837, "step": 8126 }, { "epoch": 0.88, "learning_rate": 6.890559358112614e-07, "loss": 0.6882, "step": 8127 }, { "epoch": 0.88, "learning_rate": 6.877703363618671e-07, "loss": 0.7378, "step": 8128 }, { "epoch": 0.88, "learning_rate": 6.864858946177456e-07, "loss": 0.5969, "step": 8129 }, { "epoch": 0.89, "learning_rate": 6.852026107385756e-07, "loss": 0.6042, "step": 8130 }, { "epoch": 0.89, "learning_rate": 6.839204848839031e-07, "loss": 0.7141, "step": 8131 }, { "epoch": 0.89, "learning_rate": 6.826395172131206e-07, "loss": 0.6802, "step": 8132 }, { "epoch": 0.89, "learning_rate": 6.813597078854772e-07, "loss": 0.6086, "step": 8133 }, { "epoch": 0.89, "learning_rate": 6.800810570600824e-07, "loss": 0.6177, "step": 8134 }, { "epoch": 0.89, "learning_rate": 6.788035648958979e-07, "loss": 0.7209, "step": 8135 }, { "epoch": 0.89, "learning_rate": 6.775272315517423e-07, "loss": 0.7739, "step": 8136 }, { "epoch": 0.89, "learning_rate": 6.76252057186293e-07, "loss": 0.6621, "step": 8137 }, { "epoch": 0.89, "learning_rate": 6.749780419580787e-07, "loss": 0.7749, "step": 8138 }, { "epoch": 0.89, "learning_rate": 6.737051860254861e-07, "loss": 0.6533, "step": 8139 }, { "epoch": 0.89, "learning_rate": 6.724334895467588e-07, "loss": 0.6985, "step": 8140 }, { "epoch": 0.89, "learning_rate": 6.711629526799946e-07, "loss": 0.6567, "step": 8141 }, { "epoch": 0.89, "learning_rate": 6.698935755831493e-07, "loss": 0.6545, "step": 8142 }, { "epoch": 0.89, "learning_rate": 6.686253584140334e-07, "loss": 0.6147, "step": 8143 }, { "epoch": 0.89, "learning_rate": 6.673583013303098e-07, "loss": 0.6277, "step": 8144 }, { "epoch": 0.89, "learning_rate": 6.660924044895035e-07, "loss": 0.7954, "step": 8145 }, { "epoch": 0.89, "learning_rate": 6.648276680489896e-07, "loss": 0.7073, "step": 8146 }, { "epoch": 0.89, "learning_rate": 6.635640921660014e-07, "loss": 0.77, "step": 8147 }, { "epoch": 0.89, "learning_rate": 6.623016769976309e-07, "loss": 0.6414, "step": 8148 }, { "epoch": 0.89, "learning_rate": 6.610404227008182e-07, "loss": 0.6965, "step": 8149 }, { "epoch": 0.89, "learning_rate": 6.597803294323668e-07, "loss": 0.7698, "step": 8150 }, { "epoch": 0.89, "learning_rate": 6.585213973489335e-07, "loss": 0.7004, "step": 8151 }, { "epoch": 0.89, "learning_rate": 6.572636266070265e-07, "loss": 0.7068, "step": 8152 }, { "epoch": 0.89, "learning_rate": 6.560070173630173e-07, "loss": 0.6299, "step": 8153 }, { "epoch": 0.89, "learning_rate": 6.547515697731244e-07, "loss": 0.7305, "step": 8154 }, { "epoch": 0.89, "learning_rate": 6.534972839934284e-07, "loss": 0.5735, "step": 8155 }, { "epoch": 0.89, "learning_rate": 6.522441601798646e-07, "loss": 0.7124, "step": 8156 }, { "epoch": 0.89, "learning_rate": 6.509921984882195e-07, "loss": 0.6787, "step": 8157 }, { "epoch": 0.89, "learning_rate": 6.497413990741397e-07, "loss": 0.8345, "step": 8158 }, { "epoch": 0.89, "learning_rate": 6.484917620931264e-07, "loss": 0.6545, "step": 8159 }, { "epoch": 0.89, "learning_rate": 6.472432877005341e-07, "loss": 0.7368, "step": 8160 }, { "epoch": 0.89, "learning_rate": 6.459959760515766e-07, "loss": 0.7261, "step": 8161 }, { "epoch": 0.89, "learning_rate": 6.447498273013208e-07, "loss": 0.7451, "step": 8162 }, { "epoch": 0.89, "learning_rate": 6.435048416046863e-07, "loss": 0.6572, "step": 8163 }, { "epoch": 0.89, "learning_rate": 6.422610191164535e-07, "loss": 0.6001, "step": 8164 }, { "epoch": 0.89, "learning_rate": 6.410183599912534e-07, "loss": 0.6768, "step": 8165 }, { "epoch": 0.89, "learning_rate": 6.397768643835755e-07, "loss": 0.707, "step": 8166 }, { "epoch": 0.89, "learning_rate": 6.385365324477666e-07, "loss": 0.667, "step": 8167 }, { "epoch": 0.89, "learning_rate": 6.372973643380187e-07, "loss": 0.6995, "step": 8168 }, { "epoch": 0.89, "learning_rate": 6.360593602083942e-07, "loss": 0.6619, "step": 8169 }, { "epoch": 0.89, "learning_rate": 6.348225202128e-07, "loss": 0.6675, "step": 8170 }, { "epoch": 0.89, "learning_rate": 6.335868445049998e-07, "loss": 0.7117, "step": 8171 }, { "epoch": 0.89, "learning_rate": 6.323523332386172e-07, "loss": 0.4932, "step": 8172 }, { "epoch": 0.89, "learning_rate": 6.311189865671242e-07, "loss": 0.5437, "step": 8173 }, { "epoch": 0.89, "learning_rate": 6.298868046438533e-07, "loss": 0.572, "step": 8174 }, { "epoch": 0.89, "learning_rate": 6.286557876219912e-07, "loss": 0.7471, "step": 8175 }, { "epoch": 0.89, "learning_rate": 6.274259356545775e-07, "loss": 0.6108, "step": 8176 }, { "epoch": 0.89, "learning_rate": 6.261972488945089e-07, "loss": 0.7097, "step": 8177 }, { "epoch": 0.89, "learning_rate": 6.249697274945377e-07, "loss": 0.7017, "step": 8178 }, { "epoch": 0.89, "learning_rate": 6.237433716072705e-07, "loss": 0.6521, "step": 8179 }, { "epoch": 0.89, "learning_rate": 6.225181813851688e-07, "loss": 0.6218, "step": 8180 }, { "epoch": 0.89, "learning_rate": 6.212941569805508e-07, "loss": 0.7087, "step": 8181 }, { "epoch": 0.89, "learning_rate": 6.200712985455858e-07, "loss": 0.8149, "step": 8182 }, { "epoch": 0.89, "learning_rate": 6.188496062323035e-07, "loss": 0.6931, "step": 8183 }, { "epoch": 0.89, "learning_rate": 6.176290801925822e-07, "loss": 0.7363, "step": 8184 }, { "epoch": 0.89, "learning_rate": 6.164097205781616e-07, "loss": 0.6602, "step": 8185 }, { "epoch": 0.89, "learning_rate": 6.151915275406339e-07, "loss": 0.5723, "step": 8186 }, { "epoch": 0.89, "learning_rate": 6.139745012314424e-07, "loss": 0.7111, "step": 8187 }, { "epoch": 0.89, "learning_rate": 6.127586418018938e-07, "loss": 0.6353, "step": 8188 }, { "epoch": 0.89, "learning_rate": 6.115439494031428e-07, "loss": 0.6436, "step": 8189 }, { "epoch": 0.89, "learning_rate": 6.103304241862006e-07, "loss": 0.5991, "step": 8190 }, { "epoch": 0.89, "learning_rate": 6.091180663019358e-07, "loss": 0.751, "step": 8191 }, { "epoch": 0.89, "learning_rate": 6.079068759010676e-07, "loss": 0.6311, "step": 8192 }, { "epoch": 0.89, "learning_rate": 6.066968531341721e-07, "loss": 0.6719, "step": 8193 }, { "epoch": 0.89, "learning_rate": 6.054879981516836e-07, "loss": 0.7783, "step": 8194 }, { "epoch": 0.89, "learning_rate": 6.042803111038842e-07, "loss": 0.5327, "step": 8195 }, { "epoch": 0.89, "learning_rate": 6.030737921409169e-07, "loss": 0.8005, "step": 8196 }, { "epoch": 0.89, "learning_rate": 6.018684414127762e-07, "loss": 0.646, "step": 8197 }, { "epoch": 0.89, "learning_rate": 6.006642590693146e-07, "loss": 0.6216, "step": 8198 }, { "epoch": 0.89, "learning_rate": 5.994612452602344e-07, "loss": 0.6658, "step": 8199 }, { "epoch": 0.89, "learning_rate": 5.982594001350994e-07, "loss": 0.6614, "step": 8200 }, { "epoch": 0.89, "learning_rate": 5.97058723843319e-07, "loss": 0.7817, "step": 8201 }, { "epoch": 0.89, "learning_rate": 5.95859216534167e-07, "loss": 0.6897, "step": 8202 }, { "epoch": 0.89, "learning_rate": 5.946608783567642e-07, "loss": 0.7251, "step": 8203 }, { "epoch": 0.89, "learning_rate": 5.934637094600892e-07, "loss": 0.6938, "step": 8204 }, { "epoch": 0.89, "learning_rate": 5.922677099929785e-07, "loss": 0.6794, "step": 8205 }, { "epoch": 0.89, "learning_rate": 5.910728801041166e-07, "loss": 0.7158, "step": 8206 }, { "epoch": 0.89, "learning_rate": 5.898792199420445e-07, "loss": 0.6096, "step": 8207 }, { "epoch": 0.89, "learning_rate": 5.886867296551646e-07, "loss": 0.6113, "step": 8208 }, { "epoch": 0.89, "learning_rate": 5.87495409391724e-07, "loss": 0.5903, "step": 8209 }, { "epoch": 0.89, "learning_rate": 5.863052592998308e-07, "loss": 0.5969, "step": 8210 }, { "epoch": 0.89, "learning_rate": 5.851162795274445e-07, "loss": 0.6409, "step": 8211 }, { "epoch": 0.89, "learning_rate": 5.839284702223802e-07, "loss": 0.6802, "step": 8212 }, { "epoch": 0.89, "learning_rate": 5.827418315323097e-07, "loss": 0.6077, "step": 8213 }, { "epoch": 0.89, "learning_rate": 5.815563636047539e-07, "loss": 0.7041, "step": 8214 }, { "epoch": 0.89, "learning_rate": 5.803720665870927e-07, "loss": 0.6677, "step": 8215 }, { "epoch": 0.89, "learning_rate": 5.791889406265583e-07, "loss": 0.6919, "step": 8216 }, { "epoch": 0.89, "learning_rate": 5.780069858702397e-07, "loss": 0.6113, "step": 8217 }, { "epoch": 0.89, "learning_rate": 5.768262024650773e-07, "loss": 0.7085, "step": 8218 }, { "epoch": 0.89, "learning_rate": 5.75646590557869e-07, "loss": 0.7224, "step": 8219 }, { "epoch": 0.89, "learning_rate": 5.744681502952621e-07, "loss": 0.7683, "step": 8220 }, { "epoch": 0.89, "learning_rate": 5.732908818237659e-07, "loss": 0.6357, "step": 8221 }, { "epoch": 0.9, "learning_rate": 5.721147852897347e-07, "loss": 0.6404, "step": 8222 }, { "epoch": 0.9, "learning_rate": 5.709398608393835e-07, "loss": 0.6125, "step": 8223 }, { "epoch": 0.9, "learning_rate": 5.697661086187823e-07, "loss": 0.8262, "step": 8224 }, { "epoch": 0.9, "learning_rate": 5.685935287738509e-07, "loss": 0.7451, "step": 8225 }, { "epoch": 0.9, "learning_rate": 5.674221214503639e-07, "loss": 0.7012, "step": 8226 }, { "epoch": 0.9, "learning_rate": 5.662518867939571e-07, "loss": 0.8213, "step": 8227 }, { "epoch": 0.9, "learning_rate": 5.650828249501106e-07, "loss": 0.6177, "step": 8228 }, { "epoch": 0.9, "learning_rate": 5.63914936064165e-07, "loss": 0.7417, "step": 8229 }, { "epoch": 0.9, "learning_rate": 5.627482202813128e-07, "loss": 0.6462, "step": 8230 }, { "epoch": 0.9, "learning_rate": 5.615826777466016e-07, "loss": 0.676, "step": 8231 }, { "epoch": 0.9, "learning_rate": 5.604183086049342e-07, "loss": 0.7856, "step": 8232 }, { "epoch": 0.9, "learning_rate": 5.592551130010626e-07, "loss": 0.7183, "step": 8233 }, { "epoch": 0.9, "learning_rate": 5.580930910795978e-07, "loss": 0.7231, "step": 8234 }, { "epoch": 0.9, "learning_rate": 5.569322429850055e-07, "loss": 0.7029, "step": 8235 }, { "epoch": 0.9, "learning_rate": 5.557725688616001e-07, "loss": 0.6443, "step": 8236 }, { "epoch": 0.9, "learning_rate": 5.546140688535562e-07, "loss": 0.6594, "step": 8237 }, { "epoch": 0.9, "learning_rate": 5.53456743104901e-07, "loss": 0.6951, "step": 8238 }, { "epoch": 0.9, "learning_rate": 5.523005917595093e-07, "loss": 0.7261, "step": 8239 }, { "epoch": 0.9, "learning_rate": 5.511456149611194e-07, "loss": 0.7217, "step": 8240 }, { "epoch": 0.9, "learning_rate": 5.499918128533155e-07, "loss": 0.603, "step": 8241 }, { "epoch": 0.9, "learning_rate": 5.488391855795416e-07, "loss": 0.6943, "step": 8242 }, { "epoch": 0.9, "learning_rate": 5.476877332830954e-07, "loss": 0.689, "step": 8243 }, { "epoch": 0.9, "learning_rate": 5.465374561071213e-07, "loss": 0.6902, "step": 8244 }, { "epoch": 0.9, "learning_rate": 5.453883541946248e-07, "loss": 0.6731, "step": 8245 }, { "epoch": 0.9, "learning_rate": 5.442404276884683e-07, "loss": 0.6392, "step": 8246 }, { "epoch": 0.9, "learning_rate": 5.430936767313566e-07, "loss": 0.729, "step": 8247 }, { "epoch": 0.9, "learning_rate": 5.41948101465859e-07, "loss": 0.5669, "step": 8248 }, { "epoch": 0.9, "learning_rate": 5.408037020343915e-07, "loss": 0.6997, "step": 8249 }, { "epoch": 0.9, "learning_rate": 5.396604785792281e-07, "loss": 0.6345, "step": 8250 }, { "epoch": 0.9, "learning_rate": 5.385184312424973e-07, "loss": 0.7261, "step": 8251 }, { "epoch": 0.9, "learning_rate": 5.373775601661757e-07, "loss": 0.7764, "step": 8252 }, { "epoch": 0.9, "learning_rate": 5.362378654921008e-07, "loss": 0.6582, "step": 8253 }, { "epoch": 0.9, "learning_rate": 5.350993473619592e-07, "loss": 0.7671, "step": 8254 }, { "epoch": 0.9, "learning_rate": 5.339620059172923e-07, "loss": 0.7856, "step": 8255 }, { "epoch": 0.9, "learning_rate": 5.328258412994958e-07, "loss": 0.6284, "step": 8256 }, { "epoch": 0.9, "learning_rate": 5.316908536498211e-07, "loss": 0.6597, "step": 8257 }, { "epoch": 0.9, "learning_rate": 5.305570431093665e-07, "loss": 0.7329, "step": 8258 }, { "epoch": 0.9, "learning_rate": 5.294244098190926e-07, "loss": 0.6677, "step": 8259 }, { "epoch": 0.9, "learning_rate": 5.282929539198056e-07, "loss": 0.6191, "step": 8260 }, { "epoch": 0.9, "learning_rate": 5.271626755521719e-07, "loss": 0.6426, "step": 8261 }, { "epoch": 0.9, "learning_rate": 5.26033574856708e-07, "loss": 0.688, "step": 8262 }, { "epoch": 0.9, "learning_rate": 5.24905651973785e-07, "loss": 0.6172, "step": 8263 }, { "epoch": 0.9, "learning_rate": 5.237789070436239e-07, "loss": 0.5352, "step": 8264 }, { "epoch": 0.9, "learning_rate": 5.226533402063094e-07, "loss": 0.7869, "step": 8265 }, { "epoch": 0.9, "learning_rate": 5.215289516017685e-07, "loss": 0.6553, "step": 8266 }, { "epoch": 0.9, "learning_rate": 5.204057413697883e-07, "loss": 0.6963, "step": 8267 }, { "epoch": 0.9, "learning_rate": 5.192837096500058e-07, "loss": 0.6372, "step": 8268 }, { "epoch": 0.9, "learning_rate": 5.18162856581913e-07, "loss": 0.6062, "step": 8269 }, { "epoch": 0.9, "learning_rate": 5.170431823048571e-07, "loss": 0.5835, "step": 8270 }, { "epoch": 0.9, "learning_rate": 5.159246869580348e-07, "loss": 0.6775, "step": 8271 }, { "epoch": 0.9, "learning_rate": 5.148073706805001e-07, "loss": 0.6951, "step": 8272 }, { "epoch": 0.9, "learning_rate": 5.136912336111599e-07, "loss": 0.7222, "step": 8273 }, { "epoch": 0.9, "learning_rate": 5.125762758887687e-07, "loss": 0.7144, "step": 8274 }, { "epoch": 0.9, "learning_rate": 5.114624976519434e-07, "loss": 0.7588, "step": 8275 }, { "epoch": 0.9, "learning_rate": 5.103498990391509e-07, "loss": 0.5883, "step": 8276 }, { "epoch": 0.9, "learning_rate": 5.092384801887074e-07, "loss": 0.7075, "step": 8277 }, { "epoch": 0.9, "learning_rate": 5.081282412387878e-07, "loss": 0.6206, "step": 8278 }, { "epoch": 0.9, "learning_rate": 5.070191823274151e-07, "loss": 0.7297, "step": 8279 }, { "epoch": 0.9, "learning_rate": 5.059113035924712e-07, "loss": 0.7112, "step": 8280 }, { "epoch": 0.9, "learning_rate": 5.048046051716892e-07, "loss": 0.572, "step": 8281 }, { "epoch": 0.9, "learning_rate": 5.036990872026515e-07, "loss": 0.7195, "step": 8282 }, { "epoch": 0.9, "learning_rate": 5.025947498227979e-07, "loss": 0.7983, "step": 8283 }, { "epoch": 0.9, "learning_rate": 5.014915931694253e-07, "loss": 0.707, "step": 8284 }, { "epoch": 0.9, "learning_rate": 5.003896173796751e-07, "loss": 0.6292, "step": 8285 }, { "epoch": 0.9, "learning_rate": 4.992888225905467e-07, "loss": 0.6853, "step": 8286 }, { "epoch": 0.9, "learning_rate": 4.981892089388917e-07, "loss": 0.6343, "step": 8287 }, { "epoch": 0.9, "learning_rate": 4.970907765614152e-07, "loss": 0.6897, "step": 8288 }, { "epoch": 0.9, "learning_rate": 4.959935255946769e-07, "loss": 0.6416, "step": 8289 }, { "epoch": 0.9, "learning_rate": 4.948974561750852e-07, "loss": 0.7334, "step": 8290 }, { "epoch": 0.9, "learning_rate": 4.93802568438907e-07, "loss": 0.668, "step": 8291 }, { "epoch": 0.9, "learning_rate": 4.927088625222598e-07, "loss": 0.6719, "step": 8292 }, { "epoch": 0.9, "learning_rate": 4.916163385611094e-07, "loss": 0.6016, "step": 8293 }, { "epoch": 0.9, "learning_rate": 4.905249966912862e-07, "loss": 0.6455, "step": 8294 }, { "epoch": 0.9, "learning_rate": 4.894348370484648e-07, "loss": 0.6467, "step": 8295 }, { "epoch": 0.9, "learning_rate": 4.883458597681722e-07, "loss": 0.7043, "step": 8296 }, { "epoch": 0.9, "learning_rate": 4.872580649857949e-07, "loss": 0.5969, "step": 8297 }, { "epoch": 0.9, "learning_rate": 4.861714528365647e-07, "loss": 0.717, "step": 8298 }, { "epoch": 0.9, "learning_rate": 4.85086023455572e-07, "loss": 0.6064, "step": 8299 }, { "epoch": 0.9, "learning_rate": 4.840017769777605e-07, "loss": 0.6453, "step": 8300 }, { "epoch": 0.9, "learning_rate": 4.829187135379221e-07, "loss": 0.6992, "step": 8301 }, { "epoch": 0.9, "learning_rate": 4.818368332707024e-07, "loss": 0.6664, "step": 8302 }, { "epoch": 0.9, "learning_rate": 4.807561363106072e-07, "loss": 0.5979, "step": 8303 }, { "epoch": 0.9, "learning_rate": 4.796766227919858e-07, "loss": 0.6687, "step": 8304 }, { "epoch": 0.9, "learning_rate": 4.785982928490473e-07, "loss": 0.7578, "step": 8305 }, { "epoch": 0.9, "learning_rate": 4.775211466158469e-07, "loss": 0.6892, "step": 8306 }, { "epoch": 0.9, "learning_rate": 4.764451842262996e-07, "loss": 0.7246, "step": 8307 }, { "epoch": 0.9, "learning_rate": 4.753704058141695e-07, "loss": 0.7261, "step": 8308 }, { "epoch": 0.9, "learning_rate": 4.742968115130719e-07, "loss": 0.6428, "step": 8309 }, { "epoch": 0.9, "learning_rate": 4.7322440145647905e-07, "loss": 0.7349, "step": 8310 }, { "epoch": 0.9, "learning_rate": 4.7215317577771424e-07, "loss": 0.7021, "step": 8311 }, { "epoch": 0.9, "learning_rate": 4.710831346099509e-07, "loss": 0.7358, "step": 8312 }, { "epoch": 0.9, "learning_rate": 4.7001427808622045e-07, "loss": 0.6602, "step": 8313 }, { "epoch": 0.91, "learning_rate": 4.6894660633940435e-07, "loss": 0.6484, "step": 8314 }, { "epoch": 0.91, "learning_rate": 4.678801195022342e-07, "loss": 0.7053, "step": 8315 }, { "epoch": 0.91, "learning_rate": 4.6681481770729844e-07, "loss": 0.72, "step": 8316 }, { "epoch": 0.91, "learning_rate": 4.6575070108703433e-07, "loss": 0.6897, "step": 8317 }, { "epoch": 0.91, "learning_rate": 4.646877697737362e-07, "loss": 0.6841, "step": 8318 }, { "epoch": 0.91, "learning_rate": 4.6362602389954825e-07, "loss": 0.696, "step": 8319 }, { "epoch": 0.91, "learning_rate": 4.6256546359646604e-07, "loss": 0.6689, "step": 8320 }, { "epoch": 0.91, "learning_rate": 4.6150608899633855e-07, "loss": 0.7314, "step": 8321 }, { "epoch": 0.91, "learning_rate": 4.6044790023087373e-07, "loss": 0.6521, "step": 8322 }, { "epoch": 0.91, "learning_rate": 4.593908974316208e-07, "loss": 0.7444, "step": 8323 }, { "epoch": 0.91, "learning_rate": 4.5833508072999243e-07, "loss": 0.6462, "step": 8324 }, { "epoch": 0.91, "learning_rate": 4.5728045025724366e-07, "loss": 0.5735, "step": 8325 }, { "epoch": 0.91, "learning_rate": 4.562270061444907e-07, "loss": 0.7661, "step": 8326 }, { "epoch": 0.91, "learning_rate": 4.551747485226976e-07, "loss": 0.6736, "step": 8327 }, { "epoch": 0.91, "learning_rate": 4.5412367752268094e-07, "loss": 0.6313, "step": 8328 }, { "epoch": 0.91, "learning_rate": 4.530737932751128e-07, "loss": 0.5452, "step": 8329 }, { "epoch": 0.91, "learning_rate": 4.5202509591051547e-07, "loss": 0.6785, "step": 8330 }, { "epoch": 0.91, "learning_rate": 4.509775855592613e-07, "loss": 0.6917, "step": 8331 }, { "epoch": 0.91, "learning_rate": 4.499312623515806e-07, "loss": 0.6069, "step": 8332 }, { "epoch": 0.91, "learning_rate": 4.488861264175537e-07, "loss": 0.6553, "step": 8333 }, { "epoch": 0.91, "learning_rate": 4.4784217788711113e-07, "loss": 0.7944, "step": 8334 }, { "epoch": 0.91, "learning_rate": 4.4679941689003914e-07, "loss": 0.5405, "step": 8335 }, { "epoch": 0.91, "learning_rate": 4.4575784355597284e-07, "loss": 0.75, "step": 8336 }, { "epoch": 0.91, "learning_rate": 4.447174580144031e-07, "loss": 0.7808, "step": 8337 }, { "epoch": 0.91, "learning_rate": 4.436782603946721e-07, "loss": 0.6653, "step": 8338 }, { "epoch": 0.91, "learning_rate": 4.4264025082597084e-07, "loss": 0.6206, "step": 8339 }, { "epoch": 0.91, "learning_rate": 4.4160342943734723e-07, "loss": 0.6206, "step": 8340 }, { "epoch": 0.91, "learning_rate": 4.4056779635770374e-07, "loss": 0.6473, "step": 8341 }, { "epoch": 0.91, "learning_rate": 4.3953335171578514e-07, "loss": 0.7258, "step": 8342 }, { "epoch": 0.91, "learning_rate": 4.3850009564019967e-07, "loss": 0.5996, "step": 8343 }, { "epoch": 0.91, "learning_rate": 4.3746802825939903e-07, "loss": 0.6748, "step": 8344 }, { "epoch": 0.91, "learning_rate": 4.364371497016917e-07, "loss": 0.668, "step": 8345 }, { "epoch": 0.91, "learning_rate": 4.354074600952407e-07, "loss": 0.6616, "step": 8346 }, { "epoch": 0.91, "learning_rate": 4.343789595680525e-07, "loss": 0.6772, "step": 8347 }, { "epoch": 0.91, "learning_rate": 4.3335164824799494e-07, "loss": 0.6021, "step": 8348 }, { "epoch": 0.91, "learning_rate": 4.323255262627846e-07, "loss": 0.7156, "step": 8349 }, { "epoch": 0.91, "learning_rate": 4.313005937399861e-07, "loss": 0.7522, "step": 8350 }, { "epoch": 0.91, "learning_rate": 4.3027685080702543e-07, "loss": 0.6118, "step": 8351 }, { "epoch": 0.91, "learning_rate": 4.2925429759117175e-07, "loss": 0.646, "step": 8352 }, { "epoch": 0.91, "learning_rate": 4.2823293421955017e-07, "loss": 0.7048, "step": 8353 }, { "epoch": 0.91, "learning_rate": 4.272127608191401e-07, "loss": 0.6768, "step": 8354 }, { "epoch": 0.91, "learning_rate": 4.261937775167657e-07, "loss": 0.6521, "step": 8355 }, { "epoch": 0.91, "learning_rate": 4.2517598443911235e-07, "loss": 0.6343, "step": 8356 }, { "epoch": 0.91, "learning_rate": 4.241593817127121e-07, "loss": 0.6494, "step": 8357 }, { "epoch": 0.91, "learning_rate": 4.2314396946394833e-07, "loss": 0.6438, "step": 8358 }, { "epoch": 0.91, "learning_rate": 4.221297478190589e-07, "loss": 0.7019, "step": 8359 }, { "epoch": 0.91, "learning_rate": 4.2111671690413303e-07, "loss": 0.7437, "step": 8360 }, { "epoch": 0.91, "learning_rate": 4.2010487684511105e-07, "loss": 0.6904, "step": 8361 }, { "epoch": 0.91, "learning_rate": 4.1909422776778784e-07, "loss": 0.6904, "step": 8362 }, { "epoch": 0.91, "learning_rate": 4.1808476979780634e-07, "loss": 0.6677, "step": 8363 }, { "epoch": 0.91, "learning_rate": 4.170765030606638e-07, "loss": 0.689, "step": 8364 }, { "epoch": 0.91, "learning_rate": 4.16069427681709e-07, "loss": 0.6033, "step": 8365 }, { "epoch": 0.91, "learning_rate": 4.1506354378614277e-07, "loss": 0.7114, "step": 8366 }, { "epoch": 0.91, "learning_rate": 4.1405885149901623e-07, "loss": 0.5845, "step": 8367 }, { "epoch": 0.91, "learning_rate": 4.130553509452362e-07, "loss": 0.7949, "step": 8368 }, { "epoch": 0.91, "learning_rate": 4.1205304224955503e-07, "loss": 0.6614, "step": 8369 }, { "epoch": 0.91, "learning_rate": 4.110519255365852e-07, "loss": 0.6355, "step": 8370 }, { "epoch": 0.91, "learning_rate": 4.10052000930784e-07, "loss": 0.6238, "step": 8371 }, { "epoch": 0.91, "learning_rate": 4.0905326855646186e-07, "loss": 0.6106, "step": 8372 }, { "epoch": 0.91, "learning_rate": 4.0805572853778617e-07, "loss": 0.7273, "step": 8373 }, { "epoch": 0.91, "learning_rate": 4.0705938099876664e-07, "loss": 0.7021, "step": 8374 }, { "epoch": 0.91, "learning_rate": 4.060642260632741e-07, "loss": 0.6643, "step": 8375 }, { "epoch": 0.91, "learning_rate": 4.0507026385502747e-07, "loss": 0.5779, "step": 8376 }, { "epoch": 0.91, "learning_rate": 4.040774944975934e-07, "loss": 0.6052, "step": 8377 }, { "epoch": 0.91, "learning_rate": 4.030859181143976e-07, "loss": 0.6038, "step": 8378 }, { "epoch": 0.91, "learning_rate": 4.0209553482871145e-07, "loss": 0.6321, "step": 8379 }, { "epoch": 0.91, "learning_rate": 4.0110634476366097e-07, "loss": 0.6477, "step": 8380 }, { "epoch": 0.91, "learning_rate": 4.001183480422255e-07, "loss": 0.5986, "step": 8381 }, { "epoch": 0.91, "learning_rate": 3.9913154478723014e-07, "loss": 0.6855, "step": 8382 }, { "epoch": 0.91, "learning_rate": 3.981459351213568e-07, "loss": 0.6348, "step": 8383 }, { "epoch": 0.91, "learning_rate": 3.971615191671385e-07, "loss": 0.7017, "step": 8384 }, { "epoch": 0.91, "learning_rate": 3.9617829704695634e-07, "loss": 0.7358, "step": 8385 }, { "epoch": 0.91, "learning_rate": 3.9519626888304684e-07, "loss": 0.6616, "step": 8386 }, { "epoch": 0.91, "learning_rate": 3.9421543479749804e-07, "loss": 0.6412, "step": 8387 }, { "epoch": 0.91, "learning_rate": 3.932357949122445e-07, "loss": 0.7146, "step": 8388 }, { "epoch": 0.91, "learning_rate": 3.9225734934907997e-07, "loss": 0.6982, "step": 8389 }, { "epoch": 0.91, "learning_rate": 3.9128009822964385e-07, "loss": 0.7183, "step": 8390 }, { "epoch": 0.91, "learning_rate": 3.9030404167542777e-07, "loss": 0.6646, "step": 8391 }, { "epoch": 0.91, "learning_rate": 3.8932917980777916e-07, "loss": 0.5667, "step": 8392 }, { "epoch": 0.91, "learning_rate": 3.8835551274789107e-07, "loss": 0.7034, "step": 8393 }, { "epoch": 0.91, "learning_rate": 3.8738304061681107e-07, "loss": 0.6711, "step": 8394 }, { "epoch": 0.91, "learning_rate": 3.864117635354403e-07, "loss": 0.7095, "step": 8395 }, { "epoch": 0.91, "learning_rate": 3.8544168162452544e-07, "loss": 0.6338, "step": 8396 }, { "epoch": 0.91, "learning_rate": 3.8447279500466893e-07, "loss": 0.7114, "step": 8397 }, { "epoch": 0.91, "learning_rate": 3.835051037963244e-07, "loss": 0.6508, "step": 8398 }, { "epoch": 0.91, "learning_rate": 3.8253860811979573e-07, "loss": 0.5825, "step": 8399 }, { "epoch": 0.91, "learning_rate": 3.8157330809524105e-07, "loss": 0.7517, "step": 8400 }, { "epoch": 0.91, "learning_rate": 3.806092038426623e-07, "loss": 0.6226, "step": 8401 }, { "epoch": 0.91, "learning_rate": 3.7964629548192135e-07, "loss": 0.6743, "step": 8402 }, { "epoch": 0.91, "learning_rate": 3.7868458313272906e-07, "loss": 0.6738, "step": 8403 }, { "epoch": 0.91, "learning_rate": 3.777240669146431e-07, "loss": 0.7114, "step": 8404 }, { "epoch": 0.91, "learning_rate": 3.7676474694707697e-07, "loss": 0.6323, "step": 8405 }, { "epoch": 0.92, "learning_rate": 3.7580662334929517e-07, "loss": 0.6897, "step": 8406 }, { "epoch": 0.92, "learning_rate": 3.7484969624041025e-07, "loss": 0.6047, "step": 8407 }, { "epoch": 0.92, "learning_rate": 3.7389396573939253e-07, "loss": 0.7378, "step": 8408 }, { "epoch": 0.92, "learning_rate": 3.7293943196505476e-07, "loss": 0.7219, "step": 8409 }, { "epoch": 0.92, "learning_rate": 3.719860950360676e-07, "loss": 0.6782, "step": 8410 }, { "epoch": 0.92, "learning_rate": 3.710339550709519e-07, "loss": 0.6897, "step": 8411 }, { "epoch": 0.92, "learning_rate": 3.7008301218807716e-07, "loss": 0.6912, "step": 8412 }, { "epoch": 0.92, "learning_rate": 3.691332665056646e-07, "loss": 0.7749, "step": 8413 }, { "epoch": 0.92, "learning_rate": 3.681847181417897e-07, "loss": 0.6199, "step": 8414 }, { "epoch": 0.92, "learning_rate": 3.6723736721437475e-07, "loss": 0.793, "step": 8415 }, { "epoch": 0.92, "learning_rate": 3.662912138411967e-07, "loss": 0.7202, "step": 8416 }, { "epoch": 0.92, "learning_rate": 3.6534625813988257e-07, "loss": 0.6848, "step": 8417 }, { "epoch": 0.92, "learning_rate": 3.6440250022790837e-07, "loss": 0.7124, "step": 8418 }, { "epoch": 0.92, "learning_rate": 3.6345994022260576e-07, "loss": 0.71, "step": 8419 }, { "epoch": 0.92, "learning_rate": 3.625185782411522e-07, "loss": 0.6211, "step": 8420 }, { "epoch": 0.92, "learning_rate": 3.615784144005796e-07, "loss": 0.6555, "step": 8421 }, { "epoch": 0.92, "learning_rate": 3.606394488177711e-07, "loss": 0.7463, "step": 8422 }, { "epoch": 0.92, "learning_rate": 3.5970168160945676e-07, "loss": 0.6211, "step": 8423 }, { "epoch": 0.92, "learning_rate": 3.5876511289222314e-07, "loss": 0.7241, "step": 8424 }, { "epoch": 0.92, "learning_rate": 3.578297427825062e-07, "loss": 0.7666, "step": 8425 }, { "epoch": 0.92, "learning_rate": 3.5689557139658824e-07, "loss": 0.6174, "step": 8426 }, { "epoch": 0.92, "learning_rate": 3.55962598850611e-07, "loss": 0.6052, "step": 8427 }, { "epoch": 0.92, "learning_rate": 3.5503082526055946e-07, "loss": 0.6489, "step": 8428 }, { "epoch": 0.92, "learning_rate": 3.5410025074227306e-07, "loss": 0.635, "step": 8429 }, { "epoch": 0.92, "learning_rate": 3.531708754114438e-07, "loss": 0.5925, "step": 8430 }, { "epoch": 0.92, "learning_rate": 3.5224269938360924e-07, "loss": 0.6584, "step": 8431 }, { "epoch": 0.92, "learning_rate": 3.513157227741626e-07, "loss": 0.6458, "step": 8432 }, { "epoch": 0.92, "learning_rate": 3.503899456983484e-07, "loss": 0.6045, "step": 8433 }, { "epoch": 0.92, "learning_rate": 3.4946536827125674e-07, "loss": 0.7192, "step": 8434 }, { "epoch": 0.92, "learning_rate": 3.4854199060783247e-07, "loss": 0.5361, "step": 8435 }, { "epoch": 0.92, "learning_rate": 3.476198128228736e-07, "loss": 0.7175, "step": 8436 }, { "epoch": 0.92, "learning_rate": 3.4669883503102296e-07, "loss": 0.6436, "step": 8437 }, { "epoch": 0.92, "learning_rate": 3.457790573467812e-07, "loss": 0.7136, "step": 8438 }, { "epoch": 0.92, "learning_rate": 3.448604798844912e-07, "loss": 0.6724, "step": 8439 }, { "epoch": 0.92, "learning_rate": 3.439431027583551e-07, "loss": 0.6694, "step": 8440 }, { "epoch": 0.92, "learning_rate": 3.4302692608242037e-07, "loss": 0.6694, "step": 8441 }, { "epoch": 0.92, "learning_rate": 3.4211194997058717e-07, "loss": 0.7188, "step": 8442 }, { "epoch": 0.92, "learning_rate": 3.4119817453660665e-07, "loss": 0.7083, "step": 8443 }, { "epoch": 0.92, "learning_rate": 3.402855998940813e-07, "loss": 0.7183, "step": 8444 }, { "epoch": 0.92, "learning_rate": 3.393742261564603e-07, "loss": 0.5735, "step": 8445 }, { "epoch": 0.92, "learning_rate": 3.3846405343704757e-07, "loss": 0.6235, "step": 8446 }, { "epoch": 0.92, "learning_rate": 3.3755508184899813e-07, "loss": 0.615, "step": 8447 }, { "epoch": 0.92, "learning_rate": 3.3664731150531484e-07, "loss": 0.7686, "step": 8448 }, { "epoch": 0.92, "learning_rate": 3.357407425188541e-07, "loss": 0.7661, "step": 8449 }, { "epoch": 0.92, "learning_rate": 3.3483537500232034e-07, "loss": 0.6462, "step": 8450 }, { "epoch": 0.92, "learning_rate": 3.339312090682689e-07, "loss": 0.6418, "step": 8451 }, { "epoch": 0.92, "learning_rate": 3.3302824482910777e-07, "loss": 0.7505, "step": 8452 }, { "epoch": 0.92, "learning_rate": 3.3212648239709375e-07, "loss": 0.6133, "step": 8453 }, { "epoch": 0.92, "learning_rate": 3.31225921884335e-07, "loss": 0.7207, "step": 8454 }, { "epoch": 0.92, "learning_rate": 3.303265634027897e-07, "loss": 0.6121, "step": 8455 }, { "epoch": 0.92, "learning_rate": 3.2942840706426725e-07, "loss": 0.6538, "step": 8456 }, { "epoch": 0.92, "learning_rate": 3.2853145298042954e-07, "loss": 0.6843, "step": 8457 }, { "epoch": 0.92, "learning_rate": 3.276357012627829e-07, "loss": 0.6393, "step": 8458 }, { "epoch": 0.92, "learning_rate": 3.267411520226893e-07, "loss": 0.6533, "step": 8459 }, { "epoch": 0.92, "learning_rate": 3.2584780537136206e-07, "loss": 0.7195, "step": 8460 }, { "epoch": 0.92, "learning_rate": 3.24955661419859e-07, "loss": 0.8252, "step": 8461 }, { "epoch": 0.92, "learning_rate": 3.2406472027909585e-07, "loss": 0.679, "step": 8462 }, { "epoch": 0.92, "learning_rate": 3.23174982059834e-07, "loss": 0.8147, "step": 8463 }, { "epoch": 0.92, "learning_rate": 3.2228644687268606e-07, "loss": 0.6807, "step": 8464 }, { "epoch": 0.92, "learning_rate": 3.213991148281159e-07, "loss": 0.6436, "step": 8465 }, { "epoch": 0.92, "learning_rate": 3.2051298603643754e-07, "loss": 0.7368, "step": 8466 }, { "epoch": 0.92, "learning_rate": 3.1962806060781503e-07, "loss": 0.7097, "step": 8467 }, { "epoch": 0.92, "learning_rate": 3.1874433865226484e-07, "loss": 0.5032, "step": 8468 }, { "epoch": 0.92, "learning_rate": 3.178618202796502e-07, "loss": 0.6831, "step": 8469 }, { "epoch": 0.92, "learning_rate": 3.169805055996866e-07, "loss": 0.6306, "step": 8470 }, { "epoch": 0.92, "learning_rate": 3.161003947219421e-07, "loss": 0.7971, "step": 8471 }, { "epoch": 0.92, "learning_rate": 3.152214877558302e-07, "loss": 0.675, "step": 8472 }, { "epoch": 0.92, "learning_rate": 3.14343784810619e-07, "loss": 0.7495, "step": 8473 }, { "epoch": 0.92, "learning_rate": 3.1346728599542355e-07, "loss": 0.7441, "step": 8474 }, { "epoch": 0.92, "learning_rate": 3.125919914192144e-07, "loss": 0.6331, "step": 8475 }, { "epoch": 0.92, "learning_rate": 3.117179011908067e-07, "loss": 0.6816, "step": 8476 }, { "epoch": 0.92, "learning_rate": 3.1084501541886804e-07, "loss": 0.5156, "step": 8477 }, { "epoch": 0.92, "learning_rate": 3.099733342119171e-07, "loss": 0.6567, "step": 8478 }, { "epoch": 0.92, "learning_rate": 3.091028576783228e-07, "loss": 0.6484, "step": 8479 }, { "epoch": 0.92, "learning_rate": 3.082335859263019e-07, "loss": 0.6917, "step": 8480 }, { "epoch": 0.92, "learning_rate": 3.0736551906392354e-07, "loss": 0.6814, "step": 8481 }, { "epoch": 0.92, "learning_rate": 3.06498657199108e-07, "loss": 0.7073, "step": 8482 }, { "epoch": 0.92, "learning_rate": 3.0563300043962243e-07, "loss": 0.5776, "step": 8483 }, { "epoch": 0.92, "learning_rate": 3.0476854889308737e-07, "loss": 0.688, "step": 8484 }, { "epoch": 0.92, "learning_rate": 3.039053026669725e-07, "loss": 0.6948, "step": 8485 }, { "epoch": 0.92, "learning_rate": 3.0304326186859525e-07, "loss": 0.6472, "step": 8486 }, { "epoch": 0.92, "learning_rate": 3.0218242660512985e-07, "loss": 0.7485, "step": 8487 }, { "epoch": 0.92, "learning_rate": 3.013227969835908e-07, "loss": 0.7161, "step": 8488 }, { "epoch": 0.92, "learning_rate": 3.004643731108514e-07, "loss": 0.5813, "step": 8489 }, { "epoch": 0.92, "learning_rate": 2.996071550936319e-07, "loss": 0.6892, "step": 8490 }, { "epoch": 0.92, "learning_rate": 2.987511430385004e-07, "loss": 0.696, "step": 8491 }, { "epoch": 0.92, "learning_rate": 2.978963370518784e-07, "loss": 0.5498, "step": 8492 }, { "epoch": 0.92, "learning_rate": 2.970427372400353e-07, "loss": 0.7319, "step": 8493 }, { "epoch": 0.92, "learning_rate": 2.961903437090929e-07, "loss": 0.5847, "step": 8494 }, { "epoch": 0.92, "learning_rate": 2.95339156565021e-07, "loss": 0.7407, "step": 8495 }, { "epoch": 0.92, "learning_rate": 2.9448917591363923e-07, "loss": 0.7253, "step": 8496 }, { "epoch": 0.92, "learning_rate": 2.936404018606187e-07, "loss": 0.6292, "step": 8497 }, { "epoch": 0.93, "learning_rate": 2.9279283451148055e-07, "loss": 0.6172, "step": 8498 }, { "epoch": 0.93, "learning_rate": 2.9194647397159383e-07, "loss": 0.6494, "step": 8499 }, { "epoch": 0.93, "learning_rate": 2.911013203461788e-07, "loss": 0.6655, "step": 8500 }, { "epoch": 0.93, "learning_rate": 2.9025737374030696e-07, "loss": 0.6826, "step": 8501 }, { "epoch": 0.93, "learning_rate": 2.894146342588977e-07, "loss": 0.7183, "step": 8502 }, { "epoch": 0.93, "learning_rate": 2.885731020067206e-07, "loss": 0.6216, "step": 8503 }, { "epoch": 0.93, "learning_rate": 2.877327770883964e-07, "loss": 0.8076, "step": 8504 }, { "epoch": 0.93, "learning_rate": 2.86893659608396e-07, "loss": 0.6799, "step": 8505 }, { "epoch": 0.93, "learning_rate": 2.8605574967103924e-07, "loss": 0.7256, "step": 8506 }, { "epoch": 0.93, "learning_rate": 2.85219047380495e-07, "loss": 0.6826, "step": 8507 }, { "epoch": 0.93, "learning_rate": 2.8438355284078235e-07, "loss": 0.7441, "step": 8508 }, { "epoch": 0.93, "learning_rate": 2.835492661557726e-07, "loss": 0.7476, "step": 8509 }, { "epoch": 0.93, "learning_rate": 2.827161874291828e-07, "loss": 0.6475, "step": 8510 }, { "epoch": 0.93, "learning_rate": 2.818843167645835e-07, "loss": 0.7563, "step": 8511 }, { "epoch": 0.93, "learning_rate": 2.810536542653941e-07, "loss": 0.6145, "step": 8512 }, { "epoch": 0.93, "learning_rate": 2.802242000348809e-07, "loss": 0.6255, "step": 8513 }, { "epoch": 0.93, "learning_rate": 2.7939595417616593e-07, "loss": 0.5813, "step": 8514 }, { "epoch": 0.93, "learning_rate": 2.7856891679221565e-07, "loss": 0.7593, "step": 8515 }, { "epoch": 0.93, "learning_rate": 2.777430879858478e-07, "loss": 0.6206, "step": 8516 }, { "epoch": 0.93, "learning_rate": 2.769184678597314e-07, "loss": 0.7087, "step": 8517 }, { "epoch": 0.93, "learning_rate": 2.7609505651638226e-07, "loss": 0.6047, "step": 8518 }, { "epoch": 0.93, "learning_rate": 2.752728540581695e-07, "loss": 0.8198, "step": 8519 }, { "epoch": 0.93, "learning_rate": 2.744518605873092e-07, "loss": 0.7212, "step": 8520 }, { "epoch": 0.93, "learning_rate": 2.736320762058675e-07, "loss": 0.7295, "step": 8521 }, { "epoch": 0.93, "learning_rate": 2.7281350101576176e-07, "loss": 0.6636, "step": 8522 }, { "epoch": 0.93, "learning_rate": 2.719961351187583e-07, "loss": 0.6416, "step": 8523 }, { "epoch": 0.93, "learning_rate": 2.711799786164715e-07, "loss": 0.752, "step": 8524 }, { "epoch": 0.93, "learning_rate": 2.7036503161036784e-07, "loss": 0.748, "step": 8525 }, { "epoch": 0.93, "learning_rate": 2.6955129420176193e-07, "loss": 0.6575, "step": 8526 }, { "epoch": 0.93, "learning_rate": 2.687387664918184e-07, "loss": 0.6736, "step": 8527 }, { "epoch": 0.93, "learning_rate": 2.6792744858155196e-07, "loss": 0.8452, "step": 8528 }, { "epoch": 0.93, "learning_rate": 2.6711734057182417e-07, "loss": 0.7319, "step": 8529 }, { "epoch": 0.93, "learning_rate": 2.663084425633511e-07, "loss": 0.7505, "step": 8530 }, { "epoch": 0.93, "learning_rate": 2.6550075465669567e-07, "loss": 0.6919, "step": 8531 }, { "epoch": 0.93, "learning_rate": 2.6469427695226755e-07, "loss": 0.7805, "step": 8532 }, { "epoch": 0.93, "learning_rate": 2.6388900955033326e-07, "loss": 0.769, "step": 8533 }, { "epoch": 0.93, "learning_rate": 2.630849525510004e-07, "loss": 0.595, "step": 8534 }, { "epoch": 0.93, "learning_rate": 2.6228210605423134e-07, "loss": 0.7629, "step": 8535 }, { "epoch": 0.93, "learning_rate": 2.6148047015983834e-07, "loss": 0.6667, "step": 8536 }, { "epoch": 0.93, "learning_rate": 2.606800449674796e-07, "loss": 0.543, "step": 8537 }, { "epoch": 0.93, "learning_rate": 2.5988083057666534e-07, "loss": 0.5645, "step": 8538 }, { "epoch": 0.93, "learning_rate": 2.590828270867551e-07, "loss": 0.8032, "step": 8539 }, { "epoch": 0.93, "learning_rate": 2.5828603459695624e-07, "loss": 0.6846, "step": 8540 }, { "epoch": 0.93, "learning_rate": 2.5749045320632824e-07, "loss": 0.6628, "step": 8541 }, { "epoch": 0.93, "learning_rate": 2.5669608301377656e-07, "loss": 0.5664, "step": 8542 }, { "epoch": 0.93, "learning_rate": 2.5590292411805996e-07, "loss": 0.6611, "step": 8543 }, { "epoch": 0.93, "learning_rate": 2.551109766177851e-07, "loss": 0.7104, "step": 8544 }, { "epoch": 0.93, "learning_rate": 2.543202406114065e-07, "loss": 0.7676, "step": 8545 }, { "epoch": 0.93, "learning_rate": 2.535307161972278e-07, "loss": 0.646, "step": 8546 }, { "epoch": 0.93, "learning_rate": 2.527424034734072e-07, "loss": 0.6741, "step": 8547 }, { "epoch": 0.93, "learning_rate": 2.51955302537944e-07, "loss": 0.6772, "step": 8548 }, { "epoch": 0.93, "learning_rate": 2.5116941348869437e-07, "loss": 0.6628, "step": 8549 }, { "epoch": 0.93, "learning_rate": 2.503847364233614e-07, "loss": 0.645, "step": 8550 }, { "epoch": 0.93, "learning_rate": 2.4960127143949354e-07, "loss": 0.6866, "step": 8551 }, { "epoch": 0.93, "learning_rate": 2.488190186344952e-07, "loss": 0.6047, "step": 8552 }, { "epoch": 0.93, "learning_rate": 2.4803797810561523e-07, "loss": 0.6572, "step": 8553 }, { "epoch": 0.93, "learning_rate": 2.4725814994995265e-07, "loss": 0.6816, "step": 8554 }, { "epoch": 0.93, "learning_rate": 2.464795342644588e-07, "loss": 0.6587, "step": 8555 }, { "epoch": 0.93, "learning_rate": 2.4570213114592957e-07, "loss": 0.6565, "step": 8556 }, { "epoch": 0.93, "learning_rate": 2.449259406910143e-07, "loss": 0.575, "step": 8557 }, { "epoch": 0.93, "learning_rate": 2.44150962996208e-07, "loss": 0.6526, "step": 8558 }, { "epoch": 0.93, "learning_rate": 2.433771981578581e-07, "loss": 0.7358, "step": 8559 }, { "epoch": 0.93, "learning_rate": 2.4260464627215765e-07, "loss": 0.6169, "step": 8560 }, { "epoch": 0.93, "learning_rate": 2.418333074351531e-07, "loss": 0.6108, "step": 8561 }, { "epoch": 0.93, "learning_rate": 2.410631817427378e-07, "loss": 0.6057, "step": 8562 }, { "epoch": 0.93, "learning_rate": 2.4029426929065514e-07, "loss": 0.6172, "step": 8563 }, { "epoch": 0.93, "learning_rate": 2.395265701744953e-07, "loss": 0.6672, "step": 8564 }, { "epoch": 0.93, "learning_rate": 2.387600844896998e-07, "loss": 0.6663, "step": 8565 }, { "epoch": 0.93, "learning_rate": 2.3799481233156008e-07, "loss": 0.7388, "step": 8566 }, { "epoch": 0.93, "learning_rate": 2.3723075379521342e-07, "loss": 0.7612, "step": 8567 }, { "epoch": 0.93, "learning_rate": 2.3646790897564943e-07, "loss": 0.6968, "step": 8568 }, { "epoch": 0.93, "learning_rate": 2.3570627796770772e-07, "loss": 0.7163, "step": 8569 }, { "epoch": 0.93, "learning_rate": 2.349458608660704e-07, "loss": 0.6533, "step": 8570 }, { "epoch": 0.93, "learning_rate": 2.3418665776527738e-07, "loss": 0.728, "step": 8571 }, { "epoch": 0.93, "learning_rate": 2.3342866875971203e-07, "loss": 0.7295, "step": 8572 }, { "epoch": 0.93, "learning_rate": 2.326718939436079e-07, "loss": 0.749, "step": 8573 }, { "epoch": 0.93, "learning_rate": 2.3191633341104859e-07, "loss": 0.8066, "step": 8574 }, { "epoch": 0.93, "learning_rate": 2.3116198725596562e-07, "loss": 0.6299, "step": 8575 }, { "epoch": 0.93, "learning_rate": 2.3040885557214065e-07, "loss": 0.7368, "step": 8576 }, { "epoch": 0.93, "learning_rate": 2.2965693845320325e-07, "loss": 0.6946, "step": 8577 }, { "epoch": 0.93, "learning_rate": 2.2890623599263196e-07, "loss": 0.6292, "step": 8578 }, { "epoch": 0.93, "learning_rate": 2.2815674828375655e-07, "loss": 0.7437, "step": 8579 }, { "epoch": 0.93, "learning_rate": 2.274084754197514e-07, "loss": 0.6548, "step": 8580 }, { "epoch": 0.93, "learning_rate": 2.2666141749364434e-07, "loss": 0.7395, "step": 8581 }, { "epoch": 0.93, "learning_rate": 2.2591557459831103e-07, "loss": 0.6067, "step": 8582 }, { "epoch": 0.93, "learning_rate": 2.25170946826474e-07, "loss": 0.7666, "step": 8583 }, { "epoch": 0.93, "learning_rate": 2.2442753427070586e-07, "loss": 0.5693, "step": 8584 }, { "epoch": 0.93, "learning_rate": 2.2368533702343043e-07, "loss": 0.6333, "step": 8585 }, { "epoch": 0.93, "learning_rate": 2.2294435517691504e-07, "loss": 0.6755, "step": 8586 }, { "epoch": 0.93, "learning_rate": 2.2220458882328155e-07, "loss": 0.6592, "step": 8587 }, { "epoch": 0.93, "learning_rate": 2.2146603805449861e-07, "loss": 0.6851, "step": 8588 }, { "epoch": 0.94, "learning_rate": 2.207287029623817e-07, "loss": 0.6855, "step": 8589 }, { "epoch": 0.94, "learning_rate": 2.1999258363859966e-07, "loss": 0.6775, "step": 8590 }, { "epoch": 0.94, "learning_rate": 2.1925768017466597e-07, "loss": 0.688, "step": 8591 }, { "epoch": 0.94, "learning_rate": 2.1852399266194312e-07, "loss": 0.6416, "step": 8592 }, { "epoch": 0.94, "learning_rate": 2.1779152119164814e-07, "loss": 0.6401, "step": 8593 }, { "epoch": 0.94, "learning_rate": 2.1706026585483708e-07, "loss": 0.5916, "step": 8594 }, { "epoch": 0.94, "learning_rate": 2.16330226742425e-07, "loss": 0.675, "step": 8595 }, { "epoch": 0.94, "learning_rate": 2.1560140394516815e-07, "loss": 0.6641, "step": 8596 }, { "epoch": 0.94, "learning_rate": 2.1487379755367632e-07, "loss": 0.6399, "step": 8597 }, { "epoch": 0.94, "learning_rate": 2.141474076584038e-07, "loss": 0.6189, "step": 8598 }, { "epoch": 0.94, "learning_rate": 2.1342223434965837e-07, "loss": 0.5784, "step": 8599 }, { "epoch": 0.94, "learning_rate": 2.1269827771759344e-07, "loss": 0.7832, "step": 8600 }, { "epoch": 0.94, "learning_rate": 2.119755378522137e-07, "loss": 0.637, "step": 8601 }, { "epoch": 0.94, "learning_rate": 2.1125401484336727e-07, "loss": 0.7485, "step": 8602 }, { "epoch": 0.94, "learning_rate": 2.1053370878075685e-07, "loss": 0.6838, "step": 8603 }, { "epoch": 0.94, "learning_rate": 2.0981461975393193e-07, "loss": 0.6721, "step": 8604 }, { "epoch": 0.94, "learning_rate": 2.0909674785228984e-07, "loss": 0.7202, "step": 8605 }, { "epoch": 0.94, "learning_rate": 2.083800931650759e-07, "loss": 0.6719, "step": 8606 }, { "epoch": 0.94, "learning_rate": 2.0766465578138773e-07, "loss": 0.6675, "step": 8607 }, { "epoch": 0.94, "learning_rate": 2.0695043579016638e-07, "loss": 0.634, "step": 8608 }, { "epoch": 0.94, "learning_rate": 2.062374332802064e-07, "loss": 0.6392, "step": 8609 }, { "epoch": 0.94, "learning_rate": 2.0552564834014797e-07, "loss": 0.7129, "step": 8610 }, { "epoch": 0.94, "learning_rate": 2.0481508105848146e-07, "loss": 0.6875, "step": 8611 }, { "epoch": 0.94, "learning_rate": 2.0410573152354619e-07, "loss": 0.6992, "step": 8612 }, { "epoch": 0.94, "learning_rate": 2.0339759982352713e-07, "loss": 0.6523, "step": 8613 }, { "epoch": 0.94, "learning_rate": 2.0269068604646058e-07, "loss": 0.6709, "step": 8614 }, { "epoch": 0.94, "learning_rate": 2.0198499028023178e-07, "loss": 0.7341, "step": 8615 }, { "epoch": 0.94, "learning_rate": 2.0128051261257165e-07, "loss": 0.5635, "step": 8616 }, { "epoch": 0.94, "learning_rate": 2.0057725313106236e-07, "loss": 0.8052, "step": 8617 }, { "epoch": 0.94, "learning_rate": 1.9987521192313397e-07, "loss": 0.6885, "step": 8618 }, { "epoch": 0.94, "learning_rate": 1.9917438907606556e-07, "loss": 0.6277, "step": 8619 }, { "epoch": 0.94, "learning_rate": 1.9847478467698411e-07, "loss": 0.708, "step": 8620 }, { "epoch": 0.94, "learning_rate": 1.9777639881286337e-07, "loss": 0.7263, "step": 8621 }, { "epoch": 0.94, "learning_rate": 1.9707923157052834e-07, "loss": 0.6973, "step": 8622 }, { "epoch": 0.94, "learning_rate": 1.9638328303665298e-07, "loss": 0.5513, "step": 8623 }, { "epoch": 0.94, "learning_rate": 1.9568855329775592e-07, "loss": 0.6611, "step": 8624 }, { "epoch": 0.94, "learning_rate": 1.9499504244020694e-07, "loss": 0.6829, "step": 8625 }, { "epoch": 0.94, "learning_rate": 1.9430275055022597e-07, "loss": 0.6414, "step": 8626 }, { "epoch": 0.94, "learning_rate": 1.9361167771387634e-07, "loss": 0.676, "step": 8627 }, { "epoch": 0.94, "learning_rate": 1.9292182401707603e-07, "loss": 0.748, "step": 8628 }, { "epoch": 0.94, "learning_rate": 1.9223318954558646e-07, "loss": 0.562, "step": 8629 }, { "epoch": 0.94, "learning_rate": 1.915457743850202e-07, "loss": 0.6223, "step": 8630 }, { "epoch": 0.94, "learning_rate": 1.908595786208367e-07, "loss": 0.6196, "step": 8631 }, { "epoch": 0.94, "learning_rate": 1.901746023383444e-07, "loss": 0.7559, "step": 8632 }, { "epoch": 0.94, "learning_rate": 1.8949084562269959e-07, "loss": 0.7031, "step": 8633 }, { "epoch": 0.94, "learning_rate": 1.8880830855891097e-07, "loss": 0.5984, "step": 8634 }, { "epoch": 0.94, "learning_rate": 1.8812699123182733e-07, "loss": 0.6624, "step": 8635 }, { "epoch": 0.94, "learning_rate": 1.874468937261531e-07, "loss": 0.7192, "step": 8636 }, { "epoch": 0.94, "learning_rate": 1.8676801612643957e-07, "loss": 0.6404, "step": 8637 }, { "epoch": 0.94, "learning_rate": 1.8609035851708367e-07, "loss": 0.646, "step": 8638 }, { "epoch": 0.94, "learning_rate": 1.8541392098233468e-07, "loss": 0.6841, "step": 8639 }, { "epoch": 0.94, "learning_rate": 1.8473870360628533e-07, "loss": 0.594, "step": 8640 }, { "epoch": 0.94, "learning_rate": 1.8406470647288067e-07, "loss": 0.5728, "step": 8641 }, { "epoch": 0.94, "learning_rate": 1.8339192966591257e-07, "loss": 0.6367, "step": 8642 }, { "epoch": 0.94, "learning_rate": 1.827203732690208e-07, "loss": 0.5381, "step": 8643 }, { "epoch": 0.94, "learning_rate": 1.8205003736569416e-07, "loss": 0.6431, "step": 8644 }, { "epoch": 0.94, "learning_rate": 1.813809220392704e-07, "loss": 0.7139, "step": 8645 }, { "epoch": 0.94, "learning_rate": 1.8071302737293294e-07, "loss": 0.666, "step": 8646 }, { "epoch": 0.94, "learning_rate": 1.8004635344971656e-07, "loss": 0.6807, "step": 8647 }, { "epoch": 0.94, "learning_rate": 1.7938090035250154e-07, "loss": 0.7578, "step": 8648 }, { "epoch": 0.94, "learning_rate": 1.7871666816401844e-07, "loss": 0.6953, "step": 8649 }, { "epoch": 0.94, "learning_rate": 1.7805365696684564e-07, "loss": 0.6897, "step": 8650 }, { "epoch": 0.94, "learning_rate": 1.7739186684340825e-07, "loss": 0.5603, "step": 8651 }, { "epoch": 0.94, "learning_rate": 1.7673129787598052e-07, "loss": 0.7021, "step": 8652 }, { "epoch": 0.94, "learning_rate": 1.7607195014668678e-07, "loss": 0.6099, "step": 8653 }, { "epoch": 0.94, "learning_rate": 1.7541382373749582e-07, "loss": 0.6877, "step": 8654 }, { "epoch": 0.94, "learning_rate": 1.747569187302267e-07, "loss": 0.7466, "step": 8655 }, { "epoch": 0.94, "learning_rate": 1.7410123520654743e-07, "loss": 0.7393, "step": 8656 }, { "epoch": 0.94, "learning_rate": 1.7344677324797276e-07, "loss": 0.6445, "step": 8657 }, { "epoch": 0.94, "learning_rate": 1.7279353293586765e-07, "loss": 0.6982, "step": 8658 }, { "epoch": 0.94, "learning_rate": 1.7214151435144045e-07, "loss": 0.6802, "step": 8659 }, { "epoch": 0.94, "learning_rate": 1.7149071757575298e-07, "loss": 0.7429, "step": 8660 }, { "epoch": 0.94, "learning_rate": 1.7084114268971275e-07, "loss": 0.705, "step": 8661 }, { "epoch": 0.94, "learning_rate": 1.7019278977407405e-07, "loss": 0.7151, "step": 8662 }, { "epoch": 0.94, "learning_rate": 1.695456589094413e-07, "loss": 0.6626, "step": 8663 }, { "epoch": 0.94, "learning_rate": 1.6889975017626902e-07, "loss": 0.7441, "step": 8664 }, { "epoch": 0.94, "learning_rate": 1.682550636548519e-07, "loss": 0.625, "step": 8665 }, { "epoch": 0.94, "learning_rate": 1.6761159942534356e-07, "loss": 0.6292, "step": 8666 }, { "epoch": 0.94, "learning_rate": 1.6696935756773669e-07, "loss": 0.6475, "step": 8667 }, { "epoch": 0.94, "learning_rate": 1.6632833816187632e-07, "loss": 0.6129, "step": 8668 }, { "epoch": 0.94, "learning_rate": 1.6568854128745537e-07, "loss": 0.6035, "step": 8669 }, { "epoch": 0.94, "learning_rate": 1.6504996702401243e-07, "loss": 0.8267, "step": 8670 }, { "epoch": 0.94, "learning_rate": 1.6441261545093624e-07, "loss": 0.6841, "step": 8671 }, { "epoch": 0.94, "learning_rate": 1.6377648664746448e-07, "loss": 0.7144, "step": 8672 }, { "epoch": 0.94, "learning_rate": 1.631415806926795e-07, "loss": 0.6777, "step": 8673 }, { "epoch": 0.94, "learning_rate": 1.6250789766551367e-07, "loss": 0.6118, "step": 8674 }, { "epoch": 0.94, "learning_rate": 1.6187543764474733e-07, "loss": 0.6265, "step": 8675 }, { "epoch": 0.94, "learning_rate": 1.612442007090076e-07, "loss": 0.7231, "step": 8676 }, { "epoch": 0.94, "learning_rate": 1.6061418693677278e-07, "loss": 0.6127, "step": 8677 }, { "epoch": 0.94, "learning_rate": 1.599853964063658e-07, "loss": 0.7649, "step": 8678 }, { "epoch": 0.94, "learning_rate": 1.5935782919595634e-07, "loss": 0.7373, "step": 8679 }, { "epoch": 0.94, "learning_rate": 1.5873148538356752e-07, "loss": 0.7068, "step": 8680 }, { "epoch": 0.95, "learning_rate": 1.5810636504706377e-07, "loss": 0.7095, "step": 8681 }, { "epoch": 0.95, "learning_rate": 1.574824682641629e-07, "loss": 0.6685, "step": 8682 }, { "epoch": 0.95, "learning_rate": 1.5685979511242844e-07, "loss": 0.7178, "step": 8683 }, { "epoch": 0.95, "learning_rate": 1.5623834566927065e-07, "loss": 0.7351, "step": 8684 }, { "epoch": 0.95, "learning_rate": 1.5561812001194888e-07, "loss": 0.5474, "step": 8685 }, { "epoch": 0.95, "learning_rate": 1.5499911821756918e-07, "loss": 0.7271, "step": 8686 }, { "epoch": 0.95, "learning_rate": 1.5438134036308893e-07, "loss": 0.7437, "step": 8687 }, { "epoch": 0.95, "learning_rate": 1.5376478652530891e-07, "loss": 0.6753, "step": 8688 }, { "epoch": 0.95, "learning_rate": 1.531494567808811e-07, "loss": 0.6796, "step": 8689 }, { "epoch": 0.95, "learning_rate": 1.5253535120630214e-07, "loss": 0.6936, "step": 8690 }, { "epoch": 0.95, "learning_rate": 1.519224698779198e-07, "loss": 0.7207, "step": 8691 }, { "epoch": 0.95, "learning_rate": 1.5131081287192762e-07, "loss": 0.6897, "step": 8692 }, { "epoch": 0.95, "learning_rate": 1.5070038026436583e-07, "loss": 0.6838, "step": 8693 }, { "epoch": 0.95, "learning_rate": 1.50091172131126e-07, "loss": 0.6143, "step": 8694 }, { "epoch": 0.95, "learning_rate": 1.494831885479453e-07, "loss": 0.6514, "step": 8695 }, { "epoch": 0.95, "learning_rate": 1.4887642959040881e-07, "loss": 0.6956, "step": 8696 }, { "epoch": 0.95, "learning_rate": 1.4827089533394735e-07, "loss": 0.678, "step": 8697 }, { "epoch": 0.95, "learning_rate": 1.4766658585384396e-07, "loss": 0.6272, "step": 8698 }, { "epoch": 0.95, "learning_rate": 1.470635012252264e-07, "loss": 0.5713, "step": 8699 }, { "epoch": 0.95, "learning_rate": 1.464616415230702e-07, "loss": 0.7158, "step": 8700 }, { "epoch": 0.95, "learning_rate": 1.4586100682219885e-07, "loss": 0.6936, "step": 8701 }, { "epoch": 0.95, "learning_rate": 1.4526159719728595e-07, "loss": 0.6975, "step": 8702 }, { "epoch": 0.95, "learning_rate": 1.4466341272284745e-07, "loss": 0.6887, "step": 8703 }, { "epoch": 0.95, "learning_rate": 1.4406645347325164e-07, "loss": 0.6172, "step": 8704 }, { "epoch": 0.95, "learning_rate": 1.4347071952271363e-07, "loss": 0.6819, "step": 8705 }, { "epoch": 0.95, "learning_rate": 1.4287621094529524e-07, "loss": 0.6794, "step": 8706 }, { "epoch": 0.95, "learning_rate": 1.4228292781490737e-07, "loss": 0.6992, "step": 8707 }, { "epoch": 0.95, "learning_rate": 1.4169087020530549e-07, "loss": 0.6558, "step": 8708 }, { "epoch": 0.95, "learning_rate": 1.411000381900951e-07, "loss": 0.5754, "step": 8709 }, { "epoch": 0.95, "learning_rate": 1.4051043184273193e-07, "loss": 0.6907, "step": 8710 }, { "epoch": 0.95, "learning_rate": 1.3992205123651182e-07, "loss": 0.7061, "step": 8711 }, { "epoch": 0.95, "learning_rate": 1.393348964445862e-07, "loss": 0.7686, "step": 8712 }, { "epoch": 0.95, "learning_rate": 1.3874896753995005e-07, "loss": 0.6833, "step": 8713 }, { "epoch": 0.95, "learning_rate": 1.3816426459544507e-07, "loss": 0.6736, "step": 8714 }, { "epoch": 0.95, "learning_rate": 1.3758078768376426e-07, "loss": 0.7209, "step": 8715 }, { "epoch": 0.95, "learning_rate": 1.3699853687744514e-07, "loss": 0.7607, "step": 8716 }, { "epoch": 0.95, "learning_rate": 1.3641751224887313e-07, "loss": 0.6426, "step": 8717 }, { "epoch": 0.95, "learning_rate": 1.3583771387028267e-07, "loss": 0.7378, "step": 8718 }, { "epoch": 0.95, "learning_rate": 1.3525914181375389e-07, "loss": 0.6785, "step": 8719 }, { "epoch": 0.95, "learning_rate": 1.346817961512159e-07, "loss": 0.7034, "step": 8720 }, { "epoch": 0.95, "learning_rate": 1.3410567695444576e-07, "loss": 0.6428, "step": 8721 }, { "epoch": 0.95, "learning_rate": 1.3353078429506506e-07, "loss": 0.6572, "step": 8722 }, { "epoch": 0.95, "learning_rate": 1.329571182445466e-07, "loss": 0.5867, "step": 8723 }, { "epoch": 0.95, "learning_rate": 1.323846788742078e-07, "loss": 0.7319, "step": 8724 }, { "epoch": 0.95, "learning_rate": 1.318134662552173e-07, "loss": 0.6829, "step": 8725 }, { "epoch": 0.95, "learning_rate": 1.3124348045858716e-07, "loss": 0.6516, "step": 8726 }, { "epoch": 0.95, "learning_rate": 1.3067472155517736e-07, "loss": 0.7019, "step": 8727 }, { "epoch": 0.95, "learning_rate": 1.3010718961569913e-07, "loss": 0.6478, "step": 8728 }, { "epoch": 0.95, "learning_rate": 1.2954088471070713e-07, "loss": 0.7158, "step": 8729 }, { "epoch": 0.95, "learning_rate": 1.2897580691060506e-07, "loss": 0.6274, "step": 8730 }, { "epoch": 0.95, "learning_rate": 1.284119562856434e-07, "loss": 0.5642, "step": 8731 }, { "epoch": 0.95, "learning_rate": 1.2784933290592049e-07, "loss": 0.72, "step": 8732 }, { "epoch": 0.95, "learning_rate": 1.2728793684138485e-07, "loss": 0.687, "step": 8733 }, { "epoch": 0.95, "learning_rate": 1.267277681618273e-07, "loss": 0.6868, "step": 8734 }, { "epoch": 0.95, "learning_rate": 1.261688269368877e-07, "loss": 0.6912, "step": 8735 }, { "epoch": 0.95, "learning_rate": 1.2561111323605714e-07, "loss": 0.6921, "step": 8736 }, { "epoch": 0.95, "learning_rate": 1.2505462712866902e-07, "loss": 0.5865, "step": 8737 }, { "epoch": 0.95, "learning_rate": 1.2449936868390578e-07, "loss": 0.7119, "step": 8738 }, { "epoch": 0.95, "learning_rate": 1.2394533797079888e-07, "loss": 0.6782, "step": 8739 }, { "epoch": 0.95, "learning_rate": 1.2339253505822656e-07, "loss": 0.7329, "step": 8740 }, { "epoch": 0.95, "learning_rate": 1.2284096001491275e-07, "loss": 0.6528, "step": 8741 }, { "epoch": 0.95, "learning_rate": 1.2229061290942922e-07, "loss": 0.6187, "step": 8742 }, { "epoch": 0.95, "learning_rate": 1.2174149381019685e-07, "loss": 0.7031, "step": 8743 }, { "epoch": 0.95, "learning_rate": 1.2119360278548209e-07, "loss": 0.6274, "step": 8744 }, { "epoch": 0.95, "learning_rate": 1.2064693990339936e-07, "loss": 0.7075, "step": 8745 }, { "epoch": 0.95, "learning_rate": 1.201015052319099e-07, "loss": 0.686, "step": 8746 }, { "epoch": 0.95, "learning_rate": 1.1955729883882383e-07, "loss": 0.7168, "step": 8747 }, { "epoch": 0.95, "learning_rate": 1.1901432079179709e-07, "loss": 0.6846, "step": 8748 }, { "epoch": 0.95, "learning_rate": 1.1847257115833122e-07, "loss": 0.6558, "step": 8749 }, { "epoch": 0.95, "learning_rate": 1.1793205000577901e-07, "loss": 0.7598, "step": 8750 }, { "epoch": 0.95, "learning_rate": 1.1739275740134004e-07, "loss": 0.6353, "step": 8751 }, { "epoch": 0.95, "learning_rate": 1.1685469341205513e-07, "loss": 0.6367, "step": 8752 }, { "epoch": 0.95, "learning_rate": 1.1631785810482077e-07, "loss": 0.6077, "step": 8753 }, { "epoch": 0.95, "learning_rate": 1.1578225154637579e-07, "loss": 0.7778, "step": 8754 }, { "epoch": 0.95, "learning_rate": 1.1524787380330693e-07, "loss": 0.6494, "step": 8755 }, { "epoch": 0.95, "learning_rate": 1.1471472494204994e-07, "loss": 0.6108, "step": 8756 }, { "epoch": 0.95, "learning_rate": 1.1418280502888401e-07, "loss": 0.7212, "step": 8757 }, { "epoch": 0.95, "learning_rate": 1.1365211412993849e-07, "loss": 0.6899, "step": 8758 }, { "epoch": 0.95, "learning_rate": 1.1312265231119168e-07, "loss": 0.6179, "step": 8759 }, { "epoch": 0.95, "learning_rate": 1.1259441963846429e-07, "loss": 0.7971, "step": 8760 }, { "epoch": 0.95, "learning_rate": 1.1206741617742711e-07, "loss": 0.6689, "step": 8761 }, { "epoch": 0.95, "learning_rate": 1.1154164199359885e-07, "loss": 0.7451, "step": 8762 }, { "epoch": 0.95, "learning_rate": 1.1101709715234388e-07, "loss": 0.6809, "step": 8763 }, { "epoch": 0.95, "learning_rate": 1.1049378171887338e-07, "loss": 0.7822, "step": 8764 }, { "epoch": 0.95, "learning_rate": 1.0997169575824752e-07, "loss": 0.6838, "step": 8765 }, { "epoch": 0.95, "learning_rate": 1.0945083933537104e-07, "loss": 0.7102, "step": 8766 }, { "epoch": 0.95, "learning_rate": 1.0893121251499882e-07, "loss": 0.6353, "step": 8767 }, { "epoch": 0.95, "learning_rate": 1.084128153617292e-07, "loss": 0.7059, "step": 8768 }, { "epoch": 0.95, "learning_rate": 1.0789564794001283e-07, "loss": 0.7725, "step": 8769 }, { "epoch": 0.95, "learning_rate": 1.0737971031414274e-07, "loss": 0.6316, "step": 8770 }, { "epoch": 0.95, "learning_rate": 1.0686500254825983e-07, "loss": 0.6318, "step": 8771 }, { "epoch": 0.95, "learning_rate": 1.0635152470635513e-07, "loss": 0.6899, "step": 8772 }, { "epoch": 0.96, "learning_rate": 1.0583927685226424e-07, "loss": 0.7378, "step": 8773 }, { "epoch": 0.96, "learning_rate": 1.0532825904966848e-07, "loss": 0.7212, "step": 8774 }, { "epoch": 0.96, "learning_rate": 1.0481847136210033e-07, "loss": 0.614, "step": 8775 }, { "epoch": 0.96, "learning_rate": 1.0430991385293576e-07, "loss": 0.658, "step": 8776 }, { "epoch": 0.96, "learning_rate": 1.0380258658539977e-07, "loss": 0.6367, "step": 8777 }, { "epoch": 0.96, "learning_rate": 1.0329648962256411e-07, "loss": 0.6951, "step": 8778 }, { "epoch": 0.96, "learning_rate": 1.0279162302734624e-07, "loss": 0.6255, "step": 8779 }, { "epoch": 0.96, "learning_rate": 1.022879868625115e-07, "loss": 0.7485, "step": 8780 }, { "epoch": 0.96, "learning_rate": 1.0178558119067316e-07, "loss": 0.7214, "step": 8781 }, { "epoch": 0.96, "learning_rate": 1.0128440607429014e-07, "loss": 0.6165, "step": 8782 }, { "epoch": 0.96, "learning_rate": 1.0078446157567034e-07, "loss": 0.6692, "step": 8783 }, { "epoch": 0.96, "learning_rate": 1.0028574775696632e-07, "loss": 0.5874, "step": 8784 }, { "epoch": 0.96, "learning_rate": 9.978826468017844e-08, "loss": 0.6975, "step": 8785 }, { "epoch": 0.96, "learning_rate": 9.929201240715503e-08, "loss": 0.6152, "step": 8786 }, { "epoch": 0.96, "learning_rate": 9.879699099959006e-08, "loss": 0.5872, "step": 8787 }, { "epoch": 0.96, "learning_rate": 9.830320051902542e-08, "loss": 0.7617, "step": 8788 }, { "epoch": 0.96, "learning_rate": 9.781064102684979e-08, "loss": 0.657, "step": 8789 }, { "epoch": 0.96, "learning_rate": 9.731931258429638e-08, "loss": 0.7607, "step": 8790 }, { "epoch": 0.96, "learning_rate": 9.682921525245192e-08, "loss": 0.6841, "step": 8791 }, { "epoch": 0.96, "learning_rate": 9.63403490922421e-08, "loss": 0.6282, "step": 8792 }, { "epoch": 0.96, "learning_rate": 9.585271416444497e-08, "loss": 0.7085, "step": 8793 }, { "epoch": 0.96, "learning_rate": 9.536631052968315e-08, "loss": 0.699, "step": 8794 }, { "epoch": 0.96, "learning_rate": 9.488113824842715e-08, "loss": 0.592, "step": 8795 }, { "epoch": 0.96, "learning_rate": 9.439719738099318e-08, "loss": 0.6377, "step": 8796 }, { "epoch": 0.96, "learning_rate": 9.391448798754643e-08, "loss": 0.6809, "step": 8797 }, { "epoch": 0.96, "learning_rate": 9.34330101280967e-08, "loss": 0.6228, "step": 8798 }, { "epoch": 0.96, "learning_rate": 9.295276386250273e-08, "loss": 0.7397, "step": 8799 }, { "epoch": 0.96, "learning_rate": 9.247374925046903e-08, "loss": 0.583, "step": 8800 }, { "epoch": 0.96, "learning_rate": 9.199596635154684e-08, "loss": 0.575, "step": 8801 }, { "epoch": 0.96, "learning_rate": 9.15194152251353e-08, "loss": 0.6184, "step": 8802 }, { "epoch": 0.96, "learning_rate": 9.104409593047814e-08, "loss": 0.6013, "step": 8803 }, { "epoch": 0.96, "learning_rate": 9.057000852666808e-08, "loss": 0.6326, "step": 8804 }, { "epoch": 0.96, "learning_rate": 9.009715307264577e-08, "loss": 0.6893, "step": 8805 }, { "epoch": 0.96, "learning_rate": 8.962552962719528e-08, "loss": 0.6182, "step": 8806 }, { "epoch": 0.96, "learning_rate": 8.915513824894972e-08, "loss": 0.6233, "step": 8807 }, { "epoch": 0.96, "learning_rate": 8.868597899638897e-08, "loss": 0.752, "step": 8808 }, { "epoch": 0.96, "learning_rate": 8.82180519278375e-08, "loss": 0.6328, "step": 8809 }, { "epoch": 0.96, "learning_rate": 8.775135710147209e-08, "loss": 0.6035, "step": 8810 }, { "epoch": 0.96, "learning_rate": 8.728589457530857e-08, "loss": 0.6716, "step": 8811 }, { "epoch": 0.96, "learning_rate": 8.682166440721729e-08, "loss": 0.655, "step": 8812 }, { "epoch": 0.96, "learning_rate": 8.635866665490988e-08, "loss": 0.7056, "step": 8813 }, { "epoch": 0.96, "learning_rate": 8.589690137594697e-08, "loss": 0.8135, "step": 8814 }, { "epoch": 0.96, "learning_rate": 8.543636862773486e-08, "loss": 0.7261, "step": 8815 }, { "epoch": 0.96, "learning_rate": 8.497706846752885e-08, "loss": 0.6147, "step": 8816 }, { "epoch": 0.96, "learning_rate": 8.451900095242882e-08, "loss": 0.7419, "step": 8817 }, { "epoch": 0.96, "learning_rate": 8.406216613938256e-08, "loss": 0.6855, "step": 8818 }, { "epoch": 0.96, "learning_rate": 8.360656408518353e-08, "loss": 0.7671, "step": 8819 }, { "epoch": 0.96, "learning_rate": 8.315219484647308e-08, "loss": 0.7446, "step": 8820 }, { "epoch": 0.96, "learning_rate": 8.269905847973936e-08, "loss": 0.6782, "step": 8821 }, { "epoch": 0.96, "learning_rate": 8.224715504131508e-08, "loss": 0.689, "step": 8822 }, { "epoch": 0.96, "learning_rate": 8.179648458738309e-08, "loss": 0.5933, "step": 8823 }, { "epoch": 0.96, "learning_rate": 8.134704717397079e-08, "loss": 0.7378, "step": 8824 }, { "epoch": 0.96, "learning_rate": 8.089884285695126e-08, "loss": 0.6755, "step": 8825 }, { "epoch": 0.96, "learning_rate": 8.04518716920466e-08, "loss": 0.5889, "step": 8826 }, { "epoch": 0.96, "learning_rate": 8.00061337348268e-08, "loss": 0.7019, "step": 8827 }, { "epoch": 0.96, "learning_rate": 7.956162904070197e-08, "loss": 0.5918, "step": 8828 }, { "epoch": 0.96, "learning_rate": 7.911835766493792e-08, "loss": 0.6824, "step": 8829 }, { "epoch": 0.96, "learning_rate": 7.867631966263945e-08, "loss": 0.7375, "step": 8830 }, { "epoch": 0.96, "learning_rate": 7.823551508876148e-08, "loss": 0.7019, "step": 8831 }, { "epoch": 0.96, "learning_rate": 7.779594399810685e-08, "loss": 0.6072, "step": 8832 }, { "epoch": 0.96, "learning_rate": 7.735760644532298e-08, "loss": 0.6211, "step": 8833 }, { "epoch": 0.96, "learning_rate": 7.692050248490291e-08, "loss": 0.6045, "step": 8834 }, { "epoch": 0.96, "learning_rate": 7.648463217118985e-08, "loss": 0.6157, "step": 8835 }, { "epoch": 0.96, "learning_rate": 7.604999555837045e-08, "loss": 0.6924, "step": 8836 }, { "epoch": 0.96, "learning_rate": 7.561659270047928e-08, "loss": 0.7329, "step": 8837 }, { "epoch": 0.96, "learning_rate": 7.518442365139767e-08, "loss": 0.6028, "step": 8838 }, { "epoch": 0.96, "learning_rate": 7.475348846485264e-08, "loss": 0.6316, "step": 8839 }, { "epoch": 0.96, "learning_rate": 7.432378719441913e-08, "loss": 0.6919, "step": 8840 }, { "epoch": 0.96, "learning_rate": 7.389531989351773e-08, "loss": 0.6553, "step": 8841 }, { "epoch": 0.96, "learning_rate": 7.346808661541694e-08, "loss": 0.6875, "step": 8842 }, { "epoch": 0.96, "learning_rate": 7.304208741322871e-08, "loss": 0.5886, "step": 8843 }, { "epoch": 0.96, "learning_rate": 7.261732233991514e-08, "loss": 0.6799, "step": 8844 }, { "epoch": 0.96, "learning_rate": 7.219379144828287e-08, "loss": 0.6736, "step": 8845 }, { "epoch": 0.96, "learning_rate": 7.177149479098644e-08, "loss": 0.7007, "step": 8846 }, { "epoch": 0.96, "learning_rate": 7.135043242052497e-08, "loss": 0.6575, "step": 8847 }, { "epoch": 0.96, "learning_rate": 7.093060438924659e-08, "loss": 0.7183, "step": 8848 }, { "epoch": 0.96, "learning_rate": 7.0512010749344e-08, "loss": 0.6729, "step": 8849 }, { "epoch": 0.96, "learning_rate": 7.009465155285777e-08, "loss": 0.729, "step": 8850 }, { "epoch": 0.96, "learning_rate": 6.967852685167309e-08, "loss": 0.5591, "step": 8851 }, { "epoch": 0.96, "learning_rate": 6.926363669752412e-08, "loss": 0.6746, "step": 8852 }, { "epoch": 0.96, "learning_rate": 6.88499811419896e-08, "loss": 0.6328, "step": 8853 }, { "epoch": 0.96, "learning_rate": 6.843756023649728e-08, "loss": 0.6855, "step": 8854 }, { "epoch": 0.96, "learning_rate": 6.802637403231727e-08, "loss": 0.6257, "step": 8855 }, { "epoch": 0.96, "learning_rate": 6.761642258056977e-08, "loss": 0.5613, "step": 8856 }, { "epoch": 0.96, "learning_rate": 6.720770593222181e-08, "loss": 0.7463, "step": 8857 }, { "epoch": 0.96, "learning_rate": 6.680022413808274e-08, "loss": 0.6831, "step": 8858 }, { "epoch": 0.96, "learning_rate": 6.639397724881314e-08, "loss": 0.6594, "step": 8859 }, { "epoch": 0.96, "learning_rate": 6.598896531491706e-08, "loss": 0.656, "step": 8860 }, { "epoch": 0.96, "learning_rate": 6.558518838674533e-08, "loss": 0.6501, "step": 8861 }, { "epoch": 0.96, "learning_rate": 6.51826465144978e-08, "loss": 0.7461, "step": 8862 }, { "epoch": 0.96, "learning_rate": 6.478133974821777e-08, "loss": 0.6785, "step": 8863 }, { "epoch": 0.96, "learning_rate": 6.438126813779533e-08, "loss": 0.6641, "step": 8864 }, { "epoch": 0.97, "learning_rate": 6.398243173296958e-08, "loss": 0.5171, "step": 8865 }, { "epoch": 0.97, "learning_rate": 6.358483058332199e-08, "loss": 0.6973, "step": 8866 }, { "epoch": 0.97, "learning_rate": 6.318846473828522e-08, "loss": 0.6931, "step": 8867 }, { "epoch": 0.97, "learning_rate": 6.27933342471343e-08, "loss": 0.6794, "step": 8868 }, { "epoch": 0.97, "learning_rate": 6.239943915899105e-08, "loss": 0.7766, "step": 8869 }, { "epoch": 0.97, "learning_rate": 6.200677952282852e-08, "loss": 0.7053, "step": 8870 }, { "epoch": 0.97, "learning_rate": 6.161535538745877e-08, "loss": 0.587, "step": 8871 }, { "epoch": 0.97, "learning_rate": 6.122516680154622e-08, "loss": 0.6802, "step": 8872 }, { "epoch": 0.97, "learning_rate": 6.083621381359873e-08, "loss": 0.7324, "step": 8873 }, { "epoch": 0.97, "learning_rate": 6.044849647197093e-08, "loss": 0.6958, "step": 8874 }, { "epoch": 0.97, "learning_rate": 6.00620148248654e-08, "loss": 0.6943, "step": 8875 }, { "epoch": 0.97, "learning_rate": 5.967676892032814e-08, "loss": 0.7144, "step": 8876 }, { "epoch": 0.97, "learning_rate": 5.929275880625529e-08, "loss": 0.6497, "step": 8877 }, { "epoch": 0.97, "learning_rate": 5.890998453038643e-08, "loss": 0.6938, "step": 8878 }, { "epoch": 0.97, "learning_rate": 5.852844614030795e-08, "loss": 0.6077, "step": 8879 }, { "epoch": 0.97, "learning_rate": 5.814814368345412e-08, "loss": 0.7686, "step": 8880 }, { "epoch": 0.97, "learning_rate": 5.7769077207103785e-08, "loss": 0.72, "step": 8881 }, { "epoch": 0.97, "learning_rate": 5.739124675838259e-08, "loss": 0.6626, "step": 8882 }, { "epoch": 0.97, "learning_rate": 5.701465238426296e-08, "loss": 0.656, "step": 8883 }, { "epoch": 0.97, "learning_rate": 5.6639294131564105e-08, "loss": 0.5671, "step": 8884 }, { "epoch": 0.97, "learning_rate": 5.6265172046949815e-08, "loss": 0.6702, "step": 8885 }, { "epoch": 0.97, "learning_rate": 5.5892286176932875e-08, "loss": 0.6096, "step": 8886 }, { "epoch": 0.97, "learning_rate": 5.5520636567869544e-08, "loss": 0.7246, "step": 8887 }, { "epoch": 0.97, "learning_rate": 5.5150223265963974e-08, "loss": 0.7241, "step": 8888 }, { "epoch": 0.97, "learning_rate": 5.4781046317267103e-08, "loss": 0.6077, "step": 8889 }, { "epoch": 0.97, "learning_rate": 5.4413105767673335e-08, "loss": 0.6624, "step": 8890 }, { "epoch": 0.97, "learning_rate": 5.4046401662927185e-08, "loss": 0.6587, "step": 8891 }, { "epoch": 0.97, "learning_rate": 5.368093404861774e-08, "loss": 0.6194, "step": 8892 }, { "epoch": 0.97, "learning_rate": 5.331670297017977e-08, "loss": 0.75, "step": 8893 }, { "epoch": 0.97, "learning_rate": 5.2953708472893715e-08, "loss": 0.6506, "step": 8894 }, { "epoch": 0.97, "learning_rate": 5.259195060188904e-08, "loss": 0.6094, "step": 8895 }, { "epoch": 0.97, "learning_rate": 5.223142940213865e-08, "loss": 0.6802, "step": 8896 }, { "epoch": 0.97, "learning_rate": 5.187214491846338e-08, "loss": 0.6777, "step": 8897 }, { "epoch": 0.97, "learning_rate": 5.15140971955308e-08, "loss": 0.6604, "step": 8898 }, { "epoch": 0.97, "learning_rate": 5.115728627785199e-08, "loss": 0.6157, "step": 8899 }, { "epoch": 0.97, "learning_rate": 5.080171220978813e-08, "loss": 0.5854, "step": 8900 }, { "epoch": 0.97, "learning_rate": 5.044737503554165e-08, "loss": 0.6689, "step": 8901 }, { "epoch": 0.97, "learning_rate": 5.0094274799166175e-08, "loss": 0.7061, "step": 8902 }, { "epoch": 0.97, "learning_rate": 4.974241154455994e-08, "loss": 0.6992, "step": 8903 }, { "epoch": 0.97, "learning_rate": 4.939178531546463e-08, "loss": 0.7705, "step": 8904 }, { "epoch": 0.97, "learning_rate": 4.9042396155472015e-08, "loss": 0.6179, "step": 8905 }, { "epoch": 0.97, "learning_rate": 4.869424410801848e-08, "loss": 0.6233, "step": 8906 }, { "epoch": 0.97, "learning_rate": 4.8347329216387184e-08, "loss": 0.6223, "step": 8907 }, { "epoch": 0.97, "learning_rate": 4.800165152370584e-08, "loss": 0.6543, "step": 8908 }, { "epoch": 0.97, "learning_rate": 4.765721107294896e-08, "loss": 0.6169, "step": 8909 }, { "epoch": 0.97, "learning_rate": 4.731400790693785e-08, "loss": 0.6436, "step": 8910 }, { "epoch": 0.97, "learning_rate": 4.6972042068341714e-08, "loss": 0.6653, "step": 8911 }, { "epoch": 0.97, "learning_rate": 4.6631313599673214e-08, "loss": 0.678, "step": 8912 }, { "epoch": 0.97, "learning_rate": 4.6291822543290676e-08, "loss": 0.8157, "step": 8913 }, { "epoch": 0.97, "learning_rate": 4.595356894140035e-08, "loss": 0.644, "step": 8914 }, { "epoch": 0.97, "learning_rate": 4.561655283605526e-08, "loss": 0.6113, "step": 8915 }, { "epoch": 0.97, "learning_rate": 4.528077426915412e-08, "loss": 0.6968, "step": 8916 }, { "epoch": 0.97, "learning_rate": 4.4946233282439076e-08, "loss": 0.7583, "step": 8917 }, { "epoch": 0.97, "learning_rate": 4.4612929917502433e-08, "loss": 0.7705, "step": 8918 }, { "epoch": 0.97, "learning_rate": 4.428086421577993e-08, "loss": 0.7104, "step": 8919 }, { "epoch": 0.97, "learning_rate": 4.395003621855409e-08, "loss": 0.6768, "step": 8920 }, { "epoch": 0.97, "learning_rate": 4.362044596695425e-08, "loss": 0.8115, "step": 8921 }, { "epoch": 0.97, "learning_rate": 4.329209350195651e-08, "loss": 0.6377, "step": 8922 }, { "epoch": 0.97, "learning_rate": 4.2964978864379336e-08, "loss": 0.6335, "step": 8923 }, { "epoch": 0.97, "learning_rate": 4.26391020948913e-08, "loss": 0.5532, "step": 8924 }, { "epoch": 0.97, "learning_rate": 4.231446323400557e-08, "loss": 0.7607, "step": 8925 }, { "epoch": 0.97, "learning_rate": 4.1991062322082057e-08, "loss": 0.6465, "step": 8926 }, { "epoch": 0.97, "learning_rate": 4.166889939932639e-08, "loss": 0.7366, "step": 8927 }, { "epoch": 0.97, "learning_rate": 4.134797450578987e-08, "loss": 0.5073, "step": 8928 }, { "epoch": 0.97, "learning_rate": 4.102828768136946e-08, "loss": 0.6797, "step": 8929 }, { "epoch": 0.97, "learning_rate": 4.070983896581004e-08, "loss": 0.5989, "step": 8930 }, { "epoch": 0.97, "learning_rate": 4.0392628398699954e-08, "loss": 0.6218, "step": 8931 }, { "epoch": 0.97, "learning_rate": 4.007665601947652e-08, "loss": 0.7881, "step": 8932 }, { "epoch": 0.97, "learning_rate": 3.976192186742167e-08, "loss": 0.5791, "step": 8933 }, { "epoch": 0.97, "learning_rate": 3.9448425981661876e-08, "loss": 0.7058, "step": 8934 }, { "epoch": 0.97, "learning_rate": 3.913616840117374e-08, "loss": 0.7031, "step": 8935 }, { "epoch": 0.97, "learning_rate": 3.88251491647762e-08, "loss": 0.6252, "step": 8936 }, { "epoch": 0.97, "learning_rate": 3.851536831113389e-08, "loss": 0.6353, "step": 8937 }, { "epoch": 0.97, "learning_rate": 3.8206825878762675e-08, "loss": 0.8076, "step": 8938 }, { "epoch": 0.97, "learning_rate": 3.789952190601742e-08, "loss": 0.666, "step": 8939 }, { "epoch": 0.97, "learning_rate": 3.759345643110313e-08, "loss": 0.6008, "step": 8940 }, { "epoch": 0.97, "learning_rate": 3.728862949207268e-08, "loss": 0.6736, "step": 8941 }, { "epoch": 0.97, "learning_rate": 3.698504112681911e-08, "loss": 0.6375, "step": 8942 }, { "epoch": 0.97, "learning_rate": 3.668269137308666e-08, "loss": 0.6631, "step": 8943 }, { "epoch": 0.97, "learning_rate": 3.6381580268463056e-08, "loss": 0.6863, "step": 8944 }, { "epoch": 0.97, "learning_rate": 3.6081707850382785e-08, "loss": 0.6887, "step": 8945 }, { "epoch": 0.97, "learning_rate": 3.578307415612714e-08, "loss": 0.7251, "step": 8946 }, { "epoch": 0.97, "learning_rate": 3.548567922282198e-08, "loss": 0.6602, "step": 8947 }, { "epoch": 0.97, "learning_rate": 3.518952308743884e-08, "loss": 0.7283, "step": 8948 }, { "epoch": 0.97, "learning_rate": 3.489460578679715e-08, "loss": 0.6572, "step": 8949 }, { "epoch": 0.97, "learning_rate": 3.460092735756204e-08, "loss": 0.7158, "step": 8950 }, { "epoch": 0.97, "learning_rate": 3.4308487836242077e-08, "loss": 0.6655, "step": 8951 }, { "epoch": 0.97, "learning_rate": 3.401728725919373e-08, "loss": 0.6487, "step": 8952 }, { "epoch": 0.97, "learning_rate": 3.372732566262138e-08, "loss": 0.637, "step": 8953 }, { "epoch": 0.97, "learning_rate": 3.343860308257174e-08, "loss": 0.6943, "step": 8954 }, { "epoch": 0.97, "learning_rate": 3.315111955493944e-08, "loss": 0.7441, "step": 8955 }, { "epoch": 0.97, "learning_rate": 3.2864875115464765e-08, "loss": 0.7104, "step": 8956 }, { "epoch": 0.98, "learning_rate": 3.257986979973371e-08, "loss": 0.6821, "step": 8957 }, { "epoch": 0.98, "learning_rate": 3.229610364317792e-08, "loss": 0.6885, "step": 8958 }, { "epoch": 0.98, "learning_rate": 3.2013576681075855e-08, "loss": 0.6445, "step": 8959 }, { "epoch": 0.98, "learning_rate": 3.173228894855274e-08, "loss": 0.7153, "step": 8960 }, { "epoch": 0.98, "learning_rate": 3.1452240480577265e-08, "loss": 0.5969, "step": 8961 }, { "epoch": 0.98, "learning_rate": 3.117343131196493e-08, "loss": 0.6846, "step": 8962 }, { "epoch": 0.98, "learning_rate": 3.0895861477377995e-08, "loss": 0.6226, "step": 8963 }, { "epoch": 0.98, "learning_rate": 3.061953101132442e-08, "loss": 0.6914, "step": 8964 }, { "epoch": 0.98, "learning_rate": 3.034443994815894e-08, "loss": 0.6685, "step": 8965 }, { "epoch": 0.98, "learning_rate": 3.0070588322079765e-08, "loss": 0.6348, "step": 8966 }, { "epoch": 0.98, "learning_rate": 2.979797616713187e-08, "loss": 0.5679, "step": 8967 }, { "epoch": 0.98, "learning_rate": 2.952660351720815e-08, "loss": 0.7231, "step": 8968 }, { "epoch": 0.98, "learning_rate": 2.9256470406044958e-08, "loss": 0.6262, "step": 8969 }, { "epoch": 0.98, "learning_rate": 2.898757686722542e-08, "loss": 0.6641, "step": 8970 }, { "epoch": 0.98, "learning_rate": 2.871992293417947e-08, "loss": 0.5935, "step": 8971 }, { "epoch": 0.98, "learning_rate": 2.8453508640181592e-08, "loss": 0.6472, "step": 8972 }, { "epoch": 0.98, "learning_rate": 2.818833401835308e-08, "loss": 0.668, "step": 8973 }, { "epoch": 0.98, "learning_rate": 2.7924399101659783e-08, "loss": 0.7012, "step": 8974 }, { "epoch": 0.98, "learning_rate": 2.766170392291434e-08, "loss": 0.6392, "step": 8975 }, { "epoch": 0.98, "learning_rate": 2.7400248514776184e-08, "loss": 0.7722, "step": 8976 }, { "epoch": 0.98, "learning_rate": 2.7140032909749315e-08, "loss": 0.656, "step": 8977 }, { "epoch": 0.98, "learning_rate": 2.6881057140184518e-08, "loss": 0.658, "step": 8978 }, { "epoch": 0.98, "learning_rate": 2.6623321238277157e-08, "loss": 0.7305, "step": 8979 }, { "epoch": 0.98, "learning_rate": 2.6366825236068262e-08, "loss": 0.7334, "step": 8980 }, { "epoch": 0.98, "learning_rate": 2.6111569165447882e-08, "loss": 0.6904, "step": 8981 }, { "epoch": 0.98, "learning_rate": 2.585755305814841e-08, "loss": 0.6948, "step": 8982 }, { "epoch": 0.98, "learning_rate": 2.5604776945750142e-08, "loss": 0.5989, "step": 8983 }, { "epoch": 0.98, "learning_rate": 2.5353240859676832e-08, "loss": 0.6328, "step": 8984 }, { "epoch": 0.98, "learning_rate": 2.5102944831201238e-08, "loss": 0.6599, "step": 8985 }, { "epoch": 0.98, "learning_rate": 2.4853888891439582e-08, "loss": 0.6975, "step": 8986 }, { "epoch": 0.98, "learning_rate": 2.4606073071355983e-08, "loss": 0.6907, "step": 8987 }, { "epoch": 0.98, "learning_rate": 2.4359497401758026e-08, "loss": 0.7583, "step": 8988 }, { "epoch": 0.98, "learning_rate": 2.4114161913300072e-08, "loss": 0.5708, "step": 8989 }, { "epoch": 0.98, "learning_rate": 2.3870066636482168e-08, "loss": 0.6179, "step": 8990 }, { "epoch": 0.98, "learning_rate": 2.3627211601651157e-08, "loss": 0.594, "step": 8991 }, { "epoch": 0.98, "learning_rate": 2.3385596839000658e-08, "loss": 0.6665, "step": 8992 }, { "epoch": 0.98, "learning_rate": 2.3145222378565535e-08, "loss": 0.6543, "step": 8993 }, { "epoch": 0.98, "learning_rate": 2.2906088250229664e-08, "loss": 0.6357, "step": 8994 }, { "epoch": 0.98, "learning_rate": 2.2668194483724814e-08, "loss": 0.6763, "step": 8995 }, { "epoch": 0.98, "learning_rate": 2.2431541108624e-08, "loss": 0.657, "step": 8996 }, { "epoch": 0.98, "learning_rate": 2.219612815434924e-08, "loss": 0.7175, "step": 8997 }, { "epoch": 0.98, "learning_rate": 2.1961955650167122e-08, "loss": 0.7251, "step": 8998 }, { "epoch": 0.98, "learning_rate": 2.1729023625189916e-08, "loss": 0.7529, "step": 8999 }, { "epoch": 0.98, "learning_rate": 2.1497332108375567e-08, "loss": 0.6235, "step": 9000 }, { "epoch": 0.98, "learning_rate": 2.1266881128528815e-08, "loss": 0.6228, "step": 9001 }, { "epoch": 0.98, "learning_rate": 2.1037670714300072e-08, "loss": 0.478, "step": 9002 }, { "epoch": 0.98, "learning_rate": 2.0809700894183214e-08, "loss": 0.6877, "step": 9003 }, { "epoch": 0.98, "learning_rate": 2.0582971696522237e-08, "loss": 0.6899, "step": 9004 }, { "epoch": 0.98, "learning_rate": 2.0357483149501256e-08, "loss": 0.6475, "step": 9005 }, { "epoch": 0.98, "learning_rate": 2.013323528115674e-08, "loss": 0.6487, "step": 9006 }, { "epoch": 0.98, "learning_rate": 1.9910228119364162e-08, "loss": 0.6343, "step": 9007 }, { "epoch": 0.98, "learning_rate": 1.9688461691849125e-08, "loss": 0.6213, "step": 9008 }, { "epoch": 0.98, "learning_rate": 1.946793602618291e-08, "loss": 0.7856, "step": 9009 }, { "epoch": 0.98, "learning_rate": 1.924865114978025e-08, "loss": 0.6995, "step": 9010 }, { "epoch": 0.98, "learning_rate": 1.9030607089902675e-08, "loss": 0.7441, "step": 9011 }, { "epoch": 0.98, "learning_rate": 1.881380387365961e-08, "loss": 0.7388, "step": 9012 }, { "epoch": 0.98, "learning_rate": 1.8598241528001716e-08, "loss": 0.7422, "step": 9013 }, { "epoch": 0.98, "learning_rate": 1.838392007972867e-08, "loss": 0.6335, "step": 9014 }, { "epoch": 0.98, "learning_rate": 1.817083955548693e-08, "loss": 0.7964, "step": 9015 }, { "epoch": 0.98, "learning_rate": 1.7958999981764203e-08, "loss": 0.6631, "step": 9016 }, { "epoch": 0.98, "learning_rate": 1.7748401384898306e-08, "loss": 0.7446, "step": 9017 }, { "epoch": 0.98, "learning_rate": 1.753904379106941e-08, "loss": 0.6262, "step": 9018 }, { "epoch": 0.98, "learning_rate": 1.7330927226306694e-08, "loss": 0.6741, "step": 9019 }, { "epoch": 0.98, "learning_rate": 1.7124051716483903e-08, "loss": 0.7578, "step": 9020 }, { "epoch": 0.98, "learning_rate": 1.6918417287318245e-08, "loss": 0.6162, "step": 9021 }, { "epoch": 0.98, "learning_rate": 1.6714023964374824e-08, "loss": 0.7439, "step": 9022 }, { "epoch": 0.98, "learning_rate": 1.651087177306443e-08, "loss": 0.7734, "step": 9023 }, { "epoch": 0.98, "learning_rate": 1.630896073864352e-08, "loss": 0.6782, "step": 9024 }, { "epoch": 0.98, "learning_rate": 1.610829088621313e-08, "loss": 0.6213, "step": 9025 }, { "epoch": 0.98, "learning_rate": 1.590886224071997e-08, "loss": 0.678, "step": 9026 }, { "epoch": 0.98, "learning_rate": 1.5710674826959758e-08, "loss": 0.6409, "step": 9027 }, { "epoch": 0.98, "learning_rate": 1.551372866956835e-08, "loss": 0.656, "step": 9028 }, { "epoch": 0.98, "learning_rate": 1.5318023793032823e-08, "loss": 0.7422, "step": 9029 }, { "epoch": 0.98, "learning_rate": 1.5123560221681488e-08, "loss": 0.7441, "step": 9030 }, { "epoch": 0.98, "learning_rate": 1.4930337979691678e-08, "loss": 0.4802, "step": 9031 }, { "epoch": 0.98, "learning_rate": 1.4738357091084177e-08, "loss": 0.5676, "step": 9032 }, { "epoch": 0.98, "learning_rate": 1.4547617579725449e-08, "loss": 0.6924, "step": 9033 }, { "epoch": 0.98, "learning_rate": 1.4358119469329857e-08, "loss": 0.6228, "step": 9034 }, { "epoch": 0.98, "learning_rate": 1.4169862783456335e-08, "loss": 0.6855, "step": 9035 }, { "epoch": 0.98, "learning_rate": 1.3982847545507271e-08, "loss": 0.7734, "step": 9036 }, { "epoch": 0.98, "learning_rate": 1.3797073778734071e-08, "loss": 0.5754, "step": 9037 }, { "epoch": 0.98, "learning_rate": 1.3612541506231592e-08, "loss": 0.573, "step": 9038 }, { "epoch": 0.98, "learning_rate": 1.342925075094148e-08, "loss": 0.5938, "step": 9039 }, { "epoch": 0.98, "learning_rate": 1.3247201535649957e-08, "loss": 0.5291, "step": 9040 }, { "epoch": 0.98, "learning_rate": 1.3066393882990026e-08, "loss": 0.7285, "step": 9041 }, { "epoch": 0.98, "learning_rate": 1.2886827815440373e-08, "loss": 0.6807, "step": 9042 }, { "epoch": 0.98, "learning_rate": 1.2708503355323143e-08, "loss": 0.73, "step": 9043 }, { "epoch": 0.98, "learning_rate": 1.25314205248106e-08, "loss": 0.7542, "step": 9044 }, { "epoch": 0.98, "learning_rate": 1.2355579345915136e-08, "loss": 0.7607, "step": 9045 }, { "epoch": 0.98, "learning_rate": 1.2180979840498153e-08, "loss": 0.6667, "step": 9046 }, { "epoch": 0.98, "learning_rate": 1.200762203026784e-08, "loss": 0.7134, "step": 9047 }, { "epoch": 0.98, "learning_rate": 1.1835505936773628e-08, "loss": 0.6909, "step": 9048 }, { "epoch": 0.99, "learning_rate": 1.1664631581415065e-08, "loss": 0.707, "step": 9049 }, { "epoch": 0.99, "learning_rate": 1.1494998985434047e-08, "loss": 0.5214, "step": 9050 }, { "epoch": 0.99, "learning_rate": 1.1326608169920373e-08, "loss": 0.6624, "step": 9051 }, { "epoch": 0.99, "learning_rate": 1.1159459155808405e-08, "loss": 0.6173, "step": 9052 }, { "epoch": 0.99, "learning_rate": 1.099355196387819e-08, "loss": 0.6992, "step": 9053 }, { "epoch": 0.99, "learning_rate": 1.0828886614754342e-08, "loss": 0.6704, "step": 9054 }, { "epoch": 0.99, "learning_rate": 1.066546312891048e-08, "loss": 0.7144, "step": 9055 }, { "epoch": 0.99, "learning_rate": 1.0503281526662579e-08, "loss": 0.7488, "step": 9056 }, { "epoch": 0.99, "learning_rate": 1.0342341828172287e-08, "loss": 0.6492, "step": 9057 }, { "epoch": 0.99, "learning_rate": 1.0182644053448044e-08, "loss": 0.6233, "step": 9058 }, { "epoch": 0.99, "learning_rate": 1.0024188222345076e-08, "loss": 0.6729, "step": 9059 }, { "epoch": 0.99, "learning_rate": 9.866974354560966e-09, "loss": 0.6309, "step": 9060 }, { "epoch": 0.99, "learning_rate": 9.711002469642294e-09, "loss": 0.71, "step": 9061 }, { "epoch": 0.99, "learning_rate": 9.556272586977999e-09, "loss": 0.7021, "step": 9062 }, { "epoch": 0.99, "learning_rate": 9.402784725806024e-09, "loss": 0.7527, "step": 9063 }, { "epoch": 0.99, "learning_rate": 9.250538905206663e-09, "loss": 0.7036, "step": 9064 }, { "epoch": 0.99, "learning_rate": 9.099535144108107e-09, "loss": 0.6104, "step": 9065 }, { "epoch": 0.99, "learning_rate": 8.949773461282008e-09, "loss": 0.7495, "step": 9066 }, { "epoch": 0.99, "learning_rate": 8.801253875349026e-09, "loss": 0.6599, "step": 9067 }, { "epoch": 0.99, "learning_rate": 8.653976404771059e-09, "loss": 0.6685, "step": 9068 }, { "epoch": 0.99, "learning_rate": 8.507941067859016e-09, "loss": 0.7056, "step": 9069 }, { "epoch": 0.99, "learning_rate": 8.363147882768375e-09, "loss": 0.5739, "step": 9070 }, { "epoch": 0.99, "learning_rate": 8.21959686749918e-09, "loss": 0.7158, "step": 9071 }, { "epoch": 0.99, "learning_rate": 8.077288039898267e-09, "loss": 0.6936, "step": 9072 }, { "epoch": 0.99, "learning_rate": 7.936221417658152e-09, "loss": 0.6799, "step": 9073 }, { "epoch": 0.99, "learning_rate": 7.796397018314804e-09, "loss": 0.6868, "step": 9074 }, { "epoch": 0.99, "learning_rate": 7.657814859252099e-09, "loss": 0.645, "step": 9075 }, { "epoch": 0.99, "learning_rate": 7.520474957699586e-09, "loss": 0.6572, "step": 9076 }, { "epoch": 0.99, "learning_rate": 7.384377330730275e-09, "loss": 0.79, "step": 9077 }, { "epoch": 0.99, "learning_rate": 7.2495219952639636e-09, "loss": 0.7156, "step": 9078 }, { "epoch": 0.99, "learning_rate": 7.115908968067242e-09, "loss": 0.6648, "step": 9079 }, { "epoch": 0.99, "learning_rate": 6.983538265750156e-09, "loss": 0.6235, "step": 9080 }, { "epoch": 0.99, "learning_rate": 6.8524099047695415e-09, "loss": 0.6272, "step": 9081 }, { "epoch": 0.99, "learning_rate": 6.722523901426803e-09, "loss": 0.6472, "step": 9082 }, { "epoch": 0.99, "learning_rate": 6.593880271869024e-09, "loss": 0.6357, "step": 9083 }, { "epoch": 0.99, "learning_rate": 6.4664790320911885e-09, "loss": 0.6814, "step": 9084 }, { "epoch": 0.99, "learning_rate": 6.340320197929517e-09, "loss": 0.6694, "step": 9085 }, { "epoch": 0.99, "learning_rate": 6.2154037850703505e-09, "loss": 0.6772, "step": 9086 }, { "epoch": 0.99, "learning_rate": 6.091729809042379e-09, "loss": 0.6624, "step": 9087 }, { "epoch": 0.99, "learning_rate": 5.969298285221081e-09, "loss": 0.7253, "step": 9088 }, { "epoch": 0.99, "learning_rate": 5.848109228827614e-09, "loss": 0.7083, "step": 9089 }, { "epoch": 0.99, "learning_rate": 5.728162654927705e-09, "loss": 0.6726, "step": 9090 }, { "epoch": 0.99, "learning_rate": 5.609458578432758e-09, "loss": 0.7109, "step": 9091 }, { "epoch": 0.99, "learning_rate": 5.49199701410208e-09, "loss": 0.6508, "step": 9092 }, { "epoch": 0.99, "learning_rate": 5.375777976536211e-09, "loss": 0.6436, "step": 9093 }, { "epoch": 0.99, "learning_rate": 5.260801480185818e-09, "loss": 0.6807, "step": 9094 }, { "epoch": 0.99, "learning_rate": 5.147067539342798e-09, "loss": 0.7961, "step": 9095 }, { "epoch": 0.99, "learning_rate": 5.034576168149175e-09, "loss": 0.5967, "step": 9096 }, { "epoch": 0.99, "learning_rate": 4.923327380587095e-09, "loss": 0.7808, "step": 9097 }, { "epoch": 0.99, "learning_rate": 4.813321190488829e-09, "loss": 0.7373, "step": 9098 }, { "epoch": 0.99, "learning_rate": 4.704557611531213e-09, "loss": 0.7642, "step": 9099 }, { "epoch": 0.99, "learning_rate": 4.597036657233434e-09, "loss": 0.7139, "step": 9100 }, { "epoch": 0.99, "learning_rate": 4.490758340964796e-09, "loss": 0.572, "step": 9101 }, { "epoch": 0.99, "learning_rate": 4.385722675936954e-09, "loss": 0.6282, "step": 9102 }, { "epoch": 0.99, "learning_rate": 4.281929675208351e-09, "loss": 0.7266, "step": 9103 }, { "epoch": 0.99, "learning_rate": 4.1793793516820005e-09, "loss": 0.7939, "step": 9104 }, { "epoch": 0.99, "learning_rate": 4.0780717181077015e-09, "loss": 0.6187, "step": 9105 }, { "epoch": 0.99, "learning_rate": 3.978006787079824e-09, "loss": 0.7354, "step": 9106 }, { "epoch": 0.99, "learning_rate": 3.87918457103953e-09, "loss": 0.6721, "step": 9107 }, { "epoch": 0.99, "learning_rate": 3.7816050822703235e-09, "loss": 0.7656, "step": 9108 }, { "epoch": 0.99, "learning_rate": 3.6852683329058336e-09, "loss": 0.6914, "step": 9109 }, { "epoch": 0.99, "learning_rate": 3.590174334919816e-09, "loss": 0.6616, "step": 9110 }, { "epoch": 0.99, "learning_rate": 3.4963231001383657e-09, "loss": 0.6733, "step": 9111 }, { "epoch": 0.99, "learning_rate": 3.403714640225486e-09, "loss": 0.7217, "step": 9112 }, { "epoch": 0.99, "learning_rate": 3.3123489666964104e-09, "loss": 0.604, "step": 9113 }, { "epoch": 0.99, "learning_rate": 3.22222609090872e-09, "loss": 0.5986, "step": 9114 }, { "epoch": 0.99, "learning_rate": 3.1333460240678958e-09, "loss": 0.7568, "step": 9115 }, { "epoch": 0.99, "learning_rate": 3.0457087772228777e-09, "loss": 0.7339, "step": 9116 }, { "epoch": 0.99, "learning_rate": 2.959314361268284e-09, "loss": 0.6956, "step": 9117 }, { "epoch": 0.99, "learning_rate": 2.8741627869444123e-09, "loss": 0.729, "step": 9118 }, { "epoch": 0.99, "learning_rate": 2.7902540648394593e-09, "loss": 0.6533, "step": 9119 }, { "epoch": 0.99, "learning_rate": 2.7075882053828605e-09, "loss": 0.6533, "step": 9120 }, { "epoch": 0.99, "learning_rate": 2.6261652188530608e-09, "loss": 0.6536, "step": 9121 }, { "epoch": 0.99, "learning_rate": 2.545985115371963e-09, "loss": 0.6643, "step": 9122 }, { "epoch": 0.99, "learning_rate": 2.4670479049082596e-09, "loss": 0.6097, "step": 9123 }, { "epoch": 0.99, "learning_rate": 2.3893535972752126e-09, "loss": 0.656, "step": 9124 }, { "epoch": 0.99, "learning_rate": 2.3129022021317615e-09, "loss": 0.6846, "step": 9125 }, { "epoch": 0.99, "learning_rate": 2.237693728981416e-09, "loss": 0.6345, "step": 9126 }, { "epoch": 0.99, "learning_rate": 2.1637281871766948e-09, "loss": 0.6184, "step": 9127 }, { "epoch": 0.99, "learning_rate": 2.091005585910244e-09, "loss": 0.5669, "step": 9128 }, { "epoch": 0.99, "learning_rate": 2.0195259342248306e-09, "loss": 0.6929, "step": 9129 }, { "epoch": 0.99, "learning_rate": 1.94928924100557e-09, "loss": 0.6245, "step": 9130 }, { "epoch": 0.99, "learning_rate": 1.8802955149865854e-09, "loss": 0.6277, "step": 9131 }, { "epoch": 0.99, "learning_rate": 1.8125447647421302e-09, "loss": 0.6399, "step": 9132 }, { "epoch": 0.99, "learning_rate": 1.7460369986976866e-09, "loss": 0.7256, "step": 9133 }, { "epoch": 0.99, "learning_rate": 1.6807722251199754e-09, "loss": 0.7002, "step": 9134 }, { "epoch": 0.99, "learning_rate": 1.6167504521236166e-09, "loss": 0.6294, "step": 9135 }, { "epoch": 0.99, "learning_rate": 1.553971687667799e-09, "loss": 0.7354, "step": 9136 }, { "epoch": 0.99, "learning_rate": 1.4924359395573907e-09, "loss": 0.751, "step": 9137 }, { "epoch": 0.99, "learning_rate": 1.432143215441828e-09, "loss": 0.7388, "step": 9138 }, { "epoch": 0.99, "learning_rate": 1.3730935228162268e-09, "loss": 0.6985, "step": 9139 }, { "epoch": 0.99, "learning_rate": 1.315286869023602e-09, "loss": 0.7004, "step": 9140 }, { "epoch": 1.0, "learning_rate": 1.2587232612493172e-09, "loss": 0.6365, "step": 9141 }, { "epoch": 1.0, "learning_rate": 1.203402706525525e-09, "loss": 0.7622, "step": 9142 }, { "epoch": 1.0, "learning_rate": 1.149325211730057e-09, "loss": 0.7676, "step": 9143 }, { "epoch": 1.0, "learning_rate": 1.0964907835864235e-09, "loss": 0.6619, "step": 9144 }, { "epoch": 1.0, "learning_rate": 1.0448994286615944e-09, "loss": 0.5964, "step": 9145 }, { "epoch": 1.0, "learning_rate": 9.945511533693275e-10, "loss": 0.6628, "step": 9146 }, { "epoch": 1.0, "learning_rate": 9.45445963971281e-10, "loss": 0.698, "step": 9147 }, { "epoch": 1.0, "learning_rate": 8.975838665703507e-10, "loss": 0.7729, "step": 9148 }, { "epoch": 1.0, "learning_rate": 8.509648671162218e-10, "loss": 0.7468, "step": 9149 }, { "epoch": 1.0, "learning_rate": 8.05588971406479e-10, "loss": 0.6697, "step": 9150 }, { "epoch": 1.0, "learning_rate": 7.614561850821655e-10, "loss": 0.6709, "step": 9151 }, { "epoch": 1.0, "learning_rate": 7.185665136277831e-10, "loss": 0.7109, "step": 9152 }, { "epoch": 1.0, "learning_rate": 6.769199623779532e-10, "loss": 0.7954, "step": 9153 }, { "epoch": 1.0, "learning_rate": 6.365165365085358e-10, "loss": 0.5579, "step": 9154 }, { "epoch": 1.0, "learning_rate": 5.973562410432898e-10, "loss": 0.6497, "step": 9155 }, { "epoch": 1.0, "learning_rate": 5.594390808494332e-10, "loss": 0.6731, "step": 9156 }, { "epoch": 1.0, "learning_rate": 5.227650606431933e-10, "loss": 0.5916, "step": 9157 }, { "epoch": 1.0, "learning_rate": 4.873341849820356e-10, "loss": 0.6782, "step": 9158 }, { "epoch": 1.0, "learning_rate": 4.531464582713252e-10, "loss": 0.6665, "step": 9159 }, { "epoch": 1.0, "learning_rate": 4.2020188476099565e-10, "loss": 0.7261, "step": 9160 }, { "epoch": 1.0, "learning_rate": 3.8850046854777e-10, "loss": 0.6931, "step": 9161 }, { "epoch": 1.0, "learning_rate": 3.580422135718298e-10, "loss": 0.7856, "step": 9162 }, { "epoch": 1.0, "learning_rate": 3.288271236201457e-10, "loss": 0.7202, "step": 9163 }, { "epoch": 1.0, "learning_rate": 3.008552023242572e-10, "loss": 0.5659, "step": 9164 }, { "epoch": 1.0, "learning_rate": 2.741264531624932e-10, "loss": 0.6182, "step": 9165 }, { "epoch": 1.0, "learning_rate": 2.4864087945664085e-10, "loss": 0.6917, "step": 9166 }, { "epoch": 1.0, "learning_rate": 2.243984843763869e-10, "loss": 0.8433, "step": 9167 }, { "epoch": 1.0, "learning_rate": 2.0139927093487666e-10, "loss": 0.5593, "step": 9168 }, { "epoch": 1.0, "learning_rate": 1.7964324199204463e-10, "loss": 0.5991, "step": 9169 }, { "epoch": 1.0, "learning_rate": 1.591304002512839e-10, "loss": 0.6423, "step": 9170 }, { "epoch": 1.0, "learning_rate": 1.3986074826388697e-10, "loss": 0.6851, "step": 9171 }, { "epoch": 1.0, "learning_rate": 1.2183428842460486e-10, "loss": 0.8486, "step": 9172 }, { "epoch": 1.0, "learning_rate": 1.0505102297608815e-10, "loss": 0.6296, "step": 9173 }, { "epoch": 1.0, "learning_rate": 8.951095400333565e-11, "loss": 0.6431, "step": 9174 }, { "epoch": 1.0, "learning_rate": 7.521408343924564e-11, "loss": 0.6792, "step": 9175 }, { "epoch": 1.0, "learning_rate": 6.216041306017495e-11, "loss": 0.6858, "step": 9176 }, { "epoch": 1.0, "learning_rate": 5.034994448926967e-11, "loss": 0.6128, "step": 9177 }, { "epoch": 1.0, "learning_rate": 3.978267919535483e-11, "loss": 0.7646, "step": 9178 }, { "epoch": 1.0, "learning_rate": 3.0458618492934525e-11, "loss": 0.6914, "step": 9179 }, { "epoch": 1.0, "learning_rate": 2.237776353886112e-11, "loss": 0.6655, "step": 9180 }, { "epoch": 1.0, "learning_rate": 1.554011534010691e-11, "loss": 0.7612, "step": 9181 }, { "epoch": 1.0, "learning_rate": 9.945674744882283e-12, "loss": 0.5867, "step": 9182 }, { "epoch": 1.0, "learning_rate": 5.594442449297077e-12, "loss": 0.6682, "step": 9183 }, { "epoch": 1.0, "learning_rate": 2.4864189951401274e-12, "loss": 0.7583, "step": 9184 }, { "epoch": 1.0, "learning_rate": 6.216047676588233e-13, "loss": 0.7192, "step": 9185 }, { "epoch": 1.0, "learning_rate": 0.0, "loss": 0.6372, "step": 9186 }, { "epoch": 1.0, "step": 9186, "total_flos": 4036443115880448.0, "train_loss": 0.7238920225496, "train_runtime": 155543.7253, "train_samples_per_second": 7.559, "train_steps_per_second": 0.059 } ], "max_steps": 9186, "num_train_epochs": 1, "total_flos": 4036443115880448.0, "trial_name": null, "trial_params": null }