{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.9566580346190541, "global_step": 14038, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 4.53514739229025e-08, "loss": 1.3926, "step": 1 }, { "epoch": 0.0, "learning_rate": 9.0702947845805e-08, "loss": 1.3477, "step": 2 }, { "epoch": 0.0, "learning_rate": 1.360544217687075e-07, "loss": 1.3555, "step": 3 }, { "epoch": 0.0, "learning_rate": 1.8140589569161e-07, "loss": 1.334, "step": 4 }, { "epoch": 0.0, "learning_rate": 2.267573696145125e-07, "loss": 1.3906, "step": 5 }, { "epoch": 0.0, "learning_rate": 2.72108843537415e-07, "loss": 1.4297, "step": 6 }, { "epoch": 0.0, "learning_rate": 3.174603174603175e-07, "loss": 1.2656, "step": 7 }, { "epoch": 0.0, "learning_rate": 3.6281179138322e-07, "loss": 1.3438, "step": 8 }, { "epoch": 0.0, "learning_rate": 4.0816326530612243e-07, "loss": 1.3809, "step": 9 }, { "epoch": 0.0, "learning_rate": 4.53514739229025e-07, "loss": 1.3672, "step": 10 }, { "epoch": 0.0, "learning_rate": 4.988662131519275e-07, "loss": 1.3887, "step": 11 }, { "epoch": 0.0, "learning_rate": 5.4421768707483e-07, "loss": 1.3516, "step": 12 }, { "epoch": 0.0, "learning_rate": 5.895691609977325e-07, "loss": 1.4375, "step": 13 }, { "epoch": 0.0, "learning_rate": 6.34920634920635e-07, "loss": 1.3633, "step": 14 }, { "epoch": 0.0, "learning_rate": 6.802721088435376e-07, "loss": 1.3633, "step": 15 }, { "epoch": 0.0, "learning_rate": 7.2562358276644e-07, "loss": 1.2695, "step": 16 }, { "epoch": 0.0, "learning_rate": 7.709750566893425e-07, "loss": 1.3711, "step": 17 }, { "epoch": 0.0, "learning_rate": 8.163265306122449e-07, "loss": 1.3711, "step": 18 }, { "epoch": 0.0, "learning_rate": 8.616780045351475e-07, "loss": 1.3887, "step": 19 }, { "epoch": 0.0, "learning_rate": 9.0702947845805e-07, "loss": 1.3984, "step": 20 }, { "epoch": 0.0, "learning_rate": 9.523809523809525e-07, "loss": 1.3574, "step": 21 }, { "epoch": 0.0, "learning_rate": 9.97732426303855e-07, "loss": 1.2578, "step": 22 }, { "epoch": 0.0, "learning_rate": 1.0430839002267576e-06, "loss": 1.3594, "step": 23 }, { "epoch": 0.0, "learning_rate": 1.08843537414966e-06, "loss": 1.2754, "step": 24 }, { "epoch": 0.0, "learning_rate": 1.1337868480725626e-06, "loss": 1.3047, "step": 25 }, { "epoch": 0.0, "learning_rate": 1.179138321995465e-06, "loss": 1.2383, "step": 26 }, { "epoch": 0.0, "learning_rate": 1.2244897959183673e-06, "loss": 1.2051, "step": 27 }, { "epoch": 0.0, "learning_rate": 1.26984126984127e-06, "loss": 1.2051, "step": 28 }, { "epoch": 0.0, "learning_rate": 1.3151927437641723e-06, "loss": 1.2148, "step": 29 }, { "epoch": 0.0, "learning_rate": 1.3605442176870751e-06, "loss": 1.1465, "step": 30 }, { "epoch": 0.0, "learning_rate": 1.4058956916099775e-06, "loss": 1.1836, "step": 31 }, { "epoch": 0.0, "learning_rate": 1.45124716553288e-06, "loss": 1.2402, "step": 32 }, { "epoch": 0.0, "learning_rate": 1.4965986394557825e-06, "loss": 1.2266, "step": 33 }, { "epoch": 0.0, "learning_rate": 1.541950113378685e-06, "loss": 1.168, "step": 34 }, { "epoch": 0.0, "learning_rate": 1.5873015873015873e-06, "loss": 1.2227, "step": 35 }, { "epoch": 0.0, "learning_rate": 1.6326530612244897e-06, "loss": 1.2441, "step": 36 }, { "epoch": 0.0, "learning_rate": 1.6780045351473925e-06, "loss": 1.2227, "step": 37 }, { "epoch": 0.0, "learning_rate": 1.723356009070295e-06, "loss": 1.0801, "step": 38 }, { "epoch": 0.0, "learning_rate": 1.7687074829931975e-06, "loss": 1.1562, "step": 39 }, { "epoch": 0.0, "learning_rate": 1.8140589569161e-06, "loss": 1.1221, "step": 40 }, { "epoch": 0.0, "learning_rate": 1.8594104308390023e-06, "loss": 1.1699, "step": 41 }, { "epoch": 0.0, "learning_rate": 1.904761904761905e-06, "loss": 1.1074, "step": 42 }, { "epoch": 0.0, "learning_rate": 1.9501133786848077e-06, "loss": 1.2422, "step": 43 }, { "epoch": 0.0, "learning_rate": 1.99546485260771e-06, "loss": 1.1367, "step": 44 }, { "epoch": 0.0, "learning_rate": 2.0408163265306125e-06, "loss": 1.083, "step": 45 }, { "epoch": 0.0, "learning_rate": 2.086167800453515e-06, "loss": 1.0762, "step": 46 }, { "epoch": 0.0, "learning_rate": 2.1315192743764173e-06, "loss": 1.0762, "step": 47 }, { "epoch": 0.0, "learning_rate": 2.17687074829932e-06, "loss": 0.9932, "step": 48 }, { "epoch": 0.0, "learning_rate": 2.222222222222222e-06, "loss": 1.0742, "step": 49 }, { "epoch": 0.0, "learning_rate": 2.267573696145125e-06, "loss": 1.0684, "step": 50 }, { "epoch": 0.0, "learning_rate": 2.3129251700680273e-06, "loss": 1.1074, "step": 51 }, { "epoch": 0.0, "learning_rate": 2.35827664399093e-06, "loss": 0.9893, "step": 52 }, { "epoch": 0.0, "learning_rate": 2.4036281179138325e-06, "loss": 1.0723, "step": 53 }, { "epoch": 0.0, "learning_rate": 2.4489795918367347e-06, "loss": 1.0977, "step": 54 }, { "epoch": 0.0, "learning_rate": 2.4943310657596373e-06, "loss": 1.0908, "step": 55 }, { "epoch": 0.0, "learning_rate": 2.53968253968254e-06, "loss": 1.0098, "step": 56 }, { "epoch": 0.0, "learning_rate": 2.5850340136054425e-06, "loss": 1.0684, "step": 57 }, { "epoch": 0.0, "learning_rate": 2.6303854875283447e-06, "loss": 1.0068, "step": 58 }, { "epoch": 0.0, "learning_rate": 2.6757369614512473e-06, "loss": 1.0635, "step": 59 }, { "epoch": 0.0, "learning_rate": 2.7210884353741503e-06, "loss": 1.1211, "step": 60 }, { "epoch": 0.0, "learning_rate": 2.7664399092970525e-06, "loss": 0.9844, "step": 61 }, { "epoch": 0.0, "learning_rate": 2.811791383219955e-06, "loss": 0.9893, "step": 62 }, { "epoch": 0.0, "learning_rate": 2.8571428571428573e-06, "loss": 1.0078, "step": 63 }, { "epoch": 0.0, "learning_rate": 2.90249433106576e-06, "loss": 1.0449, "step": 64 }, { "epoch": 0.0, "learning_rate": 2.947845804988662e-06, "loss": 1.0469, "step": 65 }, { "epoch": 0.0, "learning_rate": 2.993197278911565e-06, "loss": 0.9658, "step": 66 }, { "epoch": 0.0, "learning_rate": 3.0385487528344677e-06, "loss": 0.9531, "step": 67 }, { "epoch": 0.0, "learning_rate": 3.08390022675737e-06, "loss": 0.9893, "step": 68 }, { "epoch": 0.0, "learning_rate": 3.1292517006802725e-06, "loss": 1.1113, "step": 69 }, { "epoch": 0.0, "learning_rate": 3.1746031746031746e-06, "loss": 1.0098, "step": 70 }, { "epoch": 0.0, "learning_rate": 3.2199546485260772e-06, "loss": 1.1094, "step": 71 }, { "epoch": 0.0, "learning_rate": 3.2653061224489794e-06, "loss": 0.9424, "step": 72 }, { "epoch": 0.0, "learning_rate": 3.3106575963718824e-06, "loss": 1.0352, "step": 73 }, { "epoch": 0.01, "learning_rate": 3.356009070294785e-06, "loss": 1.0938, "step": 74 }, { "epoch": 0.01, "learning_rate": 3.4013605442176872e-06, "loss": 1.0186, "step": 75 }, { "epoch": 0.01, "learning_rate": 3.44671201814059e-06, "loss": 1.0322, "step": 76 }, { "epoch": 0.01, "learning_rate": 3.492063492063492e-06, "loss": 1.0566, "step": 77 }, { "epoch": 0.01, "learning_rate": 3.537414965986395e-06, "loss": 1.0566, "step": 78 }, { "epoch": 0.01, "learning_rate": 3.5827664399092976e-06, "loss": 1.0615, "step": 79 }, { "epoch": 0.01, "learning_rate": 3.6281179138322e-06, "loss": 0.9805, "step": 80 }, { "epoch": 0.01, "learning_rate": 3.6734693877551024e-06, "loss": 1.0508, "step": 81 }, { "epoch": 0.01, "learning_rate": 3.7188208616780046e-06, "loss": 1.0625, "step": 82 }, { "epoch": 0.01, "learning_rate": 3.7641723356009076e-06, "loss": 1.0078, "step": 83 }, { "epoch": 0.01, "learning_rate": 3.80952380952381e-06, "loss": 0.9902, "step": 84 }, { "epoch": 0.01, "learning_rate": 3.854875283446712e-06, "loss": 1.0176, "step": 85 }, { "epoch": 0.01, "learning_rate": 3.9002267573696154e-06, "loss": 0.9561, "step": 86 }, { "epoch": 0.01, "learning_rate": 3.945578231292517e-06, "loss": 0.9961, "step": 87 }, { "epoch": 0.01, "learning_rate": 3.99092970521542e-06, "loss": 0.9326, "step": 88 }, { "epoch": 0.01, "learning_rate": 4.036281179138322e-06, "loss": 0.9424, "step": 89 }, { "epoch": 0.01, "learning_rate": 4.081632653061225e-06, "loss": 1.042, "step": 90 }, { "epoch": 0.01, "learning_rate": 4.126984126984127e-06, "loss": 0.9355, "step": 91 }, { "epoch": 0.01, "learning_rate": 4.17233560090703e-06, "loss": 1.0186, "step": 92 }, { "epoch": 0.01, "learning_rate": 4.217687074829933e-06, "loss": 0.9922, "step": 93 }, { "epoch": 0.01, "learning_rate": 4.263038548752835e-06, "loss": 0.9492, "step": 94 }, { "epoch": 0.01, "learning_rate": 4.308390022675737e-06, "loss": 0.9775, "step": 95 }, { "epoch": 0.01, "learning_rate": 4.35374149659864e-06, "loss": 0.9434, "step": 96 }, { "epoch": 0.01, "learning_rate": 4.399092970521542e-06, "loss": 0.9697, "step": 97 }, { "epoch": 0.01, "learning_rate": 4.444444444444444e-06, "loss": 1.041, "step": 98 }, { "epoch": 0.01, "learning_rate": 4.489795918367348e-06, "loss": 1.002, "step": 99 }, { "epoch": 0.01, "learning_rate": 4.53514739229025e-06, "loss": 0.9883, "step": 100 }, { "epoch": 0.01, "learning_rate": 4.580498866213152e-06, "loss": 0.9404, "step": 101 }, { "epoch": 0.01, "learning_rate": 4.6258503401360546e-06, "loss": 0.9453, "step": 102 }, { "epoch": 0.01, "learning_rate": 4.671201814058957e-06, "loss": 0.9883, "step": 103 }, { "epoch": 0.01, "learning_rate": 4.71655328798186e-06, "loss": 0.9316, "step": 104 }, { "epoch": 0.01, "learning_rate": 4.761904761904762e-06, "loss": 1.0352, "step": 105 }, { "epoch": 0.01, "learning_rate": 4.807256235827665e-06, "loss": 1.0029, "step": 106 }, { "epoch": 0.01, "learning_rate": 4.852607709750568e-06, "loss": 0.959, "step": 107 }, { "epoch": 0.01, "learning_rate": 4.897959183673469e-06, "loss": 1.0664, "step": 108 }, { "epoch": 0.01, "learning_rate": 4.943310657596373e-06, "loss": 0.9453, "step": 109 }, { "epoch": 0.01, "learning_rate": 4.9886621315192745e-06, "loss": 0.9131, "step": 110 }, { "epoch": 0.01, "learning_rate": 5.034013605442177e-06, "loss": 0.9912, "step": 111 }, { "epoch": 0.01, "learning_rate": 5.07936507936508e-06, "loss": 0.9893, "step": 112 }, { "epoch": 0.01, "learning_rate": 5.124716553287983e-06, "loss": 1.041, "step": 113 }, { "epoch": 0.01, "learning_rate": 5.170068027210885e-06, "loss": 1.0391, "step": 114 }, { "epoch": 0.01, "learning_rate": 5.2154195011337876e-06, "loss": 0.915, "step": 115 }, { "epoch": 0.01, "learning_rate": 5.260770975056689e-06, "loss": 0.9492, "step": 116 }, { "epoch": 0.01, "learning_rate": 5.306122448979593e-06, "loss": 0.998, "step": 117 }, { "epoch": 0.01, "learning_rate": 5.3514739229024945e-06, "loss": 0.9834, "step": 118 }, { "epoch": 0.01, "learning_rate": 5.396825396825397e-06, "loss": 0.9609, "step": 119 }, { "epoch": 0.01, "learning_rate": 5.442176870748301e-06, "loss": 1.001, "step": 120 }, { "epoch": 0.01, "learning_rate": 5.487528344671202e-06, "loss": 0.959, "step": 121 }, { "epoch": 0.01, "learning_rate": 5.532879818594105e-06, "loss": 0.8428, "step": 122 }, { "epoch": 0.01, "learning_rate": 5.578231292517007e-06, "loss": 0.8887, "step": 123 }, { "epoch": 0.01, "learning_rate": 5.62358276643991e-06, "loss": 1.0703, "step": 124 }, { "epoch": 0.01, "learning_rate": 5.668934240362812e-06, "loss": 0.9512, "step": 125 }, { "epoch": 0.01, "learning_rate": 5.7142857142857145e-06, "loss": 0.9814, "step": 126 }, { "epoch": 0.01, "learning_rate": 5.759637188208618e-06, "loss": 1.0645, "step": 127 }, { "epoch": 0.01, "learning_rate": 5.80498866213152e-06, "loss": 0.9385, "step": 128 }, { "epoch": 0.01, "learning_rate": 5.850340136054422e-06, "loss": 0.959, "step": 129 }, { "epoch": 0.01, "learning_rate": 5.895691609977324e-06, "loss": 0.9512, "step": 130 }, { "epoch": 0.01, "learning_rate": 5.9410430839002275e-06, "loss": 0.9717, "step": 131 }, { "epoch": 0.01, "learning_rate": 5.98639455782313e-06, "loss": 0.9873, "step": 132 }, { "epoch": 0.01, "learning_rate": 6.031746031746032e-06, "loss": 0.8848, "step": 133 }, { "epoch": 0.01, "learning_rate": 6.077097505668935e-06, "loss": 0.8682, "step": 134 }, { "epoch": 0.01, "learning_rate": 6.122448979591837e-06, "loss": 1.0029, "step": 135 }, { "epoch": 0.01, "learning_rate": 6.16780045351474e-06, "loss": 0.9795, "step": 136 }, { "epoch": 0.01, "learning_rate": 6.2131519274376415e-06, "loss": 0.9346, "step": 137 }, { "epoch": 0.01, "learning_rate": 6.258503401360545e-06, "loss": 1.0117, "step": 138 }, { "epoch": 0.01, "learning_rate": 6.3038548752834475e-06, "loss": 1.0283, "step": 139 }, { "epoch": 0.01, "learning_rate": 6.349206349206349e-06, "loss": 0.9316, "step": 140 }, { "epoch": 0.01, "learning_rate": 6.394557823129253e-06, "loss": 0.8994, "step": 141 }, { "epoch": 0.01, "learning_rate": 6.4399092970521545e-06, "loss": 0.96, "step": 142 }, { "epoch": 0.01, "learning_rate": 6.485260770975057e-06, "loss": 1.0186, "step": 143 }, { "epoch": 0.01, "learning_rate": 6.530612244897959e-06, "loss": 0.9941, "step": 144 }, { "epoch": 0.01, "learning_rate": 6.575963718820862e-06, "loss": 0.9004, "step": 145 }, { "epoch": 0.01, "learning_rate": 6.621315192743765e-06, "loss": 0.9922, "step": 146 }, { "epoch": 0.01, "learning_rate": 6.666666666666667e-06, "loss": 0.96, "step": 147 }, { "epoch": 0.01, "learning_rate": 6.71201814058957e-06, "loss": 1.0332, "step": 148 }, { "epoch": 0.01, "learning_rate": 6.757369614512473e-06, "loss": 0.9111, "step": 149 }, { "epoch": 0.01, "learning_rate": 6.8027210884353745e-06, "loss": 0.9297, "step": 150 }, { "epoch": 0.01, "learning_rate": 6.848072562358277e-06, "loss": 1.0234, "step": 151 }, { "epoch": 0.01, "learning_rate": 6.89342403628118e-06, "loss": 0.9434, "step": 152 }, { "epoch": 0.01, "learning_rate": 6.938775510204082e-06, "loss": 0.958, "step": 153 }, { "epoch": 0.01, "learning_rate": 6.984126984126984e-06, "loss": 0.9033, "step": 154 }, { "epoch": 0.01, "learning_rate": 7.0294784580498875e-06, "loss": 0.9775, "step": 155 }, { "epoch": 0.01, "learning_rate": 7.07482993197279e-06, "loss": 0.9199, "step": 156 }, { "epoch": 0.01, "learning_rate": 7.120181405895692e-06, "loss": 0.9648, "step": 157 }, { "epoch": 0.01, "learning_rate": 7.165532879818595e-06, "loss": 0.9971, "step": 158 }, { "epoch": 0.01, "learning_rate": 7.210884353741497e-06, "loss": 0.957, "step": 159 }, { "epoch": 0.01, "learning_rate": 7.2562358276644e-06, "loss": 1.0156, "step": 160 }, { "epoch": 0.01, "learning_rate": 7.301587301587301e-06, "loss": 0.998, "step": 161 }, { "epoch": 0.01, "learning_rate": 7.346938775510205e-06, "loss": 0.9033, "step": 162 }, { "epoch": 0.01, "learning_rate": 7.3922902494331075e-06, "loss": 0.9365, "step": 163 }, { "epoch": 0.01, "learning_rate": 7.437641723356009e-06, "loss": 0.9551, "step": 164 }, { "epoch": 0.01, "learning_rate": 7.482993197278913e-06, "loss": 0.9287, "step": 165 }, { "epoch": 0.01, "learning_rate": 7.528344671201815e-06, "loss": 0.9697, "step": 166 }, { "epoch": 0.01, "learning_rate": 7.573696145124717e-06, "loss": 0.9834, "step": 167 }, { "epoch": 0.01, "learning_rate": 7.61904761904762e-06, "loss": 0.9961, "step": 168 }, { "epoch": 0.01, "learning_rate": 7.664399092970522e-06, "loss": 0.9277, "step": 169 }, { "epoch": 0.01, "learning_rate": 7.709750566893424e-06, "loss": 1.0195, "step": 170 }, { "epoch": 0.01, "learning_rate": 7.755102040816327e-06, "loss": 0.9365, "step": 171 }, { "epoch": 0.01, "learning_rate": 7.800453514739231e-06, "loss": 0.9336, "step": 172 }, { "epoch": 0.01, "learning_rate": 7.845804988662133e-06, "loss": 0.9551, "step": 173 }, { "epoch": 0.01, "learning_rate": 7.891156462585034e-06, "loss": 0.9668, "step": 174 }, { "epoch": 0.01, "learning_rate": 7.936507936507936e-06, "loss": 0.8896, "step": 175 }, { "epoch": 0.01, "learning_rate": 7.98185941043084e-06, "loss": 0.9512, "step": 176 }, { "epoch": 0.01, "learning_rate": 8.027210884353741e-06, "loss": 0.9307, "step": 177 }, { "epoch": 0.01, "learning_rate": 8.072562358276645e-06, "loss": 0.9316, "step": 178 }, { "epoch": 0.01, "learning_rate": 8.117913832199548e-06, "loss": 0.9873, "step": 179 }, { "epoch": 0.01, "learning_rate": 8.16326530612245e-06, "loss": 0.9775, "step": 180 }, { "epoch": 0.01, "learning_rate": 8.208616780045352e-06, "loss": 0.9355, "step": 181 }, { "epoch": 0.01, "learning_rate": 8.253968253968254e-06, "loss": 0.8779, "step": 182 }, { "epoch": 0.01, "learning_rate": 8.299319727891157e-06, "loss": 0.9541, "step": 183 }, { "epoch": 0.01, "learning_rate": 8.34467120181406e-06, "loss": 0.9932, "step": 184 }, { "epoch": 0.01, "learning_rate": 8.390022675736962e-06, "loss": 0.9746, "step": 185 }, { "epoch": 0.01, "learning_rate": 8.435374149659866e-06, "loss": 0.8672, "step": 186 }, { "epoch": 0.01, "learning_rate": 8.480725623582767e-06, "loss": 0.877, "step": 187 }, { "epoch": 0.01, "learning_rate": 8.52607709750567e-06, "loss": 0.9473, "step": 188 }, { "epoch": 0.01, "learning_rate": 8.571428571428571e-06, "loss": 0.9609, "step": 189 }, { "epoch": 0.01, "learning_rate": 8.616780045351474e-06, "loss": 0.8926, "step": 190 }, { "epoch": 0.01, "learning_rate": 8.662131519274378e-06, "loss": 0.9814, "step": 191 }, { "epoch": 0.01, "learning_rate": 8.70748299319728e-06, "loss": 1.0068, "step": 192 }, { "epoch": 0.01, "learning_rate": 8.752834467120183e-06, "loss": 0.9053, "step": 193 }, { "epoch": 0.01, "learning_rate": 8.798185941043085e-06, "loss": 0.8994, "step": 194 }, { "epoch": 0.01, "learning_rate": 8.843537414965987e-06, "loss": 1.0205, "step": 195 }, { "epoch": 0.01, "learning_rate": 8.888888888888888e-06, "loss": 0.9248, "step": 196 }, { "epoch": 0.01, "learning_rate": 8.934240362811792e-06, "loss": 0.9238, "step": 197 }, { "epoch": 0.01, "learning_rate": 8.979591836734695e-06, "loss": 0.8975, "step": 198 }, { "epoch": 0.01, "learning_rate": 9.024943310657597e-06, "loss": 0.9609, "step": 199 }, { "epoch": 0.01, "learning_rate": 9.0702947845805e-06, "loss": 0.9951, "step": 200 }, { "epoch": 0.01, "learning_rate": 9.115646258503402e-06, "loss": 1.0312, "step": 201 }, { "epoch": 0.01, "learning_rate": 9.160997732426304e-06, "loss": 0.8604, "step": 202 }, { "epoch": 0.01, "learning_rate": 9.206349206349207e-06, "loss": 0.9307, "step": 203 }, { "epoch": 0.01, "learning_rate": 9.251700680272109e-06, "loss": 0.9902, "step": 204 }, { "epoch": 0.01, "learning_rate": 9.297052154195013e-06, "loss": 0.9082, "step": 205 }, { "epoch": 0.01, "learning_rate": 9.342403628117914e-06, "loss": 0.9941, "step": 206 }, { "epoch": 0.01, "learning_rate": 9.387755102040818e-06, "loss": 0.9102, "step": 207 }, { "epoch": 0.01, "learning_rate": 9.43310657596372e-06, "loss": 1.0283, "step": 208 }, { "epoch": 0.01, "learning_rate": 9.478458049886621e-06, "loss": 0.9707, "step": 209 }, { "epoch": 0.01, "learning_rate": 9.523809523809525e-06, "loss": 0.9639, "step": 210 }, { "epoch": 0.01, "learning_rate": 9.569160997732427e-06, "loss": 0.9199, "step": 211 }, { "epoch": 0.01, "learning_rate": 9.61451247165533e-06, "loss": 0.9551, "step": 212 }, { "epoch": 0.01, "learning_rate": 9.659863945578232e-06, "loss": 0.9619, "step": 213 }, { "epoch": 0.01, "learning_rate": 9.705215419501135e-06, "loss": 0.9824, "step": 214 }, { "epoch": 0.01, "learning_rate": 9.750566893424037e-06, "loss": 0.9785, "step": 215 }, { "epoch": 0.01, "learning_rate": 9.795918367346939e-06, "loss": 0.9531, "step": 216 }, { "epoch": 0.01, "learning_rate": 9.841269841269842e-06, "loss": 0.9346, "step": 217 }, { "epoch": 0.01, "learning_rate": 9.886621315192746e-06, "loss": 0.8838, "step": 218 }, { "epoch": 0.01, "learning_rate": 9.931972789115647e-06, "loss": 0.9102, "step": 219 }, { "epoch": 0.01, "learning_rate": 9.977324263038549e-06, "loss": 0.958, "step": 220 }, { "epoch": 0.02, "learning_rate": 1.0022675736961451e-05, "loss": 0.9873, "step": 221 }, { "epoch": 0.02, "learning_rate": 1.0068027210884354e-05, "loss": 1.002, "step": 222 }, { "epoch": 0.02, "learning_rate": 1.0113378684807258e-05, "loss": 0.9863, "step": 223 }, { "epoch": 0.02, "learning_rate": 1.015873015873016e-05, "loss": 0.9844, "step": 224 }, { "epoch": 0.02, "learning_rate": 1.0204081632653063e-05, "loss": 0.9414, "step": 225 }, { "epoch": 0.02, "learning_rate": 1.0249433106575966e-05, "loss": 0.9932, "step": 226 }, { "epoch": 0.02, "learning_rate": 1.0294784580498866e-05, "loss": 0.9443, "step": 227 }, { "epoch": 0.02, "learning_rate": 1.034013605442177e-05, "loss": 1.002, "step": 228 }, { "epoch": 0.02, "learning_rate": 1.0385487528344672e-05, "loss": 0.8984, "step": 229 }, { "epoch": 0.02, "learning_rate": 1.0430839002267575e-05, "loss": 0.8447, "step": 230 }, { "epoch": 0.02, "learning_rate": 1.0476190476190477e-05, "loss": 1.0117, "step": 231 }, { "epoch": 0.02, "learning_rate": 1.0521541950113379e-05, "loss": 0.9355, "step": 232 }, { "epoch": 0.02, "learning_rate": 1.0566893424036282e-05, "loss": 0.9814, "step": 233 }, { "epoch": 0.02, "learning_rate": 1.0612244897959186e-05, "loss": 0.9258, "step": 234 }, { "epoch": 0.02, "learning_rate": 1.0657596371882086e-05, "loss": 0.9453, "step": 235 }, { "epoch": 0.02, "learning_rate": 1.0702947845804989e-05, "loss": 0.8701, "step": 236 }, { "epoch": 0.02, "learning_rate": 1.0748299319727893e-05, "loss": 0.8496, "step": 237 }, { "epoch": 0.02, "learning_rate": 1.0793650793650794e-05, "loss": 0.9678, "step": 238 }, { "epoch": 0.02, "learning_rate": 1.0839002267573698e-05, "loss": 0.9219, "step": 239 }, { "epoch": 0.02, "learning_rate": 1.0884353741496601e-05, "loss": 0.9932, "step": 240 }, { "epoch": 0.02, "learning_rate": 1.0929705215419501e-05, "loss": 0.9248, "step": 241 }, { "epoch": 0.02, "learning_rate": 1.0975056689342405e-05, "loss": 0.9482, "step": 242 }, { "epoch": 0.02, "learning_rate": 1.1020408163265306e-05, "loss": 0.9326, "step": 243 }, { "epoch": 0.02, "learning_rate": 1.106575963718821e-05, "loss": 0.9746, "step": 244 }, { "epoch": 0.02, "learning_rate": 1.1111111111111113e-05, "loss": 0.9434, "step": 245 }, { "epoch": 0.02, "learning_rate": 1.1156462585034013e-05, "loss": 0.9785, "step": 246 }, { "epoch": 0.02, "learning_rate": 1.1201814058956917e-05, "loss": 0.9727, "step": 247 }, { "epoch": 0.02, "learning_rate": 1.124716553287982e-05, "loss": 0.8896, "step": 248 }, { "epoch": 0.02, "learning_rate": 1.1292517006802722e-05, "loss": 0.9434, "step": 249 }, { "epoch": 0.02, "learning_rate": 1.1337868480725624e-05, "loss": 0.9854, "step": 250 }, { "epoch": 0.02, "learning_rate": 1.1383219954648527e-05, "loss": 0.9355, "step": 251 }, { "epoch": 0.02, "learning_rate": 1.1428571428571429e-05, "loss": 1.0107, "step": 252 }, { "epoch": 0.02, "learning_rate": 1.1473922902494332e-05, "loss": 0.9258, "step": 253 }, { "epoch": 0.02, "learning_rate": 1.1519274376417236e-05, "loss": 0.9551, "step": 254 }, { "epoch": 0.02, "learning_rate": 1.1564625850340136e-05, "loss": 1.0039, "step": 255 }, { "epoch": 0.02, "learning_rate": 1.160997732426304e-05, "loss": 0.9043, "step": 256 }, { "epoch": 0.02, "learning_rate": 1.1655328798185943e-05, "loss": 0.9229, "step": 257 }, { "epoch": 0.02, "learning_rate": 1.1700680272108845e-05, "loss": 0.9424, "step": 258 }, { "epoch": 0.02, "learning_rate": 1.1746031746031748e-05, "loss": 0.8809, "step": 259 }, { "epoch": 0.02, "learning_rate": 1.1791383219954648e-05, "loss": 0.9199, "step": 260 }, { "epoch": 0.02, "learning_rate": 1.1836734693877552e-05, "loss": 0.9658, "step": 261 }, { "epoch": 0.02, "learning_rate": 1.1882086167800455e-05, "loss": 0.8945, "step": 262 }, { "epoch": 0.02, "learning_rate": 1.1927437641723357e-05, "loss": 0.9326, "step": 263 }, { "epoch": 0.02, "learning_rate": 1.197278911564626e-05, "loss": 0.9336, "step": 264 }, { "epoch": 0.02, "learning_rate": 1.2018140589569162e-05, "loss": 0.8535, "step": 265 }, { "epoch": 0.02, "learning_rate": 1.2063492063492064e-05, "loss": 0.9385, "step": 266 }, { "epoch": 0.02, "learning_rate": 1.2108843537414967e-05, "loss": 0.957, "step": 267 }, { "epoch": 0.02, "learning_rate": 1.215419501133787e-05, "loss": 1.0166, "step": 268 }, { "epoch": 0.02, "learning_rate": 1.219954648526077e-05, "loss": 1.0146, "step": 269 }, { "epoch": 0.02, "learning_rate": 1.2244897959183674e-05, "loss": 0.9131, "step": 270 }, { "epoch": 0.02, "learning_rate": 1.2290249433106578e-05, "loss": 1.0703, "step": 271 }, { "epoch": 0.02, "learning_rate": 1.233560090702948e-05, "loss": 0.8789, "step": 272 }, { "epoch": 0.02, "learning_rate": 1.2380952380952383e-05, "loss": 0.874, "step": 273 }, { "epoch": 0.02, "learning_rate": 1.2426303854875283e-05, "loss": 0.9531, "step": 274 }, { "epoch": 0.02, "learning_rate": 1.2471655328798186e-05, "loss": 0.9756, "step": 275 }, { "epoch": 0.02, "learning_rate": 1.251700680272109e-05, "loss": 0.9658, "step": 276 }, { "epoch": 0.02, "learning_rate": 1.2562358276643992e-05, "loss": 0.9463, "step": 277 }, { "epoch": 0.02, "learning_rate": 1.2607709750566895e-05, "loss": 0.9297, "step": 278 }, { "epoch": 0.02, "learning_rate": 1.2653061224489798e-05, "loss": 0.9717, "step": 279 }, { "epoch": 0.02, "learning_rate": 1.2698412698412699e-05, "loss": 0.9805, "step": 280 }, { "epoch": 0.02, "learning_rate": 1.2743764172335602e-05, "loss": 0.9521, "step": 281 }, { "epoch": 0.02, "learning_rate": 1.2789115646258505e-05, "loss": 0.957, "step": 282 }, { "epoch": 0.02, "learning_rate": 1.2834467120181407e-05, "loss": 0.9883, "step": 283 }, { "epoch": 0.02, "learning_rate": 1.2879818594104309e-05, "loss": 0.9688, "step": 284 }, { "epoch": 0.02, "learning_rate": 1.2925170068027212e-05, "loss": 0.9766, "step": 285 }, { "epoch": 0.02, "learning_rate": 1.2970521541950114e-05, "loss": 0.8711, "step": 286 }, { "epoch": 0.02, "learning_rate": 1.3015873015873018e-05, "loss": 0.8672, "step": 287 }, { "epoch": 0.02, "learning_rate": 1.3061224489795918e-05, "loss": 1.0215, "step": 288 }, { "epoch": 0.02, "learning_rate": 1.3106575963718821e-05, "loss": 0.9316, "step": 289 }, { "epoch": 0.02, "learning_rate": 1.3151927437641725e-05, "loss": 0.9756, "step": 290 }, { "epoch": 0.02, "learning_rate": 1.3197278911564626e-05, "loss": 0.9219, "step": 291 }, { "epoch": 0.02, "learning_rate": 1.324263038548753e-05, "loss": 0.8877, "step": 292 }, { "epoch": 0.02, "learning_rate": 1.3287981859410433e-05, "loss": 0.9736, "step": 293 }, { "epoch": 0.02, "learning_rate": 1.3333333333333333e-05, "loss": 0.9004, "step": 294 }, { "epoch": 0.02, "learning_rate": 1.3378684807256237e-05, "loss": 0.9609, "step": 295 }, { "epoch": 0.02, "learning_rate": 1.342403628117914e-05, "loss": 0.9785, "step": 296 }, { "epoch": 0.02, "learning_rate": 1.3469387755102042e-05, "loss": 0.959, "step": 297 }, { "epoch": 0.02, "learning_rate": 1.3514739229024945e-05, "loss": 0.9531, "step": 298 }, { "epoch": 0.02, "learning_rate": 1.3560090702947847e-05, "loss": 0.9209, "step": 299 }, { "epoch": 0.02, "learning_rate": 1.3605442176870749e-05, "loss": 0.8457, "step": 300 }, { "epoch": 0.02, "learning_rate": 1.3650793650793652e-05, "loss": 0.9668, "step": 301 }, { "epoch": 0.02, "learning_rate": 1.3696145124716554e-05, "loss": 0.8779, "step": 302 }, { "epoch": 0.02, "learning_rate": 1.3741496598639456e-05, "loss": 0.9844, "step": 303 }, { "epoch": 0.02, "learning_rate": 1.378684807256236e-05, "loss": 0.9521, "step": 304 }, { "epoch": 0.02, "learning_rate": 1.3832199546485261e-05, "loss": 0.9395, "step": 305 }, { "epoch": 0.02, "learning_rate": 1.3877551020408165e-05, "loss": 0.9502, "step": 306 }, { "epoch": 0.02, "learning_rate": 1.3922902494331068e-05, "loss": 0.9971, "step": 307 }, { "epoch": 0.02, "learning_rate": 1.3968253968253968e-05, "loss": 0.9219, "step": 308 }, { "epoch": 0.02, "learning_rate": 1.4013605442176872e-05, "loss": 0.9473, "step": 309 }, { "epoch": 0.02, "learning_rate": 1.4058956916099775e-05, "loss": 0.915, "step": 310 }, { "epoch": 0.02, "learning_rate": 1.4104308390022677e-05, "loss": 0.9688, "step": 311 }, { "epoch": 0.02, "learning_rate": 1.414965986394558e-05, "loss": 0.8506, "step": 312 }, { "epoch": 0.02, "learning_rate": 1.4195011337868484e-05, "loss": 1.0137, "step": 313 }, { "epoch": 0.02, "learning_rate": 1.4240362811791384e-05, "loss": 1.0215, "step": 314 }, { "epoch": 0.02, "learning_rate": 1.4285714285714287e-05, "loss": 0.9248, "step": 315 }, { "epoch": 0.02, "learning_rate": 1.433106575963719e-05, "loss": 0.9033, "step": 316 }, { "epoch": 0.02, "learning_rate": 1.4376417233560092e-05, "loss": 0.96, "step": 317 }, { "epoch": 0.02, "learning_rate": 1.4421768707482994e-05, "loss": 0.9883, "step": 318 }, { "epoch": 0.02, "learning_rate": 1.4467120181405896e-05, "loss": 0.9385, "step": 319 }, { "epoch": 0.02, "learning_rate": 1.45124716553288e-05, "loss": 0.9414, "step": 320 }, { "epoch": 0.02, "learning_rate": 1.4557823129251703e-05, "loss": 0.9209, "step": 321 }, { "epoch": 0.02, "learning_rate": 1.4603174603174603e-05, "loss": 0.9316, "step": 322 }, { "epoch": 0.02, "learning_rate": 1.4648526077097506e-05, "loss": 0.8945, "step": 323 }, { "epoch": 0.02, "learning_rate": 1.469387755102041e-05, "loss": 0.8867, "step": 324 }, { "epoch": 0.02, "learning_rate": 1.4739229024943311e-05, "loss": 0.8809, "step": 325 }, { "epoch": 0.02, "learning_rate": 1.4784580498866215e-05, "loss": 0.9365, "step": 326 }, { "epoch": 0.02, "learning_rate": 1.4829931972789118e-05, "loss": 0.918, "step": 327 }, { "epoch": 0.02, "learning_rate": 1.4875283446712018e-05, "loss": 0.8926, "step": 328 }, { "epoch": 0.02, "learning_rate": 1.4920634920634922e-05, "loss": 0.9795, "step": 329 }, { "epoch": 0.02, "learning_rate": 1.4965986394557825e-05, "loss": 0.9746, "step": 330 }, { "epoch": 0.02, "learning_rate": 1.5011337868480727e-05, "loss": 0.9668, "step": 331 }, { "epoch": 0.02, "learning_rate": 1.505668934240363e-05, "loss": 0.9219, "step": 332 }, { "epoch": 0.02, "learning_rate": 1.510204081632653e-05, "loss": 0.874, "step": 333 }, { "epoch": 0.02, "learning_rate": 1.5147392290249434e-05, "loss": 0.917, "step": 334 }, { "epoch": 0.02, "learning_rate": 1.5192743764172338e-05, "loss": 0.9482, "step": 335 }, { "epoch": 0.02, "learning_rate": 1.523809523809524e-05, "loss": 0.9199, "step": 336 }, { "epoch": 0.02, "learning_rate": 1.528344671201814e-05, "loss": 0.9551, "step": 337 }, { "epoch": 0.02, "learning_rate": 1.5328798185941044e-05, "loss": 0.9385, "step": 338 }, { "epoch": 0.02, "learning_rate": 1.5374149659863945e-05, "loss": 0.8916, "step": 339 }, { "epoch": 0.02, "learning_rate": 1.5419501133786848e-05, "loss": 0.9277, "step": 340 }, { "epoch": 0.02, "learning_rate": 1.546485260770975e-05, "loss": 0.9277, "step": 341 }, { "epoch": 0.02, "learning_rate": 1.5510204081632655e-05, "loss": 0.9639, "step": 342 }, { "epoch": 0.02, "learning_rate": 1.555555555555556e-05, "loss": 0.9297, "step": 343 }, { "epoch": 0.02, "learning_rate": 1.5600907029478462e-05, "loss": 1.0107, "step": 344 }, { "epoch": 0.02, "learning_rate": 1.5646258503401362e-05, "loss": 0.9521, "step": 345 }, { "epoch": 0.02, "learning_rate": 1.5691609977324265e-05, "loss": 1.0029, "step": 346 }, { "epoch": 0.02, "learning_rate": 1.5736961451247165e-05, "loss": 1.0, "step": 347 }, { "epoch": 0.02, "learning_rate": 1.578231292517007e-05, "loss": 0.9258, "step": 348 }, { "epoch": 0.02, "learning_rate": 1.5827664399092972e-05, "loss": 1.0273, "step": 349 }, { "epoch": 0.02, "learning_rate": 1.5873015873015872e-05, "loss": 1.0, "step": 350 }, { "epoch": 0.02, "learning_rate": 1.5918367346938776e-05, "loss": 0.9883, "step": 351 }, { "epoch": 0.02, "learning_rate": 1.596371882086168e-05, "loss": 0.9043, "step": 352 }, { "epoch": 0.02, "learning_rate": 1.6009070294784583e-05, "loss": 0.9375, "step": 353 }, { "epoch": 0.02, "learning_rate": 1.6054421768707483e-05, "loss": 0.8916, "step": 354 }, { "epoch": 0.02, "learning_rate": 1.6099773242630386e-05, "loss": 0.9189, "step": 355 }, { "epoch": 0.02, "learning_rate": 1.614512471655329e-05, "loss": 0.9678, "step": 356 }, { "epoch": 0.02, "learning_rate": 1.6190476190476193e-05, "loss": 0.9385, "step": 357 }, { "epoch": 0.02, "learning_rate": 1.6235827664399097e-05, "loss": 0.9482, "step": 358 }, { "epoch": 0.02, "learning_rate": 1.6281179138321997e-05, "loss": 0.9473, "step": 359 }, { "epoch": 0.02, "learning_rate": 1.63265306122449e-05, "loss": 0.9355, "step": 360 }, { "epoch": 0.02, "learning_rate": 1.63718820861678e-05, "loss": 0.9248, "step": 361 }, { "epoch": 0.02, "learning_rate": 1.6417233560090704e-05, "loss": 0.9795, "step": 362 }, { "epoch": 0.02, "learning_rate": 1.6462585034013607e-05, "loss": 0.9775, "step": 363 }, { "epoch": 0.02, "learning_rate": 1.6507936507936507e-05, "loss": 0.8262, "step": 364 }, { "epoch": 0.02, "learning_rate": 1.655328798185941e-05, "loss": 0.958, "step": 365 }, { "epoch": 0.02, "learning_rate": 1.6598639455782314e-05, "loss": 0.8916, "step": 366 }, { "epoch": 0.03, "learning_rate": 1.6643990929705217e-05, "loss": 0.9658, "step": 367 }, { "epoch": 0.03, "learning_rate": 1.668934240362812e-05, "loss": 0.9824, "step": 368 }, { "epoch": 0.03, "learning_rate": 1.673469387755102e-05, "loss": 0.9502, "step": 369 }, { "epoch": 0.03, "learning_rate": 1.6780045351473924e-05, "loss": 0.9922, "step": 370 }, { "epoch": 0.03, "learning_rate": 1.6825396825396828e-05, "loss": 0.9609, "step": 371 }, { "epoch": 0.03, "learning_rate": 1.687074829931973e-05, "loss": 0.9922, "step": 372 }, { "epoch": 0.03, "learning_rate": 1.691609977324263e-05, "loss": 0.9092, "step": 373 }, { "epoch": 0.03, "learning_rate": 1.6961451247165535e-05, "loss": 0.8398, "step": 374 }, { "epoch": 0.03, "learning_rate": 1.7006802721088435e-05, "loss": 0.9258, "step": 375 }, { "epoch": 0.03, "learning_rate": 1.705215419501134e-05, "loss": 0.9238, "step": 376 }, { "epoch": 0.03, "learning_rate": 1.7097505668934242e-05, "loss": 0.9658, "step": 377 }, { "epoch": 0.03, "learning_rate": 1.7142857142857142e-05, "loss": 0.9023, "step": 378 }, { "epoch": 0.03, "learning_rate": 1.7188208616780045e-05, "loss": 0.9375, "step": 379 }, { "epoch": 0.03, "learning_rate": 1.723356009070295e-05, "loss": 0.9492, "step": 380 }, { "epoch": 0.03, "learning_rate": 1.7278911564625852e-05, "loss": 0.8535, "step": 381 }, { "epoch": 0.03, "learning_rate": 1.7324263038548756e-05, "loss": 0.9482, "step": 382 }, { "epoch": 0.03, "learning_rate": 1.736961451247166e-05, "loss": 0.8115, "step": 383 }, { "epoch": 0.03, "learning_rate": 1.741496598639456e-05, "loss": 0.9707, "step": 384 }, { "epoch": 0.03, "learning_rate": 1.7460317460317463e-05, "loss": 0.8906, "step": 385 }, { "epoch": 0.03, "learning_rate": 1.7505668934240366e-05, "loss": 0.874, "step": 386 }, { "epoch": 0.03, "learning_rate": 1.7551020408163266e-05, "loss": 0.9717, "step": 387 }, { "epoch": 0.03, "learning_rate": 1.759637188208617e-05, "loss": 0.959, "step": 388 }, { "epoch": 0.03, "learning_rate": 1.7641723356009073e-05, "loss": 0.8682, "step": 389 }, { "epoch": 0.03, "learning_rate": 1.7687074829931973e-05, "loss": 0.9873, "step": 390 }, { "epoch": 0.03, "learning_rate": 1.7732426303854877e-05, "loss": 0.8994, "step": 391 }, { "epoch": 0.03, "learning_rate": 1.7777777777777777e-05, "loss": 0.9365, "step": 392 }, { "epoch": 0.03, "learning_rate": 1.782312925170068e-05, "loss": 0.832, "step": 393 }, { "epoch": 0.03, "learning_rate": 1.7868480725623583e-05, "loss": 0.9717, "step": 394 }, { "epoch": 0.03, "learning_rate": 1.7913832199546487e-05, "loss": 0.96, "step": 395 }, { "epoch": 0.03, "learning_rate": 1.795918367346939e-05, "loss": 0.8184, "step": 396 }, { "epoch": 0.03, "learning_rate": 1.8004535147392294e-05, "loss": 0.9824, "step": 397 }, { "epoch": 0.03, "learning_rate": 1.8049886621315194e-05, "loss": 0.9531, "step": 398 }, { "epoch": 0.03, "learning_rate": 1.8095238095238097e-05, "loss": 0.9541, "step": 399 }, { "epoch": 0.03, "learning_rate": 1.8140589569161e-05, "loss": 0.9287, "step": 400 }, { "epoch": 0.03, "learning_rate": 1.81859410430839e-05, "loss": 0.9795, "step": 401 }, { "epoch": 0.03, "learning_rate": 1.8231292517006804e-05, "loss": 0.9854, "step": 402 }, { "epoch": 0.03, "learning_rate": 1.8276643990929708e-05, "loss": 0.9014, "step": 403 }, { "epoch": 0.03, "learning_rate": 1.8321995464852608e-05, "loss": 0.9795, "step": 404 }, { "epoch": 0.03, "learning_rate": 1.836734693877551e-05, "loss": 0.9688, "step": 405 }, { "epoch": 0.03, "learning_rate": 1.8412698412698415e-05, "loss": 0.9756, "step": 406 }, { "epoch": 0.03, "learning_rate": 1.8458049886621315e-05, "loss": 0.9727, "step": 407 }, { "epoch": 0.03, "learning_rate": 1.8503401360544218e-05, "loss": 0.9121, "step": 408 }, { "epoch": 0.03, "learning_rate": 1.8548752834467122e-05, "loss": 0.9365, "step": 409 }, { "epoch": 0.03, "learning_rate": 1.8594104308390025e-05, "loss": 0.917, "step": 410 }, { "epoch": 0.03, "learning_rate": 1.863945578231293e-05, "loss": 0.9717, "step": 411 }, { "epoch": 0.03, "learning_rate": 1.868480725623583e-05, "loss": 0.8945, "step": 412 }, { "epoch": 0.03, "learning_rate": 1.8730158730158732e-05, "loss": 0.918, "step": 413 }, { "epoch": 0.03, "learning_rate": 1.8775510204081636e-05, "loss": 0.9922, "step": 414 }, { "epoch": 0.03, "learning_rate": 1.8820861678004536e-05, "loss": 0.9502, "step": 415 }, { "epoch": 0.03, "learning_rate": 1.886621315192744e-05, "loss": 0.8789, "step": 416 }, { "epoch": 0.03, "learning_rate": 1.8911564625850343e-05, "loss": 0.9727, "step": 417 }, { "epoch": 0.03, "learning_rate": 1.8956916099773243e-05, "loss": 0.9189, "step": 418 }, { "epoch": 0.03, "learning_rate": 1.9002267573696146e-05, "loss": 0.8965, "step": 419 }, { "epoch": 0.03, "learning_rate": 1.904761904761905e-05, "loss": 0.9951, "step": 420 }, { "epoch": 0.03, "learning_rate": 1.9092970521541953e-05, "loss": 0.9443, "step": 421 }, { "epoch": 0.03, "learning_rate": 1.9138321995464853e-05, "loss": 0.8691, "step": 422 }, { "epoch": 0.03, "learning_rate": 1.9183673469387756e-05, "loss": 0.9453, "step": 423 }, { "epoch": 0.03, "learning_rate": 1.922902494331066e-05, "loss": 0.9561, "step": 424 }, { "epoch": 0.03, "learning_rate": 1.9274376417233563e-05, "loss": 0.8818, "step": 425 }, { "epoch": 0.03, "learning_rate": 1.9319727891156463e-05, "loss": 1.0293, "step": 426 }, { "epoch": 0.03, "learning_rate": 1.9365079365079367e-05, "loss": 0.9902, "step": 427 }, { "epoch": 0.03, "learning_rate": 1.941043083900227e-05, "loss": 0.9531, "step": 428 }, { "epoch": 0.03, "learning_rate": 1.945578231292517e-05, "loss": 1.0322, "step": 429 }, { "epoch": 0.03, "learning_rate": 1.9501133786848074e-05, "loss": 0.9248, "step": 430 }, { "epoch": 0.03, "learning_rate": 1.9546485260770977e-05, "loss": 0.9453, "step": 431 }, { "epoch": 0.03, "learning_rate": 1.9591836734693877e-05, "loss": 1.0098, "step": 432 }, { "epoch": 0.03, "learning_rate": 1.963718820861678e-05, "loss": 0.8721, "step": 433 }, { "epoch": 0.03, "learning_rate": 1.9682539682539684e-05, "loss": 0.9785, "step": 434 }, { "epoch": 0.03, "learning_rate": 1.9727891156462588e-05, "loss": 0.9414, "step": 435 }, { "epoch": 0.03, "learning_rate": 1.977324263038549e-05, "loss": 0.8613, "step": 436 }, { "epoch": 0.03, "learning_rate": 1.981859410430839e-05, "loss": 0.8799, "step": 437 }, { "epoch": 0.03, "learning_rate": 1.9863945578231295e-05, "loss": 0.9238, "step": 438 }, { "epoch": 0.03, "learning_rate": 1.9909297052154198e-05, "loss": 1.001, "step": 439 }, { "epoch": 0.03, "learning_rate": 1.9954648526077098e-05, "loss": 0.9961, "step": 440 }, { "epoch": 0.03, "learning_rate": 2e-05, "loss": 1.0146, "step": 441 }, { "epoch": 0.03, "learning_rate": 1.9999999756400245e-05, "loss": 0.9854, "step": 442 }, { "epoch": 0.03, "learning_rate": 1.999999902560099e-05, "loss": 0.9834, "step": 443 }, { "epoch": 0.03, "learning_rate": 1.9999997807602266e-05, "loss": 0.9492, "step": 444 }, { "epoch": 0.03, "learning_rate": 1.999999610240414e-05, "loss": 0.9922, "step": 445 }, { "epoch": 0.03, "learning_rate": 1.999999391000669e-05, "loss": 0.9736, "step": 446 }, { "epoch": 0.03, "learning_rate": 1.9999991230410028e-05, "loss": 0.9082, "step": 447 }, { "epoch": 0.03, "learning_rate": 1.9999988063614274e-05, "loss": 0.9131, "step": 448 }, { "epoch": 0.03, "learning_rate": 1.9999984409619595e-05, "loss": 0.9609, "step": 449 }, { "epoch": 0.03, "learning_rate": 1.999998026842616e-05, "loss": 0.917, "step": 450 }, { "epoch": 0.03, "learning_rate": 1.9999975640034175e-05, "loss": 1.0273, "step": 451 }, { "epoch": 0.03, "learning_rate": 1.9999970524443867e-05, "loss": 0.9863, "step": 452 }, { "epoch": 0.03, "learning_rate": 1.999996492165548e-05, "loss": 0.8975, "step": 453 }, { "epoch": 0.03, "learning_rate": 1.9999958831669288e-05, "loss": 0.8672, "step": 454 }, { "epoch": 0.03, "learning_rate": 1.9999952254485594e-05, "loss": 0.96, "step": 455 }, { "epoch": 0.03, "learning_rate": 1.999994519010471e-05, "loss": 0.9609, "step": 456 }, { "epoch": 0.03, "learning_rate": 1.9999937638526984e-05, "loss": 1.0322, "step": 457 }, { "epoch": 0.03, "learning_rate": 1.999992959975279e-05, "loss": 0.9863, "step": 458 }, { "epoch": 0.03, "learning_rate": 1.9999921073782508e-05, "loss": 0.9346, "step": 459 }, { "epoch": 0.03, "learning_rate": 1.999991206061656e-05, "loss": 0.9619, "step": 460 }, { "epoch": 0.03, "learning_rate": 1.999990256025538e-05, "loss": 0.9131, "step": 461 }, { "epoch": 0.03, "learning_rate": 1.999989257269944e-05, "loss": 0.9941, "step": 462 }, { "epoch": 0.03, "learning_rate": 1.9999882097949222e-05, "loss": 0.9219, "step": 463 }, { "epoch": 0.03, "learning_rate": 1.9999871136005233e-05, "loss": 0.918, "step": 464 }, { "epoch": 0.03, "learning_rate": 1.999985968686801e-05, "loss": 1.002, "step": 465 }, { "epoch": 0.03, "learning_rate": 1.9999847750538113e-05, "loss": 0.8877, "step": 466 }, { "epoch": 0.03, "learning_rate": 1.999983532701612e-05, "loss": 0.9033, "step": 467 }, { "epoch": 0.03, "learning_rate": 1.9999822416302638e-05, "loss": 0.9502, "step": 468 }, { "epoch": 0.03, "learning_rate": 1.9999809018398297e-05, "loss": 0.9951, "step": 469 }, { "epoch": 0.03, "learning_rate": 1.9999795133303742e-05, "loss": 0.9531, "step": 470 }, { "epoch": 0.03, "learning_rate": 1.999978076101966e-05, "loss": 1.002, "step": 471 }, { "epoch": 0.03, "learning_rate": 1.999976590154675e-05, "loss": 0.9297, "step": 472 }, { "epoch": 0.03, "learning_rate": 1.9999750554885728e-05, "loss": 0.8672, "step": 473 }, { "epoch": 0.03, "learning_rate": 1.999973472103735e-05, "loss": 0.957, "step": 474 }, { "epoch": 0.03, "learning_rate": 1.9999718400002385e-05, "loss": 0.9326, "step": 475 }, { "epoch": 0.03, "learning_rate": 1.9999701591781622e-05, "loss": 0.96, "step": 476 }, { "epoch": 0.03, "learning_rate": 1.9999684296375887e-05, "loss": 0.9365, "step": 477 }, { "epoch": 0.03, "learning_rate": 1.9999666513786023e-05, "loss": 0.9424, "step": 478 }, { "epoch": 0.03, "learning_rate": 1.999964824401289e-05, "loss": 0.9424, "step": 479 }, { "epoch": 0.03, "learning_rate": 1.9999629487057385e-05, "loss": 0.9639, "step": 480 }, { "epoch": 0.03, "learning_rate": 1.999961024292042e-05, "loss": 0.9922, "step": 481 }, { "epoch": 0.03, "learning_rate": 1.999959051160293e-05, "loss": 0.9492, "step": 482 }, { "epoch": 0.03, "learning_rate": 1.999957029310588e-05, "loss": 0.9492, "step": 483 }, { "epoch": 0.03, "learning_rate": 1.9999549587430252e-05, "loss": 0.958, "step": 484 }, { "epoch": 0.03, "learning_rate": 1.9999528394577058e-05, "loss": 0.9766, "step": 485 }, { "epoch": 0.03, "learning_rate": 1.9999506714547325e-05, "loss": 0.873, "step": 486 }, { "epoch": 0.03, "learning_rate": 1.9999484547342113e-05, "loss": 0.9678, "step": 487 }, { "epoch": 0.03, "learning_rate": 1.99994618929625e-05, "loss": 1.0312, "step": 488 }, { "epoch": 0.03, "learning_rate": 1.9999438751409593e-05, "loss": 0.9922, "step": 489 }, { "epoch": 0.03, "learning_rate": 1.9999415122684514e-05, "loss": 0.9141, "step": 490 }, { "epoch": 0.03, "learning_rate": 1.9999391006788426e-05, "loss": 0.8867, "step": 491 }, { "epoch": 0.03, "learning_rate": 1.999936640372249e-05, "loss": 0.9297, "step": 492 }, { "epoch": 0.03, "learning_rate": 1.9999341313487913e-05, "loss": 1.0059, "step": 493 }, { "epoch": 0.03, "learning_rate": 1.999931573608591e-05, "loss": 0.917, "step": 494 }, { "epoch": 0.03, "learning_rate": 1.9999289671517736e-05, "loss": 1.0283, "step": 495 }, { "epoch": 0.03, "learning_rate": 1.9999263119784657e-05, "loss": 0.8828, "step": 496 }, { "epoch": 0.03, "learning_rate": 1.999923608088797e-05, "loss": 0.9756, "step": 497 }, { "epoch": 0.03, "learning_rate": 1.9999208554828978e-05, "loss": 0.9375, "step": 498 }, { "epoch": 0.03, "learning_rate": 1.999918054160904e-05, "loss": 0.9395, "step": 499 }, { "epoch": 0.03, "learning_rate": 1.9999152041229514e-05, "loss": 0.9385, "step": 500 }, { "epoch": 0.03, "learning_rate": 1.9999123053691788e-05, "loss": 1.0225, "step": 501 }, { "epoch": 0.03, "learning_rate": 1.9999093578997273e-05, "loss": 0.917, "step": 502 }, { "epoch": 0.03, "learning_rate": 1.9999063617147408e-05, "loss": 0.9609, "step": 503 }, { "epoch": 0.03, "learning_rate": 1.999903316814365e-05, "loss": 0.8887, "step": 504 }, { "epoch": 0.03, "learning_rate": 1.9999002231987482e-05, "loss": 1.002, "step": 505 }, { "epoch": 0.03, "learning_rate": 1.9998970808680414e-05, "loss": 0.8945, "step": 506 }, { "epoch": 0.03, "learning_rate": 1.999893889822398e-05, "loss": 0.9307, "step": 507 }, { "epoch": 0.03, "learning_rate": 1.9998906500619727e-05, "loss": 0.9648, "step": 508 }, { "epoch": 0.03, "learning_rate": 1.9998873615869235e-05, "loss": 0.9512, "step": 509 }, { "epoch": 0.03, "learning_rate": 1.999884024397411e-05, "loss": 0.9824, "step": 510 }, { "epoch": 0.03, "learning_rate": 1.9998806384935975e-05, "loss": 1.0527, "step": 511 }, { "epoch": 0.03, "learning_rate": 1.9998772038756483e-05, "loss": 0.8682, "step": 512 }, { "epoch": 0.03, "learning_rate": 1.99987372054373e-05, "loss": 0.8936, "step": 513 }, { "epoch": 0.04, "learning_rate": 1.9998701884980133e-05, "loss": 0.9688, "step": 514 }, { "epoch": 0.04, "learning_rate": 1.9998666077386698e-05, "loss": 0.9736, "step": 515 }, { "epoch": 0.04, "learning_rate": 1.9998629782658736e-05, "loss": 1.002, "step": 516 }, { "epoch": 0.04, "learning_rate": 1.999859300079802e-05, "loss": 0.9766, "step": 517 }, { "epoch": 0.04, "learning_rate": 1.9998555731806338e-05, "loss": 0.9141, "step": 518 }, { "epoch": 0.04, "learning_rate": 1.9998517975685514e-05, "loss": 0.9668, "step": 519 }, { "epoch": 0.04, "learning_rate": 1.9998479732437376e-05, "loss": 0.8691, "step": 520 }, { "epoch": 0.04, "learning_rate": 1.9998441002063796e-05, "loss": 0.9688, "step": 521 }, { "epoch": 0.04, "learning_rate": 1.999840178456666e-05, "loss": 0.9053, "step": 522 }, { "epoch": 0.04, "learning_rate": 1.9998362079947876e-05, "loss": 1.0332, "step": 523 }, { "epoch": 0.04, "learning_rate": 1.9998321888209376e-05, "loss": 0.9053, "step": 524 }, { "epoch": 0.04, "learning_rate": 1.999828120935312e-05, "loss": 0.8193, "step": 525 }, { "epoch": 0.04, "learning_rate": 1.9998240043381094e-05, "loss": 0.9668, "step": 526 }, { "epoch": 0.04, "learning_rate": 1.99981983902953e-05, "loss": 0.9336, "step": 527 }, { "epoch": 0.04, "learning_rate": 1.9998156250097768e-05, "loss": 1.0, "step": 528 }, { "epoch": 0.04, "learning_rate": 1.9998113622790552e-05, "loss": 0.8896, "step": 529 }, { "epoch": 0.04, "learning_rate": 1.999807050837573e-05, "loss": 0.8682, "step": 530 }, { "epoch": 0.04, "learning_rate": 1.9998026906855393e-05, "loss": 0.9238, "step": 531 }, { "epoch": 0.04, "learning_rate": 1.999798281823168e-05, "loss": 1.0068, "step": 532 }, { "epoch": 0.04, "learning_rate": 1.999793824250673e-05, "loss": 0.8438, "step": 533 }, { "epoch": 0.04, "learning_rate": 1.9997893179682713e-05, "loss": 0.9453, "step": 534 }, { "epoch": 0.04, "learning_rate": 1.9997847629761833e-05, "loss": 0.876, "step": 535 }, { "epoch": 0.04, "learning_rate": 1.99978015927463e-05, "loss": 1.0166, "step": 536 }, { "epoch": 0.04, "learning_rate": 1.9997755068638363e-05, "loss": 0.9883, "step": 537 }, { "epoch": 0.04, "learning_rate": 1.9997708057440284e-05, "loss": 0.8994, "step": 538 }, { "epoch": 0.04, "learning_rate": 1.999766055915436e-05, "loss": 0.8711, "step": 539 }, { "epoch": 0.04, "learning_rate": 1.99976125737829e-05, "loss": 0.9473, "step": 540 }, { "epoch": 0.04, "learning_rate": 1.999756410132824e-05, "loss": 0.9717, "step": 541 }, { "epoch": 0.04, "learning_rate": 1.9997515141792747e-05, "loss": 0.9863, "step": 542 }, { "epoch": 0.04, "learning_rate": 1.9997465695178802e-05, "loss": 1.0479, "step": 543 }, { "epoch": 0.04, "learning_rate": 1.999741576148882e-05, "loss": 0.9678, "step": 544 }, { "epoch": 0.04, "learning_rate": 1.9997365340725224e-05, "loss": 0.9551, "step": 545 }, { "epoch": 0.04, "learning_rate": 1.999731443289048e-05, "loss": 0.9463, "step": 546 }, { "epoch": 0.04, "learning_rate": 1.9997263037987064e-05, "loss": 0.9834, "step": 547 }, { "epoch": 0.04, "learning_rate": 1.999721115601748e-05, "loss": 0.9199, "step": 548 }, { "epoch": 0.04, "learning_rate": 1.9997158786984255e-05, "loss": 0.875, "step": 549 }, { "epoch": 0.04, "learning_rate": 1.999710593088994e-05, "loss": 0.9941, "step": 550 }, { "epoch": 0.04, "learning_rate": 1.9997052587737115e-05, "loss": 0.9424, "step": 551 }, { "epoch": 0.04, "learning_rate": 1.999699875752837e-05, "loss": 0.9326, "step": 552 }, { "epoch": 0.04, "learning_rate": 1.9996944440266342e-05, "loss": 0.9443, "step": 553 }, { "epoch": 0.04, "learning_rate": 1.9996889635953663e-05, "loss": 0.9756, "step": 554 }, { "epoch": 0.04, "learning_rate": 1.9996834344593008e-05, "loss": 0.9121, "step": 555 }, { "epoch": 0.04, "learning_rate": 1.9996778566187072e-05, "loss": 0.9043, "step": 556 }, { "epoch": 0.04, "learning_rate": 1.9996722300738575e-05, "loss": 0.9414, "step": 557 }, { "epoch": 0.04, "learning_rate": 1.999666554825025e-05, "loss": 0.9805, "step": 558 }, { "epoch": 0.04, "learning_rate": 1.9996608308724867e-05, "loss": 0.8945, "step": 559 }, { "epoch": 0.04, "learning_rate": 1.9996550582165217e-05, "loss": 0.9023, "step": 560 }, { "epoch": 0.04, "learning_rate": 1.999649236857411e-05, "loss": 1.0273, "step": 561 }, { "epoch": 0.04, "learning_rate": 1.9996433667954384e-05, "loss": 0.8828, "step": 562 }, { "epoch": 0.04, "learning_rate": 1.9996374480308894e-05, "loss": 1.0068, "step": 563 }, { "epoch": 0.04, "learning_rate": 1.9996314805640526e-05, "loss": 0.9229, "step": 564 }, { "epoch": 0.04, "learning_rate": 1.9996254643952195e-05, "loss": 0.9199, "step": 565 }, { "epoch": 0.04, "learning_rate": 1.9996193995246817e-05, "loss": 0.9893, "step": 566 }, { "epoch": 0.04, "learning_rate": 1.9996132859527358e-05, "loss": 0.9287, "step": 567 }, { "epoch": 0.04, "learning_rate": 1.9996071236796796e-05, "loss": 0.8633, "step": 568 }, { "epoch": 0.04, "learning_rate": 1.9996009127058128e-05, "loss": 0.9443, "step": 569 }, { "epoch": 0.04, "learning_rate": 1.9995946530314384e-05, "loss": 0.9277, "step": 570 }, { "epoch": 0.04, "learning_rate": 1.999588344656861e-05, "loss": 1.0244, "step": 571 }, { "epoch": 0.04, "learning_rate": 1.9995819875823886e-05, "loss": 0.9551, "step": 572 }, { "epoch": 0.04, "learning_rate": 1.9995755818083302e-05, "loss": 0.9434, "step": 573 }, { "epoch": 0.04, "learning_rate": 1.9995691273349985e-05, "loss": 0.9238, "step": 574 }, { "epoch": 0.04, "learning_rate": 1.9995626241627075e-05, "loss": 0.8887, "step": 575 }, { "epoch": 0.04, "learning_rate": 1.999556072291774e-05, "loss": 1.0723, "step": 576 }, { "epoch": 0.04, "learning_rate": 1.9995494717225177e-05, "loss": 0.9375, "step": 577 }, { "epoch": 0.04, "learning_rate": 1.9995428224552597e-05, "loss": 0.9834, "step": 578 }, { "epoch": 0.04, "learning_rate": 1.9995361244903244e-05, "loss": 0.9668, "step": 579 }, { "epoch": 0.04, "learning_rate": 1.9995293778280376e-05, "loss": 0.9805, "step": 580 }, { "epoch": 0.04, "learning_rate": 1.9995225824687283e-05, "loss": 0.9121, "step": 581 }, { "epoch": 0.04, "learning_rate": 1.9995157384127273e-05, "loss": 0.9297, "step": 582 }, { "epoch": 0.04, "learning_rate": 1.9995088456603686e-05, "loss": 0.9072, "step": 583 }, { "epoch": 0.04, "learning_rate": 1.9995019042119875e-05, "loss": 0.9219, "step": 584 }, { "epoch": 0.04, "learning_rate": 1.9994949140679228e-05, "loss": 0.9346, "step": 585 }, { "epoch": 0.04, "learning_rate": 1.999487875228514e-05, "loss": 0.9629, "step": 586 }, { "epoch": 0.04, "learning_rate": 1.999480787694105e-05, "loss": 0.9102, "step": 587 }, { "epoch": 0.04, "learning_rate": 1.9994736514650407e-05, "loss": 0.9873, "step": 588 }, { "epoch": 0.04, "learning_rate": 1.999466466541669e-05, "loss": 0.8828, "step": 589 }, { "epoch": 0.04, "learning_rate": 1.9994592329243395e-05, "loss": 0.9463, "step": 590 }, { "epoch": 0.04, "learning_rate": 1.999451950613405e-05, "loss": 0.9053, "step": 591 }, { "epoch": 0.04, "learning_rate": 1.9994446196092205e-05, "loss": 0.9854, "step": 592 }, { "epoch": 0.04, "learning_rate": 1.9994372399121426e-05, "loss": 0.9355, "step": 593 }, { "epoch": 0.04, "learning_rate": 1.999429811522531e-05, "loss": 0.8418, "step": 594 }, { "epoch": 0.04, "learning_rate": 1.999422334440748e-05, "loss": 0.9463, "step": 595 }, { "epoch": 0.04, "learning_rate": 1.9994148086671576e-05, "loss": 1.0342, "step": 596 }, { "epoch": 0.04, "learning_rate": 1.999407234202126e-05, "loss": 0.9775, "step": 597 }, { "epoch": 0.04, "learning_rate": 1.9993996110460233e-05, "loss": 0.9004, "step": 598 }, { "epoch": 0.04, "learning_rate": 1.99939193919922e-05, "loss": 0.9131, "step": 599 }, { "epoch": 0.04, "learning_rate": 1.99938421866209e-05, "loss": 0.9209, "step": 600 }, { "epoch": 0.04, "learning_rate": 1.99937644943501e-05, "loss": 0.9707, "step": 601 }, { "epoch": 0.04, "learning_rate": 1.999368631518358e-05, "loss": 0.9492, "step": 602 }, { "epoch": 0.04, "learning_rate": 1.9993607649125146e-05, "loss": 0.9639, "step": 603 }, { "epoch": 0.04, "learning_rate": 1.9993528496178637e-05, "loss": 0.9678, "step": 604 }, { "epoch": 0.04, "learning_rate": 1.999344885634791e-05, "loss": 0.9092, "step": 605 }, { "epoch": 0.04, "learning_rate": 1.999336872963684e-05, "loss": 0.9551, "step": 606 }, { "epoch": 0.04, "learning_rate": 1.9993288116049332e-05, "loss": 0.9072, "step": 607 }, { "epoch": 0.04, "learning_rate": 1.9993207015589316e-05, "loss": 0.9219, "step": 608 }, { "epoch": 0.04, "learning_rate": 1.9993125428260737e-05, "loss": 0.959, "step": 609 }, { "epoch": 0.04, "learning_rate": 1.999304335406758e-05, "loss": 0.8916, "step": 610 }, { "epoch": 0.04, "learning_rate": 1.9992960793013835e-05, "loss": 0.9082, "step": 611 }, { "epoch": 0.04, "learning_rate": 1.999287774510353e-05, "loss": 0.8926, "step": 612 }, { "epoch": 0.04, "learning_rate": 1.9992794210340707e-05, "loss": 0.9795, "step": 613 }, { "epoch": 0.04, "learning_rate": 1.9992710188729437e-05, "loss": 0.9404, "step": 614 }, { "epoch": 0.04, "learning_rate": 1.9992625680273818e-05, "loss": 0.8691, "step": 615 }, { "epoch": 0.04, "learning_rate": 1.9992540684977958e-05, "loss": 0.8701, "step": 616 }, { "epoch": 0.04, "learning_rate": 1.9992455202846002e-05, "loss": 0.791, "step": 617 }, { "epoch": 0.04, "learning_rate": 1.999236923388212e-05, "loss": 0.9355, "step": 618 }, { "epoch": 0.04, "learning_rate": 1.9992282778090495e-05, "loss": 0.9336, "step": 619 }, { "epoch": 0.04, "learning_rate": 1.999219583547534e-05, "loss": 0.9248, "step": 620 }, { "epoch": 0.04, "learning_rate": 1.999210840604089e-05, "loss": 0.9814, "step": 621 }, { "epoch": 0.04, "learning_rate": 1.9992020489791407e-05, "loss": 0.9717, "step": 622 }, { "epoch": 0.04, "learning_rate": 1.9991932086731175e-05, "loss": 0.9678, "step": 623 }, { "epoch": 0.04, "learning_rate": 1.9991843196864496e-05, "loss": 0.9043, "step": 624 }, { "epoch": 0.04, "learning_rate": 1.9991753820195706e-05, "loss": 0.8838, "step": 625 }, { "epoch": 0.04, "learning_rate": 1.9991663956729154e-05, "loss": 0.8906, "step": 626 }, { "epoch": 0.04, "learning_rate": 1.9991573606469224e-05, "loss": 0.9551, "step": 627 }, { "epoch": 0.04, "learning_rate": 1.9991482769420315e-05, "loss": 0.9375, "step": 628 }, { "epoch": 0.04, "learning_rate": 1.999139144558685e-05, "loss": 0.8916, "step": 629 }, { "epoch": 0.04, "learning_rate": 1.9991299634973285e-05, "loss": 0.9307, "step": 630 }, { "epoch": 0.04, "learning_rate": 1.9991207337584085e-05, "loss": 0.9902, "step": 631 }, { "epoch": 0.04, "learning_rate": 1.9991114553423752e-05, "loss": 1.0166, "step": 632 }, { "epoch": 0.04, "learning_rate": 1.999102128249681e-05, "loss": 0.9258, "step": 633 }, { "epoch": 0.04, "learning_rate": 1.9990927524807793e-05, "loss": 0.8818, "step": 634 }, { "epoch": 0.04, "learning_rate": 1.9990833280361274e-05, "loss": 0.9463, "step": 635 }, { "epoch": 0.04, "learning_rate": 1.9990738549161847e-05, "loss": 0.8945, "step": 636 }, { "epoch": 0.04, "learning_rate": 1.9990643331214127e-05, "loss": 0.873, "step": 637 }, { "epoch": 0.04, "learning_rate": 1.9990547626522746e-05, "loss": 1.0, "step": 638 }, { "epoch": 0.04, "learning_rate": 1.9990451435092375e-05, "loss": 0.9404, "step": 639 }, { "epoch": 0.04, "learning_rate": 1.9990354756927698e-05, "loss": 0.8965, "step": 640 }, { "epoch": 0.04, "learning_rate": 1.999025759203342e-05, "loss": 0.9502, "step": 641 }, { "epoch": 0.04, "learning_rate": 1.9990159940414286e-05, "loss": 0.9033, "step": 642 }, { "epoch": 0.04, "learning_rate": 1.9990061802075044e-05, "loss": 0.9189, "step": 643 }, { "epoch": 0.04, "learning_rate": 1.9989963177020476e-05, "loss": 0.9775, "step": 644 }, { "epoch": 0.04, "learning_rate": 1.9989864065255393e-05, "loss": 0.959, "step": 645 }, { "epoch": 0.04, "learning_rate": 1.9989764466784615e-05, "loss": 1.0439, "step": 646 }, { "epoch": 0.04, "learning_rate": 1.9989664381613002e-05, "loss": 0.9326, "step": 647 }, { "epoch": 0.04, "learning_rate": 1.998956380974543e-05, "loss": 1.0332, "step": 648 }, { "epoch": 0.04, "learning_rate": 1.9989462751186794e-05, "loss": 0.9453, "step": 649 }, { "epoch": 0.04, "learning_rate": 1.9989361205942016e-05, "loss": 1.002, "step": 650 }, { "epoch": 0.04, "learning_rate": 1.9989259174016054e-05, "loss": 0.9756, "step": 651 }, { "epoch": 0.04, "learning_rate": 1.998915665541387e-05, "loss": 0.8545, "step": 652 }, { "epoch": 0.04, "learning_rate": 1.9989053650140457e-05, "loss": 0.8711, "step": 653 }, { "epoch": 0.04, "learning_rate": 1.9988950158200843e-05, "loss": 0.8867, "step": 654 }, { "epoch": 0.04, "learning_rate": 1.998884617960006e-05, "loss": 0.9453, "step": 655 }, { "epoch": 0.04, "learning_rate": 1.998874171434318e-05, "loss": 0.9688, "step": 656 }, { "epoch": 0.04, "learning_rate": 1.998863676243529e-05, "loss": 0.9824, "step": 657 }, { "epoch": 0.04, "learning_rate": 1.9988531323881504e-05, "loss": 0.9316, "step": 658 }, { "epoch": 0.04, "learning_rate": 1.998842539868696e-05, "loss": 0.9375, "step": 659 }, { "epoch": 0.04, "learning_rate": 1.998831898685682e-05, "loss": 0.9102, "step": 660 }, { "epoch": 0.05, "learning_rate": 1.9988212088396262e-05, "loss": 0.9395, "step": 661 }, { "epoch": 0.05, "learning_rate": 1.99881047033105e-05, "loss": 0.8877, "step": 662 }, { "epoch": 0.05, "learning_rate": 1.9987996831604762e-05, "loss": 0.9375, "step": 663 }, { "epoch": 0.05, "learning_rate": 1.998788847328431e-05, "loss": 0.9619, "step": 664 }, { "epoch": 0.05, "learning_rate": 1.9987779628354412e-05, "loss": 0.9824, "step": 665 }, { "epoch": 0.05, "learning_rate": 1.9987670296820382e-05, "loss": 0.8857, "step": 666 }, { "epoch": 0.05, "learning_rate": 1.9987560478687543e-05, "loss": 0.8984, "step": 667 }, { "epoch": 0.05, "learning_rate": 1.9987450173961243e-05, "loss": 0.8955, "step": 668 }, { "epoch": 0.05, "learning_rate": 1.9987339382646857e-05, "loss": 0.9648, "step": 669 }, { "epoch": 0.05, "learning_rate": 1.9987228104749784e-05, "loss": 0.9658, "step": 670 }, { "epoch": 0.05, "learning_rate": 1.9987116340275447e-05, "loss": 0.874, "step": 671 }, { "epoch": 0.05, "learning_rate": 1.9987004089229284e-05, "loss": 0.9863, "step": 672 }, { "epoch": 0.05, "learning_rate": 1.9986891351616772e-05, "loss": 0.9707, "step": 673 }, { "epoch": 0.05, "learning_rate": 1.99867781274434e-05, "loss": 0.8906, "step": 674 }, { "epoch": 0.05, "learning_rate": 1.9986664416714685e-05, "loss": 0.9355, "step": 675 }, { "epoch": 0.05, "learning_rate": 1.9986550219436166e-05, "loss": 0.8828, "step": 676 }, { "epoch": 0.05, "learning_rate": 1.9986435535613408e-05, "loss": 1.0332, "step": 677 }, { "epoch": 0.05, "learning_rate": 1.9986320365251998e-05, "loss": 0.8652, "step": 678 }, { "epoch": 0.05, "learning_rate": 1.9986204708357543e-05, "loss": 0.8779, "step": 679 }, { "epoch": 0.05, "learning_rate": 1.9986088564935687e-05, "loss": 0.9268, "step": 680 }, { "epoch": 0.05, "learning_rate": 1.998597193499208e-05, "loss": 0.9082, "step": 681 }, { "epoch": 0.05, "learning_rate": 1.9985854818532408e-05, "loss": 1.0615, "step": 682 }, { "epoch": 0.05, "learning_rate": 1.998573721556238e-05, "loss": 0.8994, "step": 683 }, { "epoch": 0.05, "learning_rate": 1.9985619126087714e-05, "loss": 0.9219, "step": 684 }, { "epoch": 0.05, "learning_rate": 1.9985500550114178e-05, "loss": 0.876, "step": 685 }, { "epoch": 0.05, "learning_rate": 1.998538148764754e-05, "loss": 0.8643, "step": 686 }, { "epoch": 0.05, "learning_rate": 1.9985261938693598e-05, "loss": 0.9111, "step": 687 }, { "epoch": 0.05, "learning_rate": 1.9985141903258186e-05, "loss": 0.8467, "step": 688 }, { "epoch": 0.05, "learning_rate": 1.998502138134715e-05, "loss": 0.9873, "step": 689 }, { "epoch": 0.05, "learning_rate": 1.9984900372966356e-05, "loss": 0.8555, "step": 690 }, { "epoch": 0.05, "learning_rate": 1.99847788781217e-05, "loss": 0.998, "step": 691 }, { "epoch": 0.05, "learning_rate": 1.998465689681911e-05, "loss": 0.9248, "step": 692 }, { "epoch": 0.05, "learning_rate": 1.9984534429064517e-05, "loss": 0.8701, "step": 693 }, { "epoch": 0.05, "learning_rate": 1.9984411474863897e-05, "loss": 0.9521, "step": 694 }, { "epoch": 0.05, "learning_rate": 1.9984288034223236e-05, "loss": 1.0088, "step": 695 }, { "epoch": 0.05, "learning_rate": 1.998416410714855e-05, "loss": 0.9062, "step": 696 }, { "epoch": 0.05, "learning_rate": 1.9984039693645876e-05, "loss": 0.9727, "step": 697 }, { "epoch": 0.05, "learning_rate": 1.998391479372127e-05, "loss": 0.9053, "step": 698 }, { "epoch": 0.05, "learning_rate": 1.9983789407380828e-05, "loss": 0.9844, "step": 699 }, { "epoch": 0.05, "learning_rate": 1.998366353463065e-05, "loss": 0.9619, "step": 700 }, { "epoch": 0.05, "learning_rate": 1.9983537175476875e-05, "loss": 0.9248, "step": 701 }, { "epoch": 0.05, "learning_rate": 1.998341032992565e-05, "loss": 0.915, "step": 702 }, { "epoch": 0.05, "learning_rate": 1.9983282997983163e-05, "loss": 1.0127, "step": 703 }, { "epoch": 0.05, "learning_rate": 1.998315517965562e-05, "loss": 0.832, "step": 704 }, { "epoch": 0.05, "learning_rate": 1.9983026874949235e-05, "loss": 0.8984, "step": 705 }, { "epoch": 0.05, "learning_rate": 1.9982898083870274e-05, "loss": 0.7852, "step": 706 }, { "epoch": 0.05, "learning_rate": 1.9982768806425002e-05, "loss": 0.9092, "step": 707 }, { "epoch": 0.05, "learning_rate": 1.9982639042619724e-05, "loss": 1.0146, "step": 708 }, { "epoch": 0.05, "learning_rate": 1.998250879246075e-05, "loss": 0.9395, "step": 709 }, { "epoch": 0.05, "learning_rate": 1.9982378055954444e-05, "loss": 0.9824, "step": 710 }, { "epoch": 0.05, "learning_rate": 1.9982246833107162e-05, "loss": 0.9883, "step": 711 }, { "epoch": 0.05, "learning_rate": 1.9982115123925302e-05, "loss": 0.9824, "step": 712 }, { "epoch": 0.05, "learning_rate": 1.998198292841528e-05, "loss": 0.8037, "step": 713 }, { "epoch": 0.05, "learning_rate": 1.9981850246583535e-05, "loss": 0.9463, "step": 714 }, { "epoch": 0.05, "learning_rate": 1.9981717078436534e-05, "loss": 0.8994, "step": 715 }, { "epoch": 0.05, "learning_rate": 1.9981583423980765e-05, "loss": 0.8945, "step": 716 }, { "epoch": 0.05, "learning_rate": 1.9981449283222737e-05, "loss": 0.9023, "step": 717 }, { "epoch": 0.05, "learning_rate": 1.9981314656168983e-05, "loss": 0.9746, "step": 718 }, { "epoch": 0.05, "learning_rate": 1.9981179542826072e-05, "loss": 0.9189, "step": 719 }, { "epoch": 0.05, "learning_rate": 1.9981043943200577e-05, "loss": 0.9961, "step": 720 }, { "epoch": 0.05, "learning_rate": 1.998090785729911e-05, "loss": 1.0244, "step": 721 }, { "epoch": 0.05, "learning_rate": 1.9980771285128296e-05, "loss": 0.9043, "step": 722 }, { "epoch": 0.05, "learning_rate": 1.998063422669479e-05, "loss": 0.9736, "step": 723 }, { "epoch": 0.05, "learning_rate": 1.998049668200528e-05, "loss": 0.7998, "step": 724 }, { "epoch": 0.05, "learning_rate": 1.9980358651066448e-05, "loss": 0.9258, "step": 725 }, { "epoch": 0.05, "learning_rate": 1.9980220133885037e-05, "loss": 0.9502, "step": 726 }, { "epoch": 0.05, "learning_rate": 1.9980081130467784e-05, "loss": 0.9336, "step": 727 }, { "epoch": 0.05, "learning_rate": 1.9979941640821465e-05, "loss": 0.9375, "step": 728 }, { "epoch": 0.05, "learning_rate": 1.997980166495288e-05, "loss": 0.998, "step": 729 }, { "epoch": 0.05, "learning_rate": 1.997966120286884e-05, "loss": 0.8721, "step": 730 }, { "epoch": 0.05, "learning_rate": 1.9979520254576195e-05, "loss": 0.8193, "step": 731 }, { "epoch": 0.05, "learning_rate": 1.9979378820081806e-05, "loss": 0.9453, "step": 732 }, { "epoch": 0.05, "learning_rate": 1.9979236899392572e-05, "loss": 0.9043, "step": 733 }, { "epoch": 0.05, "learning_rate": 1.99790944925154e-05, "loss": 0.9824, "step": 734 }, { "epoch": 0.05, "learning_rate": 1.9978951599457233e-05, "loss": 0.9248, "step": 735 }, { "epoch": 0.05, "learning_rate": 1.997880822022503e-05, "loss": 0.9521, "step": 736 }, { "epoch": 0.05, "learning_rate": 1.9978664354825778e-05, "loss": 0.9053, "step": 737 }, { "epoch": 0.05, "learning_rate": 1.9978520003266488e-05, "loss": 0.8896, "step": 738 }, { "epoch": 0.05, "learning_rate": 1.9978375165554182e-05, "loss": 0.918, "step": 739 }, { "epoch": 0.05, "learning_rate": 1.9978229841695932e-05, "loss": 0.9238, "step": 740 }, { "epoch": 0.05, "learning_rate": 1.997808403169881e-05, "loss": 0.9219, "step": 741 }, { "epoch": 0.05, "learning_rate": 1.9977937735569915e-05, "loss": 0.9189, "step": 742 }, { "epoch": 0.05, "learning_rate": 1.997779095331638e-05, "loss": 1.0244, "step": 743 }, { "epoch": 0.05, "learning_rate": 1.9977643684945364e-05, "loss": 0.9541, "step": 744 }, { "epoch": 0.05, "learning_rate": 1.9977495930464032e-05, "loss": 0.959, "step": 745 }, { "epoch": 0.05, "learning_rate": 1.997734768987958e-05, "loss": 0.8467, "step": 746 }, { "epoch": 0.05, "learning_rate": 1.9977198963199237e-05, "loss": 1.0049, "step": 747 }, { "epoch": 0.05, "learning_rate": 1.997704975043025e-05, "loss": 0.9346, "step": 748 }, { "epoch": 0.05, "learning_rate": 1.9976900051579883e-05, "loss": 0.9678, "step": 749 }, { "epoch": 0.05, "learning_rate": 1.9976749866655433e-05, "loss": 0.9932, "step": 750 }, { "epoch": 0.05, "learning_rate": 1.9976599195664216e-05, "loss": 0.9521, "step": 751 }, { "epoch": 0.05, "learning_rate": 1.9976448038613574e-05, "loss": 0.9463, "step": 752 }, { "epoch": 0.05, "learning_rate": 1.9976296395510867e-05, "loss": 0.874, "step": 753 }, { "epoch": 0.05, "learning_rate": 1.997614426636349e-05, "loss": 0.8604, "step": 754 }, { "epoch": 0.05, "learning_rate": 1.9975991651178847e-05, "loss": 0.9814, "step": 755 }, { "epoch": 0.05, "learning_rate": 1.9975838549964378e-05, "loss": 0.8516, "step": 756 }, { "epoch": 0.05, "learning_rate": 1.9975684962727543e-05, "loss": 0.8477, "step": 757 }, { "epoch": 0.05, "learning_rate": 1.9975530889475824e-05, "loss": 0.9033, "step": 758 }, { "epoch": 0.05, "learning_rate": 1.9975376330216726e-05, "loss": 0.8691, "step": 759 }, { "epoch": 0.05, "learning_rate": 1.9975221284957776e-05, "loss": 0.9551, "step": 760 }, { "epoch": 0.05, "learning_rate": 1.9975065753706534e-05, "loss": 0.9971, "step": 761 }, { "epoch": 0.05, "learning_rate": 1.9974909736470572e-05, "loss": 0.9307, "step": 762 }, { "epoch": 0.05, "learning_rate": 1.99747532332575e-05, "loss": 0.8838, "step": 763 }, { "epoch": 0.05, "learning_rate": 1.9974596244074935e-05, "loss": 1.0029, "step": 764 }, { "epoch": 0.05, "learning_rate": 1.9974438768930526e-05, "loss": 0.9541, "step": 765 }, { "epoch": 0.05, "learning_rate": 1.997428080783195e-05, "loss": 0.9971, "step": 766 }, { "epoch": 0.05, "learning_rate": 1.9974122360786893e-05, "loss": 0.9688, "step": 767 }, { "epoch": 0.05, "learning_rate": 1.9973963427803085e-05, "loss": 0.9307, "step": 768 }, { "epoch": 0.05, "learning_rate": 1.9973804008888265e-05, "loss": 0.9336, "step": 769 }, { "epoch": 0.05, "learning_rate": 1.99736441040502e-05, "loss": 0.9424, "step": 770 }, { "epoch": 0.05, "learning_rate": 1.997348371329668e-05, "loss": 0.8662, "step": 771 }, { "epoch": 0.05, "learning_rate": 1.9973322836635517e-05, "loss": 0.9736, "step": 772 }, { "epoch": 0.05, "learning_rate": 1.9973161474074556e-05, "loss": 0.8486, "step": 773 }, { "epoch": 0.05, "learning_rate": 1.9972999625621653e-05, "loss": 0.9453, "step": 774 }, { "epoch": 0.05, "learning_rate": 1.9972837291284697e-05, "loss": 0.9863, "step": 775 }, { "epoch": 0.05, "learning_rate": 1.997267447107159e-05, "loss": 0.9629, "step": 776 }, { "epoch": 0.05, "learning_rate": 1.9972511164990274e-05, "loss": 0.9619, "step": 777 }, { "epoch": 0.05, "learning_rate": 1.9972347373048696e-05, "loss": 0.9092, "step": 778 }, { "epoch": 0.05, "learning_rate": 1.9972183095254844e-05, "loss": 0.9004, "step": 779 }, { "epoch": 0.05, "learning_rate": 1.9972018331616713e-05, "loss": 0.9717, "step": 780 }, { "epoch": 0.05, "learning_rate": 1.9971853082142337e-05, "loss": 0.8721, "step": 781 }, { "epoch": 0.05, "learning_rate": 1.9971687346839766e-05, "loss": 0.9326, "step": 782 }, { "epoch": 0.05, "learning_rate": 1.9971521125717078e-05, "loss": 0.9277, "step": 783 }, { "epoch": 0.05, "learning_rate": 1.997135441878236e-05, "loss": 0.9053, "step": 784 }, { "epoch": 0.05, "learning_rate": 1.9971187226043746e-05, "loss": 0.8281, "step": 785 }, { "epoch": 0.05, "learning_rate": 1.9971019547509372e-05, "loss": 0.8906, "step": 786 }, { "epoch": 0.05, "learning_rate": 1.9970851383187417e-05, "loss": 0.9824, "step": 787 }, { "epoch": 0.05, "learning_rate": 1.9970682733086066e-05, "loss": 0.9561, "step": 788 }, { "epoch": 0.05, "learning_rate": 1.9970513597213543e-05, "loss": 0.9424, "step": 789 }, { "epoch": 0.05, "learning_rate": 1.9970343975578076e-05, "loss": 0.9248, "step": 790 }, { "epoch": 0.05, "learning_rate": 1.997017386818794e-05, "loss": 0.8848, "step": 791 }, { "epoch": 0.05, "learning_rate": 1.997000327505142e-05, "loss": 0.8936, "step": 792 }, { "epoch": 0.05, "learning_rate": 1.9969832196176826e-05, "loss": 0.9258, "step": 793 }, { "epoch": 0.05, "learning_rate": 1.9969660631572492e-05, "loss": 0.9473, "step": 794 }, { "epoch": 0.05, "learning_rate": 1.9969488581246785e-05, "loss": 0.8828, "step": 795 }, { "epoch": 0.05, "learning_rate": 1.9969316045208072e-05, "loss": 0.9248, "step": 796 }, { "epoch": 0.05, "learning_rate": 1.9969143023464774e-05, "loss": 1.001, "step": 797 }, { "epoch": 0.05, "learning_rate": 1.9968969516025312e-05, "loss": 0.9492, "step": 798 }, { "epoch": 0.05, "learning_rate": 1.996879552289814e-05, "loss": 1.0254, "step": 799 }, { "epoch": 0.05, "learning_rate": 1.9968621044091736e-05, "loss": 0.9502, "step": 800 }, { "epoch": 0.05, "learning_rate": 1.99684460796146e-05, "loss": 0.8828, "step": 801 }, { "epoch": 0.05, "learning_rate": 1.996827062947526e-05, "loss": 0.957, "step": 802 }, { "epoch": 0.05, "learning_rate": 1.996809469368226e-05, "loss": 0.9277, "step": 803 }, { "epoch": 0.05, "learning_rate": 1.9967918272244173e-05, "loss": 0.9678, "step": 804 }, { "epoch": 0.05, "learning_rate": 1.9967741365169596e-05, "loss": 0.9307, "step": 805 }, { "epoch": 0.05, "learning_rate": 1.996756397246714e-05, "loss": 0.833, "step": 806 }, { "epoch": 0.05, "learning_rate": 1.996738609414546e-05, "loss": 1.0723, "step": 807 }, { "epoch": 0.06, "learning_rate": 1.996720773021321e-05, "loss": 0.9795, "step": 808 }, { "epoch": 0.06, "learning_rate": 1.996702888067909e-05, "loss": 0.9492, "step": 809 }, { "epoch": 0.06, "learning_rate": 1.9966849545551804e-05, "loss": 1.0029, "step": 810 }, { "epoch": 0.06, "learning_rate": 1.9966669724840098e-05, "loss": 0.8672, "step": 811 }, { "epoch": 0.06, "learning_rate": 1.9966489418552724e-05, "loss": 0.9268, "step": 812 }, { "epoch": 0.06, "learning_rate": 1.996630862669848e-05, "loss": 0.8955, "step": 813 }, { "epoch": 0.06, "learning_rate": 1.9966127349286158e-05, "loss": 0.9316, "step": 814 }, { "epoch": 0.06, "learning_rate": 1.99659455863246e-05, "loss": 1.0195, "step": 815 }, { "epoch": 0.06, "learning_rate": 1.9965763337822662e-05, "loss": 0.9443, "step": 816 }, { "epoch": 0.06, "learning_rate": 1.9965580603789218e-05, "loss": 0.833, "step": 817 }, { "epoch": 0.06, "learning_rate": 1.996539738423317e-05, "loss": 0.9873, "step": 818 }, { "epoch": 0.06, "learning_rate": 1.996521367916345e-05, "loss": 0.918, "step": 819 }, { "epoch": 0.06, "learning_rate": 1.996502948858901e-05, "loss": 0.9307, "step": 820 }, { "epoch": 0.06, "learning_rate": 1.9964844812518814e-05, "loss": 0.9424, "step": 821 }, { "epoch": 0.06, "learning_rate": 1.9964659650961866e-05, "loss": 0.8867, "step": 822 }, { "epoch": 0.06, "learning_rate": 1.9964474003927184e-05, "loss": 0.9346, "step": 823 }, { "epoch": 0.06, "learning_rate": 1.9964287871423816e-05, "loss": 0.9561, "step": 824 }, { "epoch": 0.06, "learning_rate": 1.996410125346083e-05, "loss": 0.8311, "step": 825 }, { "epoch": 0.06, "learning_rate": 1.9963914150047315e-05, "loss": 0.9062, "step": 826 }, { "epoch": 0.06, "learning_rate": 1.996372656119239e-05, "loss": 0.8555, "step": 827 }, { "epoch": 0.06, "learning_rate": 1.996353848690519e-05, "loss": 0.9678, "step": 828 }, { "epoch": 0.06, "learning_rate": 1.9963349927194885e-05, "loss": 0.8379, "step": 829 }, { "epoch": 0.06, "learning_rate": 1.9963160882070654e-05, "loss": 0.9121, "step": 830 }, { "epoch": 0.06, "learning_rate": 1.996297135154171e-05, "loss": 0.9072, "step": 831 }, { "epoch": 0.06, "learning_rate": 1.9962781335617292e-05, "loss": 0.9082, "step": 832 }, { "epoch": 0.06, "learning_rate": 1.996259083430665e-05, "loss": 0.9385, "step": 833 }, { "epoch": 0.06, "learning_rate": 1.9962399847619068e-05, "loss": 0.9502, "step": 834 }, { "epoch": 0.06, "learning_rate": 1.9962208375563853e-05, "loss": 0.8486, "step": 835 }, { "epoch": 0.06, "learning_rate": 1.996201641815033e-05, "loss": 0.9541, "step": 836 }, { "epoch": 0.06, "learning_rate": 1.9961823975387857e-05, "loss": 0.9248, "step": 837 }, { "epoch": 0.06, "learning_rate": 1.99616310472858e-05, "loss": 0.8955, "step": 838 }, { "epoch": 0.06, "learning_rate": 1.9961437633853568e-05, "loss": 0.9551, "step": 839 }, { "epoch": 0.06, "learning_rate": 1.9961243735100578e-05, "loss": 0.8467, "step": 840 }, { "epoch": 0.06, "learning_rate": 1.9961049351036283e-05, "loss": 1.0352, "step": 841 }, { "epoch": 0.06, "learning_rate": 1.9960854481670145e-05, "loss": 0.8721, "step": 842 }, { "epoch": 0.06, "learning_rate": 1.9960659127011667e-05, "loss": 0.9619, "step": 843 }, { "epoch": 0.06, "learning_rate": 1.9960463287070357e-05, "loss": 0.9619, "step": 844 }, { "epoch": 0.06, "learning_rate": 1.9960266961855764e-05, "loss": 0.9307, "step": 845 }, { "epoch": 0.06, "learning_rate": 1.996007015137745e-05, "loss": 0.9229, "step": 846 }, { "epoch": 0.06, "learning_rate": 1.9959872855645e-05, "loss": 1.0039, "step": 847 }, { "epoch": 0.06, "learning_rate": 1.9959675074668038e-05, "loss": 0.8652, "step": 848 }, { "epoch": 0.06, "learning_rate": 1.9959476808456185e-05, "loss": 0.9482, "step": 849 }, { "epoch": 0.06, "learning_rate": 1.995927805701911e-05, "loss": 0.959, "step": 850 }, { "epoch": 0.06, "learning_rate": 1.9959078820366497e-05, "loss": 0.9404, "step": 851 }, { "epoch": 0.06, "learning_rate": 1.9958879098508047e-05, "loss": 0.875, "step": 852 }, { "epoch": 0.06, "learning_rate": 1.9958678891453492e-05, "loss": 0.9541, "step": 853 }, { "epoch": 0.06, "learning_rate": 1.9958478199212586e-05, "loss": 0.9395, "step": 854 }, { "epoch": 0.06, "learning_rate": 1.9958277021795112e-05, "loss": 0.96, "step": 855 }, { "epoch": 0.06, "learning_rate": 1.9958075359210863e-05, "loss": 0.9062, "step": 856 }, { "epoch": 0.06, "learning_rate": 1.9957873211469673e-05, "loss": 0.9365, "step": 857 }, { "epoch": 0.06, "learning_rate": 1.995767057858138e-05, "loss": 0.918, "step": 858 }, { "epoch": 0.06, "learning_rate": 1.9957467460555865e-05, "loss": 0.8955, "step": 859 }, { "epoch": 0.06, "learning_rate": 1.995726385740302e-05, "loss": 0.9648, "step": 860 }, { "epoch": 0.06, "learning_rate": 1.9957059769132767e-05, "loss": 0.9424, "step": 861 }, { "epoch": 0.06, "learning_rate": 1.9956855195755046e-05, "loss": 0.9121, "step": 862 }, { "epoch": 0.06, "learning_rate": 1.9956650137279827e-05, "loss": 0.875, "step": 863 }, { "epoch": 0.06, "learning_rate": 1.9956444593717097e-05, "loss": 0.8887, "step": 864 }, { "epoch": 0.06, "learning_rate": 1.9956238565076873e-05, "loss": 0.875, "step": 865 }, { "epoch": 0.06, "learning_rate": 1.995603205136919e-05, "loss": 0.9707, "step": 866 }, { "epoch": 0.06, "learning_rate": 1.9955825052604115e-05, "loss": 0.8877, "step": 867 }, { "epoch": 0.06, "learning_rate": 1.9955617568791727e-05, "loss": 0.9229, "step": 868 }, { "epoch": 0.06, "learning_rate": 1.9955409599942137e-05, "loss": 0.9502, "step": 869 }, { "epoch": 0.06, "learning_rate": 1.9955201146065476e-05, "loss": 0.9141, "step": 870 }, { "epoch": 0.06, "learning_rate": 1.9954992207171898e-05, "loss": 0.8926, "step": 871 }, { "epoch": 0.06, "learning_rate": 1.9954782783271588e-05, "loss": 0.9033, "step": 872 }, { "epoch": 0.06, "learning_rate": 1.9954572874374748e-05, "loss": 1.0215, "step": 873 }, { "epoch": 0.06, "learning_rate": 1.99543624804916e-05, "loss": 0.959, "step": 874 }, { "epoch": 0.06, "learning_rate": 1.9954151601632397e-05, "loss": 0.9434, "step": 875 }, { "epoch": 0.06, "learning_rate": 1.9953940237807415e-05, "loss": 0.9707, "step": 876 }, { "epoch": 0.06, "learning_rate": 1.995372838902695e-05, "loss": 0.9717, "step": 877 }, { "epoch": 0.06, "learning_rate": 1.9953516055301323e-05, "loss": 0.9863, "step": 878 }, { "epoch": 0.06, "learning_rate": 1.995330323664088e-05, "loss": 0.9482, "step": 879 }, { "epoch": 0.06, "learning_rate": 1.9953089933055987e-05, "loss": 0.9873, "step": 880 }, { "epoch": 0.06, "learning_rate": 1.995287614455704e-05, "loss": 0.9531, "step": 881 }, { "epoch": 0.06, "learning_rate": 1.995266187115445e-05, "loss": 0.9551, "step": 882 }, { "epoch": 0.06, "learning_rate": 1.995244711285866e-05, "loss": 0.8525, "step": 883 }, { "epoch": 0.06, "learning_rate": 1.9952231869680135e-05, "loss": 0.9248, "step": 884 }, { "epoch": 0.06, "learning_rate": 1.9952016141629352e-05, "loss": 0.8975, "step": 885 }, { "epoch": 0.06, "learning_rate": 1.9951799928716835e-05, "loss": 0.8594, "step": 886 }, { "epoch": 0.06, "learning_rate": 1.9951583230953105e-05, "loss": 0.8857, "step": 887 }, { "epoch": 0.06, "learning_rate": 1.995136604834873e-05, "loss": 0.958, "step": 888 }, { "epoch": 0.06, "learning_rate": 1.9951148380914285e-05, "loss": 0.9463, "step": 889 }, { "epoch": 0.06, "learning_rate": 1.9950930228660374e-05, "loss": 0.9287, "step": 890 }, { "epoch": 0.06, "learning_rate": 1.9950711591597628e-05, "loss": 0.8682, "step": 891 }, { "epoch": 0.06, "learning_rate": 1.99504924697367e-05, "loss": 0.8838, "step": 892 }, { "epoch": 0.06, "learning_rate": 1.9950272863088265e-05, "loss": 0.9805, "step": 893 }, { "epoch": 0.06, "learning_rate": 1.995005277166302e-05, "loss": 0.9424, "step": 894 }, { "epoch": 0.06, "learning_rate": 1.994983219547169e-05, "loss": 0.9629, "step": 895 }, { "epoch": 0.06, "learning_rate": 1.9949611134525017e-05, "loss": 0.8711, "step": 896 }, { "epoch": 0.06, "learning_rate": 1.994938958883378e-05, "loss": 0.8975, "step": 897 }, { "epoch": 0.06, "learning_rate": 1.9949167558408766e-05, "loss": 0.8564, "step": 898 }, { "epoch": 0.06, "learning_rate": 1.9948945043260793e-05, "loss": 0.9531, "step": 899 }, { "epoch": 0.06, "learning_rate": 1.9948722043400702e-05, "loss": 0.9434, "step": 900 }, { "epoch": 0.06, "learning_rate": 1.9948498558839357e-05, "loss": 0.9463, "step": 901 }, { "epoch": 0.06, "learning_rate": 1.994827458958765e-05, "loss": 0.9414, "step": 902 }, { "epoch": 0.06, "learning_rate": 1.994805013565649e-05, "loss": 0.8535, "step": 903 }, { "epoch": 0.06, "learning_rate": 1.9947825197056812e-05, "loss": 0.9014, "step": 904 }, { "epoch": 0.06, "learning_rate": 1.9947599773799572e-05, "loss": 0.9414, "step": 905 }, { "epoch": 0.06, "learning_rate": 1.9947373865895762e-05, "loss": 0.8623, "step": 906 }, { "epoch": 0.06, "learning_rate": 1.994714747335638e-05, "loss": 0.8711, "step": 907 }, { "epoch": 0.06, "learning_rate": 1.994692059619246e-05, "loss": 0.9238, "step": 908 }, { "epoch": 0.06, "learning_rate": 1.9946693234415048e-05, "loss": 1.0088, "step": 909 }, { "epoch": 0.06, "learning_rate": 1.9946465388035233e-05, "loss": 0.8926, "step": 910 }, { "epoch": 0.06, "learning_rate": 1.9946237057064105e-05, "loss": 0.9346, "step": 911 }, { "epoch": 0.06, "learning_rate": 1.9946008241512797e-05, "loss": 0.9658, "step": 912 }, { "epoch": 0.06, "learning_rate": 1.9945778941392446e-05, "loss": 0.8838, "step": 913 }, { "epoch": 0.06, "learning_rate": 1.9945549156714236e-05, "loss": 0.9287, "step": 914 }, { "epoch": 0.06, "learning_rate": 1.9945318887489355e-05, "loss": 0.917, "step": 915 }, { "epoch": 0.06, "learning_rate": 1.9945088133729017e-05, "loss": 0.9658, "step": 916 }, { "epoch": 0.06, "learning_rate": 1.9944856895444474e-05, "loss": 0.9746, "step": 917 }, { "epoch": 0.06, "learning_rate": 1.9944625172646992e-05, "loss": 0.9473, "step": 918 }, { "epoch": 0.06, "learning_rate": 1.994439296534785e-05, "loss": 0.9521, "step": 919 }, { "epoch": 0.06, "learning_rate": 1.9944160273558376e-05, "loss": 0.9209, "step": 920 }, { "epoch": 0.06, "learning_rate": 1.994392709728989e-05, "loss": 0.96, "step": 921 }, { "epoch": 0.06, "learning_rate": 1.9943693436553765e-05, "loss": 0.9004, "step": 922 }, { "epoch": 0.06, "learning_rate": 1.994345929136138e-05, "loss": 0.9658, "step": 923 }, { "epoch": 0.06, "learning_rate": 1.9943224661724142e-05, "loss": 0.9639, "step": 924 }, { "epoch": 0.06, "learning_rate": 1.9942989547653487e-05, "loss": 0.9629, "step": 925 }, { "epoch": 0.06, "learning_rate": 1.994275394916086e-05, "loss": 0.9424, "step": 926 }, { "epoch": 0.06, "learning_rate": 1.994251786625775e-05, "loss": 0.9531, "step": 927 }, { "epoch": 0.06, "learning_rate": 1.9942281298955656e-05, "loss": 0.9482, "step": 928 }, { "epoch": 0.06, "learning_rate": 1.99420442472661e-05, "loss": 0.959, "step": 929 }, { "epoch": 0.06, "learning_rate": 1.9941806711200632e-05, "loss": 0.9023, "step": 930 }, { "epoch": 0.06, "learning_rate": 1.9941568690770827e-05, "loss": 0.8623, "step": 931 }, { "epoch": 0.06, "learning_rate": 1.9941330185988276e-05, "loss": 0.9941, "step": 932 }, { "epoch": 0.06, "learning_rate": 1.994109119686461e-05, "loss": 0.9102, "step": 933 }, { "epoch": 0.06, "learning_rate": 1.994085172341146e-05, "loss": 0.958, "step": 934 }, { "epoch": 0.06, "learning_rate": 1.99406117656405e-05, "loss": 0.9678, "step": 935 }, { "epoch": 0.06, "learning_rate": 1.9940371323563422e-05, "loss": 0.8428, "step": 936 }, { "epoch": 0.06, "learning_rate": 1.9940130397191938e-05, "loss": 0.9355, "step": 937 }, { "epoch": 0.06, "learning_rate": 1.9939888986537785e-05, "loss": 0.9053, "step": 938 }, { "epoch": 0.06, "learning_rate": 1.9939647091612725e-05, "loss": 0.9326, "step": 939 }, { "epoch": 0.06, "learning_rate": 1.993940471242854e-05, "loss": 0.8613, "step": 940 }, { "epoch": 0.06, "learning_rate": 1.9939161848997048e-05, "loss": 0.9287, "step": 941 }, { "epoch": 0.06, "learning_rate": 1.9938918501330073e-05, "loss": 0.9473, "step": 942 }, { "epoch": 0.06, "learning_rate": 1.9938674669439474e-05, "loss": 0.917, "step": 943 }, { "epoch": 0.06, "learning_rate": 1.9938430353337128e-05, "loss": 0.9053, "step": 944 }, { "epoch": 0.06, "learning_rate": 1.993818555303494e-05, "loss": 0.9209, "step": 945 }, { "epoch": 0.06, "learning_rate": 1.993794026854484e-05, "loss": 0.918, "step": 946 }, { "epoch": 0.06, "learning_rate": 1.993769449987877e-05, "loss": 0.8867, "step": 947 }, { "epoch": 0.06, "learning_rate": 1.993744824704871e-05, "loss": 0.8936, "step": 948 }, { "epoch": 0.06, "learning_rate": 1.9937201510066658e-05, "loss": 0.9033, "step": 949 }, { "epoch": 0.06, "learning_rate": 1.993695428894463e-05, "loss": 0.8887, "step": 950 }, { "epoch": 0.06, "learning_rate": 1.9936706583694674e-05, "loss": 0.9521, "step": 951 }, { "epoch": 0.06, "learning_rate": 1.993645839432886e-05, "loss": 0.9746, "step": 952 }, { "epoch": 0.06, "learning_rate": 1.9936209720859277e-05, "loss": 0.9961, "step": 953 }, { "epoch": 0.07, "learning_rate": 1.9935960563298043e-05, "loss": 0.8711, "step": 954 }, { "epoch": 0.07, "learning_rate": 1.9935710921657292e-05, "loss": 0.9326, "step": 955 }, { "epoch": 0.07, "learning_rate": 1.993546079594919e-05, "loss": 0.8809, "step": 956 }, { "epoch": 0.07, "learning_rate": 1.993521018618592e-05, "loss": 0.8408, "step": 957 }, { "epoch": 0.07, "learning_rate": 1.9934959092379696e-05, "loss": 0.9492, "step": 958 }, { "epoch": 0.07, "learning_rate": 1.9934707514542754e-05, "loss": 0.9043, "step": 959 }, { "epoch": 0.07, "learning_rate": 1.9934455452687344e-05, "loss": 0.874, "step": 960 }, { "epoch": 0.07, "learning_rate": 1.9934202906825747e-05, "loss": 0.9434, "step": 961 }, { "epoch": 0.07, "learning_rate": 1.9933949876970266e-05, "loss": 0.8799, "step": 962 }, { "epoch": 0.07, "learning_rate": 1.9933696363133234e-05, "loss": 0.958, "step": 963 }, { "epoch": 0.07, "learning_rate": 1.9933442365327004e-05, "loss": 0.9893, "step": 964 }, { "epoch": 0.07, "learning_rate": 1.993318788356394e-05, "loss": 0.9404, "step": 965 }, { "epoch": 0.07, "learning_rate": 1.9932932917856453e-05, "loss": 0.8477, "step": 966 }, { "epoch": 0.07, "learning_rate": 1.9932677468216954e-05, "loss": 0.9336, "step": 967 }, { "epoch": 0.07, "learning_rate": 1.9932421534657893e-05, "loss": 0.8613, "step": 968 }, { "epoch": 0.07, "learning_rate": 1.993216511719174e-05, "loss": 0.8887, "step": 969 }, { "epoch": 0.07, "learning_rate": 1.9931908215830988e-05, "loss": 0.957, "step": 970 }, { "epoch": 0.07, "learning_rate": 1.993165083058815e-05, "loss": 0.9492, "step": 971 }, { "epoch": 0.07, "learning_rate": 1.993139296147577e-05, "loss": 0.9297, "step": 972 }, { "epoch": 0.07, "learning_rate": 1.993113460850641e-05, "loss": 0.9023, "step": 973 }, { "epoch": 0.07, "learning_rate": 1.9930875771692654e-05, "loss": 0.9248, "step": 974 }, { "epoch": 0.07, "learning_rate": 1.9930616451047114e-05, "loss": 0.877, "step": 975 }, { "epoch": 0.07, "learning_rate": 1.993035664658243e-05, "loss": 0.9502, "step": 976 }, { "epoch": 0.07, "learning_rate": 1.9930096358311247e-05, "loss": 0.9238, "step": 977 }, { "epoch": 0.07, "learning_rate": 1.9929835586246254e-05, "loss": 0.9219, "step": 978 }, { "epoch": 0.07, "learning_rate": 1.992957433040016e-05, "loss": 0.9746, "step": 979 }, { "epoch": 0.07, "learning_rate": 1.992931259078569e-05, "loss": 0.877, "step": 980 }, { "epoch": 0.07, "learning_rate": 1.9929050367415593e-05, "loss": 0.8818, "step": 981 }, { "epoch": 0.07, "learning_rate": 1.9928787660302643e-05, "loss": 0.8145, "step": 982 }, { "epoch": 0.07, "learning_rate": 1.9928524469459645e-05, "loss": 0.8926, "step": 983 }, { "epoch": 0.07, "learning_rate": 1.992826079489942e-05, "loss": 0.9404, "step": 984 }, { "epoch": 0.07, "learning_rate": 1.9927996636634814e-05, "loss": 0.8691, "step": 985 }, { "epoch": 0.07, "learning_rate": 1.992773199467869e-05, "loss": 0.9648, "step": 986 }, { "epoch": 0.07, "learning_rate": 1.9927466869043954e-05, "loss": 0.9092, "step": 987 }, { "epoch": 0.07, "learning_rate": 1.9927201259743515e-05, "loss": 0.9814, "step": 988 }, { "epoch": 0.07, "learning_rate": 1.9926935166790314e-05, "loss": 0.9463, "step": 989 }, { "epoch": 0.07, "learning_rate": 1.9926668590197314e-05, "loss": 0.9814, "step": 990 }, { "epoch": 0.07, "learning_rate": 1.992640152997751e-05, "loss": 0.8672, "step": 991 }, { "epoch": 0.07, "learning_rate": 1.99261339861439e-05, "loss": 0.9668, "step": 992 }, { "epoch": 0.07, "learning_rate": 1.9925865958709528e-05, "loss": 0.96, "step": 993 }, { "epoch": 0.07, "learning_rate": 1.9925597447687456e-05, "loss": 0.918, "step": 994 }, { "epoch": 0.07, "learning_rate": 1.9925328453090755e-05, "loss": 0.9473, "step": 995 }, { "epoch": 0.07, "learning_rate": 1.9925058974932535e-05, "loss": 0.9092, "step": 996 }, { "epoch": 0.07, "learning_rate": 1.992478901322593e-05, "loss": 0.8926, "step": 997 }, { "epoch": 0.07, "learning_rate": 1.9924518567984087e-05, "loss": 0.9385, "step": 998 }, { "epoch": 0.07, "learning_rate": 1.9924247639220183e-05, "loss": 0.8896, "step": 999 }, { "epoch": 0.07, "learning_rate": 1.9923976226947417e-05, "loss": 0.9277, "step": 1000 }, { "epoch": 0.07, "learning_rate": 1.9923704331179015e-05, "loss": 0.9307, "step": 1001 }, { "epoch": 0.07, "learning_rate": 1.992343195192822e-05, "loss": 0.9297, "step": 1002 }, { "epoch": 0.07, "learning_rate": 1.9923159089208304e-05, "loss": 0.9238, "step": 1003 }, { "epoch": 0.07, "learning_rate": 1.9922885743032562e-05, "loss": 0.9238, "step": 1004 }, { "epoch": 0.07, "learning_rate": 1.992261191341431e-05, "loss": 1.0029, "step": 1005 }, { "epoch": 0.07, "learning_rate": 1.9922337600366892e-05, "loss": 0.8906, "step": 1006 }, { "epoch": 0.07, "learning_rate": 1.992206280390367e-05, "loss": 0.8457, "step": 1007 }, { "epoch": 0.07, "learning_rate": 1.992178752403803e-05, "loss": 0.9287, "step": 1008 }, { "epoch": 0.07, "learning_rate": 1.9921511760783386e-05, "loss": 0.9102, "step": 1009 }, { "epoch": 0.07, "learning_rate": 1.992123551415317e-05, "loss": 0.8848, "step": 1010 }, { "epoch": 0.07, "learning_rate": 1.992095878416085e-05, "loss": 0.9209, "step": 1011 }, { "epoch": 0.07, "learning_rate": 1.9920681570819896e-05, "loss": 0.8584, "step": 1012 }, { "epoch": 0.07, "learning_rate": 1.992040387414382e-05, "loss": 0.9453, "step": 1013 }, { "epoch": 0.07, "learning_rate": 1.9920125694146154e-05, "loss": 0.9219, "step": 1014 }, { "epoch": 0.07, "learning_rate": 1.9919847030840446e-05, "loss": 0.9336, "step": 1015 }, { "epoch": 0.07, "learning_rate": 1.9919567884240277e-05, "loss": 0.9189, "step": 1016 }, { "epoch": 0.07, "learning_rate": 1.9919288254359242e-05, "loss": 0.9316, "step": 1017 }, { "epoch": 0.07, "learning_rate": 1.9919008141210965e-05, "loss": 0.9141, "step": 1018 }, { "epoch": 0.07, "learning_rate": 1.99187275448091e-05, "loss": 0.9756, "step": 1019 }, { "epoch": 0.07, "learning_rate": 1.9918446465167308e-05, "loss": 0.8779, "step": 1020 }, { "epoch": 0.07, "learning_rate": 1.9918164902299292e-05, "loss": 0.9277, "step": 1021 }, { "epoch": 0.07, "learning_rate": 1.9917882856218767e-05, "loss": 0.8623, "step": 1022 }, { "epoch": 0.07, "learning_rate": 1.9917600326939468e-05, "loss": 0.9258, "step": 1023 }, { "epoch": 0.07, "learning_rate": 1.9917317314475167e-05, "loss": 0.9512, "step": 1024 }, { "epoch": 0.07, "learning_rate": 1.9917033818839648e-05, "loss": 1.0127, "step": 1025 }, { "epoch": 0.07, "learning_rate": 1.9916749840046727e-05, "loss": 0.9746, "step": 1026 }, { "epoch": 0.07, "learning_rate": 1.9916465378110238e-05, "loss": 0.9326, "step": 1027 }, { "epoch": 0.07, "learning_rate": 1.9916180433044035e-05, "loss": 0.8506, "step": 1028 }, { "epoch": 0.07, "learning_rate": 1.9915895004862013e-05, "loss": 0.9678, "step": 1029 }, { "epoch": 0.07, "learning_rate": 1.9915609093578063e-05, "loss": 0.9775, "step": 1030 }, { "epoch": 0.07, "learning_rate": 1.9915322699206127e-05, "loss": 0.9404, "step": 1031 }, { "epoch": 0.07, "learning_rate": 1.9915035821760148e-05, "loss": 0.9082, "step": 1032 }, { "epoch": 0.07, "learning_rate": 1.9914748461254108e-05, "loss": 0.8369, "step": 1033 }, { "epoch": 0.07, "learning_rate": 1.9914460617702003e-05, "loss": 0.8926, "step": 1034 }, { "epoch": 0.07, "learning_rate": 1.9914172291117868e-05, "loss": 0.9004, "step": 1035 }, { "epoch": 0.07, "learning_rate": 1.991388348151574e-05, "loss": 0.8984, "step": 1036 }, { "epoch": 0.07, "learning_rate": 1.9913594188909688e-05, "loss": 0.9785, "step": 1037 }, { "epoch": 0.07, "learning_rate": 1.9913304413313815e-05, "loss": 0.9678, "step": 1038 }, { "epoch": 0.07, "learning_rate": 1.9913014154742236e-05, "loss": 0.8604, "step": 1039 }, { "epoch": 0.07, "learning_rate": 1.9912723413209085e-05, "loss": 0.918, "step": 1040 }, { "epoch": 0.07, "learning_rate": 1.9912432188728536e-05, "loss": 0.9824, "step": 1041 }, { "epoch": 0.07, "learning_rate": 1.9912140481314774e-05, "loss": 0.9434, "step": 1042 }, { "epoch": 0.07, "learning_rate": 1.991184829098201e-05, "loss": 0.8408, "step": 1043 }, { "epoch": 0.07, "learning_rate": 1.9911555617744484e-05, "loss": 0.876, "step": 1044 }, { "epoch": 0.07, "learning_rate": 1.991126246161645e-05, "loss": 0.9121, "step": 1045 }, { "epoch": 0.07, "learning_rate": 1.991096882261219e-05, "loss": 0.9463, "step": 1046 }, { "epoch": 0.07, "learning_rate": 1.9910674700746015e-05, "loss": 0.8848, "step": 1047 }, { "epoch": 0.07, "learning_rate": 1.9910380096032245e-05, "loss": 0.9414, "step": 1048 }, { "epoch": 0.07, "learning_rate": 1.991008500848525e-05, "loss": 0.9873, "step": 1049 }, { "epoch": 0.07, "learning_rate": 1.990978943811939e-05, "loss": 0.8477, "step": 1050 }, { "epoch": 0.07, "learning_rate": 1.9909493384949075e-05, "loss": 0.9629, "step": 1051 }, { "epoch": 0.07, "learning_rate": 1.9909196848988724e-05, "loss": 0.9258, "step": 1052 }, { "epoch": 0.07, "learning_rate": 1.9908899830252786e-05, "loss": 0.9678, "step": 1053 }, { "epoch": 0.07, "learning_rate": 1.9908602328755733e-05, "loss": 0.9854, "step": 1054 }, { "epoch": 0.07, "learning_rate": 1.990830434451206e-05, "loss": 0.8232, "step": 1055 }, { "epoch": 0.07, "learning_rate": 1.9908005877536274e-05, "loss": 0.9453, "step": 1056 }, { "epoch": 0.07, "learning_rate": 1.9907706927842932e-05, "loss": 0.9043, "step": 1057 }, { "epoch": 0.07, "learning_rate": 1.9907407495446587e-05, "loss": 0.957, "step": 1058 }, { "epoch": 0.07, "learning_rate": 1.9907107580361836e-05, "loss": 0.9385, "step": 1059 }, { "epoch": 0.07, "learning_rate": 1.9906807182603285e-05, "loss": 0.9189, "step": 1060 }, { "epoch": 0.07, "learning_rate": 1.990650630218557e-05, "loss": 0.9717, "step": 1061 }, { "epoch": 0.07, "learning_rate": 1.9906204939123355e-05, "loss": 0.8086, "step": 1062 }, { "epoch": 0.07, "learning_rate": 1.9905903093431315e-05, "loss": 0.8008, "step": 1063 }, { "epoch": 0.07, "learning_rate": 1.990560076512416e-05, "loss": 0.8975, "step": 1064 }, { "epoch": 0.07, "learning_rate": 1.990529795421662e-05, "loss": 0.915, "step": 1065 }, { "epoch": 0.07, "learning_rate": 1.9904994660723446e-05, "loss": 0.8867, "step": 1066 }, { "epoch": 0.07, "learning_rate": 1.9904690884659413e-05, "loss": 0.9648, "step": 1067 }, { "epoch": 0.07, "learning_rate": 1.9904386626039328e-05, "loss": 0.8721, "step": 1068 }, { "epoch": 0.07, "learning_rate": 1.9904081884878006e-05, "loss": 0.9463, "step": 1069 }, { "epoch": 0.07, "learning_rate": 1.99037766611903e-05, "loss": 0.9688, "step": 1070 }, { "epoch": 0.07, "learning_rate": 1.9903470954991076e-05, "loss": 1.0195, "step": 1071 }, { "epoch": 0.07, "learning_rate": 1.990316476629523e-05, "loss": 0.9111, "step": 1072 }, { "epoch": 0.07, "learning_rate": 1.990285809511768e-05, "loss": 0.9824, "step": 1073 }, { "epoch": 0.07, "learning_rate": 1.9902550941473365e-05, "loss": 0.917, "step": 1074 }, { "epoch": 0.07, "learning_rate": 1.9902243305377253e-05, "loss": 0.8838, "step": 1075 }, { "epoch": 0.07, "learning_rate": 1.990193518684433e-05, "loss": 0.8721, "step": 1076 }, { "epoch": 0.07, "learning_rate": 1.9901626585889607e-05, "loss": 0.8623, "step": 1077 }, { "epoch": 0.07, "learning_rate": 1.990131750252812e-05, "loss": 0.8447, "step": 1078 }, { "epoch": 0.07, "learning_rate": 1.9901007936774926e-05, "loss": 0.9023, "step": 1079 }, { "epoch": 0.07, "learning_rate": 1.990069788864511e-05, "loss": 0.8721, "step": 1080 }, { "epoch": 0.07, "learning_rate": 1.9900387358153775e-05, "loss": 0.8643, "step": 1081 }, { "epoch": 0.07, "learning_rate": 1.990007634531605e-05, "loss": 0.9502, "step": 1082 }, { "epoch": 0.07, "learning_rate": 1.989976485014709e-05, "loss": 0.9912, "step": 1083 }, { "epoch": 0.07, "learning_rate": 1.9899452872662067e-05, "loss": 0.9541, "step": 1084 }, { "epoch": 0.07, "learning_rate": 1.9899140412876185e-05, "loss": 0.9092, "step": 1085 }, { "epoch": 0.07, "learning_rate": 1.9898827470804663e-05, "loss": 0.8486, "step": 1086 }, { "epoch": 0.07, "learning_rate": 1.989851404646275e-05, "loss": 0.8701, "step": 1087 }, { "epoch": 0.07, "learning_rate": 1.9898200139865714e-05, "loss": 0.7754, "step": 1088 }, { "epoch": 0.07, "learning_rate": 1.9897885751028854e-05, "loss": 0.8457, "step": 1089 }, { "epoch": 0.07, "learning_rate": 1.9897570879967477e-05, "loss": 0.999, "step": 1090 }, { "epoch": 0.07, "learning_rate": 1.9897255526696935e-05, "loss": 0.9297, "step": 1091 }, { "epoch": 0.07, "learning_rate": 1.9896939691232583e-05, "loss": 0.9209, "step": 1092 }, { "epoch": 0.07, "learning_rate": 1.9896623373589815e-05, "loss": 0.9678, "step": 1093 }, { "epoch": 0.07, "learning_rate": 1.9896306573784033e-05, "loss": 0.9121, "step": 1094 }, { "epoch": 0.07, "learning_rate": 1.9895989291830684e-05, "loss": 0.9561, "step": 1095 }, { "epoch": 0.07, "learning_rate": 1.9895671527745217e-05, "loss": 0.9922, "step": 1096 }, { "epoch": 0.07, "learning_rate": 1.9895353281543114e-05, "loss": 0.9258, "step": 1097 }, { "epoch": 0.07, "learning_rate": 1.9895034553239883e-05, "loss": 0.9082, "step": 1098 }, { "epoch": 0.07, "learning_rate": 1.9894715342851048e-05, "loss": 0.9355, "step": 1099 }, { "epoch": 0.07, "learning_rate": 1.989439565039217e-05, "loss": 0.9414, "step": 1100 }, { "epoch": 0.08, "learning_rate": 1.9894075475878812e-05, "loss": 0.9443, "step": 1101 }, { "epoch": 0.08, "learning_rate": 1.9893754819326584e-05, "loss": 0.9004, "step": 1102 }, { "epoch": 0.08, "learning_rate": 1.9893433680751105e-05, "loss": 0.9082, "step": 1103 }, { "epoch": 0.08, "learning_rate": 1.9893112060168014e-05, "loss": 0.9414, "step": 1104 }, { "epoch": 0.08, "learning_rate": 1.989278995759299e-05, "loss": 0.9297, "step": 1105 }, { "epoch": 0.08, "learning_rate": 1.9892467373041722e-05, "loss": 0.8613, "step": 1106 }, { "epoch": 0.08, "learning_rate": 1.9892144306529923e-05, "loss": 0.8975, "step": 1107 }, { "epoch": 0.08, "learning_rate": 1.989182075807334e-05, "loss": 0.9111, "step": 1108 }, { "epoch": 0.08, "learning_rate": 1.9891496727687726e-05, "loss": 0.9072, "step": 1109 }, { "epoch": 0.08, "learning_rate": 1.9891172215388878e-05, "loss": 0.8818, "step": 1110 }, { "epoch": 0.08, "learning_rate": 1.9890847221192603e-05, "loss": 0.9424, "step": 1111 }, { "epoch": 0.08, "learning_rate": 1.989052174511473e-05, "loss": 0.9219, "step": 1112 }, { "epoch": 0.08, "learning_rate": 1.989019578717112e-05, "loss": 0.958, "step": 1113 }, { "epoch": 0.08, "learning_rate": 1.9889869347377657e-05, "loss": 0.9434, "step": 1114 }, { "epoch": 0.08, "learning_rate": 1.988954242575024e-05, "loss": 0.8896, "step": 1115 }, { "epoch": 0.08, "learning_rate": 1.98892150223048e-05, "loss": 0.96, "step": 1116 }, { "epoch": 0.08, "learning_rate": 1.9888887137057283e-05, "loss": 0.835, "step": 1117 }, { "epoch": 0.08, "learning_rate": 1.988855877002367e-05, "loss": 0.9443, "step": 1118 }, { "epoch": 0.08, "learning_rate": 1.988822992121995e-05, "loss": 0.9062, "step": 1119 }, { "epoch": 0.08, "learning_rate": 1.988790059066216e-05, "loss": 0.9521, "step": 1120 }, { "epoch": 0.08, "learning_rate": 1.988757077836633e-05, "loss": 0.9062, "step": 1121 }, { "epoch": 0.08, "learning_rate": 1.9887240484348534e-05, "loss": 0.9619, "step": 1122 }, { "epoch": 0.08, "learning_rate": 1.9886909708624866e-05, "loss": 0.9072, "step": 1123 }, { "epoch": 0.08, "learning_rate": 1.9886578451211436e-05, "loss": 0.9316, "step": 1124 }, { "epoch": 0.08, "learning_rate": 1.9886246712124385e-05, "loss": 0.8818, "step": 1125 }, { "epoch": 0.08, "learning_rate": 1.988591449137988e-05, "loss": 0.8662, "step": 1126 }, { "epoch": 0.08, "learning_rate": 1.98855817889941e-05, "loss": 0.8613, "step": 1127 }, { "epoch": 0.08, "learning_rate": 1.988524860498326e-05, "loss": 0.9668, "step": 1128 }, { "epoch": 0.08, "learning_rate": 1.988491493936359e-05, "loss": 0.9727, "step": 1129 }, { "epoch": 0.08, "learning_rate": 1.9884580792151346e-05, "loss": 0.8623, "step": 1130 }, { "epoch": 0.08, "learning_rate": 1.9884246163362807e-05, "loss": 0.8857, "step": 1131 }, { "epoch": 0.08, "learning_rate": 1.988391105301428e-05, "loss": 0.9238, "step": 1132 }, { "epoch": 0.08, "learning_rate": 1.9883575461122082e-05, "loss": 0.9688, "step": 1133 }, { "epoch": 0.08, "learning_rate": 1.9883239387702572e-05, "loss": 0.9531, "step": 1134 }, { "epoch": 0.08, "learning_rate": 1.9882902832772122e-05, "loss": 0.9141, "step": 1135 }, { "epoch": 0.08, "learning_rate": 1.988256579634713e-05, "loss": 0.9707, "step": 1136 }, { "epoch": 0.08, "learning_rate": 1.988222827844401e-05, "loss": 0.9033, "step": 1137 }, { "epoch": 0.08, "learning_rate": 1.9881890279079212e-05, "loss": 0.9111, "step": 1138 }, { "epoch": 0.08, "learning_rate": 1.9881551798269205e-05, "loss": 0.9092, "step": 1139 }, { "epoch": 0.08, "learning_rate": 1.9881212836030472e-05, "loss": 0.8467, "step": 1140 }, { "epoch": 0.08, "learning_rate": 1.9880873392379533e-05, "loss": 0.8662, "step": 1141 }, { "epoch": 0.08, "learning_rate": 1.9880533467332923e-05, "loss": 0.917, "step": 1142 }, { "epoch": 0.08, "learning_rate": 1.9880193060907206e-05, "loss": 0.835, "step": 1143 }, { "epoch": 0.08, "learning_rate": 1.9879852173118963e-05, "loss": 0.8594, "step": 1144 }, { "epoch": 0.08, "learning_rate": 1.9879510803984807e-05, "loss": 0.8926, "step": 1145 }, { "epoch": 0.08, "learning_rate": 1.9879168953521364e-05, "loss": 0.9707, "step": 1146 }, { "epoch": 0.08, "learning_rate": 1.987882662174529e-05, "loss": 0.8877, "step": 1147 }, { "epoch": 0.08, "learning_rate": 1.9878483808673268e-05, "loss": 0.9658, "step": 1148 }, { "epoch": 0.08, "learning_rate": 1.9878140514321995e-05, "loss": 0.9375, "step": 1149 }, { "epoch": 0.08, "learning_rate": 1.9877796738708198e-05, "loss": 0.9736, "step": 1150 }, { "epoch": 0.08, "learning_rate": 1.9877452481848627e-05, "loss": 0.9404, "step": 1151 }, { "epoch": 0.08, "learning_rate": 1.987710774376005e-05, "loss": 0.8242, "step": 1152 }, { "epoch": 0.08, "learning_rate": 1.987676252445927e-05, "loss": 0.9121, "step": 1153 }, { "epoch": 0.08, "learning_rate": 1.9876416823963096e-05, "loss": 0.8926, "step": 1154 }, { "epoch": 0.08, "learning_rate": 1.987607064228838e-05, "loss": 0.876, "step": 1155 }, { "epoch": 0.08, "learning_rate": 1.987572397945198e-05, "loss": 1.0, "step": 1156 }, { "epoch": 0.08, "learning_rate": 1.9875376835470792e-05, "loss": 0.8857, "step": 1157 }, { "epoch": 0.08, "learning_rate": 1.9875029210361725e-05, "loss": 0.9873, "step": 1158 }, { "epoch": 0.08, "learning_rate": 1.987468110414172e-05, "loss": 0.8555, "step": 1159 }, { "epoch": 0.08, "learning_rate": 1.987433251682773e-05, "loss": 0.9248, "step": 1160 }, { "epoch": 0.08, "learning_rate": 1.987398344843674e-05, "loss": 0.958, "step": 1161 }, { "epoch": 0.08, "learning_rate": 1.987363389898576e-05, "loss": 0.8213, "step": 1162 }, { "epoch": 0.08, "learning_rate": 1.9873283868491817e-05, "loss": 0.9346, "step": 1163 }, { "epoch": 0.08, "learning_rate": 1.9872933356971967e-05, "loss": 0.9512, "step": 1164 }, { "epoch": 0.08, "learning_rate": 1.9872582364443285e-05, "loss": 0.9287, "step": 1165 }, { "epoch": 0.08, "learning_rate": 1.987223089092287e-05, "loss": 0.9248, "step": 1166 }, { "epoch": 0.08, "learning_rate": 1.9871878936427847e-05, "loss": 0.9248, "step": 1167 }, { "epoch": 0.08, "learning_rate": 1.9871526500975365e-05, "loss": 0.9629, "step": 1168 }, { "epoch": 0.08, "learning_rate": 1.9871173584582594e-05, "loss": 0.9385, "step": 1169 }, { "epoch": 0.08, "learning_rate": 1.9870820187266727e-05, "loss": 0.9434, "step": 1170 }, { "epoch": 0.08, "learning_rate": 1.987046630904498e-05, "loss": 0.874, "step": 1171 }, { "epoch": 0.08, "learning_rate": 1.9870111949934597e-05, "loss": 0.9365, "step": 1172 }, { "epoch": 0.08, "learning_rate": 1.9869757109952842e-05, "loss": 0.9854, "step": 1173 }, { "epoch": 0.08, "learning_rate": 1.9869401789117e-05, "loss": 0.9395, "step": 1174 }, { "epoch": 0.08, "learning_rate": 1.9869045987444385e-05, "loss": 0.8779, "step": 1175 }, { "epoch": 0.08, "learning_rate": 1.9868689704952333e-05, "loss": 0.8926, "step": 1176 }, { "epoch": 0.08, "learning_rate": 1.9868332941658198e-05, "loss": 0.9062, "step": 1177 }, { "epoch": 0.08, "learning_rate": 1.9867975697579363e-05, "loss": 0.9512, "step": 1178 }, { "epoch": 0.08, "learning_rate": 1.9867617972733235e-05, "loss": 0.8838, "step": 1179 }, { "epoch": 0.08, "learning_rate": 1.986725976713724e-05, "loss": 0.8496, "step": 1180 }, { "epoch": 0.08, "learning_rate": 1.9866901080808828e-05, "loss": 0.9414, "step": 1181 }, { "epoch": 0.08, "learning_rate": 1.9866541913765478e-05, "loss": 0.8516, "step": 1182 }, { "epoch": 0.08, "learning_rate": 1.9866182266024687e-05, "loss": 0.9395, "step": 1183 }, { "epoch": 0.08, "learning_rate": 1.9865822137603977e-05, "loss": 0.9102, "step": 1184 }, { "epoch": 0.08, "learning_rate": 1.9865461528520896e-05, "loss": 0.915, "step": 1185 }, { "epoch": 0.08, "learning_rate": 1.9865100438793008e-05, "loss": 0.9316, "step": 1186 }, { "epoch": 0.08, "learning_rate": 1.9864738868437907e-05, "loss": 0.916, "step": 1187 }, { "epoch": 0.08, "learning_rate": 1.986437681747321e-05, "loss": 0.9297, "step": 1188 }, { "epoch": 0.08, "learning_rate": 1.9864014285916554e-05, "loss": 0.9121, "step": 1189 }, { "epoch": 0.08, "learning_rate": 1.9863651273785606e-05, "loss": 0.9502, "step": 1190 }, { "epoch": 0.08, "learning_rate": 1.9863287781098047e-05, "loss": 0.9609, "step": 1191 }, { "epoch": 0.08, "learning_rate": 1.986292380787159e-05, "loss": 0.8691, "step": 1192 }, { "epoch": 0.08, "learning_rate": 1.9862559354123963e-05, "loss": 0.8486, "step": 1193 }, { "epoch": 0.08, "learning_rate": 1.9862194419872932e-05, "loss": 0.9258, "step": 1194 }, { "epoch": 0.08, "learning_rate": 1.9861829005136265e-05, "loss": 1.0098, "step": 1195 }, { "epoch": 0.08, "learning_rate": 1.986146310993177e-05, "loss": 0.957, "step": 1196 }, { "epoch": 0.08, "learning_rate": 1.986109673427727e-05, "loss": 0.8867, "step": 1197 }, { "epoch": 0.08, "learning_rate": 1.9860729878190624e-05, "loss": 0.9316, "step": 1198 }, { "epoch": 0.08, "learning_rate": 1.9860362541689696e-05, "loss": 0.8408, "step": 1199 }, { "epoch": 0.08, "learning_rate": 1.9859994724792388e-05, "loss": 1.0, "step": 1200 }, { "epoch": 0.08, "learning_rate": 1.9859626427516614e-05, "loss": 0.9385, "step": 1201 }, { "epoch": 0.08, "learning_rate": 1.9859257649880324e-05, "loss": 0.9053, "step": 1202 }, { "epoch": 0.08, "learning_rate": 1.985888839190148e-05, "loss": 0.9287, "step": 1203 }, { "epoch": 0.08, "learning_rate": 1.985851865359808e-05, "loss": 0.9277, "step": 1204 }, { "epoch": 0.08, "learning_rate": 1.9858148434988126e-05, "loss": 0.9033, "step": 1205 }, { "epoch": 0.08, "learning_rate": 1.985777773608966e-05, "loss": 0.9727, "step": 1206 }, { "epoch": 0.08, "learning_rate": 1.9857406556920748e-05, "loss": 0.9092, "step": 1207 }, { "epoch": 0.08, "learning_rate": 1.9857034897499468e-05, "loss": 0.8916, "step": 1208 }, { "epoch": 0.08, "learning_rate": 1.9856662757843927e-05, "loss": 0.9346, "step": 1209 }, { "epoch": 0.08, "learning_rate": 1.985629013797226e-05, "loss": 0.8984, "step": 1210 }, { "epoch": 0.08, "learning_rate": 1.9855917037902614e-05, "loss": 0.8867, "step": 1211 }, { "epoch": 0.08, "learning_rate": 1.9855543457653176e-05, "loss": 0.9189, "step": 1212 }, { "epoch": 0.08, "learning_rate": 1.9855169397242136e-05, "loss": 0.9258, "step": 1213 }, { "epoch": 0.08, "learning_rate": 1.9854794856687726e-05, "loss": 0.9072, "step": 1214 }, { "epoch": 0.08, "learning_rate": 1.985441983600819e-05, "loss": 0.9404, "step": 1215 }, { "epoch": 0.08, "learning_rate": 1.98540443352218e-05, "loss": 0.8652, "step": 1216 }, { "epoch": 0.08, "learning_rate": 1.9853668354346854e-05, "loss": 0.8779, "step": 1217 }, { "epoch": 0.08, "learning_rate": 1.9853291893401662e-05, "loss": 0.9941, "step": 1218 }, { "epoch": 0.08, "learning_rate": 1.9852914952404574e-05, "loss": 0.9404, "step": 1219 }, { "epoch": 0.08, "learning_rate": 1.9852537531373944e-05, "loss": 0.9639, "step": 1220 }, { "epoch": 0.08, "learning_rate": 1.985215963032817e-05, "loss": 0.9258, "step": 1221 }, { "epoch": 0.08, "learning_rate": 1.985178124928566e-05, "loss": 0.8906, "step": 1222 }, { "epoch": 0.08, "learning_rate": 1.9851402388264846e-05, "loss": 0.9092, "step": 1223 }, { "epoch": 0.08, "learning_rate": 1.985102304728419e-05, "loss": 0.915, "step": 1224 }, { "epoch": 0.08, "learning_rate": 1.985064322636217e-05, "loss": 0.8809, "step": 1225 }, { "epoch": 0.08, "learning_rate": 1.985026292551729e-05, "loss": 0.9785, "step": 1226 }, { "epoch": 0.08, "learning_rate": 1.9849882144768083e-05, "loss": 0.8994, "step": 1227 }, { "epoch": 0.08, "learning_rate": 1.9849500884133102e-05, "loss": 0.9453, "step": 1228 }, { "epoch": 0.08, "learning_rate": 1.9849119143630914e-05, "loss": 0.8965, "step": 1229 }, { "epoch": 0.08, "learning_rate": 1.9848736923280123e-05, "loss": 0.8994, "step": 1230 }, { "epoch": 0.08, "learning_rate": 1.9848354223099346e-05, "loss": 0.9834, "step": 1231 }, { "epoch": 0.08, "learning_rate": 1.9847971043107236e-05, "loss": 0.9131, "step": 1232 }, { "epoch": 0.08, "learning_rate": 1.9847587383322454e-05, "loss": 0.9229, "step": 1233 }, { "epoch": 0.08, "learning_rate": 1.98472032437637e-05, "loss": 0.9238, "step": 1234 }, { "epoch": 0.08, "learning_rate": 1.9846818624449677e-05, "loss": 0.8672, "step": 1235 }, { "epoch": 0.08, "learning_rate": 1.9846433525399135e-05, "loss": 0.9238, "step": 1236 }, { "epoch": 0.08, "learning_rate": 1.984604794663083e-05, "loss": 0.8359, "step": 1237 }, { "epoch": 0.08, "learning_rate": 1.984566188816355e-05, "loss": 0.8838, "step": 1238 }, { "epoch": 0.08, "learning_rate": 1.98452753500161e-05, "loss": 0.9414, "step": 1239 }, { "epoch": 0.08, "learning_rate": 1.9844888332207322e-05, "loss": 0.9443, "step": 1240 }, { "epoch": 0.08, "learning_rate": 1.984450083475606e-05, "loss": 0.96, "step": 1241 }, { "epoch": 0.08, "learning_rate": 1.98441128576812e-05, "loss": 0.8926, "step": 1242 }, { "epoch": 0.08, "learning_rate": 1.984372440100164e-05, "loss": 0.8975, "step": 1243 }, { "epoch": 0.08, "learning_rate": 1.9843335464736305e-05, "loss": 0.8838, "step": 1244 }, { "epoch": 0.08, "learning_rate": 1.984294604890415e-05, "loss": 0.9111, "step": 1245 }, { "epoch": 0.08, "learning_rate": 1.984255615352414e-05, "loss": 0.8516, "step": 1246 }, { "epoch": 0.08, "learning_rate": 1.9842165778615276e-05, "loss": 0.9512, "step": 1247 }, { "epoch": 0.09, "learning_rate": 1.9841774924196574e-05, "loss": 0.9082, "step": 1248 }, { "epoch": 0.09, "learning_rate": 1.984138359028708e-05, "loss": 0.8789, "step": 1249 }, { "epoch": 0.09, "learning_rate": 1.9840991776905857e-05, "loss": 0.9541, "step": 1250 }, { "epoch": 0.09, "learning_rate": 1.9840599484071992e-05, "loss": 0.916, "step": 1251 }, { "epoch": 0.09, "learning_rate": 1.9840206711804605e-05, "loss": 0.917, "step": 1252 }, { "epoch": 0.09, "learning_rate": 1.983981346012282e-05, "loss": 0.832, "step": 1253 }, { "epoch": 0.09, "learning_rate": 1.983941972904581e-05, "loss": 0.9355, "step": 1254 }, { "epoch": 0.09, "learning_rate": 1.9839025518592747e-05, "loss": 0.9453, "step": 1255 }, { "epoch": 0.09, "learning_rate": 1.983863082878284e-05, "loss": 0.9551, "step": 1256 }, { "epoch": 0.09, "learning_rate": 1.983823565963532e-05, "loss": 0.8896, "step": 1257 }, { "epoch": 0.09, "learning_rate": 1.983784001116944e-05, "loss": 0.918, "step": 1258 }, { "epoch": 0.09, "learning_rate": 1.983744388340447e-05, "loss": 0.8906, "step": 1259 }, { "epoch": 0.09, "learning_rate": 1.9837047276359717e-05, "loss": 0.9258, "step": 1260 }, { "epoch": 0.09, "learning_rate": 1.98366501900545e-05, "loss": 0.8721, "step": 1261 }, { "epoch": 0.09, "learning_rate": 1.9836252624508167e-05, "loss": 0.958, "step": 1262 }, { "epoch": 0.09, "learning_rate": 1.9835854579740085e-05, "loss": 0.9082, "step": 1263 }, { "epoch": 0.09, "learning_rate": 1.9835456055769645e-05, "loss": 0.9111, "step": 1264 }, { "epoch": 0.09, "learning_rate": 1.9835057052616265e-05, "loss": 0.9756, "step": 1265 }, { "epoch": 0.09, "learning_rate": 1.9834657570299386e-05, "loss": 0.9561, "step": 1266 }, { "epoch": 0.09, "learning_rate": 1.9834257608838473e-05, "loss": 0.8887, "step": 1267 }, { "epoch": 0.09, "learning_rate": 1.9833857168253007e-05, "loss": 0.9873, "step": 1268 }, { "epoch": 0.09, "learning_rate": 1.9833456248562498e-05, "loss": 0.9805, "step": 1269 }, { "epoch": 0.09, "learning_rate": 1.983305484978648e-05, "loss": 1.0, "step": 1270 }, { "epoch": 0.09, "learning_rate": 1.9832652971944513e-05, "loss": 0.8887, "step": 1271 }, { "epoch": 0.09, "learning_rate": 1.983225061505617e-05, "loss": 0.9072, "step": 1272 }, { "epoch": 0.09, "learning_rate": 1.983184777914106e-05, "loss": 0.8916, "step": 1273 }, { "epoch": 0.09, "learning_rate": 1.9831444464218797e-05, "loss": 0.8682, "step": 1274 }, { "epoch": 0.09, "learning_rate": 1.9831040670309047e-05, "loss": 0.876, "step": 1275 }, { "epoch": 0.09, "learning_rate": 1.9830636397431472e-05, "loss": 0.8857, "step": 1276 }, { "epoch": 0.09, "learning_rate": 1.983023164560577e-05, "loss": 0.8486, "step": 1277 }, { "epoch": 0.09, "learning_rate": 1.9829826414851664e-05, "loss": 0.8896, "step": 1278 }, { "epoch": 0.09, "learning_rate": 1.9829420705188896e-05, "loss": 0.9697, "step": 1279 }, { "epoch": 0.09, "learning_rate": 1.9829014516637227e-05, "loss": 0.8389, "step": 1280 }, { "epoch": 0.09, "learning_rate": 1.9828607849216454e-05, "loss": 0.9531, "step": 1281 }, { "epoch": 0.09, "learning_rate": 1.982820070294638e-05, "loss": 0.8691, "step": 1282 }, { "epoch": 0.09, "learning_rate": 1.9827793077846852e-05, "loss": 0.874, "step": 1283 }, { "epoch": 0.09, "learning_rate": 1.9827384973937723e-05, "loss": 0.8916, "step": 1284 }, { "epoch": 0.09, "learning_rate": 1.9826976391238877e-05, "loss": 0.9297, "step": 1285 }, { "epoch": 0.09, "learning_rate": 1.982656732977022e-05, "loss": 0.9346, "step": 1286 }, { "epoch": 0.09, "learning_rate": 1.982615778955168e-05, "loss": 0.916, "step": 1287 }, { "epoch": 0.09, "learning_rate": 1.9825747770603217e-05, "loss": 0.9248, "step": 1288 }, { "epoch": 0.09, "learning_rate": 1.98253372729448e-05, "loss": 0.8809, "step": 1289 }, { "epoch": 0.09, "learning_rate": 1.982492629659643e-05, "loss": 0.873, "step": 1290 }, { "epoch": 0.09, "learning_rate": 1.9824514841578128e-05, "loss": 0.8984, "step": 1291 }, { "epoch": 0.09, "learning_rate": 1.9824102907909945e-05, "loss": 1.0029, "step": 1292 }, { "epoch": 0.09, "learning_rate": 1.982369049561194e-05, "loss": 0.958, "step": 1293 }, { "epoch": 0.09, "learning_rate": 1.982327760470422e-05, "loss": 0.9141, "step": 1294 }, { "epoch": 0.09, "learning_rate": 1.9822864235206895e-05, "loss": 0.8691, "step": 1295 }, { "epoch": 0.09, "learning_rate": 1.9822450387140104e-05, "loss": 0.9795, "step": 1296 }, { "epoch": 0.09, "learning_rate": 1.9822036060524e-05, "loss": 0.8369, "step": 1297 }, { "epoch": 0.09, "learning_rate": 1.9821621255378788e-05, "loss": 0.9121, "step": 1298 }, { "epoch": 0.09, "learning_rate": 1.9821205971724664e-05, "loss": 0.959, "step": 1299 }, { "epoch": 0.09, "learning_rate": 1.9820790209581865e-05, "loss": 0.9023, "step": 1300 }, { "epoch": 0.09, "learning_rate": 1.9820373968970642e-05, "loss": 0.8535, "step": 1301 }, { "epoch": 0.09, "learning_rate": 1.981995724991128e-05, "loss": 0.9775, "step": 1302 }, { "epoch": 0.09, "learning_rate": 1.9819540052424084e-05, "loss": 0.8633, "step": 1303 }, { "epoch": 0.09, "learning_rate": 1.9819122376529372e-05, "loss": 0.9785, "step": 1304 }, { "epoch": 0.09, "learning_rate": 1.9818704222247498e-05, "loss": 0.8926, "step": 1305 }, { "epoch": 0.09, "learning_rate": 1.981828558959883e-05, "loss": 0.8125, "step": 1306 }, { "epoch": 0.09, "learning_rate": 1.981786647860377e-05, "loss": 0.8145, "step": 1307 }, { "epoch": 0.09, "learning_rate": 1.981744688928273e-05, "loss": 0.9375, "step": 1308 }, { "epoch": 0.09, "learning_rate": 1.981702682165616e-05, "loss": 0.8281, "step": 1309 }, { "epoch": 0.09, "learning_rate": 1.9816606275744524e-05, "loss": 0.8809, "step": 1310 }, { "epoch": 0.09, "learning_rate": 1.9816185251568305e-05, "loss": 0.8916, "step": 1311 }, { "epoch": 0.09, "learning_rate": 1.981576374914802e-05, "loss": 0.9189, "step": 1312 }, { "epoch": 0.09, "learning_rate": 1.9815341768504203e-05, "loss": 0.9062, "step": 1313 }, { "epoch": 0.09, "learning_rate": 1.9814919309657418e-05, "loss": 0.9414, "step": 1314 }, { "epoch": 0.09, "learning_rate": 1.981449637262824e-05, "loss": 0.9209, "step": 1315 }, { "epoch": 0.09, "learning_rate": 1.9814072957437272e-05, "loss": 0.877, "step": 1316 }, { "epoch": 0.09, "learning_rate": 1.9813649064105154e-05, "loss": 0.9082, "step": 1317 }, { "epoch": 0.09, "learning_rate": 1.9813224692652534e-05, "loss": 0.9248, "step": 1318 }, { "epoch": 0.09, "learning_rate": 1.981279984310008e-05, "loss": 0.916, "step": 1319 }, { "epoch": 0.09, "learning_rate": 1.98123745154685e-05, "loss": 0.8643, "step": 1320 }, { "epoch": 0.09, "learning_rate": 1.9811948709778513e-05, "loss": 0.9258, "step": 1321 }, { "epoch": 0.09, "learning_rate": 1.9811522426050862e-05, "loss": 0.8467, "step": 1322 }, { "epoch": 0.09, "learning_rate": 1.9811095664306315e-05, "loss": 0.8945, "step": 1323 }, { "epoch": 0.09, "learning_rate": 1.9810668424565665e-05, "loss": 0.9258, "step": 1324 }, { "epoch": 0.09, "learning_rate": 1.981024070684973e-05, "loss": 0.877, "step": 1325 }, { "epoch": 0.09, "learning_rate": 1.980981251117935e-05, "loss": 0.957, "step": 1326 }, { "epoch": 0.09, "learning_rate": 1.9809383837575378e-05, "loss": 0.8623, "step": 1327 }, { "epoch": 0.09, "learning_rate": 1.9808954686058707e-05, "loss": 0.8926, "step": 1328 }, { "epoch": 0.09, "learning_rate": 1.9808525056650238e-05, "loss": 0.8525, "step": 1329 }, { "epoch": 0.09, "learning_rate": 1.980809494937091e-05, "loss": 0.8506, "step": 1330 }, { "epoch": 0.09, "learning_rate": 1.9807664364241672e-05, "loss": 0.9395, "step": 1331 }, { "epoch": 0.09, "learning_rate": 1.9807233301283503e-05, "loss": 0.9473, "step": 1332 }, { "epoch": 0.09, "learning_rate": 1.980680176051741e-05, "loss": 0.8672, "step": 1333 }, { "epoch": 0.09, "learning_rate": 1.980636974196441e-05, "loss": 0.8887, "step": 1334 }, { "epoch": 0.09, "learning_rate": 1.9805937245645556e-05, "loss": 0.9766, "step": 1335 }, { "epoch": 0.09, "learning_rate": 1.9805504271581917e-05, "loss": 0.9385, "step": 1336 }, { "epoch": 0.09, "learning_rate": 1.980507081979459e-05, "loss": 0.9287, "step": 1337 }, { "epoch": 0.09, "learning_rate": 1.9804636890304688e-05, "loss": 0.9082, "step": 1338 }, { "epoch": 0.09, "learning_rate": 1.9804202483133358e-05, "loss": 0.9551, "step": 1339 }, { "epoch": 0.09, "learning_rate": 1.980376759830176e-05, "loss": 0.915, "step": 1340 }, { "epoch": 0.09, "learning_rate": 1.980333223583108e-05, "loss": 0.9092, "step": 1341 }, { "epoch": 0.09, "learning_rate": 1.9802896395742533e-05, "loss": 0.9385, "step": 1342 }, { "epoch": 0.09, "learning_rate": 1.9802460078057355e-05, "loss": 0.9619, "step": 1343 }, { "epoch": 0.09, "learning_rate": 1.9802023282796797e-05, "loss": 0.8232, "step": 1344 }, { "epoch": 0.09, "learning_rate": 1.9801586009982143e-05, "loss": 0.8105, "step": 1345 }, { "epoch": 0.09, "learning_rate": 1.9801148259634698e-05, "loss": 0.9053, "step": 1346 }, { "epoch": 0.09, "learning_rate": 1.9800710031775786e-05, "loss": 0.8975, "step": 1347 }, { "epoch": 0.09, "learning_rate": 1.980027132642676e-05, "loss": 0.9004, "step": 1348 }, { "epoch": 0.09, "learning_rate": 1.979983214360899e-05, "loss": 0.918, "step": 1349 }, { "epoch": 0.09, "learning_rate": 1.9799392483343878e-05, "loss": 0.8496, "step": 1350 }, { "epoch": 0.09, "learning_rate": 1.979895234565284e-05, "loss": 0.8662, "step": 1351 }, { "epoch": 0.09, "learning_rate": 1.9798511730557325e-05, "loss": 0.873, "step": 1352 }, { "epoch": 0.09, "learning_rate": 1.9798070638078797e-05, "loss": 0.9404, "step": 1353 }, { "epoch": 0.09, "learning_rate": 1.9797629068238744e-05, "loss": 0.8906, "step": 1354 }, { "epoch": 0.09, "learning_rate": 1.9797187021058678e-05, "loss": 0.9248, "step": 1355 }, { "epoch": 0.09, "learning_rate": 1.979674449656014e-05, "loss": 0.9443, "step": 1356 }, { "epoch": 0.09, "learning_rate": 1.979630149476469e-05, "loss": 0.9482, "step": 1357 }, { "epoch": 0.09, "learning_rate": 1.9795858015693908e-05, "loss": 0.9375, "step": 1358 }, { "epoch": 0.09, "learning_rate": 1.97954140593694e-05, "loss": 0.8857, "step": 1359 }, { "epoch": 0.09, "learning_rate": 1.9794969625812798e-05, "loss": 0.9072, "step": 1360 }, { "epoch": 0.09, "learning_rate": 1.9794524715045753e-05, "loss": 0.917, "step": 1361 }, { "epoch": 0.09, "learning_rate": 1.9794079327089938e-05, "loss": 0.957, "step": 1362 }, { "epoch": 0.09, "learning_rate": 1.979363346196706e-05, "loss": 0.8926, "step": 1363 }, { "epoch": 0.09, "learning_rate": 1.9793187119698837e-05, "loss": 0.9141, "step": 1364 }, { "epoch": 0.09, "learning_rate": 1.9792740300307014e-05, "loss": 0.9766, "step": 1365 }, { "epoch": 0.09, "learning_rate": 1.979229300381336e-05, "loss": 0.8818, "step": 1366 }, { "epoch": 0.09, "learning_rate": 1.979184523023967e-05, "loss": 0.9092, "step": 1367 }, { "epoch": 0.09, "learning_rate": 1.979139697960776e-05, "loss": 0.8975, "step": 1368 }, { "epoch": 0.09, "learning_rate": 1.9790948251939462e-05, "loss": 0.9248, "step": 1369 }, { "epoch": 0.09, "learning_rate": 1.9790499047256646e-05, "loss": 0.8516, "step": 1370 }, { "epoch": 0.09, "learning_rate": 1.9790049365581195e-05, "loss": 0.9121, "step": 1371 }, { "epoch": 0.09, "learning_rate": 1.9789599206935013e-05, "loss": 0.8672, "step": 1372 }, { "epoch": 0.09, "learning_rate": 1.9789148571340035e-05, "loss": 0.9629, "step": 1373 }, { "epoch": 0.09, "learning_rate": 1.978869745881822e-05, "loss": 0.877, "step": 1374 }, { "epoch": 0.09, "learning_rate": 1.978824586939154e-05, "loss": 0.9414, "step": 1375 }, { "epoch": 0.09, "learning_rate": 1.9787793803081995e-05, "loss": 0.9023, "step": 1376 }, { "epoch": 0.09, "learning_rate": 1.9787341259911618e-05, "loss": 0.874, "step": 1377 }, { "epoch": 0.09, "learning_rate": 1.978688823990245e-05, "loss": 0.9326, "step": 1378 }, { "epoch": 0.09, "learning_rate": 1.9786434743076564e-05, "loss": 0.9102, "step": 1379 }, { "epoch": 0.09, "learning_rate": 1.9785980769456054e-05, "loss": 0.9648, "step": 1380 }, { "epoch": 0.09, "learning_rate": 1.978552631906304e-05, "loss": 0.958, "step": 1381 }, { "epoch": 0.09, "learning_rate": 1.978507139191966e-05, "loss": 0.9199, "step": 1382 }, { "epoch": 0.09, "learning_rate": 1.9784615988048078e-05, "loss": 0.9541, "step": 1383 }, { "epoch": 0.09, "learning_rate": 1.9784160107470483e-05, "loss": 0.959, "step": 1384 }, { "epoch": 0.09, "learning_rate": 1.9783703750209085e-05, "loss": 0.9463, "step": 1385 }, { "epoch": 0.09, "learning_rate": 1.978324691628612e-05, "loss": 0.9131, "step": 1386 }, { "epoch": 0.09, "learning_rate": 1.978278960572384e-05, "loss": 0.8652, "step": 1387 }, { "epoch": 0.09, "learning_rate": 1.9782331818544526e-05, "loss": 0.8076, "step": 1388 }, { "epoch": 0.09, "learning_rate": 1.9781873554770484e-05, "loss": 0.8975, "step": 1389 }, { "epoch": 0.09, "learning_rate": 1.9781414814424044e-05, "loss": 0.9541, "step": 1390 }, { "epoch": 0.09, "learning_rate": 1.9780955597527544e-05, "loss": 0.9033, "step": 1391 }, { "epoch": 0.09, "learning_rate": 1.978049590410337e-05, "loss": 0.9697, "step": 1392 }, { "epoch": 0.09, "learning_rate": 1.9780035734173907e-05, "loss": 0.9072, "step": 1393 }, { "epoch": 0.09, "learning_rate": 1.9779575087761583e-05, "loss": 0.9199, "step": 1394 }, { "epoch": 0.1, "learning_rate": 1.9779113964888838e-05, "loss": 0.9219, "step": 1395 }, { "epoch": 0.1, "learning_rate": 1.9778652365578135e-05, "loss": 0.9463, "step": 1396 }, { "epoch": 0.1, "learning_rate": 1.977819028985197e-05, "loss": 0.9277, "step": 1397 }, { "epoch": 0.1, "learning_rate": 1.9777727737732845e-05, "loss": 0.9053, "step": 1398 }, { "epoch": 0.1, "learning_rate": 1.9777264709243305e-05, "loss": 0.9512, "step": 1399 }, { "epoch": 0.1, "learning_rate": 1.9776801204405906e-05, "loss": 0.8994, "step": 1400 }, { "epoch": 0.1, "learning_rate": 1.9776337223243228e-05, "loss": 0.9512, "step": 1401 }, { "epoch": 0.1, "learning_rate": 1.9775872765777878e-05, "loss": 0.9365, "step": 1402 }, { "epoch": 0.1, "learning_rate": 1.977540783203248e-05, "loss": 0.874, "step": 1403 }, { "epoch": 0.1, "learning_rate": 1.9774942422029695e-05, "loss": 0.957, "step": 1404 }, { "epoch": 0.1, "learning_rate": 1.9774476535792188e-05, "loss": 0.8662, "step": 1405 }, { "epoch": 0.1, "learning_rate": 1.977401017334266e-05, "loss": 0.9443, "step": 1406 }, { "epoch": 0.1, "learning_rate": 1.9773543334703836e-05, "loss": 0.9355, "step": 1407 }, { "epoch": 0.1, "learning_rate": 1.9773076019898457e-05, "loss": 0.9502, "step": 1408 }, { "epoch": 0.1, "learning_rate": 1.9772608228949292e-05, "loss": 0.874, "step": 1409 }, { "epoch": 0.1, "learning_rate": 1.9772139961879126e-05, "loss": 0.9424, "step": 1410 }, { "epoch": 0.1, "learning_rate": 1.977167121871078e-05, "loss": 0.9033, "step": 1411 }, { "epoch": 0.1, "learning_rate": 1.9771201999467088e-05, "loss": 0.9277, "step": 1412 }, { "epoch": 0.1, "learning_rate": 1.9770732304170915e-05, "loss": 0.8701, "step": 1413 }, { "epoch": 0.1, "learning_rate": 1.9770262132845136e-05, "loss": 0.9492, "step": 1414 }, { "epoch": 0.1, "learning_rate": 1.9769791485512665e-05, "loss": 0.9102, "step": 1415 }, { "epoch": 0.1, "learning_rate": 1.976932036219643e-05, "loss": 1.0049, "step": 1416 }, { "epoch": 0.1, "learning_rate": 1.976884876291938e-05, "loss": 0.832, "step": 1417 }, { "epoch": 0.1, "learning_rate": 1.9768376687704494e-05, "loss": 0.792, "step": 1418 }, { "epoch": 0.1, "learning_rate": 1.9767904136574778e-05, "loss": 0.874, "step": 1419 }, { "epoch": 0.1, "learning_rate": 1.9767431109553247e-05, "loss": 0.7822, "step": 1420 }, { "epoch": 0.1, "learning_rate": 1.9766957606662945e-05, "loss": 0.9023, "step": 1421 }, { "epoch": 0.1, "learning_rate": 1.976648362792695e-05, "loss": 0.8955, "step": 1422 }, { "epoch": 0.1, "learning_rate": 1.9766009173368344e-05, "loss": 0.918, "step": 1423 }, { "epoch": 0.1, "learning_rate": 1.9765534243010248e-05, "loss": 0.9141, "step": 1424 }, { "epoch": 0.1, "learning_rate": 1.9765058836875802e-05, "loss": 0.9102, "step": 1425 }, { "epoch": 0.1, "learning_rate": 1.976458295498816e-05, "loss": 0.9893, "step": 1426 }, { "epoch": 0.1, "learning_rate": 1.976410659737052e-05, "loss": 0.9014, "step": 1427 }, { "epoch": 0.1, "learning_rate": 1.976362976404608e-05, "loss": 0.9023, "step": 1428 }, { "epoch": 0.1, "learning_rate": 1.9763152455038076e-05, "loss": 0.916, "step": 1429 }, { "epoch": 0.1, "learning_rate": 1.9762674670369757e-05, "loss": 0.998, "step": 1430 }, { "epoch": 0.1, "learning_rate": 1.9762196410064406e-05, "loss": 0.9443, "step": 1431 }, { "epoch": 0.1, "learning_rate": 1.976171767414532e-05, "loss": 0.9258, "step": 1432 }, { "epoch": 0.1, "learning_rate": 1.9761238462635827e-05, "loss": 0.8408, "step": 1433 }, { "epoch": 0.1, "learning_rate": 1.9760758775559275e-05, "loss": 0.9004, "step": 1434 }, { "epoch": 0.1, "learning_rate": 1.976027861293903e-05, "loss": 0.916, "step": 1435 }, { "epoch": 0.1, "learning_rate": 1.9759797974798484e-05, "loss": 0.8594, "step": 1436 }, { "epoch": 0.1, "learning_rate": 1.9759316861161056e-05, "loss": 0.957, "step": 1437 }, { "epoch": 0.1, "learning_rate": 1.9758835272050188e-05, "loss": 0.9268, "step": 1438 }, { "epoch": 0.1, "learning_rate": 1.9758353207489342e-05, "loss": 0.9277, "step": 1439 }, { "epoch": 0.1, "learning_rate": 1.9757870667502e-05, "loss": 0.8672, "step": 1440 }, { "epoch": 0.1, "learning_rate": 1.9757387652111682e-05, "loss": 0.958, "step": 1441 }, { "epoch": 0.1, "learning_rate": 1.975690416134191e-05, "loss": 0.8145, "step": 1442 }, { "epoch": 0.1, "learning_rate": 1.9756420195216243e-05, "loss": 0.9355, "step": 1443 }, { "epoch": 0.1, "learning_rate": 1.9755935753758256e-05, "loss": 0.9707, "step": 1444 }, { "epoch": 0.1, "learning_rate": 1.9755450836991562e-05, "loss": 0.8623, "step": 1445 }, { "epoch": 0.1, "learning_rate": 1.9754965444939774e-05, "loss": 0.9199, "step": 1446 }, { "epoch": 0.1, "learning_rate": 1.9754479577626547e-05, "loss": 0.8965, "step": 1447 }, { "epoch": 0.1, "learning_rate": 1.975399323507555e-05, "loss": 0.9268, "step": 1448 }, { "epoch": 0.1, "learning_rate": 1.9753506417310476e-05, "loss": 0.8906, "step": 1449 }, { "epoch": 0.1, "learning_rate": 1.975301912435505e-05, "loss": 0.9102, "step": 1450 }, { "epoch": 0.1, "learning_rate": 1.9752531356233007e-05, "loss": 0.8369, "step": 1451 }, { "epoch": 0.1, "learning_rate": 1.9752043112968107e-05, "loss": 0.9102, "step": 1452 }, { "epoch": 0.1, "learning_rate": 1.9751554394584146e-05, "loss": 0.9639, "step": 1453 }, { "epoch": 0.1, "learning_rate": 1.975106520110493e-05, "loss": 0.9844, "step": 1454 }, { "epoch": 0.1, "learning_rate": 1.975057553255429e-05, "loss": 0.9336, "step": 1455 }, { "epoch": 0.1, "learning_rate": 1.975008538895609e-05, "loss": 0.8828, "step": 1456 }, { "epoch": 0.1, "learning_rate": 1.9749594770334207e-05, "loss": 0.9541, "step": 1457 }, { "epoch": 0.1, "learning_rate": 1.9749103676712537e-05, "loss": 0.8955, "step": 1458 }, { "epoch": 0.1, "learning_rate": 1.9748612108115016e-05, "loss": 0.9727, "step": 1459 }, { "epoch": 0.1, "learning_rate": 1.9748120064565587e-05, "loss": 0.9404, "step": 1460 }, { "epoch": 0.1, "learning_rate": 1.974762754608822e-05, "loss": 0.7588, "step": 1461 }, { "epoch": 0.1, "learning_rate": 1.9747134552706917e-05, "loss": 0.8594, "step": 1462 }, { "epoch": 0.1, "learning_rate": 1.9746641084445692e-05, "loss": 0.874, "step": 1463 }, { "epoch": 0.1, "learning_rate": 1.974614714132859e-05, "loss": 0.8809, "step": 1464 }, { "epoch": 0.1, "learning_rate": 1.9745652723379674e-05, "loss": 0.9434, "step": 1465 }, { "epoch": 0.1, "learning_rate": 1.974515783062304e-05, "loss": 0.877, "step": 1466 }, { "epoch": 0.1, "learning_rate": 1.9744662463082782e-05, "loss": 0.8896, "step": 1467 }, { "epoch": 0.1, "learning_rate": 1.9744166620783047e-05, "loss": 1.0244, "step": 1468 }, { "epoch": 0.1, "learning_rate": 1.974367030374799e-05, "loss": 0.8945, "step": 1469 }, { "epoch": 0.1, "learning_rate": 1.974317351200179e-05, "loss": 0.8877, "step": 1470 }, { "epoch": 0.1, "learning_rate": 1.9742676245568652e-05, "loss": 0.8896, "step": 1471 }, { "epoch": 0.1, "learning_rate": 1.9742178504472805e-05, "loss": 0.8857, "step": 1472 }, { "epoch": 0.1, "learning_rate": 1.9741680288738495e-05, "loss": 0.9531, "step": 1473 }, { "epoch": 0.1, "learning_rate": 1.9741181598389995e-05, "loss": 0.9521, "step": 1474 }, { "epoch": 0.1, "learning_rate": 1.9740682433451604e-05, "loss": 0.8867, "step": 1475 }, { "epoch": 0.1, "learning_rate": 1.9740182793947636e-05, "loss": 0.8857, "step": 1476 }, { "epoch": 0.1, "learning_rate": 1.973968267990244e-05, "loss": 0.9805, "step": 1477 }, { "epoch": 0.1, "learning_rate": 1.973918209134038e-05, "loss": 0.9873, "step": 1478 }, { "epoch": 0.1, "learning_rate": 1.9738681028285845e-05, "loss": 0.9453, "step": 1479 }, { "epoch": 0.1, "learning_rate": 1.9738179490763242e-05, "loss": 0.9619, "step": 1480 }, { "epoch": 0.1, "learning_rate": 1.973767747879701e-05, "loss": 0.9658, "step": 1481 }, { "epoch": 0.1, "learning_rate": 1.9737174992411608e-05, "loss": 0.9326, "step": 1482 }, { "epoch": 0.1, "learning_rate": 1.973667203163151e-05, "loss": 0.9072, "step": 1483 }, { "epoch": 0.1, "learning_rate": 1.973616859648123e-05, "loss": 0.9717, "step": 1484 }, { "epoch": 0.1, "learning_rate": 1.973566468698529e-05, "loss": 0.8848, "step": 1485 }, { "epoch": 0.1, "learning_rate": 1.9735160303168238e-05, "loss": 0.9717, "step": 1486 }, { "epoch": 0.1, "learning_rate": 1.9734655445054654e-05, "loss": 0.9043, "step": 1487 }, { "epoch": 0.1, "learning_rate": 1.9734150112669132e-05, "loss": 0.8691, "step": 1488 }, { "epoch": 0.1, "learning_rate": 1.973364430603629e-05, "loss": 0.7881, "step": 1489 }, { "epoch": 0.1, "learning_rate": 1.9733138025180775e-05, "loss": 0.874, "step": 1490 }, { "epoch": 0.1, "learning_rate": 1.9732631270127246e-05, "loss": 0.9043, "step": 1491 }, { "epoch": 0.1, "learning_rate": 1.9732124040900395e-05, "loss": 0.8721, "step": 1492 }, { "epoch": 0.1, "learning_rate": 1.973161633752494e-05, "loss": 0.9297, "step": 1493 }, { "epoch": 0.1, "learning_rate": 1.9731108160025608e-05, "loss": 0.9482, "step": 1494 }, { "epoch": 0.1, "learning_rate": 1.9730599508427164e-05, "loss": 0.8848, "step": 1495 }, { "epoch": 0.1, "learning_rate": 1.9730090382754384e-05, "loss": 0.8682, "step": 1496 }, { "epoch": 0.1, "learning_rate": 1.9729580783032077e-05, "loss": 0.8984, "step": 1497 }, { "epoch": 0.1, "learning_rate": 1.9729070709285066e-05, "loss": 0.8994, "step": 1498 }, { "epoch": 0.1, "learning_rate": 1.972856016153821e-05, "loss": 0.9902, "step": 1499 }, { "epoch": 0.1, "learning_rate": 1.9728049139816373e-05, "loss": 0.8262, "step": 1500 }, { "epoch": 0.1, "learning_rate": 1.9727537644144455e-05, "loss": 0.9248, "step": 1501 }, { "epoch": 0.1, "learning_rate": 1.972702567454738e-05, "loss": 0.8916, "step": 1502 }, { "epoch": 0.1, "learning_rate": 1.9726513231050087e-05, "loss": 0.9219, "step": 1503 }, { "epoch": 0.1, "learning_rate": 1.972600031367754e-05, "loss": 0.8994, "step": 1504 }, { "epoch": 0.1, "learning_rate": 1.972548692245474e-05, "loss": 0.9785, "step": 1505 }, { "epoch": 0.1, "learning_rate": 1.9724973057406687e-05, "loss": 0.9863, "step": 1506 }, { "epoch": 0.1, "learning_rate": 1.9724458718558424e-05, "loss": 0.9707, "step": 1507 }, { "epoch": 0.1, "learning_rate": 1.9723943905935002e-05, "loss": 0.9365, "step": 1508 }, { "epoch": 0.1, "learning_rate": 1.972342861956151e-05, "loss": 0.9268, "step": 1509 }, { "epoch": 0.1, "learning_rate": 1.9722912859463047e-05, "loss": 0.8906, "step": 1510 }, { "epoch": 0.1, "learning_rate": 1.9722396625664747e-05, "loss": 0.8701, "step": 1511 }, { "epoch": 0.1, "learning_rate": 1.972187991819176e-05, "loss": 0.8975, "step": 1512 }, { "epoch": 0.1, "learning_rate": 1.9721362737069253e-05, "loss": 0.9609, "step": 1513 }, { "epoch": 0.1, "learning_rate": 1.9720845082322426e-05, "loss": 0.9424, "step": 1514 }, { "epoch": 0.1, "learning_rate": 1.9720326953976504e-05, "loss": 0.9727, "step": 1515 }, { "epoch": 0.1, "learning_rate": 1.9719808352056728e-05, "loss": 0.9775, "step": 1516 }, { "epoch": 0.1, "learning_rate": 1.971928927658836e-05, "loss": 0.9404, "step": 1517 }, { "epoch": 0.1, "learning_rate": 1.971876972759669e-05, "loss": 0.917, "step": 1518 }, { "epoch": 0.1, "learning_rate": 1.971824970510704e-05, "loss": 0.8613, "step": 1519 }, { "epoch": 0.1, "learning_rate": 1.9717729209144732e-05, "loss": 0.9922, "step": 1520 }, { "epoch": 0.1, "learning_rate": 1.9717208239735135e-05, "loss": 0.9238, "step": 1521 }, { "epoch": 0.1, "learning_rate": 1.9716686796903622e-05, "loss": 0.8613, "step": 1522 }, { "epoch": 0.1, "learning_rate": 1.9716164880675606e-05, "loss": 0.998, "step": 1523 }, { "epoch": 0.1, "learning_rate": 1.971564249107651e-05, "loss": 0.8828, "step": 1524 }, { "epoch": 0.1, "learning_rate": 1.9715119628131786e-05, "loss": 0.9082, "step": 1525 }, { "epoch": 0.1, "learning_rate": 1.9714596291866905e-05, "loss": 0.9043, "step": 1526 }, { "epoch": 0.1, "learning_rate": 1.971407248230737e-05, "loss": 0.9453, "step": 1527 }, { "epoch": 0.1, "learning_rate": 1.9713548199478697e-05, "loss": 0.8447, "step": 1528 }, { "epoch": 0.1, "learning_rate": 1.9713023443406425e-05, "loss": 0.9072, "step": 1529 }, { "epoch": 0.1, "learning_rate": 1.971249821411613e-05, "loss": 0.8945, "step": 1530 }, { "epoch": 0.1, "learning_rate": 1.971197251163339e-05, "loss": 0.8623, "step": 1531 }, { "epoch": 0.1, "learning_rate": 1.9711446335983826e-05, "loss": 0.9072, "step": 1532 }, { "epoch": 0.1, "learning_rate": 1.971091968719307e-05, "loss": 0.9512, "step": 1533 }, { "epoch": 0.1, "learning_rate": 1.9710392565286782e-05, "loss": 0.8223, "step": 1534 }, { "epoch": 0.1, "learning_rate": 1.970986497029064e-05, "loss": 0.8984, "step": 1535 }, { "epoch": 0.1, "learning_rate": 1.970933690223035e-05, "loss": 0.8086, "step": 1536 }, { "epoch": 0.1, "learning_rate": 1.970880836113164e-05, "loss": 0.9062, "step": 1537 }, { "epoch": 0.1, "learning_rate": 1.970827934702026e-05, "loss": 0.8926, "step": 1538 }, { "epoch": 0.1, "learning_rate": 1.9707749859921982e-05, "loss": 0.9346, "step": 1539 }, { "epoch": 0.1, "learning_rate": 1.9707219899862608e-05, "loss": 0.8867, "step": 1540 }, { "epoch": 0.11, "learning_rate": 1.970668946686795e-05, "loss": 0.9551, "step": 1541 }, { "epoch": 0.11, "learning_rate": 1.970615856096386e-05, "loss": 0.9062, "step": 1542 }, { "epoch": 0.11, "learning_rate": 1.9705627182176194e-05, "loss": 0.9014, "step": 1543 }, { "epoch": 0.11, "learning_rate": 1.9705095330530845e-05, "loss": 0.7646, "step": 1544 }, { "epoch": 0.11, "learning_rate": 1.9704563006053724e-05, "loss": 0.9092, "step": 1545 }, { "epoch": 0.11, "learning_rate": 1.9704030208770767e-05, "loss": 0.8467, "step": 1546 }, { "epoch": 0.11, "learning_rate": 1.9703496938707934e-05, "loss": 0.8857, "step": 1547 }, { "epoch": 0.11, "learning_rate": 1.9702963195891202e-05, "loss": 0.7852, "step": 1548 }, { "epoch": 0.11, "learning_rate": 1.9702428980346578e-05, "loss": 0.9385, "step": 1549 }, { "epoch": 0.11, "learning_rate": 1.9701894292100087e-05, "loss": 0.8477, "step": 1550 }, { "epoch": 0.11, "learning_rate": 1.9701359131177775e-05, "loss": 0.8838, "step": 1551 }, { "epoch": 0.11, "learning_rate": 1.9700823497605723e-05, "loss": 0.8789, "step": 1552 }, { "epoch": 0.11, "learning_rate": 1.970028739141002e-05, "loss": 0.8965, "step": 1553 }, { "epoch": 0.11, "learning_rate": 1.9699750812616793e-05, "loss": 0.8887, "step": 1554 }, { "epoch": 0.11, "learning_rate": 1.9699213761252177e-05, "loss": 0.9473, "step": 1555 }, { "epoch": 0.11, "learning_rate": 1.9698676237342338e-05, "loss": 0.8848, "step": 1556 }, { "epoch": 0.11, "learning_rate": 1.9698138240913468e-05, "loss": 0.9658, "step": 1557 }, { "epoch": 0.11, "learning_rate": 1.9697599771991774e-05, "loss": 0.9043, "step": 1558 }, { "epoch": 0.11, "learning_rate": 1.9697060830603495e-05, "loss": 0.9512, "step": 1559 }, { "epoch": 0.11, "learning_rate": 1.9696521416774882e-05, "loss": 0.8818, "step": 1560 }, { "epoch": 0.11, "learning_rate": 1.969598153053222e-05, "loss": 0.9746, "step": 1561 }, { "epoch": 0.11, "learning_rate": 1.969544117190181e-05, "loss": 0.9121, "step": 1562 }, { "epoch": 0.11, "learning_rate": 1.969490034090998e-05, "loss": 0.8945, "step": 1563 }, { "epoch": 0.11, "learning_rate": 1.9694359037583076e-05, "loss": 0.9062, "step": 1564 }, { "epoch": 0.11, "learning_rate": 1.9693817261947474e-05, "loss": 0.9336, "step": 1565 }, { "epoch": 0.11, "learning_rate": 1.9693275014029568e-05, "loss": 0.9473, "step": 1566 }, { "epoch": 0.11, "learning_rate": 1.9692732293855777e-05, "loss": 0.8359, "step": 1567 }, { "epoch": 0.11, "learning_rate": 1.9692189101452535e-05, "loss": 0.8652, "step": 1568 }, { "epoch": 0.11, "learning_rate": 1.9691645436846322e-05, "loss": 0.9443, "step": 1569 }, { "epoch": 0.11, "learning_rate": 1.969110130006361e-05, "loss": 0.8838, "step": 1570 }, { "epoch": 0.11, "learning_rate": 1.9690556691130916e-05, "loss": 1.0449, "step": 1571 }, { "epoch": 0.11, "learning_rate": 1.9690011610074772e-05, "loss": 0.9707, "step": 1572 }, { "epoch": 0.11, "learning_rate": 1.9689466056921738e-05, "loss": 0.8418, "step": 1573 }, { "epoch": 0.11, "learning_rate": 1.968892003169839e-05, "loss": 0.9541, "step": 1574 }, { "epoch": 0.11, "learning_rate": 1.9688373534431327e-05, "loss": 0.9082, "step": 1575 }, { "epoch": 0.11, "learning_rate": 1.968782656514718e-05, "loss": 0.8838, "step": 1576 }, { "epoch": 0.11, "learning_rate": 1.9687279123872595e-05, "loss": 0.9258, "step": 1577 }, { "epoch": 0.11, "learning_rate": 1.968673121063425e-05, "loss": 0.8018, "step": 1578 }, { "epoch": 0.11, "learning_rate": 1.968618282545882e-05, "loss": 0.8887, "step": 1579 }, { "epoch": 0.11, "learning_rate": 1.9685633968373043e-05, "loss": 0.8906, "step": 1580 }, { "epoch": 0.11, "learning_rate": 1.968508463940365e-05, "loss": 0.9141, "step": 1581 }, { "epoch": 0.11, "learning_rate": 1.9684534838577404e-05, "loss": 0.8701, "step": 1582 }, { "epoch": 0.11, "learning_rate": 1.9683984565921096e-05, "loss": 0.9375, "step": 1583 }, { "epoch": 0.11, "learning_rate": 1.968343382146153e-05, "loss": 0.9053, "step": 1584 }, { "epoch": 0.11, "learning_rate": 1.968288260522554e-05, "loss": 0.9072, "step": 1585 }, { "epoch": 0.11, "learning_rate": 1.9682330917239983e-05, "loss": 0.915, "step": 1586 }, { "epoch": 0.11, "learning_rate": 1.9681778757531738e-05, "loss": 0.9492, "step": 1587 }, { "epoch": 0.11, "learning_rate": 1.96812261261277e-05, "loss": 0.9512, "step": 1588 }, { "epoch": 0.11, "learning_rate": 1.9680673023054803e-05, "loss": 0.9658, "step": 1589 }, { "epoch": 0.11, "learning_rate": 1.9680119448339984e-05, "loss": 0.8975, "step": 1590 }, { "epoch": 0.11, "learning_rate": 1.9679565402010217e-05, "loss": 0.9346, "step": 1591 }, { "epoch": 0.11, "learning_rate": 1.96790108840925e-05, "loss": 0.876, "step": 1592 }, { "epoch": 0.11, "learning_rate": 1.967845589461384e-05, "loss": 0.9102, "step": 1593 }, { "epoch": 0.11, "learning_rate": 1.9677900433601282e-05, "loss": 0.8604, "step": 1594 }, { "epoch": 0.11, "learning_rate": 1.9677344501081885e-05, "loss": 0.9541, "step": 1595 }, { "epoch": 0.11, "learning_rate": 1.9676788097082737e-05, "loss": 0.8945, "step": 1596 }, { "epoch": 0.11, "learning_rate": 1.9676231221630946e-05, "loss": 0.8994, "step": 1597 }, { "epoch": 0.11, "learning_rate": 1.9675673874753644e-05, "loss": 0.875, "step": 1598 }, { "epoch": 0.11, "learning_rate": 1.967511605647798e-05, "loss": 0.8701, "step": 1599 }, { "epoch": 0.11, "learning_rate": 1.9674557766831133e-05, "loss": 0.8857, "step": 1600 }, { "epoch": 0.11, "learning_rate": 1.9673999005840305e-05, "loss": 0.9395, "step": 1601 }, { "epoch": 0.11, "learning_rate": 1.9673439773532714e-05, "loss": 0.9736, "step": 1602 }, { "epoch": 0.11, "learning_rate": 1.9672880069935615e-05, "loss": 0.9248, "step": 1603 }, { "epoch": 0.11, "learning_rate": 1.9672319895076266e-05, "loss": 0.9492, "step": 1604 }, { "epoch": 0.11, "learning_rate": 1.9671759248981962e-05, "loss": 0.9375, "step": 1605 }, { "epoch": 0.11, "learning_rate": 1.9671198131680023e-05, "loss": 0.8584, "step": 1606 }, { "epoch": 0.11, "learning_rate": 1.967063654319778e-05, "loss": 0.8848, "step": 1607 }, { "epoch": 0.11, "learning_rate": 1.9670074483562597e-05, "loss": 0.9092, "step": 1608 }, { "epoch": 0.11, "learning_rate": 1.966951195280186e-05, "loss": 0.9229, "step": 1609 }, { "epoch": 0.11, "learning_rate": 1.9668948950942967e-05, "loss": 0.8271, "step": 1610 }, { "epoch": 0.11, "learning_rate": 1.9668385478013356e-05, "loss": 0.8877, "step": 1611 }, { "epoch": 0.11, "learning_rate": 1.9667821534040476e-05, "loss": 0.9189, "step": 1612 }, { "epoch": 0.11, "learning_rate": 1.96672571190518e-05, "loss": 0.8389, "step": 1613 }, { "epoch": 0.11, "learning_rate": 1.9666692233074828e-05, "loss": 0.8711, "step": 1614 }, { "epoch": 0.11, "learning_rate": 1.9666126876137083e-05, "loss": 0.9814, "step": 1615 }, { "epoch": 0.11, "learning_rate": 1.966556104826611e-05, "loss": 0.9209, "step": 1616 }, { "epoch": 0.11, "learning_rate": 1.9664994749489472e-05, "loss": 0.9248, "step": 1617 }, { "epoch": 0.11, "learning_rate": 1.9664427979834762e-05, "loss": 0.8066, "step": 1618 }, { "epoch": 0.11, "learning_rate": 1.9663860739329595e-05, "loss": 0.8428, "step": 1619 }, { "epoch": 0.11, "learning_rate": 1.96632930280016e-05, "loss": 0.8936, "step": 1620 }, { "epoch": 0.11, "learning_rate": 1.966272484587844e-05, "loss": 0.9102, "step": 1621 }, { "epoch": 0.11, "learning_rate": 1.96621561929878e-05, "loss": 0.8906, "step": 1622 }, { "epoch": 0.11, "learning_rate": 1.9661587069357378e-05, "loss": 0.9316, "step": 1623 }, { "epoch": 0.11, "learning_rate": 1.9661017475014905e-05, "loss": 0.8809, "step": 1624 }, { "epoch": 0.11, "learning_rate": 1.9660447409988132e-05, "loss": 0.9561, "step": 1625 }, { "epoch": 0.11, "learning_rate": 1.9659876874304835e-05, "loss": 0.9639, "step": 1626 }, { "epoch": 0.11, "learning_rate": 1.9659305867992805e-05, "loss": 0.9717, "step": 1627 }, { "epoch": 0.11, "learning_rate": 1.9658734391079867e-05, "loss": 0.9785, "step": 1628 }, { "epoch": 0.11, "learning_rate": 1.965816244359386e-05, "loss": 0.8701, "step": 1629 }, { "epoch": 0.11, "learning_rate": 1.9657590025562647e-05, "loss": 0.8535, "step": 1630 }, { "epoch": 0.11, "learning_rate": 1.965701713701412e-05, "loss": 0.8574, "step": 1631 }, { "epoch": 0.11, "learning_rate": 1.965644377797619e-05, "loss": 0.8525, "step": 1632 }, { "epoch": 0.11, "learning_rate": 1.965586994847679e-05, "loss": 0.9492, "step": 1633 }, { "epoch": 0.11, "learning_rate": 1.9655295648543876e-05, "loss": 0.9775, "step": 1634 }, { "epoch": 0.11, "learning_rate": 1.965472087820543e-05, "loss": 0.918, "step": 1635 }, { "epoch": 0.11, "learning_rate": 1.9654145637489453e-05, "loss": 0.8516, "step": 1636 }, { "epoch": 0.11, "learning_rate": 1.9653569926423973e-05, "loss": 0.8877, "step": 1637 }, { "epoch": 0.11, "learning_rate": 1.965299374503703e-05, "loss": 0.9229, "step": 1638 }, { "epoch": 0.11, "learning_rate": 1.965241709335671e-05, "loss": 0.8984, "step": 1639 }, { "epoch": 0.11, "learning_rate": 1.96518399714111e-05, "loss": 0.8711, "step": 1640 }, { "epoch": 0.11, "learning_rate": 1.9651262379228315e-05, "loss": 0.8438, "step": 1641 }, { "epoch": 0.11, "learning_rate": 1.9650684316836493e-05, "loss": 0.9941, "step": 1642 }, { "epoch": 0.11, "learning_rate": 1.9650105784263812e-05, "loss": 0.8369, "step": 1643 }, { "epoch": 0.11, "learning_rate": 1.964952678153844e-05, "loss": 0.9072, "step": 1644 }, { "epoch": 0.11, "learning_rate": 1.9648947308688594e-05, "loss": 0.9316, "step": 1645 }, { "epoch": 0.11, "learning_rate": 1.9648367365742507e-05, "loss": 0.8721, "step": 1646 }, { "epoch": 0.11, "learning_rate": 1.9647786952728433e-05, "loss": 0.8955, "step": 1647 }, { "epoch": 0.11, "learning_rate": 1.964720606967465e-05, "loss": 0.8037, "step": 1648 }, { "epoch": 0.11, "learning_rate": 1.964662471660946e-05, "loss": 0.8242, "step": 1649 }, { "epoch": 0.11, "learning_rate": 1.9646042893561178e-05, "loss": 0.959, "step": 1650 }, { "epoch": 0.11, "learning_rate": 1.9645460600558158e-05, "loss": 0.8154, "step": 1651 }, { "epoch": 0.11, "learning_rate": 1.964487783762877e-05, "loss": 0.8428, "step": 1652 }, { "epoch": 0.11, "learning_rate": 1.9644294604801407e-05, "loss": 0.8291, "step": 1653 }, { "epoch": 0.11, "learning_rate": 1.9643710902104475e-05, "loss": 0.9082, "step": 1654 }, { "epoch": 0.11, "learning_rate": 1.964312672956642e-05, "loss": 0.917, "step": 1655 }, { "epoch": 0.11, "learning_rate": 1.9642542087215705e-05, "loss": 0.8672, "step": 1656 }, { "epoch": 0.11, "learning_rate": 1.9641956975080807e-05, "loss": 0.8594, "step": 1657 }, { "epoch": 0.11, "learning_rate": 1.9641371393190236e-05, "loss": 0.8418, "step": 1658 }, { "epoch": 0.11, "learning_rate": 1.964078534157252e-05, "loss": 0.9219, "step": 1659 }, { "epoch": 0.11, "learning_rate": 1.964019882025621e-05, "loss": 0.8965, "step": 1660 }, { "epoch": 0.11, "learning_rate": 1.9639611829269888e-05, "loss": 0.8408, "step": 1661 }, { "epoch": 0.11, "learning_rate": 1.9639024368642144e-05, "loss": 0.9492, "step": 1662 }, { "epoch": 0.11, "learning_rate": 1.9638436438401607e-05, "loss": 0.8916, "step": 1663 }, { "epoch": 0.11, "learning_rate": 1.963784803857691e-05, "loss": 0.9678, "step": 1664 }, { "epoch": 0.11, "learning_rate": 1.9637259169196736e-05, "loss": 0.9219, "step": 1665 }, { "epoch": 0.11, "learning_rate": 1.963666983028976e-05, "loss": 0.8037, "step": 1666 }, { "epoch": 0.11, "learning_rate": 1.9636080021884697e-05, "loss": 0.9023, "step": 1667 }, { "epoch": 0.11, "learning_rate": 1.963548974401029e-05, "loss": 0.915, "step": 1668 }, { "epoch": 0.11, "learning_rate": 1.9634898996695292e-05, "loss": 0.9902, "step": 1669 }, { "epoch": 0.11, "learning_rate": 1.9634307779968482e-05, "loss": 0.8857, "step": 1670 }, { "epoch": 0.11, "learning_rate": 1.963371609385867e-05, "loss": 0.8955, "step": 1671 }, { "epoch": 0.11, "learning_rate": 1.9633123938394676e-05, "loss": 0.9131, "step": 1672 }, { "epoch": 0.11, "learning_rate": 1.9632531313605357e-05, "loss": 0.8877, "step": 1673 }, { "epoch": 0.11, "learning_rate": 1.963193821951958e-05, "loss": 0.9316, "step": 1674 }, { "epoch": 0.11, "learning_rate": 1.9631344656166243e-05, "loss": 0.9131, "step": 1675 }, { "epoch": 0.11, "learning_rate": 1.9630750623574263e-05, "loss": 0.8613, "step": 1676 }, { "epoch": 0.11, "learning_rate": 1.9630156121772584e-05, "loss": 0.9111, "step": 1677 }, { "epoch": 0.11, "learning_rate": 1.962956115079017e-05, "loss": 0.9512, "step": 1678 }, { "epoch": 0.11, "learning_rate": 1.9628965710656007e-05, "loss": 0.8486, "step": 1679 }, { "epoch": 0.11, "learning_rate": 1.96283698013991e-05, "loss": 0.9375, "step": 1680 }, { "epoch": 0.11, "learning_rate": 1.9627773423048486e-05, "loss": 0.9697, "step": 1681 }, { "epoch": 0.11, "learning_rate": 1.962717657563322e-05, "loss": 0.9268, "step": 1682 }, { "epoch": 0.11, "learning_rate": 1.9626579259182384e-05, "loss": 0.9365, "step": 1683 }, { "epoch": 0.11, "learning_rate": 1.9625981473725076e-05, "loss": 0.832, "step": 1684 }, { "epoch": 0.11, "learning_rate": 1.9625383219290417e-05, "loss": 0.8359, "step": 1685 }, { "epoch": 0.11, "learning_rate": 1.9624784495907557e-05, "loss": 0.9629, "step": 1686 }, { "epoch": 0.11, "learning_rate": 1.9624185303605668e-05, "loss": 0.9395, "step": 1687 }, { "epoch": 0.12, "learning_rate": 1.962358564241394e-05, "loss": 0.8633, "step": 1688 }, { "epoch": 0.12, "learning_rate": 1.9622985512361587e-05, "loss": 0.9121, "step": 1689 }, { "epoch": 0.12, "learning_rate": 1.962238491347785e-05, "loss": 0.915, "step": 1690 }, { "epoch": 0.12, "learning_rate": 1.962178384579199e-05, "loss": 0.8799, "step": 1691 }, { "epoch": 0.12, "learning_rate": 1.962118230933329e-05, "loss": 1.0039, "step": 1692 }, { "epoch": 0.12, "learning_rate": 1.9620580304131058e-05, "loss": 0.833, "step": 1693 }, { "epoch": 0.12, "learning_rate": 1.9619977830214623e-05, "loss": 0.8154, "step": 1694 }, { "epoch": 0.12, "learning_rate": 1.9619374887613333e-05, "loss": 0.8398, "step": 1695 }, { "epoch": 0.12, "learning_rate": 1.961877147635657e-05, "loss": 0.9971, "step": 1696 }, { "epoch": 0.12, "learning_rate": 1.961816759647373e-05, "loss": 0.8555, "step": 1697 }, { "epoch": 0.12, "learning_rate": 1.9617563247994237e-05, "loss": 0.959, "step": 1698 }, { "epoch": 0.12, "learning_rate": 1.9616958430947528e-05, "loss": 0.8613, "step": 1699 }, { "epoch": 0.12, "learning_rate": 1.961635314536307e-05, "loss": 0.8779, "step": 1700 }, { "epoch": 0.12, "learning_rate": 1.9615747391270364e-05, "loss": 0.8633, "step": 1701 }, { "epoch": 0.12, "learning_rate": 1.961514116869891e-05, "loss": 0.8945, "step": 1702 }, { "epoch": 0.12, "learning_rate": 1.9614534477678243e-05, "loss": 0.9521, "step": 1703 }, { "epoch": 0.12, "learning_rate": 1.961392731823793e-05, "loss": 0.8232, "step": 1704 }, { "epoch": 0.12, "learning_rate": 1.961331969040755e-05, "loss": 0.8779, "step": 1705 }, { "epoch": 0.12, "learning_rate": 1.9612711594216695e-05, "loss": 0.9004, "step": 1706 }, { "epoch": 0.12, "learning_rate": 1.9612103029695006e-05, "loss": 0.8828, "step": 1707 }, { "epoch": 0.12, "learning_rate": 1.9611493996872125e-05, "loss": 0.9512, "step": 1708 }, { "epoch": 0.12, "learning_rate": 1.9610884495777724e-05, "loss": 0.9395, "step": 1709 }, { "epoch": 0.12, "learning_rate": 1.96102745264415e-05, "loss": 0.916, "step": 1710 }, { "epoch": 0.12, "learning_rate": 1.9609664088893168e-05, "loss": 0.8613, "step": 1711 }, { "epoch": 0.12, "learning_rate": 1.9609053183162472e-05, "loss": 0.8477, "step": 1712 }, { "epoch": 0.12, "learning_rate": 1.960844180927917e-05, "loss": 0.9062, "step": 1713 }, { "epoch": 0.12, "learning_rate": 1.9607829967273057e-05, "loss": 0.9229, "step": 1714 }, { "epoch": 0.12, "learning_rate": 1.9607217657173935e-05, "loss": 0.9346, "step": 1715 }, { "epoch": 0.12, "learning_rate": 1.9606604879011633e-05, "loss": 0.9043, "step": 1716 }, { "epoch": 0.12, "learning_rate": 1.9605991632816015e-05, "loss": 0.9053, "step": 1717 }, { "epoch": 0.12, "learning_rate": 1.9605377918616953e-05, "loss": 0.8018, "step": 1718 }, { "epoch": 0.12, "learning_rate": 1.9604763736444344e-05, "loss": 0.8438, "step": 1719 }, { "epoch": 0.12, "learning_rate": 1.9604149086328116e-05, "loss": 0.8408, "step": 1720 }, { "epoch": 0.12, "learning_rate": 1.9603533968298212e-05, "loss": 0.9297, "step": 1721 }, { "epoch": 0.12, "learning_rate": 1.9602918382384602e-05, "loss": 0.9434, "step": 1722 }, { "epoch": 0.12, "learning_rate": 1.9602302328617276e-05, "loss": 0.8887, "step": 1723 }, { "epoch": 0.12, "learning_rate": 1.960168580702625e-05, "loss": 0.8838, "step": 1724 }, { "epoch": 0.12, "learning_rate": 1.9601068817641558e-05, "loss": 0.915, "step": 1725 }, { "epoch": 0.12, "learning_rate": 1.9600451360493264e-05, "loss": 0.9004, "step": 1726 }, { "epoch": 0.12, "learning_rate": 1.959983343561145e-05, "loss": 0.8779, "step": 1727 }, { "epoch": 0.12, "learning_rate": 1.9599215043026212e-05, "loss": 0.7705, "step": 1728 }, { "epoch": 0.12, "learning_rate": 1.959859618276769e-05, "loss": 0.8613, "step": 1729 }, { "epoch": 0.12, "learning_rate": 1.959797685486603e-05, "loss": 0.9961, "step": 1730 }, { "epoch": 0.12, "learning_rate": 1.9597357059351404e-05, "loss": 0.8018, "step": 1731 }, { "epoch": 0.12, "learning_rate": 1.959673679625401e-05, "loss": 0.8799, "step": 1732 }, { "epoch": 0.12, "learning_rate": 1.9596116065604068e-05, "loss": 0.9102, "step": 1733 }, { "epoch": 0.12, "learning_rate": 1.959549486743182e-05, "loss": 0.9639, "step": 1734 }, { "epoch": 0.12, "learning_rate": 1.959487320176753e-05, "loss": 0.9678, "step": 1735 }, { "epoch": 0.12, "learning_rate": 1.9594251068641482e-05, "loss": 0.9199, "step": 1736 }, { "epoch": 0.12, "learning_rate": 1.9593628468083995e-05, "loss": 0.959, "step": 1737 }, { "epoch": 0.12, "learning_rate": 1.9593005400125392e-05, "loss": 0.9775, "step": 1738 }, { "epoch": 0.12, "learning_rate": 1.9592381864796038e-05, "loss": 0.8838, "step": 1739 }, { "epoch": 0.12, "learning_rate": 1.9591757862126305e-05, "loss": 0.8604, "step": 1740 }, { "epoch": 0.12, "learning_rate": 1.9591133392146598e-05, "loss": 0.8828, "step": 1741 }, { "epoch": 0.12, "learning_rate": 1.959050845488734e-05, "loss": 0.8623, "step": 1742 }, { "epoch": 0.12, "learning_rate": 1.9589883050378976e-05, "loss": 0.8828, "step": 1743 }, { "epoch": 0.12, "learning_rate": 1.958925717865198e-05, "loss": 0.8037, "step": 1744 }, { "epoch": 0.12, "learning_rate": 1.958863083973684e-05, "loss": 0.7656, "step": 1745 }, { "epoch": 0.12, "learning_rate": 1.958800403366407e-05, "loss": 0.8594, "step": 1746 }, { "epoch": 0.12, "learning_rate": 1.9587376760464218e-05, "loss": 0.9814, "step": 1747 }, { "epoch": 0.12, "learning_rate": 1.958674902016783e-05, "loss": 0.8184, "step": 1748 }, { "epoch": 0.12, "learning_rate": 1.9586120812805505e-05, "loss": 0.8877, "step": 1749 }, { "epoch": 0.12, "learning_rate": 1.9585492138407835e-05, "loss": 0.873, "step": 1750 }, { "epoch": 0.12, "learning_rate": 1.958486299700546e-05, "loss": 0.8574, "step": 1751 }, { "epoch": 0.12, "learning_rate": 1.9584233388629024e-05, "loss": 0.8398, "step": 1752 }, { "epoch": 0.12, "learning_rate": 1.9583603313309208e-05, "loss": 0.9287, "step": 1753 }, { "epoch": 0.12, "learning_rate": 1.9582972771076706e-05, "loss": 0.9111, "step": 1754 }, { "epoch": 0.12, "learning_rate": 1.9582341761962236e-05, "loss": 0.8896, "step": 1755 }, { "epoch": 0.12, "learning_rate": 1.958171028599654e-05, "loss": 0.9277, "step": 1756 }, { "epoch": 0.12, "learning_rate": 1.9581078343210392e-05, "loss": 0.999, "step": 1757 }, { "epoch": 0.12, "learning_rate": 1.9580445933634568e-05, "loss": 0.9951, "step": 1758 }, { "epoch": 0.12, "learning_rate": 1.957981305729989e-05, "loss": 0.8408, "step": 1759 }, { "epoch": 0.12, "learning_rate": 1.9579179714237185e-05, "loss": 0.8916, "step": 1760 }, { "epoch": 0.12, "learning_rate": 1.9578545904477314e-05, "loss": 0.9092, "step": 1761 }, { "epoch": 0.12, "learning_rate": 1.957791162805115e-05, "loss": 0.8613, "step": 1762 }, { "epoch": 0.12, "learning_rate": 1.95772768849896e-05, "loss": 0.9434, "step": 1763 }, { "epoch": 0.12, "learning_rate": 1.9576641675323587e-05, "loss": 0.8643, "step": 1764 }, { "epoch": 0.12, "learning_rate": 1.957600599908406e-05, "loss": 0.8359, "step": 1765 }, { "epoch": 0.12, "learning_rate": 1.9575369856301986e-05, "loss": 0.9492, "step": 1766 }, { "epoch": 0.12, "learning_rate": 1.9574733247008364e-05, "loss": 1.0107, "step": 1767 }, { "epoch": 0.12, "learning_rate": 1.95740961712342e-05, "loss": 0.8125, "step": 1768 }, { "epoch": 0.12, "learning_rate": 1.957345862901054e-05, "loss": 0.8574, "step": 1769 }, { "epoch": 0.12, "learning_rate": 1.957282062036844e-05, "loss": 0.9287, "step": 1770 }, { "epoch": 0.12, "learning_rate": 1.9572182145338988e-05, "loss": 0.9648, "step": 1771 }, { "epoch": 0.12, "learning_rate": 1.9571543203953287e-05, "loss": 0.8799, "step": 1772 }, { "epoch": 0.12, "learning_rate": 1.957090379624247e-05, "loss": 0.9199, "step": 1773 }, { "epoch": 0.12, "learning_rate": 1.9570263922237686e-05, "loss": 0.9082, "step": 1774 }, { "epoch": 0.12, "learning_rate": 1.9569623581970113e-05, "loss": 0.8584, "step": 1775 }, { "epoch": 0.12, "learning_rate": 1.956898277547094e-05, "loss": 0.8828, "step": 1776 }, { "epoch": 0.12, "learning_rate": 1.9568341502771397e-05, "loss": 0.9043, "step": 1777 }, { "epoch": 0.12, "learning_rate": 1.9567699763902724e-05, "loss": 0.8799, "step": 1778 }, { "epoch": 0.12, "learning_rate": 1.956705755889618e-05, "loss": 0.8818, "step": 1779 }, { "epoch": 0.12, "learning_rate": 1.9566414887783063e-05, "loss": 0.9072, "step": 1780 }, { "epoch": 0.12, "learning_rate": 1.9565771750594674e-05, "loss": 0.9688, "step": 1781 }, { "epoch": 0.12, "learning_rate": 1.9565128147362357e-05, "loss": 0.8838, "step": 1782 }, { "epoch": 0.12, "learning_rate": 1.956448407811746e-05, "loss": 0.8369, "step": 1783 }, { "epoch": 0.12, "learning_rate": 1.956383954289137e-05, "loss": 0.834, "step": 1784 }, { "epoch": 0.12, "learning_rate": 1.956319454171548e-05, "loss": 0.918, "step": 1785 }, { "epoch": 0.12, "learning_rate": 1.9562549074621216e-05, "loss": 0.9209, "step": 1786 }, { "epoch": 0.12, "learning_rate": 1.9561903141640028e-05, "loss": 0.876, "step": 1787 }, { "epoch": 0.12, "learning_rate": 1.956125674280339e-05, "loss": 0.8682, "step": 1788 }, { "epoch": 0.12, "learning_rate": 1.9560609878142785e-05, "loss": 0.8438, "step": 1789 }, { "epoch": 0.12, "learning_rate": 1.9559962547689734e-05, "loss": 0.9326, "step": 1790 }, { "epoch": 0.12, "learning_rate": 1.9559314751475775e-05, "loss": 0.8369, "step": 1791 }, { "epoch": 0.12, "learning_rate": 1.9558666489532466e-05, "loss": 0.835, "step": 1792 }, { "epoch": 0.12, "learning_rate": 1.9558017761891396e-05, "loss": 0.915, "step": 1793 }, { "epoch": 0.12, "learning_rate": 1.9557368568584164e-05, "loss": 0.8691, "step": 1794 }, { "epoch": 0.12, "learning_rate": 1.9556718909642402e-05, "loss": 0.7764, "step": 1795 }, { "epoch": 0.12, "learning_rate": 1.9556068785097756e-05, "loss": 0.8779, "step": 1796 }, { "epoch": 0.12, "learning_rate": 1.955541819498191e-05, "loss": 0.7891, "step": 1797 }, { "epoch": 0.12, "learning_rate": 1.9554767139326553e-05, "loss": 0.8379, "step": 1798 }, { "epoch": 0.12, "learning_rate": 1.955411561816341e-05, "loss": 0.9492, "step": 1799 }, { "epoch": 0.12, "learning_rate": 1.9553463631524215e-05, "loss": 0.9189, "step": 1800 }, { "epoch": 0.12, "learning_rate": 1.9552811179440745e-05, "loss": 0.8438, "step": 1801 }, { "epoch": 0.12, "learning_rate": 1.9552158261944774e-05, "loss": 0.8691, "step": 1802 }, { "epoch": 0.12, "learning_rate": 1.955150487906812e-05, "loss": 0.8867, "step": 1803 }, { "epoch": 0.12, "learning_rate": 1.9550851030842616e-05, "loss": 0.9883, "step": 1804 }, { "epoch": 0.12, "learning_rate": 1.9550196717300114e-05, "loss": 0.9102, "step": 1805 }, { "epoch": 0.12, "learning_rate": 1.9549541938472494e-05, "loss": 0.9121, "step": 1806 }, { "epoch": 0.12, "learning_rate": 1.9548886694391654e-05, "loss": 0.8818, "step": 1807 }, { "epoch": 0.12, "learning_rate": 1.9548230985089525e-05, "loss": 0.957, "step": 1808 }, { "epoch": 0.12, "learning_rate": 1.9547574810598043e-05, "loss": 0.9277, "step": 1809 }, { "epoch": 0.12, "learning_rate": 1.9546918170949186e-05, "loss": 0.8926, "step": 1810 }, { "epoch": 0.12, "learning_rate": 1.954626106617494e-05, "loss": 0.9873, "step": 1811 }, { "epoch": 0.12, "learning_rate": 1.9545603496307317e-05, "loss": 0.877, "step": 1812 }, { "epoch": 0.12, "learning_rate": 1.9544945461378358e-05, "loss": 0.8945, "step": 1813 }, { "epoch": 0.12, "learning_rate": 1.9544286961420126e-05, "loss": 0.9062, "step": 1814 }, { "epoch": 0.12, "learning_rate": 1.9543627996464695e-05, "loss": 0.9316, "step": 1815 }, { "epoch": 0.12, "learning_rate": 1.9542968566544175e-05, "loss": 0.8691, "step": 1816 }, { "epoch": 0.12, "learning_rate": 1.954230867169069e-05, "loss": 0.9297, "step": 1817 }, { "epoch": 0.12, "learning_rate": 1.9541648311936394e-05, "loss": 0.8877, "step": 1818 }, { "epoch": 0.12, "learning_rate": 1.9540987487313456e-05, "loss": 0.8525, "step": 1819 }, { "epoch": 0.12, "learning_rate": 1.9540326197854073e-05, "loss": 0.8867, "step": 1820 }, { "epoch": 0.12, "learning_rate": 1.9539664443590463e-05, "loss": 0.8389, "step": 1821 }, { "epoch": 0.12, "learning_rate": 1.953900222455487e-05, "loss": 0.8936, "step": 1822 }, { "epoch": 0.12, "learning_rate": 1.953833954077955e-05, "loss": 0.8584, "step": 1823 }, { "epoch": 0.12, "learning_rate": 1.9537676392296793e-05, "loss": 0.8564, "step": 1824 }, { "epoch": 0.12, "learning_rate": 1.953701277913891e-05, "loss": 0.8613, "step": 1825 }, { "epoch": 0.12, "learning_rate": 1.9536348701338224e-05, "loss": 0.9033, "step": 1826 }, { "epoch": 0.12, "learning_rate": 1.95356841589271e-05, "loss": 0.9619, "step": 1827 }, { "epoch": 0.12, "learning_rate": 1.9535019151937908e-05, "loss": 0.9668, "step": 1828 }, { "epoch": 0.12, "learning_rate": 1.9534353680403046e-05, "loss": 0.9268, "step": 1829 }, { "epoch": 0.12, "learning_rate": 1.9533687744354936e-05, "loss": 0.8574, "step": 1830 }, { "epoch": 0.12, "learning_rate": 1.9533021343826027e-05, "loss": 0.8398, "step": 1831 }, { "epoch": 0.12, "learning_rate": 1.953235447884878e-05, "loss": 0.9814, "step": 1832 }, { "epoch": 0.12, "learning_rate": 1.9531687149455693e-05, "loss": 0.8604, "step": 1833 }, { "epoch": 0.12, "learning_rate": 1.9531019355679267e-05, "loss": 0.8945, "step": 1834 }, { "epoch": 0.13, "learning_rate": 1.9530351097552044e-05, "loss": 0.8701, "step": 1835 }, { "epoch": 0.13, "learning_rate": 1.9529682375106584e-05, "loss": 0.791, "step": 1836 }, { "epoch": 0.13, "learning_rate": 1.952901318837546e-05, "loss": 0.8965, "step": 1837 }, { "epoch": 0.13, "learning_rate": 1.952834353739128e-05, "loss": 0.917, "step": 1838 }, { "epoch": 0.13, "learning_rate": 1.9527673422186665e-05, "loss": 0.9434, "step": 1839 }, { "epoch": 0.13, "learning_rate": 1.952700284279427e-05, "loss": 0.9043, "step": 1840 }, { "epoch": 0.13, "learning_rate": 1.9526331799246758e-05, "loss": 0.9385, "step": 1841 }, { "epoch": 0.13, "learning_rate": 1.9525660291576827e-05, "loss": 0.8223, "step": 1842 }, { "epoch": 0.13, "learning_rate": 1.952498831981719e-05, "loss": 0.833, "step": 1843 }, { "epoch": 0.13, "learning_rate": 1.9524315884000585e-05, "loss": 1.0146, "step": 1844 }, { "epoch": 0.13, "learning_rate": 1.9523642984159777e-05, "loss": 0.8994, "step": 1845 }, { "epoch": 0.13, "learning_rate": 1.9522969620327545e-05, "loss": 0.8379, "step": 1846 }, { "epoch": 0.13, "learning_rate": 1.95222957925367e-05, "loss": 0.8721, "step": 1847 }, { "epoch": 0.13, "learning_rate": 1.9521621500820065e-05, "loss": 0.8838, "step": 1848 }, { "epoch": 0.13, "learning_rate": 1.9520946745210497e-05, "loss": 0.8174, "step": 1849 }, { "epoch": 0.13, "learning_rate": 1.952027152574087e-05, "loss": 0.9463, "step": 1850 }, { "epoch": 0.13, "learning_rate": 1.9519595842444077e-05, "loss": 0.9033, "step": 1851 }, { "epoch": 0.13, "learning_rate": 1.9518919695353035e-05, "loss": 0.8994, "step": 1852 }, { "epoch": 0.13, "learning_rate": 1.9518243084500694e-05, "loss": 0.9609, "step": 1853 }, { "epoch": 0.13, "learning_rate": 1.9517566009920014e-05, "loss": 0.915, "step": 1854 }, { "epoch": 0.13, "learning_rate": 1.951688847164398e-05, "loss": 0.8486, "step": 1855 }, { "epoch": 0.13, "learning_rate": 1.9516210469705606e-05, "loss": 0.9746, "step": 1856 }, { "epoch": 0.13, "learning_rate": 1.951553200413792e-05, "loss": 0.7314, "step": 1857 }, { "epoch": 0.13, "learning_rate": 1.951485307497398e-05, "loss": 0.8359, "step": 1858 }, { "epoch": 0.13, "learning_rate": 1.951417368224686e-05, "loss": 0.8701, "step": 1859 }, { "epoch": 0.13, "learning_rate": 1.9513493825989664e-05, "loss": 0.9043, "step": 1860 }, { "epoch": 0.13, "learning_rate": 1.9512813506235515e-05, "loss": 0.9014, "step": 1861 }, { "epoch": 0.13, "learning_rate": 1.9512132723017552e-05, "loss": 0.8799, "step": 1862 }, { "epoch": 0.13, "learning_rate": 1.9511451476368948e-05, "loss": 0.8994, "step": 1863 }, { "epoch": 0.13, "learning_rate": 1.9510769766322893e-05, "loss": 0.8555, "step": 1864 }, { "epoch": 0.13, "learning_rate": 1.9510087592912596e-05, "loss": 0.9297, "step": 1865 }, { "epoch": 0.13, "learning_rate": 1.9509404956171297e-05, "loss": 0.8779, "step": 1866 }, { "epoch": 0.13, "learning_rate": 1.9508721856132252e-05, "loss": 0.9746, "step": 1867 }, { "epoch": 0.13, "learning_rate": 1.9508038292828744e-05, "loss": 0.8379, "step": 1868 }, { "epoch": 0.13, "learning_rate": 1.9507354266294073e-05, "loss": 0.9268, "step": 1869 }, { "epoch": 0.13, "learning_rate": 1.9506669776561567e-05, "loss": 0.9141, "step": 1870 }, { "epoch": 0.13, "learning_rate": 1.950598482366457e-05, "loss": 0.8838, "step": 1871 }, { "epoch": 0.13, "learning_rate": 1.9505299407636457e-05, "loss": 0.8232, "step": 1872 }, { "epoch": 0.13, "learning_rate": 1.950461352851062e-05, "loss": 0.9648, "step": 1873 }, { "epoch": 0.13, "learning_rate": 1.9503927186320477e-05, "loss": 0.8369, "step": 1874 }, { "epoch": 0.13, "learning_rate": 1.9503240381099462e-05, "loss": 0.9072, "step": 1875 }, { "epoch": 0.13, "learning_rate": 1.9502553112881042e-05, "loss": 0.959, "step": 1876 }, { "epoch": 0.13, "learning_rate": 1.9501865381698696e-05, "loss": 0.8555, "step": 1877 }, { "epoch": 0.13, "learning_rate": 1.9501177187585935e-05, "loss": 0.8525, "step": 1878 }, { "epoch": 0.13, "learning_rate": 1.950048853057628e-05, "loss": 0.8857, "step": 1879 }, { "epoch": 0.13, "learning_rate": 1.949979941070329e-05, "loss": 0.9199, "step": 1880 }, { "epoch": 0.13, "learning_rate": 1.9499109828000536e-05, "loss": 0.9658, "step": 1881 }, { "epoch": 0.13, "learning_rate": 1.9498419782501615e-05, "loss": 0.8848, "step": 1882 }, { "epoch": 0.13, "learning_rate": 1.9497729274240145e-05, "loss": 0.8359, "step": 1883 }, { "epoch": 0.13, "learning_rate": 1.9497038303249766e-05, "loss": 0.9287, "step": 1884 }, { "epoch": 0.13, "learning_rate": 1.9496346869564143e-05, "loss": 0.8701, "step": 1885 }, { "epoch": 0.13, "learning_rate": 1.9495654973216968e-05, "loss": 0.8447, "step": 1886 }, { "epoch": 0.13, "learning_rate": 1.9494962614241942e-05, "loss": 0.9785, "step": 1887 }, { "epoch": 0.13, "learning_rate": 1.9494269792672805e-05, "loss": 0.8574, "step": 1888 }, { "epoch": 0.13, "learning_rate": 1.94935765085433e-05, "loss": 0.9746, "step": 1889 }, { "epoch": 0.13, "learning_rate": 1.949288276188722e-05, "loss": 0.9297, "step": 1890 }, { "epoch": 0.13, "learning_rate": 1.9492188552738346e-05, "loss": 0.7676, "step": 1891 }, { "epoch": 0.13, "learning_rate": 1.949149388113051e-05, "loss": 0.8857, "step": 1892 }, { "epoch": 0.13, "learning_rate": 1.949079874709756e-05, "loss": 0.9629, "step": 1893 }, { "epoch": 0.13, "learning_rate": 1.9490103150673355e-05, "loss": 0.8369, "step": 1894 }, { "epoch": 0.13, "learning_rate": 1.9489407091891785e-05, "loss": 0.9092, "step": 1895 }, { "epoch": 0.13, "learning_rate": 1.9488710570786768e-05, "loss": 0.9658, "step": 1896 }, { "epoch": 0.13, "learning_rate": 1.9488013587392232e-05, "loss": 1.0146, "step": 1897 }, { "epoch": 0.13, "learning_rate": 1.9487316141742137e-05, "loss": 0.8389, "step": 1898 }, { "epoch": 0.13, "learning_rate": 1.9486618233870462e-05, "loss": 1.0205, "step": 1899 }, { "epoch": 0.13, "learning_rate": 1.948591986381121e-05, "loss": 0.8203, "step": 1900 }, { "epoch": 0.13, "learning_rate": 1.9485221031598403e-05, "loss": 0.9004, "step": 1901 }, { "epoch": 0.13, "learning_rate": 1.9484521737266094e-05, "loss": 0.8975, "step": 1902 }, { "epoch": 0.13, "learning_rate": 1.9483821980848346e-05, "loss": 0.8809, "step": 1903 }, { "epoch": 0.13, "learning_rate": 1.9483121762379255e-05, "loss": 0.8984, "step": 1904 }, { "epoch": 0.13, "learning_rate": 1.9482421081892933e-05, "loss": 0.8877, "step": 1905 }, { "epoch": 0.13, "learning_rate": 1.948171993942352e-05, "loss": 0.8779, "step": 1906 }, { "epoch": 0.13, "learning_rate": 1.948101833500517e-05, "loss": 0.8701, "step": 1907 }, { "epoch": 0.13, "learning_rate": 1.9480316268672072e-05, "loss": 0.8896, "step": 1908 }, { "epoch": 0.13, "learning_rate": 1.9479613740458426e-05, "loss": 0.8428, "step": 1909 }, { "epoch": 0.13, "learning_rate": 1.9478910750398463e-05, "loss": 0.8467, "step": 1910 }, { "epoch": 0.13, "learning_rate": 1.947820729852643e-05, "loss": 0.9219, "step": 1911 }, { "epoch": 0.13, "learning_rate": 1.94775033848766e-05, "loss": 0.9375, "step": 1912 }, { "epoch": 0.13, "learning_rate": 1.9476799009483266e-05, "loss": 0.9639, "step": 1913 }, { "epoch": 0.13, "learning_rate": 1.9476094172380747e-05, "loss": 0.9297, "step": 1914 }, { "epoch": 0.13, "learning_rate": 1.9475388873603382e-05, "loss": 0.9854, "step": 1915 }, { "epoch": 0.13, "learning_rate": 1.947468311318553e-05, "loss": 0.9473, "step": 1916 }, { "epoch": 0.13, "learning_rate": 1.9473976891161586e-05, "loss": 0.8398, "step": 1917 }, { "epoch": 0.13, "learning_rate": 1.9473270207565945e-05, "loss": 0.8936, "step": 1918 }, { "epoch": 0.13, "learning_rate": 1.947256306243304e-05, "loss": 0.8418, "step": 1919 }, { "epoch": 0.13, "learning_rate": 1.947185545579733e-05, "loss": 0.8848, "step": 1920 }, { "epoch": 0.13, "learning_rate": 1.9471147387693278e-05, "loss": 0.9082, "step": 1921 }, { "epoch": 0.13, "learning_rate": 1.947043885815539e-05, "loss": 0.8955, "step": 1922 }, { "epoch": 0.13, "learning_rate": 1.9469729867218183e-05, "loss": 0.916, "step": 1923 }, { "epoch": 0.13, "learning_rate": 1.9469020414916197e-05, "loss": 0.8477, "step": 1924 }, { "epoch": 0.13, "learning_rate": 1.9468310501284004e-05, "loss": 0.9072, "step": 1925 }, { "epoch": 0.13, "learning_rate": 1.946760012635618e-05, "loss": 0.8252, "step": 1926 }, { "epoch": 0.13, "learning_rate": 1.946688929016734e-05, "loss": 0.9043, "step": 1927 }, { "epoch": 0.13, "learning_rate": 1.9466177992752112e-05, "loss": 0.9092, "step": 1928 }, { "epoch": 0.13, "learning_rate": 1.9465466234145157e-05, "loss": 0.8779, "step": 1929 }, { "epoch": 0.13, "learning_rate": 1.9464754014381154e-05, "loss": 0.9316, "step": 1930 }, { "epoch": 0.13, "learning_rate": 1.946404133349479e-05, "loss": 0.876, "step": 1931 }, { "epoch": 0.13, "learning_rate": 1.9463328191520797e-05, "loss": 0.9434, "step": 1932 }, { "epoch": 0.13, "learning_rate": 1.9462614588493915e-05, "loss": 0.875, "step": 1933 }, { "epoch": 0.13, "learning_rate": 1.946190052444891e-05, "loss": 0.8896, "step": 1934 }, { "epoch": 0.13, "learning_rate": 1.9461185999420573e-05, "loss": 0.8887, "step": 1935 }, { "epoch": 0.13, "learning_rate": 1.946047101344372e-05, "loss": 0.8105, "step": 1936 }, { "epoch": 0.13, "learning_rate": 1.9459755566553176e-05, "loss": 0.9414, "step": 1937 }, { "epoch": 0.13, "learning_rate": 1.9459039658783806e-05, "loss": 0.9502, "step": 1938 }, { "epoch": 0.13, "learning_rate": 1.945832329017048e-05, "loss": 0.9141, "step": 1939 }, { "epoch": 0.13, "learning_rate": 1.9457606460748106e-05, "loss": 0.9043, "step": 1940 }, { "epoch": 0.13, "learning_rate": 1.945688917055161e-05, "loss": 0.8145, "step": 1941 }, { "epoch": 0.13, "learning_rate": 1.9456171419615933e-05, "loss": 0.8857, "step": 1942 }, { "epoch": 0.13, "learning_rate": 1.9455453207976043e-05, "loss": 0.9141, "step": 1943 }, { "epoch": 0.13, "learning_rate": 1.9454734535666934e-05, "loss": 0.957, "step": 1944 }, { "epoch": 0.13, "learning_rate": 1.9454015402723626e-05, "loss": 0.916, "step": 1945 }, { "epoch": 0.13, "learning_rate": 1.9453295809181144e-05, "loss": 0.9248, "step": 1946 }, { "epoch": 0.13, "learning_rate": 1.945257575507455e-05, "loss": 0.9102, "step": 1947 }, { "epoch": 0.13, "learning_rate": 1.9451855240438928e-05, "loss": 0.9521, "step": 1948 }, { "epoch": 0.13, "learning_rate": 1.9451134265309378e-05, "loss": 0.9121, "step": 1949 }, { "epoch": 0.13, "learning_rate": 1.945041282972103e-05, "loss": 0.7627, "step": 1950 }, { "epoch": 0.13, "learning_rate": 1.9449690933709026e-05, "loss": 0.9141, "step": 1951 }, { "epoch": 0.13, "learning_rate": 1.9448968577308545e-05, "loss": 0.8535, "step": 1952 }, { "epoch": 0.13, "learning_rate": 1.944824576055477e-05, "loss": 0.9219, "step": 1953 }, { "epoch": 0.13, "learning_rate": 1.9447522483482927e-05, "loss": 0.9521, "step": 1954 }, { "epoch": 0.13, "learning_rate": 1.944679874612825e-05, "loss": 0.8262, "step": 1955 }, { "epoch": 0.13, "learning_rate": 1.9446074548525996e-05, "loss": 0.8916, "step": 1956 }, { "epoch": 0.13, "learning_rate": 1.944534989071145e-05, "loss": 0.9355, "step": 1957 }, { "epoch": 0.13, "learning_rate": 1.944462477271992e-05, "loss": 0.7441, "step": 1958 }, { "epoch": 0.13, "learning_rate": 1.9443899194586734e-05, "loss": 0.8896, "step": 1959 }, { "epoch": 0.13, "learning_rate": 1.944317315634724e-05, "loss": 0.9043, "step": 1960 }, { "epoch": 0.13, "learning_rate": 1.94424466580368e-05, "loss": 0.8945, "step": 1961 }, { "epoch": 0.13, "learning_rate": 1.944171969969083e-05, "loss": 1.0498, "step": 1962 }, { "epoch": 0.13, "learning_rate": 1.944099228134473e-05, "loss": 0.8604, "step": 1963 }, { "epoch": 0.13, "learning_rate": 1.9440264403033952e-05, "loss": 0.9268, "step": 1964 }, { "epoch": 0.13, "learning_rate": 1.9439536064793952e-05, "loss": 0.8799, "step": 1965 }, { "epoch": 0.13, "learning_rate": 1.9438807266660212e-05, "loss": 0.8652, "step": 1966 }, { "epoch": 0.13, "learning_rate": 1.9438078008668243e-05, "loss": 0.8447, "step": 1967 }, { "epoch": 0.13, "learning_rate": 1.9437348290853576e-05, "loss": 0.8916, "step": 1968 }, { "epoch": 0.13, "learning_rate": 1.943661811325176e-05, "loss": 0.8447, "step": 1969 }, { "epoch": 0.13, "learning_rate": 1.943588747589837e-05, "loss": 0.8867, "step": 1970 }, { "epoch": 0.13, "learning_rate": 1.9435156378829e-05, "loss": 0.873, "step": 1971 }, { "epoch": 0.13, "learning_rate": 1.9434424822079272e-05, "loss": 0.8584, "step": 1972 }, { "epoch": 0.13, "learning_rate": 1.943369280568483e-05, "loss": 0.8652, "step": 1973 }, { "epoch": 0.13, "learning_rate": 1.943296032968133e-05, "loss": 0.874, "step": 1974 }, { "epoch": 0.13, "learning_rate": 1.9432227394104465e-05, "loss": 0.8623, "step": 1975 }, { "epoch": 0.13, "learning_rate": 1.9431493998989942e-05, "loss": 0.8477, "step": 1976 }, { "epoch": 0.13, "learning_rate": 1.9430760144373487e-05, "loss": 0.8984, "step": 1977 }, { "epoch": 0.13, "learning_rate": 1.943002583029086e-05, "loss": 0.9248, "step": 1978 }, { "epoch": 0.13, "learning_rate": 1.9429291056777837e-05, "loss": 0.9072, "step": 1979 }, { "epoch": 0.13, "learning_rate": 1.942855582387021e-05, "loss": 0.9131, "step": 1980 }, { "epoch": 0.14, "learning_rate": 1.9427820131603806e-05, "loss": 0.8486, "step": 1981 }, { "epoch": 0.14, "learning_rate": 1.9427083980014466e-05, "loss": 0.9844, "step": 1982 }, { "epoch": 0.14, "learning_rate": 1.9426347369138052e-05, "loss": 0.8369, "step": 1983 }, { "epoch": 0.14, "learning_rate": 1.9425610299010453e-05, "loss": 0.9062, "step": 1984 }, { "epoch": 0.14, "learning_rate": 1.942487276966758e-05, "loss": 0.9258, "step": 1985 }, { "epoch": 0.14, "learning_rate": 1.9424134781145367e-05, "loss": 0.8965, "step": 1986 }, { "epoch": 0.14, "learning_rate": 1.9423396333479765e-05, "loss": 0.9658, "step": 1987 }, { "epoch": 0.14, "learning_rate": 1.9422657426706754e-05, "loss": 0.7744, "step": 1988 }, { "epoch": 0.14, "learning_rate": 1.9421918060862333e-05, "loss": 0.8965, "step": 1989 }, { "epoch": 0.14, "learning_rate": 1.9421178235982525e-05, "loss": 0.8525, "step": 1990 }, { "epoch": 0.14, "learning_rate": 1.9420437952103372e-05, "loss": 0.998, "step": 1991 }, { "epoch": 0.14, "learning_rate": 1.9419697209260938e-05, "loss": 0.8506, "step": 1992 }, { "epoch": 0.14, "learning_rate": 1.941895600749132e-05, "loss": 0.8887, "step": 1993 }, { "epoch": 0.14, "learning_rate": 1.9418214346830622e-05, "loss": 0.9014, "step": 1994 }, { "epoch": 0.14, "learning_rate": 1.941747222731498e-05, "loss": 0.9424, "step": 1995 }, { "epoch": 0.14, "learning_rate": 1.9416729648980553e-05, "loss": 0.8809, "step": 1996 }, { "epoch": 0.14, "learning_rate": 1.9415986611863516e-05, "loss": 0.8955, "step": 1997 }, { "epoch": 0.14, "learning_rate": 1.941524311600007e-05, "loss": 0.8564, "step": 1998 }, { "epoch": 0.14, "learning_rate": 1.9414499161426437e-05, "loss": 0.8369, "step": 1999 }, { "epoch": 0.14, "learning_rate": 1.9413754748178864e-05, "loss": 0.9033, "step": 2000 }, { "epoch": 0.14, "learning_rate": 1.941300987629362e-05, "loss": 0.8809, "step": 2001 }, { "epoch": 0.14, "learning_rate": 1.9412264545806993e-05, "loss": 0.9033, "step": 2002 }, { "epoch": 0.14, "learning_rate": 1.94115187567553e-05, "loss": 0.9414, "step": 2003 }, { "epoch": 0.14, "learning_rate": 1.941077250917487e-05, "loss": 0.8438, "step": 2004 }, { "epoch": 0.14, "learning_rate": 1.941002580310206e-05, "loss": 0.8896, "step": 2005 }, { "epoch": 0.14, "learning_rate": 1.9409278638573254e-05, "loss": 0.9648, "step": 2006 }, { "epoch": 0.14, "learning_rate": 1.940853101562485e-05, "loss": 0.8691, "step": 2007 }, { "epoch": 0.14, "learning_rate": 1.9407782934293273e-05, "loss": 0.8232, "step": 2008 }, { "epoch": 0.14, "learning_rate": 1.9407034394614973e-05, "loss": 0.9268, "step": 2009 }, { "epoch": 0.14, "learning_rate": 1.9406285396626413e-05, "loss": 0.9902, "step": 2010 }, { "epoch": 0.14, "learning_rate": 1.940553594036409e-05, "loss": 0.9062, "step": 2011 }, { "epoch": 0.14, "learning_rate": 1.9404786025864513e-05, "loss": 0.8232, "step": 2012 }, { "epoch": 0.14, "learning_rate": 1.940403565316422e-05, "loss": 0.9443, "step": 2013 }, { "epoch": 0.14, "learning_rate": 1.9403284822299772e-05, "loss": 0.8555, "step": 2014 }, { "epoch": 0.14, "learning_rate": 1.940253353330774e-05, "loss": 0.9805, "step": 2015 }, { "epoch": 0.14, "learning_rate": 1.9401781786224736e-05, "loss": 0.7559, "step": 2016 }, { "epoch": 0.14, "learning_rate": 1.9401029581087382e-05, "loss": 0.9443, "step": 2017 }, { "epoch": 0.14, "learning_rate": 1.9400276917932325e-05, "loss": 0.8584, "step": 2018 }, { "epoch": 0.14, "learning_rate": 1.9399523796796232e-05, "loss": 0.8105, "step": 2019 }, { "epoch": 0.14, "learning_rate": 1.93987702177158e-05, "loss": 0.8174, "step": 2020 }, { "epoch": 0.14, "learning_rate": 1.9398016180727747e-05, "loss": 0.9277, "step": 2021 }, { "epoch": 0.14, "learning_rate": 1.9397261685868796e-05, "loss": 0.8652, "step": 2022 }, { "epoch": 0.14, "learning_rate": 1.9396506733175716e-05, "loss": 0.9629, "step": 2023 }, { "epoch": 0.14, "learning_rate": 1.9395751322685286e-05, "loss": 0.8203, "step": 2024 }, { "epoch": 0.14, "learning_rate": 1.9394995454434314e-05, "loss": 0.9746, "step": 2025 }, { "epoch": 0.14, "learning_rate": 1.939423912845962e-05, "loss": 0.8789, "step": 2026 }, { "epoch": 0.14, "learning_rate": 1.939348234479805e-05, "loss": 0.9688, "step": 2027 }, { "epoch": 0.14, "learning_rate": 1.939272510348648e-05, "loss": 0.9473, "step": 2028 }, { "epoch": 0.14, "learning_rate": 1.9391967404561804e-05, "loss": 0.832, "step": 2029 }, { "epoch": 0.14, "learning_rate": 1.939120924806093e-05, "loss": 0.9014, "step": 2030 }, { "epoch": 0.14, "learning_rate": 1.93904506340208e-05, "loss": 0.8857, "step": 2031 }, { "epoch": 0.14, "learning_rate": 1.9389691562478375e-05, "loss": 0.9111, "step": 2032 }, { "epoch": 0.14, "learning_rate": 1.9388932033470633e-05, "loss": 0.8711, "step": 2033 }, { "epoch": 0.14, "learning_rate": 1.9388172047034583e-05, "loss": 0.9287, "step": 2034 }, { "epoch": 0.14, "learning_rate": 1.9387411603207246e-05, "loss": 0.9111, "step": 2035 }, { "epoch": 0.14, "learning_rate": 1.9386650702025672e-05, "loss": 0.8701, "step": 2036 }, { "epoch": 0.14, "learning_rate": 1.9385889343526938e-05, "loss": 0.9512, "step": 2037 }, { "epoch": 0.14, "learning_rate": 1.9385127527748132e-05, "loss": 0.9004, "step": 2038 }, { "epoch": 0.14, "learning_rate": 1.938436525472637e-05, "loss": 0.9639, "step": 2039 }, { "epoch": 0.14, "learning_rate": 1.9383602524498787e-05, "loss": 0.8926, "step": 2040 }, { "epoch": 0.14, "learning_rate": 1.938283933710255e-05, "loss": 0.9316, "step": 2041 }, { "epoch": 0.14, "learning_rate": 1.9382075692574836e-05, "loss": 0.9473, "step": 2042 }, { "epoch": 0.14, "learning_rate": 1.9381311590952855e-05, "loss": 0.8027, "step": 2043 }, { "epoch": 0.14, "learning_rate": 1.938054703227383e-05, "loss": 0.8857, "step": 2044 }, { "epoch": 0.14, "learning_rate": 1.937978201657501e-05, "loss": 0.835, "step": 2045 }, { "epoch": 0.14, "learning_rate": 1.9379016543893668e-05, "loss": 0.9492, "step": 2046 }, { "epoch": 0.14, "learning_rate": 1.9378250614267098e-05, "loss": 0.9629, "step": 2047 }, { "epoch": 0.14, "learning_rate": 1.9377484227732612e-05, "loss": 0.9717, "step": 2048 }, { "epoch": 0.14, "learning_rate": 1.9376717384327556e-05, "loss": 0.8867, "step": 2049 }, { "epoch": 0.14, "learning_rate": 1.9375950084089283e-05, "loss": 0.9482, "step": 2050 }, { "epoch": 0.14, "learning_rate": 1.937518232705518e-05, "loss": 0.8691, "step": 2051 }, { "epoch": 0.14, "learning_rate": 1.9374414113262654e-05, "loss": 0.9766, "step": 2052 }, { "epoch": 0.14, "learning_rate": 1.9373645442749126e-05, "loss": 0.8916, "step": 2053 }, { "epoch": 0.14, "learning_rate": 1.937287631555205e-05, "loss": 0.832, "step": 2054 }, { "epoch": 0.14, "learning_rate": 1.9372106731708897e-05, "loss": 0.8252, "step": 2055 }, { "epoch": 0.14, "learning_rate": 1.9371336691257165e-05, "loss": 0.9307, "step": 2056 }, { "epoch": 0.14, "learning_rate": 1.9370566194234363e-05, "loss": 0.8125, "step": 2057 }, { "epoch": 0.14, "learning_rate": 1.936979524067803e-05, "loss": 0.8701, "step": 2058 }, { "epoch": 0.14, "learning_rate": 1.9369023830625736e-05, "loss": 0.8125, "step": 2059 }, { "epoch": 0.14, "learning_rate": 1.9368251964115054e-05, "loss": 0.8936, "step": 2060 }, { "epoch": 0.14, "learning_rate": 1.936747964118359e-05, "loss": 0.9375, "step": 2061 }, { "epoch": 0.14, "learning_rate": 1.936670686186898e-05, "loss": 0.8857, "step": 2062 }, { "epoch": 0.14, "learning_rate": 1.9365933626208867e-05, "loss": 0.9219, "step": 2063 }, { "epoch": 0.14, "learning_rate": 1.9365159934240925e-05, "loss": 0.8652, "step": 2064 }, { "epoch": 0.14, "learning_rate": 1.9364385786002847e-05, "loss": 0.8506, "step": 2065 }, { "epoch": 0.14, "learning_rate": 1.9363611181532353e-05, "loss": 0.8408, "step": 2066 }, { "epoch": 0.14, "learning_rate": 1.9362836120867175e-05, "loss": 0.9316, "step": 2067 }, { "epoch": 0.14, "learning_rate": 1.936206060404508e-05, "loss": 0.7959, "step": 2068 }, { "epoch": 0.14, "learning_rate": 1.9361284631103846e-05, "loss": 0.9131, "step": 2069 }, { "epoch": 0.14, "learning_rate": 1.9360508202081286e-05, "loss": 0.9521, "step": 2070 }, { "epoch": 0.14, "learning_rate": 1.935973131701522e-05, "loss": 0.877, "step": 2071 }, { "epoch": 0.14, "learning_rate": 1.9358953975943498e-05, "loss": 0.959, "step": 2072 }, { "epoch": 0.14, "learning_rate": 1.9358176178904e-05, "loss": 0.9609, "step": 2073 }, { "epoch": 0.14, "learning_rate": 1.9357397925934612e-05, "loss": 0.875, "step": 2074 }, { "epoch": 0.14, "learning_rate": 1.9356619217073252e-05, "loss": 0.8428, "step": 2075 }, { "epoch": 0.14, "learning_rate": 1.9355840052357862e-05, "loss": 0.8291, "step": 2076 }, { "epoch": 0.14, "learning_rate": 1.9355060431826403e-05, "loss": 0.8223, "step": 2077 }, { "epoch": 0.14, "learning_rate": 1.9354280355516852e-05, "loss": 0.8184, "step": 2078 }, { "epoch": 0.14, "learning_rate": 1.935349982346722e-05, "loss": 0.9209, "step": 2079 }, { "epoch": 0.14, "learning_rate": 1.9352718835715535e-05, "loss": 0.8457, "step": 2080 }, { "epoch": 0.14, "learning_rate": 1.935193739229984e-05, "loss": 0.9062, "step": 2081 }, { "epoch": 0.14, "learning_rate": 1.9351155493258214e-05, "loss": 0.8398, "step": 2082 }, { "epoch": 0.14, "learning_rate": 1.935037313862875e-05, "loss": 0.915, "step": 2083 }, { "epoch": 0.14, "learning_rate": 1.934959032844956e-05, "loss": 0.8057, "step": 2084 }, { "epoch": 0.14, "learning_rate": 1.9348807062758785e-05, "loss": 0.9512, "step": 2085 }, { "epoch": 0.14, "learning_rate": 1.9348023341594586e-05, "loss": 0.8135, "step": 2086 }, { "epoch": 0.14, "learning_rate": 1.9347239164995147e-05, "loss": 0.9375, "step": 2087 }, { "epoch": 0.14, "learning_rate": 1.934645453299867e-05, "loss": 0.9678, "step": 2088 }, { "epoch": 0.14, "learning_rate": 1.9345669445643385e-05, "loss": 0.9541, "step": 2089 }, { "epoch": 0.14, "learning_rate": 1.9344883902967542e-05, "loss": 0.8779, "step": 2090 }, { "epoch": 0.14, "learning_rate": 1.934409790500941e-05, "loss": 0.9043, "step": 2091 }, { "epoch": 0.14, "learning_rate": 1.934331145180728e-05, "loss": 0.9199, "step": 2092 }, { "epoch": 0.14, "learning_rate": 1.9342524543399475e-05, "loss": 0.9033, "step": 2093 }, { "epoch": 0.14, "learning_rate": 1.9341737179824332e-05, "loss": 0.9404, "step": 2094 }, { "epoch": 0.14, "learning_rate": 1.9340949361120205e-05, "loss": 0.9033, "step": 2095 }, { "epoch": 0.14, "learning_rate": 1.9340161087325483e-05, "loss": 0.9619, "step": 2096 }, { "epoch": 0.14, "learning_rate": 1.9339372358478567e-05, "loss": 0.8867, "step": 2097 }, { "epoch": 0.14, "learning_rate": 1.9338583174617883e-05, "loss": 0.916, "step": 2098 }, { "epoch": 0.14, "learning_rate": 1.9337793535781886e-05, "loss": 0.9092, "step": 2099 }, { "epoch": 0.14, "learning_rate": 1.9337003442009042e-05, "loss": 0.7959, "step": 2100 }, { "epoch": 0.14, "learning_rate": 1.9336212893337846e-05, "loss": 0.9277, "step": 2101 }, { "epoch": 0.14, "learning_rate": 1.9335421889806812e-05, "loss": 0.8467, "step": 2102 }, { "epoch": 0.14, "learning_rate": 1.9334630431454482e-05, "loss": 0.8965, "step": 2103 }, { "epoch": 0.14, "learning_rate": 1.933383851831941e-05, "loss": 0.9521, "step": 2104 }, { "epoch": 0.14, "learning_rate": 1.9333046150440182e-05, "loss": 0.877, "step": 2105 }, { "epoch": 0.14, "learning_rate": 1.9332253327855398e-05, "loss": 0.835, "step": 2106 }, { "epoch": 0.14, "learning_rate": 1.933146005060369e-05, "loss": 0.875, "step": 2107 }, { "epoch": 0.14, "learning_rate": 1.93306663187237e-05, "loss": 0.9199, "step": 2108 }, { "epoch": 0.14, "learning_rate": 1.9329872132254108e-05, "loss": 0.9326, "step": 2109 }, { "epoch": 0.14, "learning_rate": 1.9329077491233595e-05, "loss": 0.9072, "step": 2110 }, { "epoch": 0.14, "learning_rate": 1.932828239570088e-05, "loss": 0.917, "step": 2111 }, { "epoch": 0.14, "learning_rate": 1.932748684569471e-05, "loss": 0.8584, "step": 2112 }, { "epoch": 0.14, "learning_rate": 1.9326690841253826e-05, "loss": 0.8867, "step": 2113 }, { "epoch": 0.14, "learning_rate": 1.9325894382417027e-05, "loss": 0.8799, "step": 2114 }, { "epoch": 0.14, "learning_rate": 1.9325097469223104e-05, "loss": 0.835, "step": 2115 }, { "epoch": 0.14, "learning_rate": 1.9324300101710887e-05, "loss": 0.9229, "step": 2116 }, { "epoch": 0.14, "learning_rate": 1.9323502279919223e-05, "loss": 0.9111, "step": 2117 }, { "epoch": 0.14, "learning_rate": 1.9322704003886988e-05, "loss": 0.8672, "step": 2118 }, { "epoch": 0.14, "learning_rate": 1.9321905273653065e-05, "loss": 0.8438, "step": 2119 }, { "epoch": 0.14, "learning_rate": 1.9321106089256368e-05, "loss": 0.9326, "step": 2120 }, { "epoch": 0.14, "learning_rate": 1.9320306450735845e-05, "loss": 0.9199, "step": 2121 }, { "epoch": 0.14, "learning_rate": 1.9319506358130443e-05, "loss": 0.9189, "step": 2122 }, { "epoch": 0.14, "learning_rate": 1.9318705811479145e-05, "loss": 0.9189, "step": 2123 }, { "epoch": 0.14, "learning_rate": 1.931790481082095e-05, "loss": 0.9893, "step": 2124 }, { "epoch": 0.14, "learning_rate": 1.931710335619489e-05, "loss": 0.9355, "step": 2125 }, { "epoch": 0.14, "learning_rate": 1.9316301447640012e-05, "loss": 0.7969, "step": 2126 }, { "epoch": 0.14, "learning_rate": 1.931549908519538e-05, "loss": 0.8027, "step": 2127 }, { "epoch": 0.15, "learning_rate": 1.9314696268900085e-05, "loss": 0.8809, "step": 2128 }, { "epoch": 0.15, "learning_rate": 1.9313892998793245e-05, "loss": 0.918, "step": 2129 }, { "epoch": 0.15, "learning_rate": 1.931308927491399e-05, "loss": 0.9336, "step": 2130 }, { "epoch": 0.15, "learning_rate": 1.931228509730148e-05, "loss": 0.9355, "step": 2131 }, { "epoch": 0.15, "learning_rate": 1.9311480465994896e-05, "loss": 0.8818, "step": 2132 }, { "epoch": 0.15, "learning_rate": 1.9310675381033434e-05, "loss": 0.9326, "step": 2133 }, { "epoch": 0.15, "learning_rate": 1.9309869842456325e-05, "loss": 0.9062, "step": 2134 }, { "epoch": 0.15, "learning_rate": 1.930906385030281e-05, "loss": 0.8857, "step": 2135 }, { "epoch": 0.15, "learning_rate": 1.930825740461216e-05, "loss": 0.8799, "step": 2136 }, { "epoch": 0.15, "learning_rate": 1.930745050542366e-05, "loss": 0.7979, "step": 2137 }, { "epoch": 0.15, "learning_rate": 1.930664315277663e-05, "loss": 0.9893, "step": 2138 }, { "epoch": 0.15, "learning_rate": 1.9305835346710396e-05, "loss": 0.9219, "step": 2139 }, { "epoch": 0.15, "learning_rate": 1.9305027087264315e-05, "loss": 0.8975, "step": 2140 }, { "epoch": 0.15, "learning_rate": 1.9304218374477772e-05, "loss": 0.9307, "step": 2141 }, { "epoch": 0.15, "learning_rate": 1.9303409208390163e-05, "loss": 0.877, "step": 2142 }, { "epoch": 0.15, "learning_rate": 1.930259958904091e-05, "loss": 0.9512, "step": 2143 }, { "epoch": 0.15, "learning_rate": 1.930178951646946e-05, "loss": 0.9434, "step": 2144 }, { "epoch": 0.15, "learning_rate": 1.930097899071528e-05, "loss": 0.8525, "step": 2145 }, { "epoch": 0.15, "learning_rate": 1.9300168011817852e-05, "loss": 0.8672, "step": 2146 }, { "epoch": 0.15, "learning_rate": 1.9299356579816695e-05, "loss": 0.8564, "step": 2147 }, { "epoch": 0.15, "learning_rate": 1.9298544694751337e-05, "loss": 0.8389, "step": 2148 }, { "epoch": 0.15, "learning_rate": 1.929773235666134e-05, "loss": 0.8926, "step": 2149 }, { "epoch": 0.15, "learning_rate": 1.929691956558627e-05, "loss": 0.7744, "step": 2150 }, { "epoch": 0.15, "learning_rate": 1.9296106321565738e-05, "loss": 0.8408, "step": 2151 }, { "epoch": 0.15, "learning_rate": 1.9295292624639354e-05, "loss": 0.8672, "step": 2152 }, { "epoch": 0.15, "learning_rate": 1.9294478474846768e-05, "loss": 0.8613, "step": 2153 }, { "epoch": 0.15, "learning_rate": 1.9293663872227648e-05, "loss": 0.9033, "step": 2154 }, { "epoch": 0.15, "learning_rate": 1.9292848816821675e-05, "loss": 0.8965, "step": 2155 }, { "epoch": 0.15, "learning_rate": 1.9292033308668555e-05, "loss": 0.8672, "step": 2156 }, { "epoch": 0.15, "learning_rate": 1.9291217347808034e-05, "loss": 0.9512, "step": 2157 }, { "epoch": 0.15, "learning_rate": 1.9290400934279852e-05, "loss": 0.8877, "step": 2158 }, { "epoch": 0.15, "learning_rate": 1.9289584068123792e-05, "loss": 0.9385, "step": 2159 }, { "epoch": 0.15, "learning_rate": 1.9288766749379645e-05, "loss": 0.8184, "step": 2160 }, { "epoch": 0.15, "learning_rate": 1.928794897808724e-05, "loss": 0.9131, "step": 2161 }, { "epoch": 0.15, "learning_rate": 1.9287130754286413e-05, "loss": 0.9697, "step": 2162 }, { "epoch": 0.15, "learning_rate": 1.9286312078017028e-05, "loss": 0.8652, "step": 2163 }, { "epoch": 0.15, "learning_rate": 1.928549294931897e-05, "loss": 0.8955, "step": 2164 }, { "epoch": 0.15, "learning_rate": 1.928467336823215e-05, "loss": 0.8828, "step": 2165 }, { "epoch": 0.15, "learning_rate": 1.9283853334796493e-05, "loss": 0.8838, "step": 2166 }, { "epoch": 0.15, "learning_rate": 1.9283032849051958e-05, "loss": 0.8574, "step": 2167 }, { "epoch": 0.15, "learning_rate": 1.9282211911038514e-05, "loss": 0.8643, "step": 2168 }, { "epoch": 0.15, "learning_rate": 1.928139052079616e-05, "loss": 0.8145, "step": 2169 }, { "epoch": 0.15, "learning_rate": 1.928056867836491e-05, "loss": 0.8926, "step": 2170 }, { "epoch": 0.15, "learning_rate": 1.9279746383784804e-05, "loss": 0.7871, "step": 2171 }, { "epoch": 0.15, "learning_rate": 1.927892363709591e-05, "loss": 0.833, "step": 2172 }, { "epoch": 0.15, "learning_rate": 1.927810043833831e-05, "loss": 0.9023, "step": 2173 }, { "epoch": 0.15, "learning_rate": 1.927727678755211e-05, "loss": 0.9521, "step": 2174 }, { "epoch": 0.15, "learning_rate": 1.9276452684777433e-05, "loss": 0.8818, "step": 2175 }, { "epoch": 0.15, "learning_rate": 1.9275628130054437e-05, "loss": 0.8984, "step": 2176 }, { "epoch": 0.15, "learning_rate": 1.927480312342329e-05, "loss": 0.9062, "step": 2177 }, { "epoch": 0.15, "learning_rate": 1.9273977664924187e-05, "loss": 0.874, "step": 2178 }, { "epoch": 0.15, "learning_rate": 1.9273151754597343e-05, "loss": 0.834, "step": 2179 }, { "epoch": 0.15, "learning_rate": 1.9272325392483e-05, "loss": 0.8311, "step": 2180 }, { "epoch": 0.15, "learning_rate": 1.9271498578621414e-05, "loss": 0.8145, "step": 2181 }, { "epoch": 0.15, "learning_rate": 1.927067131305287e-05, "loss": 0.8809, "step": 2182 }, { "epoch": 0.15, "learning_rate": 1.9269843595817674e-05, "loss": 0.9033, "step": 2183 }, { "epoch": 0.15, "learning_rate": 1.9269015426956148e-05, "loss": 0.8926, "step": 2184 }, { "epoch": 0.15, "learning_rate": 1.9268186806508643e-05, "loss": 0.8662, "step": 2185 }, { "epoch": 0.15, "learning_rate": 1.9267357734515527e-05, "loss": 0.8936, "step": 2186 }, { "epoch": 0.15, "learning_rate": 1.9266528211017197e-05, "loss": 0.8535, "step": 2187 }, { "epoch": 0.15, "learning_rate": 1.926569823605406e-05, "loss": 0.9316, "step": 2188 }, { "epoch": 0.15, "learning_rate": 1.9264867809666562e-05, "loss": 0.8936, "step": 2189 }, { "epoch": 0.15, "learning_rate": 1.9264036931895155e-05, "loss": 0.9395, "step": 2190 }, { "epoch": 0.15, "learning_rate": 1.926320560278032e-05, "loss": 0.9053, "step": 2191 }, { "epoch": 0.15, "learning_rate": 1.9262373822362557e-05, "loss": 0.9023, "step": 2192 }, { "epoch": 0.15, "learning_rate": 1.9261541590682394e-05, "loss": 0.9336, "step": 2193 }, { "epoch": 0.15, "learning_rate": 1.926070890778038e-05, "loss": 0.8682, "step": 2194 }, { "epoch": 0.15, "learning_rate": 1.925987577369708e-05, "loss": 0.8779, "step": 2195 }, { "epoch": 0.15, "learning_rate": 1.925904218847308e-05, "loss": 0.9014, "step": 2196 }, { "epoch": 0.15, "learning_rate": 1.9258208152148994e-05, "loss": 0.8604, "step": 2197 }, { "epoch": 0.15, "learning_rate": 1.9257373664765463e-05, "loss": 0.9727, "step": 2198 }, { "epoch": 0.15, "learning_rate": 1.9256538726363138e-05, "loss": 0.8301, "step": 2199 }, { "epoch": 0.15, "learning_rate": 1.9255703336982698e-05, "loss": 0.915, "step": 2200 }, { "epoch": 0.15, "learning_rate": 1.925486749666484e-05, "loss": 0.9297, "step": 2201 }, { "epoch": 0.15, "learning_rate": 1.925403120545029e-05, "loss": 0.7773, "step": 2202 }, { "epoch": 0.15, "learning_rate": 1.9253194463379793e-05, "loss": 0.9043, "step": 2203 }, { "epoch": 0.15, "learning_rate": 1.9252357270494108e-05, "loss": 0.8398, "step": 2204 }, { "epoch": 0.15, "learning_rate": 1.9251519626834033e-05, "loss": 0.9043, "step": 2205 }, { "epoch": 0.15, "learning_rate": 1.925068153244037e-05, "loss": 0.8037, "step": 2206 }, { "epoch": 0.15, "learning_rate": 1.9249842987353958e-05, "loss": 0.8994, "step": 2207 }, { "epoch": 0.15, "learning_rate": 1.9249003991615643e-05, "loss": 0.8594, "step": 2208 }, { "epoch": 0.15, "learning_rate": 1.9248164545266307e-05, "loss": 0.8906, "step": 2209 }, { "epoch": 0.15, "learning_rate": 1.9247324648346845e-05, "loss": 0.8535, "step": 2210 }, { "epoch": 0.15, "learning_rate": 1.924648430089817e-05, "loss": 0.8359, "step": 2211 }, { "epoch": 0.15, "learning_rate": 1.924564350296124e-05, "loss": 0.9258, "step": 2212 }, { "epoch": 0.15, "learning_rate": 1.9244802254577007e-05, "loss": 0.8418, "step": 2213 }, { "epoch": 0.15, "learning_rate": 1.9243960555786457e-05, "loss": 0.9521, "step": 2214 }, { "epoch": 0.15, "learning_rate": 1.9243118406630602e-05, "loss": 0.873, "step": 2215 }, { "epoch": 0.15, "learning_rate": 1.9242275807150464e-05, "loss": 0.8965, "step": 2216 }, { "epoch": 0.15, "learning_rate": 1.9241432757387106e-05, "loss": 0.9043, "step": 2217 }, { "epoch": 0.15, "learning_rate": 1.9240589257381593e-05, "loss": 0.9404, "step": 2218 }, { "epoch": 0.15, "learning_rate": 1.923974530717502e-05, "loss": 0.8828, "step": 2219 }, { "epoch": 0.15, "learning_rate": 1.9238900906808506e-05, "loss": 0.8916, "step": 2220 }, { "epoch": 0.15, "learning_rate": 1.9238056056323193e-05, "loss": 0.8447, "step": 2221 }, { "epoch": 0.15, "learning_rate": 1.9237210755760234e-05, "loss": 0.8594, "step": 2222 }, { "epoch": 0.15, "learning_rate": 1.923636500516082e-05, "loss": 0.8477, "step": 2223 }, { "epoch": 0.15, "learning_rate": 1.923551880456616e-05, "loss": 0.873, "step": 2224 }, { "epoch": 0.15, "learning_rate": 1.9234672154017465e-05, "loss": 0.9414, "step": 2225 }, { "epoch": 0.15, "learning_rate": 1.9233825053556e-05, "loss": 0.9092, "step": 2226 }, { "epoch": 0.15, "learning_rate": 1.9232977503223024e-05, "loss": 0.8604, "step": 2227 }, { "epoch": 0.15, "learning_rate": 1.9232129503059834e-05, "loss": 0.9658, "step": 2228 }, { "epoch": 0.15, "learning_rate": 1.9231281053107747e-05, "loss": 0.8516, "step": 2229 }, { "epoch": 0.15, "learning_rate": 1.9230432153408098e-05, "loss": 0.8555, "step": 2230 }, { "epoch": 0.15, "learning_rate": 1.9229582804002244e-05, "loss": 0.874, "step": 2231 }, { "epoch": 0.15, "learning_rate": 1.9228733004931566e-05, "loss": 0.8955, "step": 2232 }, { "epoch": 0.15, "learning_rate": 1.9227882756237463e-05, "loss": 0.8125, "step": 2233 }, { "epoch": 0.15, "learning_rate": 1.9227032057961365e-05, "loss": 0.9297, "step": 2234 }, { "epoch": 0.15, "learning_rate": 1.9226180910144716e-05, "loss": 0.877, "step": 2235 }, { "epoch": 0.15, "learning_rate": 1.9225329312828983e-05, "loss": 0.8438, "step": 2236 }, { "epoch": 0.15, "learning_rate": 1.9224477266055653e-05, "loss": 0.8105, "step": 2237 }, { "epoch": 0.15, "learning_rate": 1.9223624769866242e-05, "loss": 0.8809, "step": 2238 }, { "epoch": 0.15, "learning_rate": 1.9222771824302282e-05, "loss": 0.8643, "step": 2239 }, { "epoch": 0.15, "learning_rate": 1.9221918429405327e-05, "loss": 0.9209, "step": 2240 }, { "epoch": 0.15, "learning_rate": 1.9221064585216957e-05, "loss": 0.8926, "step": 2241 }, { "epoch": 0.15, "learning_rate": 1.922021029177877e-05, "loss": 0.9365, "step": 2242 }, { "epoch": 0.15, "learning_rate": 1.921935554913239e-05, "loss": 0.8721, "step": 2243 }, { "epoch": 0.15, "learning_rate": 1.9218500357319455e-05, "loss": 0.8652, "step": 2244 }, { "epoch": 0.15, "learning_rate": 1.9217644716381633e-05, "loss": 0.8242, "step": 2245 }, { "epoch": 0.15, "learning_rate": 1.9216788626360606e-05, "loss": 0.9316, "step": 2246 }, { "epoch": 0.15, "learning_rate": 1.9215932087298093e-05, "loss": 0.877, "step": 2247 }, { "epoch": 0.15, "learning_rate": 1.9215075099235815e-05, "loss": 0.9258, "step": 2248 }, { "epoch": 0.15, "learning_rate": 1.9214217662215525e-05, "loss": 0.8047, "step": 2249 }, { "epoch": 0.15, "learning_rate": 1.9213359776279e-05, "loss": 0.8896, "step": 2250 }, { "epoch": 0.15, "learning_rate": 1.921250144146804e-05, "loss": 0.9004, "step": 2251 }, { "epoch": 0.15, "learning_rate": 1.9211642657824458e-05, "loss": 0.8994, "step": 2252 }, { "epoch": 0.15, "learning_rate": 1.9210783425390093e-05, "loss": 0.9551, "step": 2253 }, { "epoch": 0.15, "learning_rate": 1.920992374420681e-05, "loss": 0.8838, "step": 2254 }, { "epoch": 0.15, "learning_rate": 1.9209063614316494e-05, "loss": 0.9141, "step": 2255 }, { "epoch": 0.15, "learning_rate": 1.920820303576104e-05, "loss": 0.917, "step": 2256 }, { "epoch": 0.15, "learning_rate": 1.9207342008582392e-05, "loss": 0.958, "step": 2257 }, { "epoch": 0.15, "learning_rate": 1.9206480532822486e-05, "loss": 0.9043, "step": 2258 }, { "epoch": 0.15, "learning_rate": 1.9205618608523296e-05, "loss": 0.9531, "step": 2259 }, { "epoch": 0.15, "learning_rate": 1.920475623572682e-05, "loss": 0.8604, "step": 2260 }, { "epoch": 0.15, "learning_rate": 1.9203893414475066e-05, "loss": 0.8994, "step": 2261 }, { "epoch": 0.15, "learning_rate": 1.920303014481007e-05, "loss": 0.9121, "step": 2262 }, { "epoch": 0.15, "learning_rate": 1.9202166426773902e-05, "loss": 0.9346, "step": 2263 }, { "epoch": 0.15, "learning_rate": 1.9201302260408632e-05, "loss": 0.832, "step": 2264 }, { "epoch": 0.15, "learning_rate": 1.9200437645756365e-05, "loss": 0.9131, "step": 2265 }, { "epoch": 0.15, "learning_rate": 1.9199572582859222e-05, "loss": 0.8613, "step": 2266 }, { "epoch": 0.15, "learning_rate": 1.9198707071759353e-05, "loss": 0.8779, "step": 2267 }, { "epoch": 0.15, "learning_rate": 1.9197841112498925e-05, "loss": 0.9072, "step": 2268 }, { "epoch": 0.15, "learning_rate": 1.9196974705120124e-05, "loss": 0.9424, "step": 2269 }, { "epoch": 0.15, "learning_rate": 1.9196107849665166e-05, "loss": 0.8154, "step": 2270 }, { "epoch": 0.15, "learning_rate": 1.9195240546176285e-05, "loss": 0.8877, "step": 2271 }, { "epoch": 0.15, "learning_rate": 1.9194372794695727e-05, "loss": 0.8701, "step": 2272 }, { "epoch": 0.15, "learning_rate": 1.9193504595265776e-05, "loss": 0.9258, "step": 2273 }, { "epoch": 0.15, "learning_rate": 1.9192635947928733e-05, "loss": 0.8721, "step": 2274 }, { "epoch": 0.16, "learning_rate": 1.919176685272691e-05, "loss": 0.7754, "step": 2275 }, { "epoch": 0.16, "learning_rate": 1.9190897309702657e-05, "loss": 0.9062, "step": 2276 }, { "epoch": 0.16, "learning_rate": 1.9190027318898338e-05, "loss": 0.8828, "step": 2277 }, { "epoch": 0.16, "learning_rate": 1.9189156880356334e-05, "loss": 0.9004, "step": 2278 }, { "epoch": 0.16, "learning_rate": 1.9188285994119053e-05, "loss": 0.9463, "step": 2279 }, { "epoch": 0.16, "learning_rate": 1.9187414660228928e-05, "loss": 0.8584, "step": 2280 }, { "epoch": 0.16, "learning_rate": 1.9186542878728407e-05, "loss": 0.8447, "step": 2281 }, { "epoch": 0.16, "learning_rate": 1.9185670649659965e-05, "loss": 0.8555, "step": 2282 }, { "epoch": 0.16, "learning_rate": 1.91847979730661e-05, "loss": 0.9141, "step": 2283 }, { "epoch": 0.16, "learning_rate": 1.9183924848989326e-05, "loss": 0.8838, "step": 2284 }, { "epoch": 0.16, "learning_rate": 1.9183051277472176e-05, "loss": 0.7646, "step": 2285 }, { "epoch": 0.16, "learning_rate": 1.918217725855722e-05, "loss": 0.8711, "step": 2286 }, { "epoch": 0.16, "learning_rate": 1.9181302792287037e-05, "loss": 0.9053, "step": 2287 }, { "epoch": 0.16, "learning_rate": 1.9180427878704225e-05, "loss": 0.8818, "step": 2288 }, { "epoch": 0.16, "learning_rate": 1.9179552517851418e-05, "loss": 0.833, "step": 2289 }, { "epoch": 0.16, "learning_rate": 1.917867670977126e-05, "loss": 0.8721, "step": 2290 }, { "epoch": 0.16, "learning_rate": 1.9177800454506415e-05, "loss": 0.9209, "step": 2291 }, { "epoch": 0.16, "learning_rate": 1.9176923752099584e-05, "loss": 0.8818, "step": 2292 }, { "epoch": 0.16, "learning_rate": 1.9176046602593475e-05, "loss": 0.9727, "step": 2293 }, { "epoch": 0.16, "learning_rate": 1.9175169006030825e-05, "loss": 0.7422, "step": 2294 }, { "epoch": 0.16, "learning_rate": 1.9174290962454386e-05, "loss": 0.9102, "step": 2295 }, { "epoch": 0.16, "learning_rate": 1.917341247190694e-05, "loss": 0.8857, "step": 2296 }, { "epoch": 0.16, "learning_rate": 1.9172533534431284e-05, "loss": 0.9385, "step": 2297 }, { "epoch": 0.16, "learning_rate": 1.9171654150070242e-05, "loss": 0.9541, "step": 2298 }, { "epoch": 0.16, "learning_rate": 1.9170774318866656e-05, "loss": 0.9014, "step": 2299 }, { "epoch": 0.16, "learning_rate": 1.916989404086339e-05, "loss": 0.8896, "step": 2300 }, { "epoch": 0.16, "learning_rate": 1.9169013316103342e-05, "loss": 0.9248, "step": 2301 }, { "epoch": 0.16, "learning_rate": 1.9168132144629407e-05, "loss": 0.8467, "step": 2302 }, { "epoch": 0.16, "learning_rate": 1.916725052648452e-05, "loss": 0.8428, "step": 2303 }, { "epoch": 0.16, "learning_rate": 1.9166368461711638e-05, "loss": 0.7812, "step": 2304 }, { "epoch": 0.16, "learning_rate": 1.916548595035373e-05, "loss": 0.9219, "step": 2305 }, { "epoch": 0.16, "learning_rate": 1.916460299245379e-05, "loss": 0.875, "step": 2306 }, { "epoch": 0.16, "learning_rate": 1.9163719588054842e-05, "loss": 0.877, "step": 2307 }, { "epoch": 0.16, "learning_rate": 1.9162835737199924e-05, "loss": 0.9746, "step": 2308 }, { "epoch": 0.16, "learning_rate": 1.9161951439932097e-05, "loss": 0.8301, "step": 2309 }, { "epoch": 0.16, "learning_rate": 1.9161066696294438e-05, "loss": 0.873, "step": 2310 }, { "epoch": 0.16, "learning_rate": 1.916018150633006e-05, "loss": 0.8643, "step": 2311 }, { "epoch": 0.16, "learning_rate": 1.9159295870082084e-05, "loss": 0.8301, "step": 2312 }, { "epoch": 0.16, "learning_rate": 1.9158409787593658e-05, "loss": 0.8486, "step": 2313 }, { "epoch": 0.16, "learning_rate": 1.9157523258907957e-05, "loss": 0.8643, "step": 2314 }, { "epoch": 0.16, "learning_rate": 1.915663628406817e-05, "loss": 0.8545, "step": 2315 }, { "epoch": 0.16, "learning_rate": 1.9155748863117508e-05, "loss": 0.7988, "step": 2316 }, { "epoch": 0.16, "learning_rate": 1.9154860996099205e-05, "loss": 0.8662, "step": 2317 }, { "epoch": 0.16, "learning_rate": 1.9153972683056527e-05, "loss": 0.8486, "step": 2318 }, { "epoch": 0.16, "learning_rate": 1.915308392403274e-05, "loss": 0.9004, "step": 2319 }, { "epoch": 0.16, "learning_rate": 1.9152194719071154e-05, "loss": 0.8623, "step": 2320 }, { "epoch": 0.16, "learning_rate": 1.9151305068215085e-05, "loss": 0.9404, "step": 2321 }, { "epoch": 0.16, "learning_rate": 1.915041497150788e-05, "loss": 0.8965, "step": 2322 }, { "epoch": 0.16, "learning_rate": 1.9149524428992907e-05, "loss": 0.8418, "step": 2323 }, { "epoch": 0.16, "learning_rate": 1.9148633440713548e-05, "loss": 0.749, "step": 2324 }, { "epoch": 0.16, "learning_rate": 1.9147742006713215e-05, "loss": 0.873, "step": 2325 }, { "epoch": 0.16, "learning_rate": 1.9146850127035336e-05, "loss": 0.8125, "step": 2326 }, { "epoch": 0.16, "learning_rate": 1.9145957801723364e-05, "loss": 0.8809, "step": 2327 }, { "epoch": 0.16, "learning_rate": 1.9145065030820776e-05, "loss": 0.9043, "step": 2328 }, { "epoch": 0.16, "learning_rate": 1.9144171814371065e-05, "loss": 0.9385, "step": 2329 }, { "epoch": 0.16, "learning_rate": 1.914327815241775e-05, "loss": 0.9414, "step": 2330 }, { "epoch": 0.16, "learning_rate": 1.914238404500437e-05, "loss": 0.9258, "step": 2331 }, { "epoch": 0.16, "learning_rate": 1.9141489492174484e-05, "loss": 0.8525, "step": 2332 }, { "epoch": 0.16, "learning_rate": 1.9140594493971676e-05, "loss": 0.9941, "step": 2333 }, { "epoch": 0.16, "learning_rate": 1.9139699050439548e-05, "loss": 0.958, "step": 2334 }, { "epoch": 0.16, "learning_rate": 1.9138803161621732e-05, "loss": 0.9424, "step": 2335 }, { "epoch": 0.16, "learning_rate": 1.9137906827561867e-05, "loss": 0.8916, "step": 2336 }, { "epoch": 0.16, "learning_rate": 1.913701004830363e-05, "loss": 0.9141, "step": 2337 }, { "epoch": 0.16, "learning_rate": 1.913611282389071e-05, "loss": 0.8672, "step": 2338 }, { "epoch": 0.16, "learning_rate": 1.9135215154366812e-05, "loss": 0.8232, "step": 2339 }, { "epoch": 0.16, "learning_rate": 1.9134317039775685e-05, "loss": 0.9453, "step": 2340 }, { "epoch": 0.16, "learning_rate": 1.913341848016107e-05, "loss": 0.8789, "step": 2341 }, { "epoch": 0.16, "learning_rate": 1.913251947556676e-05, "loss": 0.8721, "step": 2342 }, { "epoch": 0.16, "learning_rate": 1.9131620026036542e-05, "loss": 0.8066, "step": 2343 }, { "epoch": 0.16, "learning_rate": 1.9130720131614244e-05, "loss": 0.8711, "step": 2344 }, { "epoch": 0.16, "learning_rate": 1.9129819792343706e-05, "loss": 0.8584, "step": 2345 }, { "epoch": 0.16, "learning_rate": 1.912891900826879e-05, "loss": 0.8789, "step": 2346 }, { "epoch": 0.16, "learning_rate": 1.9128017779433386e-05, "loss": 0.7959, "step": 2347 }, { "epoch": 0.16, "learning_rate": 1.9127116105881404e-05, "loss": 0.8076, "step": 2348 }, { "epoch": 0.16, "learning_rate": 1.9126213987656766e-05, "loss": 0.9141, "step": 2349 }, { "epoch": 0.16, "learning_rate": 1.9125311424803433e-05, "loss": 0.874, "step": 2350 }, { "epoch": 0.16, "learning_rate": 1.912440841736537e-05, "loss": 0.8838, "step": 2351 }, { "epoch": 0.16, "learning_rate": 1.912350496538657e-05, "loss": 0.8877, "step": 2352 }, { "epoch": 0.16, "learning_rate": 1.9122601068911058e-05, "loss": 0.8613, "step": 2353 }, { "epoch": 0.16, "learning_rate": 1.9121696727982866e-05, "loss": 0.8467, "step": 2354 }, { "epoch": 0.16, "learning_rate": 1.9120791942646054e-05, "loss": 0.9219, "step": 2355 }, { "epoch": 0.16, "learning_rate": 1.91198867129447e-05, "loss": 0.9004, "step": 2356 }, { "epoch": 0.16, "learning_rate": 1.911898103892291e-05, "loss": 0.8965, "step": 2357 }, { "epoch": 0.16, "learning_rate": 1.9118074920624818e-05, "loss": 0.7939, "step": 2358 }, { "epoch": 0.16, "learning_rate": 1.9117168358094552e-05, "loss": 0.9082, "step": 2359 }, { "epoch": 0.16, "learning_rate": 1.911626135137629e-05, "loss": 0.916, "step": 2360 }, { "epoch": 0.16, "learning_rate": 1.9115353900514216e-05, "loss": 0.9473, "step": 2361 }, { "epoch": 0.16, "learning_rate": 1.911444600555255e-05, "loss": 0.9385, "step": 2362 }, { "epoch": 0.16, "learning_rate": 1.911353766653552e-05, "loss": 0.8887, "step": 2363 }, { "epoch": 0.16, "learning_rate": 1.9112628883507372e-05, "loss": 0.9219, "step": 2364 }, { "epoch": 0.16, "learning_rate": 1.9111719656512395e-05, "loss": 0.8701, "step": 2365 }, { "epoch": 0.16, "learning_rate": 1.9110809985594877e-05, "loss": 0.8838, "step": 2366 }, { "epoch": 0.16, "learning_rate": 1.9109899870799145e-05, "loss": 0.8281, "step": 2367 }, { "epoch": 0.16, "learning_rate": 1.9108989312169533e-05, "loss": 0.9404, "step": 2368 }, { "epoch": 0.16, "learning_rate": 1.9108078309750405e-05, "loss": 0.8867, "step": 2369 }, { "epoch": 0.16, "learning_rate": 1.910716686358615e-05, "loss": 0.8389, "step": 2370 }, { "epoch": 0.16, "learning_rate": 1.910625497372117e-05, "loss": 0.9043, "step": 2371 }, { "epoch": 0.16, "learning_rate": 1.9105342640199885e-05, "loss": 0.9121, "step": 2372 }, { "epoch": 0.16, "learning_rate": 1.9104429863066755e-05, "loss": 0.9316, "step": 2373 }, { "epoch": 0.16, "learning_rate": 1.9103516642366248e-05, "loss": 0.874, "step": 2374 }, { "epoch": 0.16, "learning_rate": 1.910260297814285e-05, "loss": 0.8457, "step": 2375 }, { "epoch": 0.16, "learning_rate": 1.910168887044108e-05, "loss": 0.8906, "step": 2376 }, { "epoch": 0.16, "learning_rate": 1.9100774319305472e-05, "loss": 0.9199, "step": 2377 }, { "epoch": 0.16, "learning_rate": 1.909985932478058e-05, "loss": 0.876, "step": 2378 }, { "epoch": 0.16, "learning_rate": 1.9098943886910993e-05, "loss": 0.9033, "step": 2379 }, { "epoch": 0.16, "learning_rate": 1.9098028005741297e-05, "loss": 0.9551, "step": 2380 }, { "epoch": 0.16, "learning_rate": 1.9097111681316125e-05, "loss": 0.8955, "step": 2381 }, { "epoch": 0.16, "learning_rate": 1.9096194913680114e-05, "loss": 0.7998, "step": 2382 }, { "epoch": 0.16, "learning_rate": 1.909527770287793e-05, "loss": 0.8516, "step": 2383 }, { "epoch": 0.16, "learning_rate": 1.9094360048954258e-05, "loss": 0.8154, "step": 2384 }, { "epoch": 0.16, "learning_rate": 1.909344195195381e-05, "loss": 0.8799, "step": 2385 }, { "epoch": 0.16, "learning_rate": 1.909252341192131e-05, "loss": 0.8818, "step": 2386 }, { "epoch": 0.16, "learning_rate": 1.909160442890152e-05, "loss": 0.8496, "step": 2387 }, { "epoch": 0.16, "learning_rate": 1.90906850029392e-05, "loss": 0.9004, "step": 2388 }, { "epoch": 0.16, "learning_rate": 1.908976513407915e-05, "loss": 0.9111, "step": 2389 }, { "epoch": 0.16, "learning_rate": 1.908884482236619e-05, "loss": 0.8613, "step": 2390 }, { "epoch": 0.16, "learning_rate": 1.908792406784515e-05, "loss": 0.9434, "step": 2391 }, { "epoch": 0.16, "learning_rate": 1.9087002870560894e-05, "loss": 0.8594, "step": 2392 }, { "epoch": 0.16, "learning_rate": 1.9086081230558297e-05, "loss": 0.8818, "step": 2393 }, { "epoch": 0.16, "learning_rate": 1.9085159147882272e-05, "loss": 0.8701, "step": 2394 }, { "epoch": 0.16, "learning_rate": 1.9084236622577732e-05, "loss": 0.9248, "step": 2395 }, { "epoch": 0.16, "learning_rate": 1.9083313654689627e-05, "loss": 0.9014, "step": 2396 }, { "epoch": 0.16, "learning_rate": 1.9082390244262928e-05, "loss": 0.874, "step": 2397 }, { "epoch": 0.16, "learning_rate": 1.9081466391342615e-05, "loss": 0.8135, "step": 2398 }, { "epoch": 0.16, "learning_rate": 1.9080542095973705e-05, "loss": 0.8076, "step": 2399 }, { "epoch": 0.16, "learning_rate": 1.9079617358201227e-05, "loss": 0.9131, "step": 2400 }, { "epoch": 0.16, "learning_rate": 1.907869217807023e-05, "loss": 0.8848, "step": 2401 }, { "epoch": 0.16, "learning_rate": 1.9077766555625796e-05, "loss": 0.8896, "step": 2402 }, { "epoch": 0.16, "learning_rate": 1.9076840490913014e-05, "loss": 0.8262, "step": 2403 }, { "epoch": 0.16, "learning_rate": 1.9075913983977013e-05, "loss": 0.958, "step": 2404 }, { "epoch": 0.16, "learning_rate": 1.907498703486292e-05, "loss": 0.8594, "step": 2405 }, { "epoch": 0.16, "learning_rate": 1.9074059643615903e-05, "loss": 0.8271, "step": 2406 }, { "epoch": 0.16, "learning_rate": 1.9073131810281143e-05, "loss": 0.8926, "step": 2407 }, { "epoch": 0.16, "learning_rate": 1.9072203534903842e-05, "loss": 0.9287, "step": 2408 }, { "epoch": 0.16, "learning_rate": 1.907127481752923e-05, "loss": 0.9385, "step": 2409 }, { "epoch": 0.16, "learning_rate": 1.907034565820255e-05, "loss": 0.873, "step": 2410 }, { "epoch": 0.16, "learning_rate": 1.9069416056969072e-05, "loss": 0.9053, "step": 2411 }, { "epoch": 0.16, "learning_rate": 1.9068486013874085e-05, "loss": 0.8828, "step": 2412 }, { "epoch": 0.16, "learning_rate": 1.90675555289629e-05, "loss": 0.9297, "step": 2413 }, { "epoch": 0.16, "learning_rate": 1.9066624602280853e-05, "loss": 0.9385, "step": 2414 }, { "epoch": 0.16, "learning_rate": 1.9065693233873302e-05, "loss": 0.8721, "step": 2415 }, { "epoch": 0.16, "learning_rate": 1.9064761423785614e-05, "loss": 0.8223, "step": 2416 }, { "epoch": 0.16, "learning_rate": 1.9063829172063194e-05, "loss": 0.9629, "step": 2417 }, { "epoch": 0.16, "learning_rate": 1.9062896478751457e-05, "loss": 0.9473, "step": 2418 }, { "epoch": 0.16, "learning_rate": 1.9061963343895848e-05, "loss": 0.8271, "step": 2419 }, { "epoch": 0.16, "learning_rate": 1.9061029767541824e-05, "loss": 0.8955, "step": 2420 }, { "epoch": 0.16, "learning_rate": 1.9060095749734873e-05, "loss": 0.8877, "step": 2421 }, { "epoch": 0.17, "learning_rate": 1.9059161290520495e-05, "loss": 0.916, "step": 2422 }, { "epoch": 0.17, "learning_rate": 1.9058226389944226e-05, "loss": 0.8604, "step": 2423 }, { "epoch": 0.17, "learning_rate": 1.9057291048051607e-05, "loss": 0.8301, "step": 2424 }, { "epoch": 0.17, "learning_rate": 1.905635526488821e-05, "loss": 0.9629, "step": 2425 }, { "epoch": 0.17, "learning_rate": 1.9055419040499626e-05, "loss": 0.8408, "step": 2426 }, { "epoch": 0.17, "learning_rate": 1.905448237493147e-05, "loss": 0.9062, "step": 2427 }, { "epoch": 0.17, "learning_rate": 1.905354526822937e-05, "loss": 0.8789, "step": 2428 }, { "epoch": 0.17, "learning_rate": 1.9052607720438988e-05, "loss": 0.8271, "step": 2429 }, { "epoch": 0.17, "learning_rate": 1.9051669731606e-05, "loss": 0.8721, "step": 2430 }, { "epoch": 0.17, "learning_rate": 1.9050731301776103e-05, "loss": 0.8799, "step": 2431 }, { "epoch": 0.17, "learning_rate": 1.904979243099502e-05, "loss": 0.8877, "step": 2432 }, { "epoch": 0.17, "learning_rate": 1.904885311930849e-05, "loss": 0.8184, "step": 2433 }, { "epoch": 0.17, "learning_rate": 1.9047913366762278e-05, "loss": 0.9316, "step": 2434 }, { "epoch": 0.17, "learning_rate": 1.9046973173402164e-05, "loss": 0.835, "step": 2435 }, { "epoch": 0.17, "learning_rate": 1.9046032539273966e-05, "loss": 0.8311, "step": 2436 }, { "epoch": 0.17, "learning_rate": 1.90450914644235e-05, "loss": 0.8584, "step": 2437 }, { "epoch": 0.17, "learning_rate": 1.9044149948896615e-05, "loss": 0.8906, "step": 2438 }, { "epoch": 0.17, "learning_rate": 1.904320799273919e-05, "loss": 0.8545, "step": 2439 }, { "epoch": 0.17, "learning_rate": 1.904226559599711e-05, "loss": 0.9111, "step": 2440 }, { "epoch": 0.17, "learning_rate": 1.9041322758716295e-05, "loss": 0.9668, "step": 2441 }, { "epoch": 0.17, "learning_rate": 1.9040379480942676e-05, "loss": 0.9062, "step": 2442 }, { "epoch": 0.17, "learning_rate": 1.9039435762722203e-05, "loss": 0.9102, "step": 2443 }, { "epoch": 0.17, "learning_rate": 1.903849160410087e-05, "loss": 0.8438, "step": 2444 }, { "epoch": 0.17, "learning_rate": 1.9037547005124658e-05, "loss": 0.9023, "step": 2445 }, { "epoch": 0.17, "learning_rate": 1.90366019658396e-05, "loss": 0.9502, "step": 2446 }, { "epoch": 0.17, "learning_rate": 1.9035656486291736e-05, "loss": 0.8672, "step": 2447 }, { "epoch": 0.17, "learning_rate": 1.9034710566527128e-05, "loss": 0.8682, "step": 2448 }, { "epoch": 0.17, "learning_rate": 1.903376420659186e-05, "loss": 0.873, "step": 2449 }, { "epoch": 0.17, "learning_rate": 1.9032817406532045e-05, "loss": 0.8643, "step": 2450 }, { "epoch": 0.17, "learning_rate": 1.9031870166393803e-05, "loss": 0.8916, "step": 2451 }, { "epoch": 0.17, "learning_rate": 1.9030922486223286e-05, "loss": 0.8457, "step": 2452 }, { "epoch": 0.17, "learning_rate": 1.902997436606667e-05, "loss": 0.8809, "step": 2453 }, { "epoch": 0.17, "learning_rate": 1.9029025805970137e-05, "loss": 0.8613, "step": 2454 }, { "epoch": 0.17, "learning_rate": 1.9028076805979913e-05, "loss": 0.8506, "step": 2455 }, { "epoch": 0.17, "learning_rate": 1.9027127366142223e-05, "loss": 0.9131, "step": 2456 }, { "epoch": 0.17, "learning_rate": 1.9026177486503332e-05, "loss": 0.8799, "step": 2457 }, { "epoch": 0.17, "learning_rate": 1.902522716710951e-05, "loss": 0.9229, "step": 2458 }, { "epoch": 0.17, "learning_rate": 1.9024276408007064e-05, "loss": 0.8838, "step": 2459 }, { "epoch": 0.17, "learning_rate": 1.9023325209242308e-05, "loss": 0.8838, "step": 2460 }, { "epoch": 0.17, "learning_rate": 1.902237357086159e-05, "loss": 0.8232, "step": 2461 }, { "epoch": 0.17, "learning_rate": 1.9021421492911272e-05, "loss": 0.9336, "step": 2462 }, { "epoch": 0.17, "learning_rate": 1.902046897543774e-05, "loss": 0.8975, "step": 2463 }, { "epoch": 0.17, "learning_rate": 1.9019516018487396e-05, "loss": 0.9697, "step": 2464 }, { "epoch": 0.17, "learning_rate": 1.9018562622106672e-05, "loss": 0.9531, "step": 2465 }, { "epoch": 0.17, "learning_rate": 1.9017608786342018e-05, "loss": 0.8818, "step": 2466 }, { "epoch": 0.17, "learning_rate": 1.9016654511239906e-05, "loss": 0.8984, "step": 2467 }, { "epoch": 0.17, "learning_rate": 1.9015699796846823e-05, "loss": 0.8896, "step": 2468 }, { "epoch": 0.17, "learning_rate": 1.9014744643209285e-05, "loss": 0.8691, "step": 2469 }, { "epoch": 0.17, "learning_rate": 1.9013789050373826e-05, "loss": 0.8008, "step": 2470 }, { "epoch": 0.17, "learning_rate": 1.901283301838701e-05, "loss": 0.8838, "step": 2471 }, { "epoch": 0.17, "learning_rate": 1.901187654729541e-05, "loss": 0.8926, "step": 2472 }, { "epoch": 0.17, "learning_rate": 1.9010919637145616e-05, "loss": 0.8691, "step": 2473 }, { "epoch": 0.17, "learning_rate": 1.900996228798426e-05, "loss": 0.9268, "step": 2474 }, { "epoch": 0.17, "learning_rate": 1.9009004499857982e-05, "loss": 0.8223, "step": 2475 }, { "epoch": 0.17, "learning_rate": 1.9008046272813443e-05, "loss": 0.8711, "step": 2476 }, { "epoch": 0.17, "learning_rate": 1.900708760689733e-05, "loss": 0.8604, "step": 2477 }, { "epoch": 0.17, "learning_rate": 1.9006128502156345e-05, "loss": 0.9121, "step": 2478 }, { "epoch": 0.17, "learning_rate": 1.900516895863722e-05, "loss": 0.9688, "step": 2479 }, { "epoch": 0.17, "learning_rate": 1.90042089763867e-05, "loss": 0.9219, "step": 2480 }, { "epoch": 0.17, "learning_rate": 1.9003248555451565e-05, "loss": 0.9775, "step": 2481 }, { "epoch": 0.17, "learning_rate": 1.9002287695878597e-05, "loss": 0.8613, "step": 2482 }, { "epoch": 0.17, "learning_rate": 1.9001326397714608e-05, "loss": 0.7686, "step": 2483 }, { "epoch": 0.17, "learning_rate": 1.900036466100644e-05, "loss": 0.8438, "step": 2484 }, { "epoch": 0.17, "learning_rate": 1.899940248580094e-05, "loss": 0.8721, "step": 2485 }, { "epoch": 0.17, "learning_rate": 1.8998439872144995e-05, "loss": 0.8115, "step": 2486 }, { "epoch": 0.17, "learning_rate": 1.8997476820085495e-05, "loss": 0.9189, "step": 2487 }, { "epoch": 0.17, "learning_rate": 1.8996513329669362e-05, "loss": 0.8896, "step": 2488 }, { "epoch": 0.17, "learning_rate": 1.899554940094354e-05, "loss": 0.9443, "step": 2489 }, { "epoch": 0.17, "learning_rate": 1.8994585033954988e-05, "loss": 0.9014, "step": 2490 }, { "epoch": 0.17, "learning_rate": 1.8993620228750695e-05, "loss": 0.9346, "step": 2491 }, { "epoch": 0.17, "learning_rate": 1.8992654985377662e-05, "loss": 0.8906, "step": 2492 }, { "epoch": 0.17, "learning_rate": 1.8991689303882915e-05, "loss": 0.8604, "step": 2493 }, { "epoch": 0.17, "learning_rate": 1.8990723184313506e-05, "loss": 0.873, "step": 2494 }, { "epoch": 0.17, "learning_rate": 1.8989756626716498e-05, "loss": 0.8994, "step": 2495 }, { "epoch": 0.17, "learning_rate": 1.8988789631138987e-05, "loss": 0.8369, "step": 2496 }, { "epoch": 0.17, "learning_rate": 1.898782219762809e-05, "loss": 0.9004, "step": 2497 }, { "epoch": 0.17, "learning_rate": 1.8986854326230925e-05, "loss": 0.8916, "step": 2498 }, { "epoch": 0.17, "learning_rate": 1.898588601699466e-05, "loss": 0.8652, "step": 2499 }, { "epoch": 0.17, "learning_rate": 1.8984917269966465e-05, "loss": 0.8604, "step": 2500 }, { "epoch": 0.17, "learning_rate": 1.898394808519354e-05, "loss": 0.9395, "step": 2501 }, { "epoch": 0.17, "learning_rate": 1.8982978462723102e-05, "loss": 0.8496, "step": 2502 }, { "epoch": 0.17, "learning_rate": 1.898200840260239e-05, "loss": 0.9941, "step": 2503 }, { "epoch": 0.17, "learning_rate": 1.8981037904878668e-05, "loss": 0.8857, "step": 2504 }, { "epoch": 0.17, "learning_rate": 1.8980066969599216e-05, "loss": 0.8896, "step": 2505 }, { "epoch": 0.17, "learning_rate": 1.897909559681134e-05, "loss": 0.8643, "step": 2506 }, { "epoch": 0.17, "learning_rate": 1.8978123786562367e-05, "loss": 0.9375, "step": 2507 }, { "epoch": 0.17, "learning_rate": 1.8977151538899635e-05, "loss": 0.8682, "step": 2508 }, { "epoch": 0.17, "learning_rate": 1.8976178853870522e-05, "loss": 0.8633, "step": 2509 }, { "epoch": 0.17, "learning_rate": 1.8975205731522415e-05, "loss": 0.9219, "step": 2510 }, { "epoch": 0.17, "learning_rate": 1.8974232171902717e-05, "loss": 0.8379, "step": 2511 }, { "epoch": 0.17, "learning_rate": 1.897325817505887e-05, "loss": 0.9062, "step": 2512 }, { "epoch": 0.17, "learning_rate": 1.897228374103832e-05, "loss": 0.793, "step": 2513 }, { "epoch": 0.17, "learning_rate": 1.8971308869888543e-05, "loss": 0.9248, "step": 2514 }, { "epoch": 0.17, "learning_rate": 1.8970333561657038e-05, "loss": 0.9111, "step": 2515 }, { "epoch": 0.17, "learning_rate": 1.8969357816391318e-05, "loss": 0.8945, "step": 2516 }, { "epoch": 0.17, "learning_rate": 1.896838163413892e-05, "loss": 0.8174, "step": 2517 }, { "epoch": 0.17, "learning_rate": 1.896740501494741e-05, "loss": 0.8604, "step": 2518 }, { "epoch": 0.17, "learning_rate": 1.8966427958864362e-05, "loss": 0.9443, "step": 2519 }, { "epoch": 0.17, "learning_rate": 1.896545046593738e-05, "loss": 0.9209, "step": 2520 }, { "epoch": 0.17, "learning_rate": 1.8964472536214093e-05, "loss": 0.8896, "step": 2521 }, { "epoch": 0.17, "learning_rate": 1.896349416974214e-05, "loss": 0.8184, "step": 2522 }, { "epoch": 0.17, "learning_rate": 1.8962515366569186e-05, "loss": 0.8965, "step": 2523 }, { "epoch": 0.17, "learning_rate": 1.8961536126742922e-05, "loss": 0.8701, "step": 2524 }, { "epoch": 0.17, "learning_rate": 1.8960556450311055e-05, "loss": 0.8633, "step": 2525 }, { "epoch": 0.17, "learning_rate": 1.8959576337321315e-05, "loss": 0.9561, "step": 2526 }, { "epoch": 0.17, "learning_rate": 1.8958595787821453e-05, "loss": 0.9453, "step": 2527 }, { "epoch": 0.17, "learning_rate": 1.8957614801859238e-05, "loss": 0.8887, "step": 2528 }, { "epoch": 0.17, "learning_rate": 1.895663337948247e-05, "loss": 0.9189, "step": 2529 }, { "epoch": 0.17, "learning_rate": 1.8955651520738957e-05, "loss": 0.9434, "step": 2530 }, { "epoch": 0.17, "learning_rate": 1.8954669225676542e-05, "loss": 0.9258, "step": 2531 }, { "epoch": 0.17, "learning_rate": 1.895368649434308e-05, "loss": 0.9131, "step": 2532 }, { "epoch": 0.17, "learning_rate": 1.8952703326786447e-05, "loss": 0.915, "step": 2533 }, { "epoch": 0.17, "learning_rate": 1.8951719723054546e-05, "loss": 0.8398, "step": 2534 }, { "epoch": 0.17, "learning_rate": 1.8950735683195295e-05, "loss": 0.9922, "step": 2535 }, { "epoch": 0.17, "learning_rate": 1.8949751207256635e-05, "loss": 0.8613, "step": 2536 }, { "epoch": 0.17, "learning_rate": 1.8948766295286535e-05, "loss": 0.8398, "step": 2537 }, { "epoch": 0.17, "learning_rate": 1.894778094733298e-05, "loss": 0.8975, "step": 2538 }, { "epoch": 0.17, "learning_rate": 1.894679516344397e-05, "loss": 0.9199, "step": 2539 }, { "epoch": 0.17, "learning_rate": 1.8945808943667537e-05, "loss": 0.873, "step": 2540 }, { "epoch": 0.17, "learning_rate": 1.8944822288051733e-05, "loss": 0.8662, "step": 2541 }, { "epoch": 0.17, "learning_rate": 1.8943835196644617e-05, "loss": 0.8457, "step": 2542 }, { "epoch": 0.17, "learning_rate": 1.894284766949429e-05, "loss": 0.9424, "step": 2543 }, { "epoch": 0.17, "learning_rate": 1.8941859706648858e-05, "loss": 0.7656, "step": 2544 }, { "epoch": 0.17, "learning_rate": 1.894087130815646e-05, "loss": 0.9561, "step": 2545 }, { "epoch": 0.17, "learning_rate": 1.8939882474065244e-05, "loss": 0.8857, "step": 2546 }, { "epoch": 0.17, "learning_rate": 1.8938893204423396e-05, "loss": 0.8701, "step": 2547 }, { "epoch": 0.17, "learning_rate": 1.8937903499279104e-05, "loss": 0.8408, "step": 2548 }, { "epoch": 0.17, "learning_rate": 1.8936913358680588e-05, "loss": 0.8447, "step": 2549 }, { "epoch": 0.17, "learning_rate": 1.8935922782676088e-05, "loss": 0.9229, "step": 2550 }, { "epoch": 0.17, "learning_rate": 1.893493177131387e-05, "loss": 0.8613, "step": 2551 }, { "epoch": 0.17, "learning_rate": 1.8933940324642207e-05, "loss": 0.8447, "step": 2552 }, { "epoch": 0.17, "learning_rate": 1.8932948442709408e-05, "loss": 0.9033, "step": 2553 }, { "epoch": 0.17, "learning_rate": 1.89319561255638e-05, "loss": 0.9541, "step": 2554 }, { "epoch": 0.17, "learning_rate": 1.8930963373253722e-05, "loss": 0.9248, "step": 2555 }, { "epoch": 0.17, "learning_rate": 1.8929970185827544e-05, "loss": 0.8447, "step": 2556 }, { "epoch": 0.17, "learning_rate": 1.8928976563333657e-05, "loss": 0.834, "step": 2557 }, { "epoch": 0.17, "learning_rate": 1.8927982505820463e-05, "loss": 0.8516, "step": 2558 }, { "epoch": 0.17, "learning_rate": 1.8926988013336402e-05, "loss": 0.8672, "step": 2559 }, { "epoch": 0.17, "learning_rate": 1.8925993085929916e-05, "loss": 0.8438, "step": 2560 }, { "epoch": 0.17, "learning_rate": 1.8924997723649484e-05, "loss": 0.8936, "step": 2561 }, { "epoch": 0.17, "learning_rate": 1.8924001926543598e-05, "loss": 0.915, "step": 2562 }, { "epoch": 0.17, "learning_rate": 1.8923005694660772e-05, "loss": 0.9707, "step": 2563 }, { "epoch": 0.17, "learning_rate": 1.8922009028049548e-05, "loss": 0.8105, "step": 2564 }, { "epoch": 0.17, "learning_rate": 1.8921011926758474e-05, "loss": 0.876, "step": 2565 }, { "epoch": 0.17, "learning_rate": 1.8920014390836137e-05, "loss": 0.7852, "step": 2566 }, { "epoch": 0.17, "learning_rate": 1.8919016420331132e-05, "loss": 0.8223, "step": 2567 }, { "epoch": 0.18, "learning_rate": 1.8918018015292082e-05, "loss": 0.8867, "step": 2568 }, { "epoch": 0.18, "learning_rate": 1.891701917576763e-05, "loss": 0.834, "step": 2569 }, { "epoch": 0.18, "learning_rate": 1.891601990180644e-05, "loss": 0.8213, "step": 2570 }, { "epoch": 0.18, "learning_rate": 1.891502019345719e-05, "loss": 0.8447, "step": 2571 }, { "epoch": 0.18, "learning_rate": 1.8914020050768597e-05, "loss": 0.9404, "step": 2572 }, { "epoch": 0.18, "learning_rate": 1.891301947378938e-05, "loss": 0.916, "step": 2573 }, { "epoch": 0.18, "learning_rate": 1.8912018462568288e-05, "loss": 0.8799, "step": 2574 }, { "epoch": 0.18, "learning_rate": 1.8911017017154093e-05, "loss": 0.9043, "step": 2575 }, { "epoch": 0.18, "learning_rate": 1.891001513759558e-05, "loss": 0.8613, "step": 2576 }, { "epoch": 0.18, "learning_rate": 1.8909012823941566e-05, "loss": 0.915, "step": 2577 }, { "epoch": 0.18, "learning_rate": 1.8908010076240883e-05, "loss": 0.8867, "step": 2578 }, { "epoch": 0.18, "learning_rate": 1.890700689454238e-05, "loss": 0.9189, "step": 2579 }, { "epoch": 0.18, "learning_rate": 1.890600327889494e-05, "loss": 0.8604, "step": 2580 }, { "epoch": 0.18, "learning_rate": 1.8904999229347452e-05, "loss": 0.8301, "step": 2581 }, { "epoch": 0.18, "learning_rate": 1.8903994745948836e-05, "loss": 0.8496, "step": 2582 }, { "epoch": 0.18, "learning_rate": 1.8902989828748032e-05, "loss": 0.9023, "step": 2583 }, { "epoch": 0.18, "learning_rate": 1.890198447779399e-05, "loss": 0.9131, "step": 2584 }, { "epoch": 0.18, "learning_rate": 1.890097869313571e-05, "loss": 0.8682, "step": 2585 }, { "epoch": 0.18, "learning_rate": 1.8899972474822176e-05, "loss": 0.8809, "step": 2586 }, { "epoch": 0.18, "learning_rate": 1.8898965822902416e-05, "loss": 0.9219, "step": 2587 }, { "epoch": 0.18, "learning_rate": 1.8897958737425477e-05, "loss": 0.8701, "step": 2588 }, { "epoch": 0.18, "learning_rate": 1.8896951218440424e-05, "loss": 0.8496, "step": 2589 }, { "epoch": 0.18, "learning_rate": 1.8895943265996336e-05, "loss": 0.8721, "step": 2590 }, { "epoch": 0.18, "learning_rate": 1.889493488014233e-05, "loss": 0.8154, "step": 2591 }, { "epoch": 0.18, "learning_rate": 1.889392606092753e-05, "loss": 0.9443, "step": 2592 }, { "epoch": 0.18, "learning_rate": 1.8892916808401086e-05, "loss": 0.8691, "step": 2593 }, { "epoch": 0.18, "learning_rate": 1.889190712261217e-05, "loss": 0.9609, "step": 2594 }, { "epoch": 0.18, "learning_rate": 1.889089700360997e-05, "loss": 0.875, "step": 2595 }, { "epoch": 0.18, "learning_rate": 1.88898864514437e-05, "loss": 0.8809, "step": 2596 }, { "epoch": 0.18, "learning_rate": 1.88888754661626e-05, "loss": 0.8438, "step": 2597 }, { "epoch": 0.18, "learning_rate": 1.888786404781592e-05, "loss": 0.9082, "step": 2598 }, { "epoch": 0.18, "learning_rate": 1.8886852196452933e-05, "loss": 0.8213, "step": 2599 }, { "epoch": 0.18, "learning_rate": 1.8885839912122948e-05, "loss": 0.8926, "step": 2600 }, { "epoch": 0.18, "learning_rate": 1.8884827194875267e-05, "loss": 0.8564, "step": 2601 }, { "epoch": 0.18, "learning_rate": 1.8883814044759242e-05, "loss": 0.8291, "step": 2602 }, { "epoch": 0.18, "learning_rate": 1.8882800461824235e-05, "loss": 0.9619, "step": 2603 }, { "epoch": 0.18, "learning_rate": 1.8881786446119617e-05, "loss": 0.9004, "step": 2604 }, { "epoch": 0.18, "learning_rate": 1.8880771997694797e-05, "loss": 0.9639, "step": 2605 }, { "epoch": 0.18, "learning_rate": 1.88797571165992e-05, "loss": 0.8418, "step": 2606 }, { "epoch": 0.18, "learning_rate": 1.8878741802882268e-05, "loss": 0.8691, "step": 2607 }, { "epoch": 0.18, "learning_rate": 1.8877726056593468e-05, "loss": 0.9258, "step": 2608 }, { "epoch": 0.18, "learning_rate": 1.887670987778229e-05, "loss": 0.8525, "step": 2609 }, { "epoch": 0.18, "learning_rate": 1.8875693266498236e-05, "loss": 0.8828, "step": 2610 }, { "epoch": 0.18, "learning_rate": 1.887467622279084e-05, "loss": 0.9023, "step": 2611 }, { "epoch": 0.18, "learning_rate": 1.8873658746709654e-05, "loss": 0.835, "step": 2612 }, { "epoch": 0.18, "learning_rate": 1.8872640838304245e-05, "loss": 0.9023, "step": 2613 }, { "epoch": 0.18, "learning_rate": 1.8871622497624207e-05, "loss": 0.9043, "step": 2614 }, { "epoch": 0.18, "learning_rate": 1.8870603724719154e-05, "loss": 0.8545, "step": 2615 }, { "epoch": 0.18, "learning_rate": 1.8869584519638717e-05, "loss": 0.8574, "step": 2616 }, { "epoch": 0.18, "learning_rate": 1.8868564882432557e-05, "loss": 0.9102, "step": 2617 }, { "epoch": 0.18, "learning_rate": 1.8867544813150348e-05, "loss": 0.835, "step": 2618 }, { "epoch": 0.18, "learning_rate": 1.886652431184179e-05, "loss": 0.8291, "step": 2619 }, { "epoch": 0.18, "learning_rate": 1.8865503378556597e-05, "loss": 0.8965, "step": 2620 }, { "epoch": 0.18, "learning_rate": 1.8864482013344512e-05, "loss": 0.8945, "step": 2621 }, { "epoch": 0.18, "learning_rate": 1.8863460216255298e-05, "loss": 0.9229, "step": 2622 }, { "epoch": 0.18, "learning_rate": 1.8862437987338733e-05, "loss": 0.8994, "step": 2623 }, { "epoch": 0.18, "learning_rate": 1.8861415326644622e-05, "loss": 0.874, "step": 2624 }, { "epoch": 0.18, "learning_rate": 1.886039223422279e-05, "loss": 0.8408, "step": 2625 }, { "epoch": 0.18, "learning_rate": 1.885936871012308e-05, "loss": 0.8613, "step": 2626 }, { "epoch": 0.18, "learning_rate": 1.8858344754395355e-05, "loss": 0.9297, "step": 2627 }, { "epoch": 0.18, "learning_rate": 1.8857320367089508e-05, "loss": 0.8701, "step": 2628 }, { "epoch": 0.18, "learning_rate": 1.8856295548255445e-05, "loss": 0.8154, "step": 2629 }, { "epoch": 0.18, "learning_rate": 1.8855270297943094e-05, "loss": 0.8662, "step": 2630 }, { "epoch": 0.18, "learning_rate": 1.8854244616202405e-05, "loss": 0.8652, "step": 2631 }, { "epoch": 0.18, "learning_rate": 1.8853218503083354e-05, "loss": 0.9795, "step": 2632 }, { "epoch": 0.18, "learning_rate": 1.8852191958635922e-05, "loss": 0.8984, "step": 2633 }, { "epoch": 0.18, "learning_rate": 1.8851164982910135e-05, "loss": 0.8174, "step": 2634 }, { "epoch": 0.18, "learning_rate": 1.8850137575956023e-05, "loss": 0.8613, "step": 2635 }, { "epoch": 0.18, "learning_rate": 1.8849109737823634e-05, "loss": 0.8594, "step": 2636 }, { "epoch": 0.18, "learning_rate": 1.8848081468563056e-05, "loss": 0.8809, "step": 2637 }, { "epoch": 0.18, "learning_rate": 1.884705276822438e-05, "loss": 0.9336, "step": 2638 }, { "epoch": 0.18, "learning_rate": 1.884602363685772e-05, "loss": 0.9092, "step": 2639 }, { "epoch": 0.18, "learning_rate": 1.884499407451322e-05, "loss": 0.834, "step": 2640 }, { "epoch": 0.18, "learning_rate": 1.8843964081241044e-05, "loss": 0.8926, "step": 2641 }, { "epoch": 0.18, "learning_rate": 1.8842933657091368e-05, "loss": 0.8574, "step": 2642 }, { "epoch": 0.18, "learning_rate": 1.8841902802114396e-05, "loss": 0.8779, "step": 2643 }, { "epoch": 0.18, "learning_rate": 1.884087151636035e-05, "loss": 0.9482, "step": 2644 }, { "epoch": 0.18, "learning_rate": 1.8839839799879472e-05, "loss": 0.834, "step": 2645 }, { "epoch": 0.18, "learning_rate": 1.8838807652722036e-05, "loss": 0.8994, "step": 2646 }, { "epoch": 0.18, "learning_rate": 1.883777507493832e-05, "loss": 0.9404, "step": 2647 }, { "epoch": 0.18, "learning_rate": 1.883674206657863e-05, "loss": 0.7998, "step": 2648 }, { "epoch": 0.18, "learning_rate": 1.88357086276933e-05, "loss": 0.8301, "step": 2649 }, { "epoch": 0.18, "learning_rate": 1.8834674758332677e-05, "loss": 0.998, "step": 2650 }, { "epoch": 0.18, "learning_rate": 1.883364045854713e-05, "loss": 0.8662, "step": 2651 }, { "epoch": 0.18, "learning_rate": 1.8832605728387047e-05, "loss": 0.875, "step": 2652 }, { "epoch": 0.18, "learning_rate": 1.8831570567902847e-05, "loss": 1.0107, "step": 2653 }, { "epoch": 0.18, "learning_rate": 1.8830534977144962e-05, "loss": 0.9355, "step": 2654 }, { "epoch": 0.18, "learning_rate": 1.882949895616384e-05, "loss": 0.9072, "step": 2655 }, { "epoch": 0.18, "learning_rate": 1.882846250500996e-05, "loss": 0.9111, "step": 2656 }, { "epoch": 0.18, "learning_rate": 1.8827425623733816e-05, "loss": 0.8408, "step": 2657 }, { "epoch": 0.18, "learning_rate": 1.882638831238593e-05, "loss": 0.8457, "step": 2658 }, { "epoch": 0.18, "learning_rate": 1.8825350571016834e-05, "loss": 0.8926, "step": 2659 }, { "epoch": 0.18, "learning_rate": 1.882431239967709e-05, "loss": 0.8271, "step": 2660 }, { "epoch": 0.18, "learning_rate": 1.8823273798417274e-05, "loss": 0.9248, "step": 2661 }, { "epoch": 0.18, "learning_rate": 1.882223476728799e-05, "loss": 0.8438, "step": 2662 }, { "epoch": 0.18, "learning_rate": 1.8821195306339855e-05, "loss": 0.8984, "step": 2663 }, { "epoch": 0.18, "learning_rate": 1.882015541562352e-05, "loss": 0.9326, "step": 2664 }, { "epoch": 0.18, "learning_rate": 1.8819115095189642e-05, "loss": 0.8252, "step": 2665 }, { "epoch": 0.18, "learning_rate": 1.8818074345088904e-05, "loss": 0.9238, "step": 2666 }, { "epoch": 0.18, "learning_rate": 1.8817033165372016e-05, "loss": 0.8242, "step": 2667 }, { "epoch": 0.18, "learning_rate": 1.8815991556089703e-05, "loss": 0.9414, "step": 2668 }, { "epoch": 0.18, "learning_rate": 1.881494951729271e-05, "loss": 0.8633, "step": 2669 }, { "epoch": 0.18, "learning_rate": 1.8813907049031805e-05, "loss": 0.9307, "step": 2670 }, { "epoch": 0.18, "learning_rate": 1.881286415135778e-05, "loss": 0.8359, "step": 2671 }, { "epoch": 0.18, "learning_rate": 1.8811820824321442e-05, "loss": 0.7852, "step": 2672 }, { "epoch": 0.18, "learning_rate": 1.8810777067973628e-05, "loss": 0.8506, "step": 2673 }, { "epoch": 0.18, "learning_rate": 1.880973288236518e-05, "loss": 0.9053, "step": 2674 }, { "epoch": 0.18, "learning_rate": 1.8808688267546977e-05, "loss": 0.792, "step": 2675 }, { "epoch": 0.18, "learning_rate": 1.880764322356991e-05, "loss": 0.9131, "step": 2676 }, { "epoch": 0.18, "learning_rate": 1.8806597750484895e-05, "loss": 0.9346, "step": 2677 }, { "epoch": 0.18, "learning_rate": 1.8805551848342868e-05, "loss": 0.8848, "step": 2678 }, { "epoch": 0.18, "learning_rate": 1.8804505517194783e-05, "loss": 0.8926, "step": 2679 }, { "epoch": 0.18, "learning_rate": 1.880345875709162e-05, "loss": 0.9268, "step": 2680 }, { "epoch": 0.18, "learning_rate": 1.880241156808438e-05, "loss": 0.9482, "step": 2681 }, { "epoch": 0.18, "learning_rate": 1.880136395022407e-05, "loss": 0.8916, "step": 2682 }, { "epoch": 0.18, "learning_rate": 1.8800315903561742e-05, "loss": 0.9629, "step": 2683 }, { "epoch": 0.18, "learning_rate": 1.879926742814845e-05, "loss": 0.8857, "step": 2684 }, { "epoch": 0.18, "learning_rate": 1.8798218524035278e-05, "loss": 0.8232, "step": 2685 }, { "epoch": 0.18, "learning_rate": 1.879716919127333e-05, "loss": 0.9277, "step": 2686 }, { "epoch": 0.18, "learning_rate": 1.8796119429913727e-05, "loss": 0.8457, "step": 2687 }, { "epoch": 0.18, "learning_rate": 1.8795069240007617e-05, "loss": 0.9248, "step": 2688 }, { "epoch": 0.18, "learning_rate": 1.879401862160616e-05, "loss": 0.9189, "step": 2689 }, { "epoch": 0.18, "learning_rate": 1.8792967574760543e-05, "loss": 0.8027, "step": 2690 }, { "epoch": 0.18, "learning_rate": 1.879191609952198e-05, "loss": 0.8867, "step": 2691 }, { "epoch": 0.18, "learning_rate": 1.8790864195941687e-05, "loss": 0.8711, "step": 2692 }, { "epoch": 0.18, "learning_rate": 1.878981186407092e-05, "loss": 0.8848, "step": 2693 }, { "epoch": 0.18, "learning_rate": 1.878875910396095e-05, "loss": 0.8916, "step": 2694 }, { "epoch": 0.18, "learning_rate": 1.8787705915663067e-05, "loss": 0.8701, "step": 2695 }, { "epoch": 0.18, "learning_rate": 1.8786652299228578e-05, "loss": 0.9072, "step": 2696 }, { "epoch": 0.18, "learning_rate": 1.8785598254708817e-05, "loss": 0.9639, "step": 2697 }, { "epoch": 0.18, "learning_rate": 1.8784543782155137e-05, "loss": 0.8711, "step": 2698 }, { "epoch": 0.18, "learning_rate": 1.8783488881618913e-05, "loss": 0.8359, "step": 2699 }, { "epoch": 0.18, "learning_rate": 1.878243355315154e-05, "loss": 0.8584, "step": 2700 }, { "epoch": 0.18, "learning_rate": 1.8781377796804432e-05, "loss": 0.9014, "step": 2701 }, { "epoch": 0.18, "learning_rate": 1.878032161262903e-05, "loss": 0.8828, "step": 2702 }, { "epoch": 0.18, "learning_rate": 1.8779265000676782e-05, "loss": 0.8799, "step": 2703 }, { "epoch": 0.18, "learning_rate": 1.8778207960999172e-05, "loss": 0.876, "step": 2704 }, { "epoch": 0.18, "learning_rate": 1.8777150493647695e-05, "loss": 0.9062, "step": 2705 }, { "epoch": 0.18, "learning_rate": 1.8776092598673878e-05, "loss": 0.7822, "step": 2706 }, { "epoch": 0.18, "learning_rate": 1.877503427612926e-05, "loss": 0.8096, "step": 2707 }, { "epoch": 0.18, "learning_rate": 1.8773975526065396e-05, "loss": 0.8711, "step": 2708 }, { "epoch": 0.18, "learning_rate": 1.8772916348533873e-05, "loss": 0.8457, "step": 2709 }, { "epoch": 0.18, "learning_rate": 1.8771856743586293e-05, "loss": 0.8291, "step": 2710 }, { "epoch": 0.18, "learning_rate": 1.8770796711274283e-05, "loss": 0.8369, "step": 2711 }, { "epoch": 0.18, "learning_rate": 1.8769736251649483e-05, "loss": 0.8467, "step": 2712 }, { "epoch": 0.18, "learning_rate": 1.8768675364763558e-05, "loss": 0.8818, "step": 2713 }, { "epoch": 0.18, "learning_rate": 1.87676140506682e-05, "loss": 0.833, "step": 2714 }, { "epoch": 0.19, "learning_rate": 1.8766552309415114e-05, "loss": 0.8857, "step": 2715 }, { "epoch": 0.19, "learning_rate": 1.8765490141056025e-05, "loss": 0.876, "step": 2716 }, { "epoch": 0.19, "learning_rate": 1.8764427545642683e-05, "loss": 0.9033, "step": 2717 }, { "epoch": 0.19, "learning_rate": 1.876336452322686e-05, "loss": 0.873, "step": 2718 }, { "epoch": 0.19, "learning_rate": 1.8762301073860346e-05, "loss": 0.8604, "step": 2719 }, { "epoch": 0.19, "learning_rate": 1.8761237197594945e-05, "loss": 0.8291, "step": 2720 }, { "epoch": 0.19, "learning_rate": 1.87601728944825e-05, "loss": 0.8945, "step": 2721 }, { "epoch": 0.19, "learning_rate": 1.875910816457486e-05, "loss": 0.9023, "step": 2722 }, { "epoch": 0.19, "learning_rate": 1.8758043007923895e-05, "loss": 0.9014, "step": 2723 }, { "epoch": 0.19, "learning_rate": 1.8756977424581503e-05, "loss": 0.9102, "step": 2724 }, { "epoch": 0.19, "learning_rate": 1.8755911414599596e-05, "loss": 0.8125, "step": 2725 }, { "epoch": 0.19, "learning_rate": 1.8754844978030112e-05, "loss": 0.9355, "step": 2726 }, { "epoch": 0.19, "learning_rate": 1.875377811492501e-05, "loss": 0.8662, "step": 2727 }, { "epoch": 0.19, "learning_rate": 1.8752710825336264e-05, "loss": 0.8623, "step": 2728 }, { "epoch": 0.19, "learning_rate": 1.8751643109315873e-05, "loss": 0.915, "step": 2729 }, { "epoch": 0.19, "learning_rate": 1.8750574966915857e-05, "loss": 0.9131, "step": 2730 }, { "epoch": 0.19, "learning_rate": 1.8749506398188254e-05, "loss": 0.9434, "step": 2731 }, { "epoch": 0.19, "learning_rate": 1.8748437403185128e-05, "loss": 0.8896, "step": 2732 }, { "epoch": 0.19, "learning_rate": 1.8747367981958556e-05, "loss": 0.8975, "step": 2733 }, { "epoch": 0.19, "learning_rate": 1.8746298134560645e-05, "loss": 0.9023, "step": 2734 }, { "epoch": 0.19, "learning_rate": 1.8745227861043514e-05, "loss": 0.8848, "step": 2735 }, { "epoch": 0.19, "learning_rate": 1.8744157161459308e-05, "loss": 0.8262, "step": 2736 }, { "epoch": 0.19, "learning_rate": 1.8743086035860192e-05, "loss": 0.9932, "step": 2737 }, { "epoch": 0.19, "learning_rate": 1.874201448429835e-05, "loss": 0.9756, "step": 2738 }, { "epoch": 0.19, "learning_rate": 1.874094250682599e-05, "loss": 0.8105, "step": 2739 }, { "epoch": 0.19, "learning_rate": 1.8739870103495335e-05, "loss": 0.8887, "step": 2740 }, { "epoch": 0.19, "learning_rate": 1.8738797274358636e-05, "loss": 0.9209, "step": 2741 }, { "epoch": 0.19, "learning_rate": 1.8737724019468162e-05, "loss": 0.8643, "step": 2742 }, { "epoch": 0.19, "learning_rate": 1.8736650338876198e-05, "loss": 0.8174, "step": 2743 }, { "epoch": 0.19, "learning_rate": 1.8735576232635056e-05, "loss": 0.8828, "step": 2744 }, { "epoch": 0.19, "learning_rate": 1.8734501700797064e-05, "loss": 0.8701, "step": 2745 }, { "epoch": 0.19, "learning_rate": 1.8733426743414577e-05, "loss": 0.8945, "step": 2746 }, { "epoch": 0.19, "learning_rate": 1.8732351360539963e-05, "loss": 0.8408, "step": 2747 }, { "epoch": 0.19, "learning_rate": 1.873127555222562e-05, "loss": 0.8535, "step": 2748 }, { "epoch": 0.19, "learning_rate": 1.8730199318523958e-05, "loss": 0.9443, "step": 2749 }, { "epoch": 0.19, "learning_rate": 1.8729122659487408e-05, "loss": 0.8916, "step": 2750 }, { "epoch": 0.19, "learning_rate": 1.872804557516843e-05, "loss": 0.8594, "step": 2751 }, { "epoch": 0.19, "learning_rate": 1.8726968065619495e-05, "loss": 0.8174, "step": 2752 }, { "epoch": 0.19, "learning_rate": 1.87258901308931e-05, "loss": 0.9414, "step": 2753 }, { "epoch": 0.19, "learning_rate": 1.872481177104177e-05, "loss": 0.8809, "step": 2754 }, { "epoch": 0.19, "learning_rate": 1.872373298611803e-05, "loss": 0.9219, "step": 2755 }, { "epoch": 0.19, "learning_rate": 1.8722653776174448e-05, "loss": 0.8066, "step": 2756 }, { "epoch": 0.19, "learning_rate": 1.8721574141263597e-05, "loss": 0.8848, "step": 2757 }, { "epoch": 0.19, "learning_rate": 1.872049408143808e-05, "loss": 0.9668, "step": 2758 }, { "epoch": 0.19, "learning_rate": 1.871941359675051e-05, "loss": 0.8604, "step": 2759 }, { "epoch": 0.19, "learning_rate": 1.8718332687253545e-05, "loss": 0.874, "step": 2760 }, { "epoch": 0.19, "learning_rate": 1.8717251352999833e-05, "loss": 0.8457, "step": 2761 }, { "epoch": 0.19, "learning_rate": 1.871616959404206e-05, "loss": 0.8818, "step": 2762 }, { "epoch": 0.19, "learning_rate": 1.871508741043293e-05, "loss": 0.876, "step": 2763 }, { "epoch": 0.19, "learning_rate": 1.8714004802225167e-05, "loss": 0.8691, "step": 2764 }, { "epoch": 0.19, "learning_rate": 1.871292176947151e-05, "loss": 0.9033, "step": 2765 }, { "epoch": 0.19, "learning_rate": 1.8711838312224733e-05, "loss": 0.8809, "step": 2766 }, { "epoch": 0.19, "learning_rate": 1.8710754430537623e-05, "loss": 0.8652, "step": 2767 }, { "epoch": 0.19, "learning_rate": 1.8709670124462973e-05, "loss": 0.8428, "step": 2768 }, { "epoch": 0.19, "learning_rate": 1.8708585394053623e-05, "loss": 0.8447, "step": 2769 }, { "epoch": 0.19, "learning_rate": 1.870750023936242e-05, "loss": 0.9219, "step": 2770 }, { "epoch": 0.19, "learning_rate": 1.8706414660442227e-05, "loss": 0.8018, "step": 2771 }, { "epoch": 0.19, "learning_rate": 1.8705328657345938e-05, "loss": 0.7861, "step": 2772 }, { "epoch": 0.19, "learning_rate": 1.870424223012646e-05, "loss": 0.8193, "step": 2773 }, { "epoch": 0.19, "learning_rate": 1.8703155378836727e-05, "loss": 0.8662, "step": 2774 }, { "epoch": 0.19, "learning_rate": 1.8702068103529684e-05, "loss": 0.835, "step": 2775 }, { "epoch": 0.19, "learning_rate": 1.870098040425831e-05, "loss": 0.8623, "step": 2776 }, { "epoch": 0.19, "learning_rate": 1.8699892281075597e-05, "loss": 0.8418, "step": 2777 }, { "epoch": 0.19, "learning_rate": 1.869880373403455e-05, "loss": 0.8311, "step": 2778 }, { "epoch": 0.19, "learning_rate": 1.8697714763188216e-05, "loss": 0.8477, "step": 2779 }, { "epoch": 0.19, "learning_rate": 1.869662536858964e-05, "loss": 0.8398, "step": 2780 }, { "epoch": 0.19, "learning_rate": 1.8695535550291905e-05, "loss": 0.8389, "step": 2781 }, { "epoch": 0.19, "learning_rate": 1.8694445308348096e-05, "loss": 0.8691, "step": 2782 }, { "epoch": 0.19, "learning_rate": 1.8693354642811336e-05, "loss": 0.9189, "step": 2783 }, { "epoch": 0.19, "learning_rate": 1.8692263553734765e-05, "loss": 0.9482, "step": 2784 }, { "epoch": 0.19, "learning_rate": 1.8691172041171536e-05, "loss": 0.9004, "step": 2785 }, { "epoch": 0.19, "learning_rate": 1.869008010517483e-05, "loss": 0.8799, "step": 2786 }, { "epoch": 0.19, "learning_rate": 1.868898774579784e-05, "loss": 0.8486, "step": 2787 }, { "epoch": 0.19, "learning_rate": 1.8687894963093796e-05, "loss": 0.9531, "step": 2788 }, { "epoch": 0.19, "learning_rate": 1.8686801757115932e-05, "loss": 0.8955, "step": 2789 }, { "epoch": 0.19, "learning_rate": 1.868570812791751e-05, "loss": 0.9131, "step": 2790 }, { "epoch": 0.19, "learning_rate": 1.868461407555181e-05, "loss": 0.8633, "step": 2791 }, { "epoch": 0.19, "learning_rate": 1.868351960007214e-05, "loss": 0.9502, "step": 2792 }, { "epoch": 0.19, "learning_rate": 1.8682424701531814e-05, "loss": 0.873, "step": 2793 }, { "epoch": 0.19, "learning_rate": 1.868132937998418e-05, "loss": 0.8691, "step": 2794 }, { "epoch": 0.19, "learning_rate": 1.8680233635482604e-05, "loss": 0.8818, "step": 2795 }, { "epoch": 0.19, "learning_rate": 1.867913746808047e-05, "loss": 0.9014, "step": 2796 }, { "epoch": 0.19, "learning_rate": 1.867804087783118e-05, "loss": 0.8652, "step": 2797 }, { "epoch": 0.19, "learning_rate": 1.867694386478816e-05, "loss": 0.8477, "step": 2798 }, { "epoch": 0.19, "learning_rate": 1.8675846429004862e-05, "loss": 0.8193, "step": 2799 }, { "epoch": 0.19, "learning_rate": 1.8674748570534743e-05, "loss": 0.9766, "step": 2800 }, { "epoch": 0.19, "learning_rate": 1.86736502894313e-05, "loss": 0.8447, "step": 2801 }, { "epoch": 0.19, "learning_rate": 1.867255158574804e-05, "loss": 0.9395, "step": 2802 }, { "epoch": 0.19, "learning_rate": 1.867145245953849e-05, "loss": 0.8594, "step": 2803 }, { "epoch": 0.19, "learning_rate": 1.8670352910856194e-05, "loss": 0.8926, "step": 2804 }, { "epoch": 0.19, "learning_rate": 1.8669252939754733e-05, "loss": 0.8477, "step": 2805 }, { "epoch": 0.19, "learning_rate": 1.8668152546287686e-05, "loss": 0.8525, "step": 2806 }, { "epoch": 0.19, "learning_rate": 1.8667051730508673e-05, "loss": 0.8613, "step": 2807 }, { "epoch": 0.19, "learning_rate": 1.8665950492471322e-05, "loss": 0.8711, "step": 2808 }, { "epoch": 0.19, "learning_rate": 1.8664848832229284e-05, "loss": 0.8496, "step": 2809 }, { "epoch": 0.19, "learning_rate": 1.8663746749836233e-05, "loss": 1.0029, "step": 2810 }, { "epoch": 0.19, "learning_rate": 1.8662644245345865e-05, "loss": 0.8916, "step": 2811 }, { "epoch": 0.19, "learning_rate": 1.866154131881189e-05, "loss": 0.9609, "step": 2812 }, { "epoch": 0.19, "learning_rate": 1.866043797028805e-05, "loss": 0.8105, "step": 2813 }, { "epoch": 0.19, "learning_rate": 1.865933419982809e-05, "loss": 0.9229, "step": 2814 }, { "epoch": 0.19, "learning_rate": 1.8658230007485788e-05, "loss": 0.9141, "step": 2815 }, { "epoch": 0.19, "learning_rate": 1.8657125393314944e-05, "loss": 0.8223, "step": 2816 }, { "epoch": 0.19, "learning_rate": 1.8656020357369374e-05, "loss": 0.7773, "step": 2817 }, { "epoch": 0.19, "learning_rate": 1.865491489970291e-05, "loss": 0.8428, "step": 2818 }, { "epoch": 0.19, "learning_rate": 1.8653809020369423e-05, "loss": 0.8555, "step": 2819 }, { "epoch": 0.19, "learning_rate": 1.8652702719422776e-05, "loss": 0.9248, "step": 2820 }, { "epoch": 0.19, "learning_rate": 1.8651595996916873e-05, "loss": 0.9121, "step": 2821 }, { "epoch": 0.19, "learning_rate": 1.865048885290564e-05, "loss": 0.9365, "step": 2822 }, { "epoch": 0.19, "learning_rate": 1.864938128744301e-05, "loss": 0.834, "step": 2823 }, { "epoch": 0.19, "learning_rate": 1.8648273300582945e-05, "loss": 0.8125, "step": 2824 }, { "epoch": 0.19, "learning_rate": 1.8647164892379427e-05, "loss": 0.9727, "step": 2825 }, { "epoch": 0.19, "learning_rate": 1.8646056062886457e-05, "loss": 0.9102, "step": 2826 }, { "epoch": 0.19, "learning_rate": 1.8644946812158057e-05, "loss": 0.8477, "step": 2827 }, { "epoch": 0.19, "learning_rate": 1.864383714024827e-05, "loss": 0.8779, "step": 2828 }, { "epoch": 0.19, "learning_rate": 1.864272704721116e-05, "loss": 0.8838, "step": 2829 }, { "epoch": 0.19, "learning_rate": 1.8641616533100807e-05, "loss": 0.876, "step": 2830 }, { "epoch": 0.19, "learning_rate": 1.864050559797132e-05, "loss": 0.8887, "step": 2831 }, { "epoch": 0.19, "learning_rate": 1.863939424187682e-05, "loss": 0.918, "step": 2832 }, { "epoch": 0.19, "learning_rate": 1.8638282464871456e-05, "loss": 0.875, "step": 2833 }, { "epoch": 0.19, "learning_rate": 1.8637170267009393e-05, "loss": 0.8604, "step": 2834 }, { "epoch": 0.19, "learning_rate": 1.8636057648344813e-05, "loss": 0.8867, "step": 2835 }, { "epoch": 0.19, "learning_rate": 1.8634944608931925e-05, "loss": 0.833, "step": 2836 }, { "epoch": 0.19, "learning_rate": 1.863383114882496e-05, "loss": 0.9248, "step": 2837 }, { "epoch": 0.19, "learning_rate": 1.863271726807816e-05, "loss": 0.8604, "step": 2838 }, { "epoch": 0.19, "learning_rate": 1.8631602966745793e-05, "loss": 0.8652, "step": 2839 }, { "epoch": 0.19, "learning_rate": 1.8630488244882156e-05, "loss": 0.8848, "step": 2840 }, { "epoch": 0.19, "learning_rate": 1.862937310254155e-05, "loss": 0.8652, "step": 2841 }, { "epoch": 0.19, "learning_rate": 1.8628257539778307e-05, "loss": 0.9189, "step": 2842 }, { "epoch": 0.19, "learning_rate": 1.862714155664678e-05, "loss": 0.8516, "step": 2843 }, { "epoch": 0.19, "learning_rate": 1.8626025153201334e-05, "loss": 0.8672, "step": 2844 }, { "epoch": 0.19, "learning_rate": 1.8624908329496362e-05, "loss": 0.9023, "step": 2845 }, { "epoch": 0.19, "learning_rate": 1.8623791085586277e-05, "loss": 0.8154, "step": 2846 }, { "epoch": 0.19, "learning_rate": 1.8622673421525516e-05, "loss": 0.8975, "step": 2847 }, { "epoch": 0.19, "learning_rate": 1.8621555337368522e-05, "loss": 0.8271, "step": 2848 }, { "epoch": 0.19, "learning_rate": 1.8620436833169773e-05, "loss": 0.9131, "step": 2849 }, { "epoch": 0.19, "learning_rate": 1.8619317908983764e-05, "loss": 0.8691, "step": 2850 }, { "epoch": 0.19, "learning_rate": 1.8618198564865004e-05, "loss": 0.9004, "step": 2851 }, { "epoch": 0.19, "learning_rate": 1.861707880086803e-05, "loss": 0.915, "step": 2852 }, { "epoch": 0.19, "learning_rate": 1.86159586170474e-05, "loss": 0.8828, "step": 2853 }, { "epoch": 0.19, "learning_rate": 1.8614838013457684e-05, "loss": 0.9229, "step": 2854 }, { "epoch": 0.19, "learning_rate": 1.861371699015348e-05, "loss": 0.8447, "step": 2855 }, { "epoch": 0.19, "learning_rate": 1.8612595547189408e-05, "loss": 0.7969, "step": 2856 }, { "epoch": 0.19, "learning_rate": 1.8611473684620094e-05, "loss": 0.8789, "step": 2857 }, { "epoch": 0.19, "learning_rate": 1.8610351402500207e-05, "loss": 0.9424, "step": 2858 }, { "epoch": 0.19, "learning_rate": 1.860922870088442e-05, "loss": 0.8613, "step": 2859 }, { "epoch": 0.19, "learning_rate": 1.8608105579827428e-05, "loss": 0.9268, "step": 2860 }, { "epoch": 0.19, "learning_rate": 1.8606982039383953e-05, "loss": 0.8994, "step": 2861 }, { "epoch": 0.2, "learning_rate": 1.8605858079608733e-05, "loss": 0.8477, "step": 2862 }, { "epoch": 0.2, "learning_rate": 1.8604733700556528e-05, "loss": 0.8506, "step": 2863 }, { "epoch": 0.2, "learning_rate": 1.860360890228212e-05, "loss": 0.8027, "step": 2864 }, { "epoch": 0.2, "learning_rate": 1.8602483684840297e-05, "loss": 0.9619, "step": 2865 }, { "epoch": 0.2, "learning_rate": 1.8601358048285892e-05, "loss": 0.8584, "step": 2866 }, { "epoch": 0.2, "learning_rate": 1.8600231992673744e-05, "loss": 0.8066, "step": 2867 }, { "epoch": 0.2, "learning_rate": 1.8599105518058713e-05, "loss": 0.792, "step": 2868 }, { "epoch": 0.2, "learning_rate": 1.8597978624495678e-05, "loss": 0.917, "step": 2869 }, { "epoch": 0.2, "learning_rate": 1.859685131203955e-05, "loss": 0.835, "step": 2870 }, { "epoch": 0.2, "learning_rate": 1.859572358074524e-05, "loss": 0.8721, "step": 2871 }, { "epoch": 0.2, "learning_rate": 1.8594595430667694e-05, "loss": 0.9033, "step": 2872 }, { "epoch": 0.2, "learning_rate": 1.859346686186188e-05, "loss": 0.832, "step": 2873 }, { "epoch": 0.2, "learning_rate": 1.859233787438278e-05, "loss": 0.8789, "step": 2874 }, { "epoch": 0.2, "learning_rate": 1.8591208468285398e-05, "loss": 0.8652, "step": 2875 }, { "epoch": 0.2, "learning_rate": 1.859007864362476e-05, "loss": 0.7764, "step": 2876 }, { "epoch": 0.2, "learning_rate": 1.858894840045591e-05, "loss": 0.9238, "step": 2877 }, { "epoch": 0.2, "learning_rate": 1.858781773883391e-05, "loss": 0.791, "step": 2878 }, { "epoch": 0.2, "learning_rate": 1.8586686658813845e-05, "loss": 0.8701, "step": 2879 }, { "epoch": 0.2, "learning_rate": 1.8585555160450833e-05, "loss": 0.8711, "step": 2880 }, { "epoch": 0.2, "learning_rate": 1.8584423243799986e-05, "loss": 0.9434, "step": 2881 }, { "epoch": 0.2, "learning_rate": 1.8583290908916458e-05, "loss": 0.8809, "step": 2882 }, { "epoch": 0.2, "learning_rate": 1.858215815585542e-05, "loss": 0.9404, "step": 2883 }, { "epoch": 0.2, "learning_rate": 1.858102498467205e-05, "loss": 0.8926, "step": 2884 }, { "epoch": 0.2, "learning_rate": 1.8579891395421563e-05, "loss": 0.9248, "step": 2885 }, { "epoch": 0.2, "learning_rate": 1.857875738815919e-05, "loss": 0.8623, "step": 2886 }, { "epoch": 0.2, "learning_rate": 1.8577622962940167e-05, "loss": 0.8506, "step": 2887 }, { "epoch": 0.2, "learning_rate": 1.8576488119819774e-05, "loss": 0.9062, "step": 2888 }, { "epoch": 0.2, "learning_rate": 1.8575352858853303e-05, "loss": 0.8789, "step": 2889 }, { "epoch": 0.2, "learning_rate": 1.8574217180096056e-05, "loss": 0.8877, "step": 2890 }, { "epoch": 0.2, "learning_rate": 1.8573081083603366e-05, "loss": 0.915, "step": 2891 }, { "epoch": 0.2, "learning_rate": 1.8571944569430582e-05, "loss": 0.8994, "step": 2892 }, { "epoch": 0.2, "learning_rate": 1.8570807637633078e-05, "loss": 0.8643, "step": 2893 }, { "epoch": 0.2, "learning_rate": 1.8569670288266245e-05, "loss": 0.8926, "step": 2894 }, { "epoch": 0.2, "learning_rate": 1.856853252138549e-05, "loss": 0.8438, "step": 2895 }, { "epoch": 0.2, "learning_rate": 1.8567394337046253e-05, "loss": 0.8008, "step": 2896 }, { "epoch": 0.2, "learning_rate": 1.856625573530398e-05, "loss": 0.834, "step": 2897 }, { "epoch": 0.2, "learning_rate": 1.8565116716214143e-05, "loss": 0.8789, "step": 2898 }, { "epoch": 0.2, "learning_rate": 1.856397727983224e-05, "loss": 0.8125, "step": 2899 }, { "epoch": 0.2, "learning_rate": 1.856283742621378e-05, "loss": 0.958, "step": 2900 }, { "epoch": 0.2, "learning_rate": 1.85616971554143e-05, "loss": 0.8828, "step": 2901 }, { "epoch": 0.2, "learning_rate": 1.856055646748935e-05, "loss": 0.8428, "step": 2902 }, { "epoch": 0.2, "learning_rate": 1.8559415362494507e-05, "loss": 0.9385, "step": 2903 }, { "epoch": 0.2, "learning_rate": 1.8558273840485367e-05, "loss": 0.8945, "step": 2904 }, { "epoch": 0.2, "learning_rate": 1.8557131901517542e-05, "loss": 0.8691, "step": 2905 }, { "epoch": 0.2, "learning_rate": 1.8555989545646668e-05, "loss": 0.9336, "step": 2906 }, { "epoch": 0.2, "learning_rate": 1.85548467729284e-05, "loss": 0.8652, "step": 2907 }, { "epoch": 0.2, "learning_rate": 1.8553703583418415e-05, "loss": 0.8242, "step": 2908 }, { "epoch": 0.2, "learning_rate": 1.8552559977172408e-05, "loss": 0.7969, "step": 2909 }, { "epoch": 0.2, "learning_rate": 1.8551415954246096e-05, "loss": 0.915, "step": 2910 }, { "epoch": 0.2, "learning_rate": 1.855027151469521e-05, "loss": 0.8428, "step": 2911 }, { "epoch": 0.2, "learning_rate": 1.854912665857552e-05, "loss": 0.8604, "step": 2912 }, { "epoch": 0.2, "learning_rate": 1.8547981385942794e-05, "loss": 0.8887, "step": 2913 }, { "epoch": 0.2, "learning_rate": 1.8546835696852833e-05, "loss": 0.8818, "step": 2914 }, { "epoch": 0.2, "learning_rate": 1.8545689591361454e-05, "loss": 0.8662, "step": 2915 }, { "epoch": 0.2, "learning_rate": 1.8544543069524494e-05, "loss": 0.8623, "step": 2916 }, { "epoch": 0.2, "learning_rate": 1.8543396131397814e-05, "loss": 0.9512, "step": 2917 }, { "epoch": 0.2, "learning_rate": 1.8542248777037287e-05, "loss": 0.9238, "step": 2918 }, { "epoch": 0.2, "learning_rate": 1.8541101006498817e-05, "loss": 0.9023, "step": 2919 }, { "epoch": 0.2, "learning_rate": 1.8539952819838325e-05, "loss": 0.8418, "step": 2920 }, { "epoch": 0.2, "learning_rate": 1.8538804217111746e-05, "loss": 0.8809, "step": 2921 }, { "epoch": 0.2, "learning_rate": 1.8537655198375046e-05, "loss": 0.8467, "step": 2922 }, { "epoch": 0.2, "learning_rate": 1.8536505763684195e-05, "loss": 0.8916, "step": 2923 }, { "epoch": 0.2, "learning_rate": 1.85353559130952e-05, "loss": 0.8926, "step": 2924 }, { "epoch": 0.2, "learning_rate": 1.8534205646664088e-05, "loss": 0.8018, "step": 2925 }, { "epoch": 0.2, "learning_rate": 1.8533054964446887e-05, "loss": 0.8486, "step": 2926 }, { "epoch": 0.2, "learning_rate": 1.8531903866499665e-05, "loss": 0.8838, "step": 2927 }, { "epoch": 0.2, "learning_rate": 1.8530752352878504e-05, "loss": 0.9004, "step": 2928 }, { "epoch": 0.2, "learning_rate": 1.8529600423639503e-05, "loss": 0.8516, "step": 2929 }, { "epoch": 0.2, "learning_rate": 1.852844807883879e-05, "loss": 0.8516, "step": 2930 }, { "epoch": 0.2, "learning_rate": 1.8527295318532497e-05, "loss": 0.957, "step": 2931 }, { "epoch": 0.2, "learning_rate": 1.8526142142776792e-05, "loss": 0.7979, "step": 2932 }, { "epoch": 0.2, "learning_rate": 1.852498855162786e-05, "loss": 0.9062, "step": 2933 }, { "epoch": 0.2, "learning_rate": 1.85238345451419e-05, "loss": 0.9434, "step": 2934 }, { "epoch": 0.2, "learning_rate": 1.852268012337514e-05, "loss": 0.9512, "step": 2935 }, { "epoch": 0.2, "learning_rate": 1.8521525286383815e-05, "loss": 0.8555, "step": 2936 }, { "epoch": 0.2, "learning_rate": 1.8520370034224194e-05, "loss": 0.8809, "step": 2937 }, { "epoch": 0.2, "learning_rate": 1.8519214366952564e-05, "loss": 0.8311, "step": 2938 }, { "epoch": 0.2, "learning_rate": 1.8518058284625225e-05, "loss": 0.8262, "step": 2939 }, { "epoch": 0.2, "learning_rate": 1.85169017872985e-05, "loss": 0.8574, "step": 2940 }, { "epoch": 0.2, "learning_rate": 1.8515744875028735e-05, "loss": 0.8574, "step": 2941 }, { "epoch": 0.2, "learning_rate": 1.85145875478723e-05, "loss": 0.9307, "step": 2942 }, { "epoch": 0.2, "learning_rate": 1.851342980588557e-05, "loss": 0.7695, "step": 2943 }, { "epoch": 0.2, "learning_rate": 1.8512271649124956e-05, "loss": 0.8428, "step": 2944 }, { "epoch": 0.2, "learning_rate": 1.8511113077646882e-05, "loss": 0.876, "step": 2945 }, { "epoch": 0.2, "learning_rate": 1.8509954091507793e-05, "loss": 0.8457, "step": 2946 }, { "epoch": 0.2, "learning_rate": 1.8508794690764156e-05, "loss": 0.8398, "step": 2947 }, { "epoch": 0.2, "learning_rate": 1.850763487547246e-05, "loss": 0.9082, "step": 2948 }, { "epoch": 0.2, "learning_rate": 1.8506474645689203e-05, "loss": 0.916, "step": 2949 }, { "epoch": 0.2, "learning_rate": 1.850531400147092e-05, "loss": 0.9229, "step": 2950 }, { "epoch": 0.2, "learning_rate": 1.8504152942874153e-05, "loss": 0.9678, "step": 2951 }, { "epoch": 0.2, "learning_rate": 1.8502991469955466e-05, "loss": 0.8438, "step": 2952 }, { "epoch": 0.2, "learning_rate": 1.850182958277145e-05, "loss": 0.8525, "step": 2953 }, { "epoch": 0.2, "learning_rate": 1.8500667281378714e-05, "loss": 0.8867, "step": 2954 }, { "epoch": 0.2, "learning_rate": 1.8499504565833884e-05, "loss": 0.8301, "step": 2955 }, { "epoch": 0.2, "learning_rate": 1.84983414361936e-05, "loss": 0.8838, "step": 2956 }, { "epoch": 0.2, "learning_rate": 1.849717789251454e-05, "loss": 0.8213, "step": 2957 }, { "epoch": 0.2, "learning_rate": 1.849601393485339e-05, "loss": 0.8398, "step": 2958 }, { "epoch": 0.2, "learning_rate": 1.849484956326685e-05, "loss": 0.875, "step": 2959 }, { "epoch": 0.2, "learning_rate": 1.8493684777811655e-05, "loss": 0.8789, "step": 2960 }, { "epoch": 0.2, "learning_rate": 1.849251957854455e-05, "loss": 0.8164, "step": 2961 }, { "epoch": 0.2, "learning_rate": 1.849135396552231e-05, "loss": 0.9404, "step": 2962 }, { "epoch": 0.2, "learning_rate": 1.849018793880172e-05, "loss": 0.7979, "step": 2963 }, { "epoch": 0.2, "learning_rate": 1.848902149843958e-05, "loss": 0.8408, "step": 2964 }, { "epoch": 0.2, "learning_rate": 1.8487854644492733e-05, "loss": 0.9014, "step": 2965 }, { "epoch": 0.2, "learning_rate": 1.848668737701802e-05, "loss": 0.916, "step": 2966 }, { "epoch": 0.2, "learning_rate": 1.8485519696072313e-05, "loss": 0.8945, "step": 2967 }, { "epoch": 0.2, "learning_rate": 1.8484351601712495e-05, "loss": 0.875, "step": 2968 }, { "epoch": 0.2, "learning_rate": 1.8483183093995486e-05, "loss": 0.9453, "step": 2969 }, { "epoch": 0.2, "learning_rate": 1.8482014172978207e-05, "loss": 0.9707, "step": 2970 }, { "epoch": 0.2, "learning_rate": 1.8480844838717616e-05, "loss": 0.9785, "step": 2971 }, { "epoch": 0.2, "learning_rate": 1.8479675091270673e-05, "loss": 0.7861, "step": 2972 }, { "epoch": 0.2, "learning_rate": 1.8478504930694375e-05, "loss": 0.8906, "step": 2973 }, { "epoch": 0.2, "learning_rate": 1.847733435704573e-05, "loss": 0.8574, "step": 2974 }, { "epoch": 0.2, "learning_rate": 1.847616337038177e-05, "loss": 0.8506, "step": 2975 }, { "epoch": 0.2, "learning_rate": 1.847499197075954e-05, "loss": 0.918, "step": 2976 }, { "epoch": 0.2, "learning_rate": 1.847382015823612e-05, "loss": 0.8838, "step": 2977 }, { "epoch": 0.2, "learning_rate": 1.847264793286859e-05, "loss": 0.8828, "step": 2978 }, { "epoch": 0.2, "learning_rate": 1.847147529471407e-05, "loss": 0.9092, "step": 2979 }, { "epoch": 0.2, "learning_rate": 1.8470302243829686e-05, "loss": 0.8945, "step": 2980 }, { "epoch": 0.2, "learning_rate": 1.8469128780272588e-05, "loss": 0.9053, "step": 2981 }, { "epoch": 0.2, "learning_rate": 1.8467954904099946e-05, "loss": 0.8525, "step": 2982 }, { "epoch": 0.2, "learning_rate": 1.846678061536896e-05, "loss": 0.8975, "step": 2983 }, { "epoch": 0.2, "learning_rate": 1.8465605914136834e-05, "loss": 0.8223, "step": 2984 }, { "epoch": 0.2, "learning_rate": 1.84644308004608e-05, "loss": 0.8779, "step": 2985 }, { "epoch": 0.2, "learning_rate": 1.846325527439811e-05, "loss": 0.8896, "step": 2986 }, { "epoch": 0.2, "learning_rate": 1.8462079336006034e-05, "loss": 0.8691, "step": 2987 }, { "epoch": 0.2, "learning_rate": 1.8460902985341867e-05, "loss": 0.7764, "step": 2988 }, { "epoch": 0.2, "learning_rate": 1.8459726222462917e-05, "loss": 0.9131, "step": 2989 }, { "epoch": 0.2, "learning_rate": 1.845854904742652e-05, "loss": 0.8867, "step": 2990 }, { "epoch": 0.2, "learning_rate": 1.8457371460290024e-05, "loss": 0.9014, "step": 2991 }, { "epoch": 0.2, "learning_rate": 1.845619346111081e-05, "loss": 0.875, "step": 2992 }, { "epoch": 0.2, "learning_rate": 1.8455015049946253e-05, "loss": 0.8369, "step": 2993 }, { "epoch": 0.2, "learning_rate": 1.845383622685378e-05, "loss": 0.9727, "step": 2994 }, { "epoch": 0.2, "learning_rate": 1.845265699189082e-05, "loss": 0.9502, "step": 2995 }, { "epoch": 0.2, "learning_rate": 1.8451477345114824e-05, "loss": 0.8701, "step": 2996 }, { "epoch": 0.2, "learning_rate": 1.845029728658326e-05, "loss": 0.9688, "step": 2997 }, { "epoch": 0.2, "learning_rate": 1.8449116816353627e-05, "loss": 0.8037, "step": 2998 }, { "epoch": 0.2, "learning_rate": 1.8447935934483433e-05, "loss": 0.7959, "step": 2999 }, { "epoch": 0.2, "learning_rate": 1.844675464103021e-05, "loss": 0.9189, "step": 3000 }, { "epoch": 0.2, "learning_rate": 1.8445572936051518e-05, "loss": 0.7852, "step": 3001 }, { "epoch": 0.2, "learning_rate": 1.844439081960492e-05, "loss": 0.8232, "step": 3002 }, { "epoch": 0.2, "learning_rate": 1.844320829174802e-05, "loss": 0.8037, "step": 3003 }, { "epoch": 0.2, "learning_rate": 1.8442025352538415e-05, "loss": 0.7637, "step": 3004 }, { "epoch": 0.2, "learning_rate": 1.8440842002033753e-05, "loss": 0.8926, "step": 3005 }, { "epoch": 0.2, "learning_rate": 1.8439658240291677e-05, "loss": 0.793, "step": 3006 }, { "epoch": 0.2, "learning_rate": 1.8438474067369865e-05, "loss": 0.8809, "step": 3007 }, { "epoch": 0.2, "learning_rate": 1.8437289483326006e-05, "loss": 0.8115, "step": 3008 }, { "epoch": 0.21, "learning_rate": 1.8436104488217816e-05, "loss": 0.8379, "step": 3009 }, { "epoch": 0.21, "learning_rate": 1.8434919082103026e-05, "loss": 0.8027, "step": 3010 }, { "epoch": 0.21, "learning_rate": 1.8433733265039387e-05, "loss": 0.8516, "step": 3011 }, { "epoch": 0.21, "learning_rate": 1.843254703708468e-05, "loss": 0.8867, "step": 3012 }, { "epoch": 0.21, "learning_rate": 1.8431360398296693e-05, "loss": 0.7578, "step": 3013 }, { "epoch": 0.21, "learning_rate": 1.8430173348733237e-05, "loss": 0.8457, "step": 3014 }, { "epoch": 0.21, "learning_rate": 1.8428985888452145e-05, "loss": 0.8486, "step": 3015 }, { "epoch": 0.21, "learning_rate": 1.842779801751127e-05, "loss": 0.8564, "step": 3016 }, { "epoch": 0.21, "learning_rate": 1.842660973596849e-05, "loss": 0.8223, "step": 3017 }, { "epoch": 0.21, "learning_rate": 1.8425421043881693e-05, "loss": 0.8975, "step": 3018 }, { "epoch": 0.21, "learning_rate": 1.8424231941308792e-05, "loss": 0.7861, "step": 3019 }, { "epoch": 0.21, "learning_rate": 1.8423042428307723e-05, "loss": 0.8711, "step": 3020 }, { "epoch": 0.21, "learning_rate": 1.842185250493644e-05, "loss": 0.8789, "step": 3021 }, { "epoch": 0.21, "learning_rate": 1.842066217125291e-05, "loss": 0.8877, "step": 3022 }, { "epoch": 0.21, "learning_rate": 1.841947142731513e-05, "loss": 0.8828, "step": 3023 }, { "epoch": 0.21, "learning_rate": 1.8418280273181114e-05, "loss": 0.8574, "step": 3024 }, { "epoch": 0.21, "learning_rate": 1.8417088708908895e-05, "loss": 0.877, "step": 3025 }, { "epoch": 0.21, "learning_rate": 1.8415896734556523e-05, "loss": 0.9062, "step": 3026 }, { "epoch": 0.21, "learning_rate": 1.8414704350182075e-05, "loss": 0.8379, "step": 3027 }, { "epoch": 0.21, "learning_rate": 1.8413511555843636e-05, "loss": 0.8467, "step": 3028 }, { "epoch": 0.21, "learning_rate": 1.841231835159933e-05, "loss": 0.8135, "step": 3029 }, { "epoch": 0.21, "learning_rate": 1.841112473750728e-05, "loss": 0.8867, "step": 3030 }, { "epoch": 0.21, "learning_rate": 1.8409930713625644e-05, "loss": 0.9102, "step": 3031 }, { "epoch": 0.21, "learning_rate": 1.8408736280012596e-05, "loss": 0.8232, "step": 3032 }, { "epoch": 0.21, "learning_rate": 1.8407541436726327e-05, "loss": 0.835, "step": 3033 }, { "epoch": 0.21, "learning_rate": 1.8406346183825045e-05, "loss": 0.9238, "step": 3034 }, { "epoch": 0.21, "learning_rate": 1.8405150521366988e-05, "loss": 0.8926, "step": 3035 }, { "epoch": 0.21, "learning_rate": 1.840395444941041e-05, "loss": 0.8672, "step": 3036 }, { "epoch": 0.21, "learning_rate": 1.840275796801358e-05, "loss": 0.875, "step": 3037 }, { "epoch": 0.21, "learning_rate": 1.8401561077234792e-05, "loss": 0.8838, "step": 3038 }, { "epoch": 0.21, "learning_rate": 1.8400363777132356e-05, "loss": 0.8887, "step": 3039 }, { "epoch": 0.21, "learning_rate": 1.8399166067764603e-05, "loss": 0.8477, "step": 3040 }, { "epoch": 0.21, "learning_rate": 1.8397967949189897e-05, "loss": 0.7754, "step": 3041 }, { "epoch": 0.21, "learning_rate": 1.8396769421466598e-05, "loss": 0.8906, "step": 3042 }, { "epoch": 0.21, "learning_rate": 1.83955704846531e-05, "loss": 0.7705, "step": 3043 }, { "epoch": 0.21, "learning_rate": 1.8394371138807824e-05, "loss": 0.8584, "step": 3044 }, { "epoch": 0.21, "learning_rate": 1.839317138398919e-05, "loss": 0.8428, "step": 3045 }, { "epoch": 0.21, "learning_rate": 1.8391971220255658e-05, "loss": 0.9277, "step": 3046 }, { "epoch": 0.21, "learning_rate": 1.8390770647665696e-05, "loss": 0.8252, "step": 3047 }, { "epoch": 0.21, "learning_rate": 1.8389569666277796e-05, "loss": 0.8242, "step": 3048 }, { "epoch": 0.21, "learning_rate": 1.8388368276150475e-05, "loss": 0.7852, "step": 3049 }, { "epoch": 0.21, "learning_rate": 1.838716647734226e-05, "loss": 0.9043, "step": 3050 }, { "epoch": 0.21, "learning_rate": 1.83859642699117e-05, "loss": 0.7461, "step": 3051 }, { "epoch": 0.21, "learning_rate": 1.8384761653917367e-05, "loss": 0.8301, "step": 3052 }, { "epoch": 0.21, "learning_rate": 1.838355862941786e-05, "loss": 0.9004, "step": 3053 }, { "epoch": 0.21, "learning_rate": 1.8382355196471788e-05, "loss": 0.9141, "step": 3054 }, { "epoch": 0.21, "learning_rate": 1.8381151355137776e-05, "loss": 0.8564, "step": 3055 }, { "epoch": 0.21, "learning_rate": 1.837994710547448e-05, "loss": 0.8242, "step": 3056 }, { "epoch": 0.21, "learning_rate": 1.8378742447540567e-05, "loss": 0.8447, "step": 3057 }, { "epoch": 0.21, "learning_rate": 1.837753738139473e-05, "loss": 0.8916, "step": 3058 }, { "epoch": 0.21, "learning_rate": 1.8376331907095685e-05, "loss": 0.8301, "step": 3059 }, { "epoch": 0.21, "learning_rate": 1.8375126024702155e-05, "loss": 0.8857, "step": 3060 }, { "epoch": 0.21, "learning_rate": 1.8373919734272895e-05, "loss": 0.834, "step": 3061 }, { "epoch": 0.21, "learning_rate": 1.8372713035866675e-05, "loss": 0.8711, "step": 3062 }, { "epoch": 0.21, "learning_rate": 1.837150592954228e-05, "loss": 0.834, "step": 3063 }, { "epoch": 0.21, "learning_rate": 1.8370298415358527e-05, "loss": 0.8545, "step": 3064 }, { "epoch": 0.21, "learning_rate": 1.8369090493374245e-05, "loss": 0.8623, "step": 3065 }, { "epoch": 0.21, "learning_rate": 1.8367882163648278e-05, "loss": 0.9629, "step": 3066 }, { "epoch": 0.21, "learning_rate": 1.8366673426239503e-05, "loss": 0.9102, "step": 3067 }, { "epoch": 0.21, "learning_rate": 1.8365464281206807e-05, "loss": 0.8799, "step": 3068 }, { "epoch": 0.21, "learning_rate": 1.8364254728609095e-05, "loss": 0.8965, "step": 3069 }, { "epoch": 0.21, "learning_rate": 1.8363044768505306e-05, "loss": 0.8291, "step": 3070 }, { "epoch": 0.21, "learning_rate": 1.8361834400954383e-05, "loss": 0.874, "step": 3071 }, { "epoch": 0.21, "learning_rate": 1.8360623626015293e-05, "loss": 0.9033, "step": 3072 }, { "epoch": 0.21, "learning_rate": 1.8359412443747027e-05, "loss": 0.9258, "step": 3073 }, { "epoch": 0.21, "learning_rate": 1.83582008542086e-05, "loss": 0.8623, "step": 3074 }, { "epoch": 0.21, "learning_rate": 1.835698885745903e-05, "loss": 0.8164, "step": 3075 }, { "epoch": 0.21, "learning_rate": 1.835577645355737e-05, "loss": 0.9199, "step": 3076 }, { "epoch": 0.21, "learning_rate": 1.835456364256269e-05, "loss": 1.0225, "step": 3077 }, { "epoch": 0.21, "learning_rate": 1.8353350424534078e-05, "loss": 0.873, "step": 3078 }, { "epoch": 0.21, "learning_rate": 1.835213679953064e-05, "loss": 0.9893, "step": 3079 }, { "epoch": 0.21, "learning_rate": 1.8350922767611504e-05, "loss": 0.7627, "step": 3080 }, { "epoch": 0.21, "learning_rate": 1.834970832883582e-05, "loss": 0.8906, "step": 3081 }, { "epoch": 0.21, "learning_rate": 1.834849348326275e-05, "loss": 0.8525, "step": 3082 }, { "epoch": 0.21, "learning_rate": 1.8347278230951488e-05, "loss": 0.8711, "step": 3083 }, { "epoch": 0.21, "learning_rate": 1.834606257196123e-05, "loss": 0.8887, "step": 3084 }, { "epoch": 0.21, "learning_rate": 1.834484650635122e-05, "loss": 0.8945, "step": 3085 }, { "epoch": 0.21, "learning_rate": 1.8343630034180694e-05, "loss": 0.8779, "step": 3086 }, { "epoch": 0.21, "learning_rate": 1.8342413155508915e-05, "loss": 0.8291, "step": 3087 }, { "epoch": 0.21, "learning_rate": 1.8341195870395176e-05, "loss": 0.8779, "step": 3088 }, { "epoch": 0.21, "learning_rate": 1.833997817889878e-05, "loss": 0.873, "step": 3089 }, { "epoch": 0.21, "learning_rate": 1.8338760081079056e-05, "loss": 0.9092, "step": 3090 }, { "epoch": 0.21, "learning_rate": 1.8337541576995348e-05, "loss": 0.9229, "step": 3091 }, { "epoch": 0.21, "learning_rate": 1.833632266670702e-05, "loss": 0.8125, "step": 3092 }, { "epoch": 0.21, "learning_rate": 1.8335103350273455e-05, "loss": 0.8389, "step": 3093 }, { "epoch": 0.21, "learning_rate": 1.8333883627754065e-05, "loss": 0.8213, "step": 3094 }, { "epoch": 0.21, "learning_rate": 1.833266349920827e-05, "loss": 0.9053, "step": 3095 }, { "epoch": 0.21, "learning_rate": 1.8331442964695514e-05, "loss": 0.9072, "step": 3096 }, { "epoch": 0.21, "learning_rate": 1.8330222024275266e-05, "loss": 0.8447, "step": 3097 }, { "epoch": 0.21, "learning_rate": 1.8329000678007004e-05, "loss": 0.7979, "step": 3098 }, { "epoch": 0.21, "learning_rate": 1.832777892595024e-05, "loss": 0.8857, "step": 3099 }, { "epoch": 0.21, "learning_rate": 1.8326556768164488e-05, "loss": 0.8438, "step": 3100 }, { "epoch": 0.21, "learning_rate": 1.8325334204709298e-05, "loss": 0.9307, "step": 3101 }, { "epoch": 0.21, "learning_rate": 1.832411123564423e-05, "loss": 0.834, "step": 3102 }, { "epoch": 0.21, "learning_rate": 1.832288786102887e-05, "loss": 0.8799, "step": 3103 }, { "epoch": 0.21, "learning_rate": 1.8321664080922823e-05, "loss": 0.832, "step": 3104 }, { "epoch": 0.21, "learning_rate": 1.8320439895385703e-05, "loss": 0.8545, "step": 3105 }, { "epoch": 0.21, "learning_rate": 1.8319215304477157e-05, "loss": 0.8174, "step": 3106 }, { "epoch": 0.21, "learning_rate": 1.831799030825685e-05, "loss": 0.8301, "step": 3107 }, { "epoch": 0.21, "learning_rate": 1.831676490678446e-05, "loss": 0.8789, "step": 3108 }, { "epoch": 0.21, "learning_rate": 1.8315539100119685e-05, "loss": 0.7979, "step": 3109 }, { "epoch": 0.21, "learning_rate": 1.8314312888322257e-05, "loss": 0.9443, "step": 3110 }, { "epoch": 0.21, "learning_rate": 1.8313086271451906e-05, "loss": 0.9297, "step": 3111 }, { "epoch": 0.21, "learning_rate": 1.83118592495684e-05, "loss": 0.875, "step": 3112 }, { "epoch": 0.21, "learning_rate": 1.8310631822731516e-05, "loss": 0.8594, "step": 3113 }, { "epoch": 0.21, "learning_rate": 1.8309403991001056e-05, "loss": 0.8701, "step": 3114 }, { "epoch": 0.21, "learning_rate": 1.8308175754436837e-05, "loss": 0.8828, "step": 3115 }, { "epoch": 0.21, "learning_rate": 1.83069471130987e-05, "loss": 0.9111, "step": 3116 }, { "epoch": 0.21, "learning_rate": 1.8305718067046506e-05, "loss": 0.8291, "step": 3117 }, { "epoch": 0.21, "learning_rate": 1.830448861634013e-05, "loss": 0.7822, "step": 3118 }, { "epoch": 0.21, "learning_rate": 1.8303258761039476e-05, "loss": 0.917, "step": 3119 }, { "epoch": 0.21, "learning_rate": 1.830202850120446e-05, "loss": 0.8301, "step": 3120 }, { "epoch": 0.21, "learning_rate": 1.830079783689502e-05, "loss": 0.9697, "step": 3121 }, { "epoch": 0.21, "learning_rate": 1.8299566768171114e-05, "loss": 0.8418, "step": 3122 }, { "epoch": 0.21, "learning_rate": 1.8298335295092723e-05, "loss": 0.8838, "step": 3123 }, { "epoch": 0.21, "learning_rate": 1.8297103417719837e-05, "loss": 0.915, "step": 3124 }, { "epoch": 0.21, "learning_rate": 1.8295871136112478e-05, "loss": 0.8262, "step": 3125 }, { "epoch": 0.21, "learning_rate": 1.829463845033068e-05, "loss": 0.8584, "step": 3126 }, { "epoch": 0.21, "learning_rate": 1.8293405360434505e-05, "loss": 0.9482, "step": 3127 }, { "epoch": 0.21, "learning_rate": 1.8292171866484027e-05, "loss": 0.8252, "step": 3128 }, { "epoch": 0.21, "learning_rate": 1.8290937968539335e-05, "loss": 0.874, "step": 3129 }, { "epoch": 0.21, "learning_rate": 1.828970366666055e-05, "loss": 0.8682, "step": 3130 }, { "epoch": 0.21, "learning_rate": 1.8288468960907808e-05, "loss": 0.9795, "step": 3131 }, { "epoch": 0.21, "learning_rate": 1.8287233851341262e-05, "loss": 0.9277, "step": 3132 }, { "epoch": 0.21, "learning_rate": 1.828599833802109e-05, "loss": 0.96, "step": 3133 }, { "epoch": 0.21, "learning_rate": 1.8284762421007478e-05, "loss": 0.8223, "step": 3134 }, { "epoch": 0.21, "learning_rate": 1.8283526100360648e-05, "loss": 0.8721, "step": 3135 }, { "epoch": 0.21, "learning_rate": 1.828228937614083e-05, "loss": 0.8643, "step": 3136 }, { "epoch": 0.21, "learning_rate": 1.8281052248408277e-05, "loss": 0.8779, "step": 3137 }, { "epoch": 0.21, "learning_rate": 1.827981471722326e-05, "loss": 0.8955, "step": 3138 }, { "epoch": 0.21, "learning_rate": 1.8278576782646076e-05, "loss": 0.8633, "step": 3139 }, { "epoch": 0.21, "learning_rate": 1.8277338444737037e-05, "loss": 0.8379, "step": 3140 }, { "epoch": 0.21, "learning_rate": 1.827609970355647e-05, "loss": 0.832, "step": 3141 }, { "epoch": 0.21, "learning_rate": 1.827486055916473e-05, "loss": 0.9326, "step": 3142 }, { "epoch": 0.21, "learning_rate": 1.8273621011622188e-05, "loss": 0.8037, "step": 3143 }, { "epoch": 0.21, "learning_rate": 1.827238106098923e-05, "loss": 0.9502, "step": 3144 }, { "epoch": 0.21, "learning_rate": 1.8271140707326275e-05, "loss": 0.8965, "step": 3145 }, { "epoch": 0.21, "learning_rate": 1.8269899950693744e-05, "loss": 0.8691, "step": 3146 }, { "epoch": 0.21, "learning_rate": 1.8268658791152092e-05, "loss": 0.8301, "step": 3147 }, { "epoch": 0.21, "learning_rate": 1.8267417228761787e-05, "loss": 0.833, "step": 3148 }, { "epoch": 0.21, "learning_rate": 1.826617526358332e-05, "loss": 0.9219, "step": 3149 }, { "epoch": 0.21, "learning_rate": 1.8264932895677195e-05, "loss": 0.8711, "step": 3150 }, { "epoch": 0.21, "learning_rate": 1.8263690125103943e-05, "loss": 0.9453, "step": 3151 }, { "epoch": 0.21, "learning_rate": 1.826244695192411e-05, "loss": 0.8447, "step": 3152 }, { "epoch": 0.21, "learning_rate": 1.8261203376198264e-05, "loss": 0.7666, "step": 3153 }, { "epoch": 0.21, "learning_rate": 1.825995939798699e-05, "loss": 0.8584, "step": 3154 }, { "epoch": 0.22, "learning_rate": 1.8258715017350904e-05, "loss": 0.8955, "step": 3155 }, { "epoch": 0.22, "learning_rate": 1.8257470234350622e-05, "loss": 0.876, "step": 3156 }, { "epoch": 0.22, "learning_rate": 1.825622504904679e-05, "loss": 0.8457, "step": 3157 }, { "epoch": 0.22, "learning_rate": 1.825497946150008e-05, "loss": 0.8877, "step": 3158 }, { "epoch": 0.22, "learning_rate": 1.8253733471771173e-05, "loss": 0.8623, "step": 3159 }, { "epoch": 0.22, "learning_rate": 1.8252487079920773e-05, "loss": 0.9365, "step": 3160 }, { "epoch": 0.22, "learning_rate": 1.8251240286009608e-05, "loss": 0.8799, "step": 3161 }, { "epoch": 0.22, "learning_rate": 1.8249993090098414e-05, "loss": 0.8613, "step": 3162 }, { "epoch": 0.22, "learning_rate": 1.824874549224796e-05, "loss": 0.9873, "step": 3163 }, { "epoch": 0.22, "learning_rate": 1.8247497492519026e-05, "loss": 0.875, "step": 3164 }, { "epoch": 0.22, "learning_rate": 1.824624909097242e-05, "loss": 0.8555, "step": 3165 }, { "epoch": 0.22, "learning_rate": 1.824500028766896e-05, "loss": 0.8672, "step": 3166 }, { "epoch": 0.22, "learning_rate": 1.8243751082669486e-05, "loss": 0.8848, "step": 3167 }, { "epoch": 0.22, "learning_rate": 1.824250147603486e-05, "loss": 0.8994, "step": 3168 }, { "epoch": 0.22, "learning_rate": 1.824125146782597e-05, "loss": 0.9092, "step": 3169 }, { "epoch": 0.22, "learning_rate": 1.8240001058103707e-05, "loss": 0.9072, "step": 3170 }, { "epoch": 0.22, "learning_rate": 1.8238750246928992e-05, "loss": 0.8711, "step": 3171 }, { "epoch": 0.22, "learning_rate": 1.8237499034362768e-05, "loss": 0.8711, "step": 3172 }, { "epoch": 0.22, "learning_rate": 1.8236247420465995e-05, "loss": 0.8877, "step": 3173 }, { "epoch": 0.22, "learning_rate": 1.8234995405299648e-05, "loss": 0.793, "step": 3174 }, { "epoch": 0.22, "learning_rate": 1.8233742988924725e-05, "loss": 0.8828, "step": 3175 }, { "epoch": 0.22, "learning_rate": 1.8232490171402248e-05, "loss": 0.8086, "step": 3176 }, { "epoch": 0.22, "learning_rate": 1.8231236952793248e-05, "loss": 0.8721, "step": 3177 }, { "epoch": 0.22, "learning_rate": 1.8229983333158787e-05, "loss": 0.8525, "step": 3178 }, { "epoch": 0.22, "learning_rate": 1.822872931255994e-05, "loss": 0.9238, "step": 3179 }, { "epoch": 0.22, "learning_rate": 1.82274748910578e-05, "loss": 0.9219, "step": 3180 }, { "epoch": 0.22, "learning_rate": 1.8226220068713488e-05, "loss": 0.8916, "step": 3181 }, { "epoch": 0.22, "learning_rate": 1.8224964845588133e-05, "loss": 0.8047, "step": 3182 }, { "epoch": 0.22, "learning_rate": 1.8223709221742893e-05, "loss": 0.8184, "step": 3183 }, { "epoch": 0.22, "learning_rate": 1.822245319723894e-05, "loss": 0.8252, "step": 3184 }, { "epoch": 0.22, "learning_rate": 1.8221196772137467e-05, "loss": 0.9102, "step": 3185 }, { "epoch": 0.22, "learning_rate": 1.821993994649969e-05, "loss": 0.748, "step": 3186 }, { "epoch": 0.22, "learning_rate": 1.821868272038684e-05, "loss": 0.8242, "step": 3187 }, { "epoch": 0.22, "learning_rate": 1.8217425093860166e-05, "loss": 0.9355, "step": 3188 }, { "epoch": 0.22, "learning_rate": 1.8216167066980946e-05, "loss": 0.8135, "step": 3189 }, { "epoch": 0.22, "learning_rate": 1.8214908639810463e-05, "loss": 0.9424, "step": 3190 }, { "epoch": 0.22, "learning_rate": 1.8213649812410034e-05, "loss": 0.8271, "step": 3191 }, { "epoch": 0.22, "learning_rate": 1.8212390584840984e-05, "loss": 0.8896, "step": 3192 }, { "epoch": 0.22, "learning_rate": 1.821113095716467e-05, "loss": 0.9199, "step": 3193 }, { "epoch": 0.22, "learning_rate": 1.820987092944245e-05, "loss": 0.8574, "step": 3194 }, { "epoch": 0.22, "learning_rate": 1.8208610501735726e-05, "loss": 0.8887, "step": 3195 }, { "epoch": 0.22, "learning_rate": 1.8207349674105894e-05, "loss": 0.8467, "step": 3196 }, { "epoch": 0.22, "learning_rate": 1.8206088446614387e-05, "loss": 0.9092, "step": 3197 }, { "epoch": 0.22, "learning_rate": 1.820482681932265e-05, "loss": 0.8857, "step": 3198 }, { "epoch": 0.22, "learning_rate": 1.8203564792292153e-05, "loss": 0.9258, "step": 3199 }, { "epoch": 0.22, "learning_rate": 1.820230236558438e-05, "loss": 0.8086, "step": 3200 }, { "epoch": 0.22, "learning_rate": 1.8201039539260833e-05, "loss": 0.9023, "step": 3201 }, { "epoch": 0.22, "learning_rate": 1.819977631338304e-05, "loss": 0.917, "step": 3202 }, { "epoch": 0.22, "learning_rate": 1.8198512688012545e-05, "loss": 0.9121, "step": 3203 }, { "epoch": 0.22, "learning_rate": 1.8197248663210915e-05, "loss": 0.7998, "step": 3204 }, { "epoch": 0.22, "learning_rate": 1.8195984239039724e-05, "loss": 0.8955, "step": 3205 }, { "epoch": 0.22, "learning_rate": 1.8194719415560584e-05, "loss": 0.8662, "step": 3206 }, { "epoch": 0.22, "learning_rate": 1.8193454192835113e-05, "loss": 0.9346, "step": 3207 }, { "epoch": 0.22, "learning_rate": 1.8192188570924952e-05, "loss": 0.8545, "step": 3208 }, { "epoch": 0.22, "learning_rate": 1.8190922549891766e-05, "loss": 0.9395, "step": 3209 }, { "epoch": 0.22, "learning_rate": 1.818965612979723e-05, "loss": 0.8643, "step": 3210 }, { "epoch": 0.22, "learning_rate": 1.818838931070305e-05, "loss": 0.8369, "step": 3211 }, { "epoch": 0.22, "learning_rate": 1.818712209267094e-05, "loss": 0.8867, "step": 3212 }, { "epoch": 0.22, "learning_rate": 1.818585447576264e-05, "loss": 0.8857, "step": 3213 }, { "epoch": 0.22, "learning_rate": 1.818458646003991e-05, "loss": 0.8105, "step": 3214 }, { "epoch": 0.22, "learning_rate": 1.818331804556453e-05, "loss": 0.8594, "step": 3215 }, { "epoch": 0.22, "learning_rate": 1.8182049232398292e-05, "loss": 0.833, "step": 3216 }, { "epoch": 0.22, "learning_rate": 1.818078002060301e-05, "loss": 0.8838, "step": 3217 }, { "epoch": 0.22, "learning_rate": 1.817951041024053e-05, "loss": 0.8506, "step": 3218 }, { "epoch": 0.22, "learning_rate": 1.81782404013727e-05, "loss": 0.8926, "step": 3219 }, { "epoch": 0.22, "learning_rate": 1.8176969994061395e-05, "loss": 0.9053, "step": 3220 }, { "epoch": 0.22, "learning_rate": 1.8175699188368513e-05, "loss": 0.874, "step": 3221 }, { "epoch": 0.22, "learning_rate": 1.8174427984355962e-05, "loss": 0.9131, "step": 3222 }, { "epoch": 0.22, "learning_rate": 1.817315638208568e-05, "loss": 0.8311, "step": 3223 }, { "epoch": 0.22, "learning_rate": 1.817188438161962e-05, "loss": 0.8662, "step": 3224 }, { "epoch": 0.22, "learning_rate": 1.817061198301975e-05, "loss": 0.7754, "step": 3225 }, { "epoch": 0.22, "learning_rate": 1.816933918634806e-05, "loss": 0.8154, "step": 3226 }, { "epoch": 0.22, "learning_rate": 1.8168065991666565e-05, "loss": 0.8311, "step": 3227 }, { "epoch": 0.22, "learning_rate": 1.8166792399037294e-05, "loss": 0.877, "step": 3228 }, { "epoch": 0.22, "learning_rate": 1.8165518408522293e-05, "loss": 0.8984, "step": 3229 }, { "epoch": 0.22, "learning_rate": 1.8164244020183638e-05, "loss": 0.8584, "step": 3230 }, { "epoch": 0.22, "learning_rate": 1.816296923408341e-05, "loss": 0.8799, "step": 3231 }, { "epoch": 0.22, "learning_rate": 1.8161694050283717e-05, "loss": 0.8125, "step": 3232 }, { "epoch": 0.22, "learning_rate": 1.816041846884669e-05, "loss": 0.8311, "step": 3233 }, { "epoch": 0.22, "learning_rate": 1.8159142489834473e-05, "loss": 0.8154, "step": 3234 }, { "epoch": 0.22, "learning_rate": 1.8157866113309232e-05, "loss": 0.874, "step": 3235 }, { "epoch": 0.22, "learning_rate": 1.8156589339333154e-05, "loss": 0.9102, "step": 3236 }, { "epoch": 0.22, "learning_rate": 1.8155312167968438e-05, "loss": 0.8242, "step": 3237 }, { "epoch": 0.22, "learning_rate": 1.815403459927731e-05, "loss": 0.8223, "step": 3238 }, { "epoch": 0.22, "learning_rate": 1.8152756633322015e-05, "loss": 0.835, "step": 3239 }, { "epoch": 0.22, "learning_rate": 1.8151478270164815e-05, "loss": 0.8438, "step": 3240 }, { "epoch": 0.22, "learning_rate": 1.815019950986799e-05, "loss": 0.8389, "step": 3241 }, { "epoch": 0.22, "learning_rate": 1.8148920352493845e-05, "loss": 0.8271, "step": 3242 }, { "epoch": 0.22, "learning_rate": 1.8147640798104694e-05, "loss": 0.9814, "step": 3243 }, { "epoch": 0.22, "learning_rate": 1.8146360846762886e-05, "loss": 0.9492, "step": 3244 }, { "epoch": 0.22, "learning_rate": 1.814508049853077e-05, "loss": 0.8477, "step": 3245 }, { "epoch": 0.22, "learning_rate": 1.8143799753470733e-05, "loss": 0.8809, "step": 3246 }, { "epoch": 0.22, "learning_rate": 1.8142518611645165e-05, "loss": 0.8584, "step": 3247 }, { "epoch": 0.22, "learning_rate": 1.814123707311649e-05, "loss": 0.8975, "step": 3248 }, { "epoch": 0.22, "learning_rate": 1.813995513794714e-05, "loss": 0.8262, "step": 3249 }, { "epoch": 0.22, "learning_rate": 1.8138672806199576e-05, "loss": 0.9082, "step": 3250 }, { "epoch": 0.22, "learning_rate": 1.8137390077936267e-05, "loss": 0.9014, "step": 3251 }, { "epoch": 0.22, "learning_rate": 1.813610695321971e-05, "loss": 0.9033, "step": 3252 }, { "epoch": 0.22, "learning_rate": 1.813482343211242e-05, "loss": 0.8037, "step": 3253 }, { "epoch": 0.22, "learning_rate": 1.813353951467693e-05, "loss": 0.9121, "step": 3254 }, { "epoch": 0.22, "learning_rate": 1.813225520097579e-05, "loss": 0.9043, "step": 3255 }, { "epoch": 0.22, "learning_rate": 1.8130970491071574e-05, "loss": 0.9141, "step": 3256 }, { "epoch": 0.22, "learning_rate": 1.8129685385026872e-05, "loss": 0.8193, "step": 3257 }, { "epoch": 0.22, "learning_rate": 1.8128399882904296e-05, "loss": 0.8164, "step": 3258 }, { "epoch": 0.22, "learning_rate": 1.812711398476647e-05, "loss": 0.8613, "step": 3259 }, { "epoch": 0.22, "learning_rate": 1.812582769067605e-05, "loss": 0.8809, "step": 3260 }, { "epoch": 0.22, "learning_rate": 1.81245410006957e-05, "loss": 0.9307, "step": 3261 }, { "epoch": 0.22, "learning_rate": 1.8123253914888107e-05, "loss": 0.8691, "step": 3262 }, { "epoch": 0.22, "learning_rate": 1.8121966433315985e-05, "loss": 0.8516, "step": 3263 }, { "epoch": 0.22, "learning_rate": 1.812067855604205e-05, "loss": 0.8359, "step": 3264 }, { "epoch": 0.22, "learning_rate": 1.8119390283129054e-05, "loss": 0.8936, "step": 3265 }, { "epoch": 0.22, "learning_rate": 1.811810161463976e-05, "loss": 0.8232, "step": 3266 }, { "epoch": 0.22, "learning_rate": 1.8116812550636948e-05, "loss": 0.6445, "step": 3267 }, { "epoch": 0.22, "learning_rate": 1.8115523091183425e-05, "loss": 0.833, "step": 3268 }, { "epoch": 0.22, "learning_rate": 1.8114233236342013e-05, "loss": 0.8633, "step": 3269 }, { "epoch": 0.22, "learning_rate": 1.8112942986175553e-05, "loss": 0.8076, "step": 3270 }, { "epoch": 0.22, "learning_rate": 1.8111652340746908e-05, "loss": 0.8887, "step": 3271 }, { "epoch": 0.22, "learning_rate": 1.8110361300118957e-05, "loss": 0.8701, "step": 3272 }, { "epoch": 0.22, "learning_rate": 1.81090698643546e-05, "loss": 0.9346, "step": 3273 }, { "epoch": 0.22, "learning_rate": 1.810777803351675e-05, "loss": 0.8633, "step": 3274 }, { "epoch": 0.22, "learning_rate": 1.8106485807668354e-05, "loss": 0.8721, "step": 3275 }, { "epoch": 0.22, "learning_rate": 1.8105193186872363e-05, "loss": 0.8232, "step": 3276 }, { "epoch": 0.22, "learning_rate": 1.8103900171191757e-05, "loss": 0.8643, "step": 3277 }, { "epoch": 0.22, "learning_rate": 1.8102606760689524e-05, "loss": 0.8623, "step": 3278 }, { "epoch": 0.22, "learning_rate": 1.810131295542869e-05, "loss": 0.8223, "step": 3279 }, { "epoch": 0.22, "learning_rate": 1.8100018755472283e-05, "loss": 0.876, "step": 3280 }, { "epoch": 0.22, "learning_rate": 1.809872416088336e-05, "loss": 0.8457, "step": 3281 }, { "epoch": 0.22, "learning_rate": 1.8097429171724986e-05, "loss": 0.8457, "step": 3282 }, { "epoch": 0.22, "learning_rate": 1.809613378806026e-05, "loss": 0.8682, "step": 3283 }, { "epoch": 0.22, "learning_rate": 1.8094838009952287e-05, "loss": 0.9668, "step": 3284 }, { "epoch": 0.22, "learning_rate": 1.8093541837464207e-05, "loss": 0.8242, "step": 3285 }, { "epoch": 0.22, "learning_rate": 1.809224527065916e-05, "loss": 0.8535, "step": 3286 }, { "epoch": 0.22, "learning_rate": 1.8090948309600315e-05, "loss": 0.9346, "step": 3287 }, { "epoch": 0.22, "learning_rate": 1.8089650954350867e-05, "loss": 0.874, "step": 3288 }, { "epoch": 0.22, "learning_rate": 1.8088353204974017e-05, "loss": 0.9111, "step": 3289 }, { "epoch": 0.22, "learning_rate": 1.8087055061532995e-05, "loss": 0.8564, "step": 3290 }, { "epoch": 0.22, "learning_rate": 1.8085756524091047e-05, "loss": 0.8125, "step": 3291 }, { "epoch": 0.22, "learning_rate": 1.8084457592711432e-05, "loss": 0.8828, "step": 3292 }, { "epoch": 0.22, "learning_rate": 1.8083158267457438e-05, "loss": 0.8857, "step": 3293 }, { "epoch": 0.22, "learning_rate": 1.8081858548392368e-05, "loss": 0.8574, "step": 3294 }, { "epoch": 0.22, "learning_rate": 1.8080558435579544e-05, "loss": 0.9053, "step": 3295 }, { "epoch": 0.22, "learning_rate": 1.807925792908231e-05, "loss": 0.8604, "step": 3296 }, { "epoch": 0.22, "learning_rate": 1.8077957028964018e-05, "loss": 0.7969, "step": 3297 }, { "epoch": 0.22, "learning_rate": 1.8076655735288054e-05, "loss": 0.7939, "step": 3298 }, { "epoch": 0.22, "learning_rate": 1.8075354048117818e-05, "loss": 0.8789, "step": 3299 }, { "epoch": 0.22, "learning_rate": 1.8074051967516726e-05, "loss": 0.8877, "step": 3300 }, { "epoch": 0.22, "learning_rate": 1.8072749493548217e-05, "loss": 0.8223, "step": 3301 }, { "epoch": 0.23, "learning_rate": 1.8071446626275745e-05, "loss": 0.9014, "step": 3302 }, { "epoch": 0.23, "learning_rate": 1.807014336576279e-05, "loss": 0.9238, "step": 3303 }, { "epoch": 0.23, "learning_rate": 1.8068839712072842e-05, "loss": 0.9521, "step": 3304 }, { "epoch": 0.23, "learning_rate": 1.8067535665269416e-05, "loss": 0.8125, "step": 3305 }, { "epoch": 0.23, "learning_rate": 1.806623122541604e-05, "loss": 0.8848, "step": 3306 }, { "epoch": 0.23, "learning_rate": 1.8064926392576283e-05, "loss": 0.9102, "step": 3307 }, { "epoch": 0.23, "learning_rate": 1.80636211668137e-05, "loss": 0.9043, "step": 3308 }, { "epoch": 0.23, "learning_rate": 1.806231554819189e-05, "loss": 0.79, "step": 3309 }, { "epoch": 0.23, "learning_rate": 1.8061009536774455e-05, "loss": 0.9639, "step": 3310 }, { "epoch": 0.23, "learning_rate": 1.805970313262503e-05, "loss": 0.834, "step": 3311 }, { "epoch": 0.23, "learning_rate": 1.805839633580726e-05, "loss": 0.916, "step": 3312 }, { "epoch": 0.23, "learning_rate": 1.8057089146384817e-05, "loss": 0.8359, "step": 3313 }, { "epoch": 0.23, "learning_rate": 1.8055781564421382e-05, "loss": 0.8984, "step": 3314 }, { "epoch": 0.23, "learning_rate": 1.8054473589980665e-05, "loss": 0.9512, "step": 3315 }, { "epoch": 0.23, "learning_rate": 1.8053165223126384e-05, "loss": 0.8125, "step": 3316 }, { "epoch": 0.23, "learning_rate": 1.8051856463922285e-05, "loss": 0.7676, "step": 3317 }, { "epoch": 0.23, "learning_rate": 1.8050547312432132e-05, "loss": 0.9229, "step": 3318 }, { "epoch": 0.23, "learning_rate": 1.804923776871971e-05, "loss": 0.915, "step": 3319 }, { "epoch": 0.23, "learning_rate": 1.8047927832848816e-05, "loss": 0.8779, "step": 3320 }, { "epoch": 0.23, "learning_rate": 1.804661750488327e-05, "loss": 0.8711, "step": 3321 }, { "epoch": 0.23, "learning_rate": 1.804530678488691e-05, "loss": 0.876, "step": 3322 }, { "epoch": 0.23, "learning_rate": 1.8043995672923595e-05, "loss": 0.8965, "step": 3323 }, { "epoch": 0.23, "learning_rate": 1.8042684169057204e-05, "loss": 0.792, "step": 3324 }, { "epoch": 0.23, "learning_rate": 1.8041372273351637e-05, "loss": 0.8848, "step": 3325 }, { "epoch": 0.23, "learning_rate": 1.80400599858708e-05, "loss": 0.8945, "step": 3326 }, { "epoch": 0.23, "learning_rate": 1.8038747306678632e-05, "loss": 0.8965, "step": 3327 }, { "epoch": 0.23, "learning_rate": 1.803743423583909e-05, "loss": 0.9209, "step": 3328 }, { "epoch": 0.23, "learning_rate": 1.8036120773416145e-05, "loss": 0.8232, "step": 3329 }, { "epoch": 0.23, "learning_rate": 1.8034806919473782e-05, "loss": 0.7891, "step": 3330 }, { "epoch": 0.23, "learning_rate": 1.8033492674076023e-05, "loss": 0.7949, "step": 3331 }, { "epoch": 0.23, "learning_rate": 1.803217803728689e-05, "loss": 0.9189, "step": 3332 }, { "epoch": 0.23, "learning_rate": 1.8030863009170435e-05, "loss": 0.8828, "step": 3333 }, { "epoch": 0.23, "learning_rate": 1.8029547589790728e-05, "loss": 0.7959, "step": 3334 }, { "epoch": 0.23, "learning_rate": 1.8028231779211852e-05, "loss": 0.9053, "step": 3335 }, { "epoch": 0.23, "learning_rate": 1.8026915577497915e-05, "loss": 0.8301, "step": 3336 }, { "epoch": 0.23, "learning_rate": 1.8025598984713044e-05, "loss": 0.875, "step": 3337 }, { "epoch": 0.23, "learning_rate": 1.802428200092138e-05, "loss": 0.9707, "step": 3338 }, { "epoch": 0.23, "learning_rate": 1.8022964626187092e-05, "loss": 0.873, "step": 3339 }, { "epoch": 0.23, "learning_rate": 1.8021646860574354e-05, "loss": 0.8301, "step": 3340 }, { "epoch": 0.23, "learning_rate": 1.8020328704147377e-05, "loss": 0.8887, "step": 3341 }, { "epoch": 0.23, "learning_rate": 1.8019010156970373e-05, "loss": 0.9238, "step": 3342 }, { "epoch": 0.23, "learning_rate": 1.8017691219107587e-05, "loss": 0.8105, "step": 3343 }, { "epoch": 0.23, "learning_rate": 1.8016371890623272e-05, "loss": 0.8643, "step": 3344 }, { "epoch": 0.23, "learning_rate": 1.8015052171581714e-05, "loss": 0.8555, "step": 3345 }, { "epoch": 0.23, "learning_rate": 1.8013732062047204e-05, "loss": 0.9014, "step": 3346 }, { "epoch": 0.23, "learning_rate": 1.8012411562084054e-05, "loss": 0.8955, "step": 3347 }, { "epoch": 0.23, "learning_rate": 1.801109067175661e-05, "loss": 0.8809, "step": 3348 }, { "epoch": 0.23, "learning_rate": 1.8009769391129217e-05, "loss": 0.7812, "step": 3349 }, { "epoch": 0.23, "learning_rate": 1.800844772026625e-05, "loss": 0.8975, "step": 3350 }, { "epoch": 0.23, "learning_rate": 1.80071256592321e-05, "loss": 0.9268, "step": 3351 }, { "epoch": 0.23, "learning_rate": 1.8005803208091178e-05, "loss": 0.8584, "step": 3352 }, { "epoch": 0.23, "learning_rate": 1.8004480366907915e-05, "loss": 0.7803, "step": 3353 }, { "epoch": 0.23, "learning_rate": 1.8003157135746757e-05, "loss": 0.8994, "step": 3354 }, { "epoch": 0.23, "learning_rate": 1.800183351467218e-05, "loss": 0.9043, "step": 3355 }, { "epoch": 0.23, "learning_rate": 1.8000509503748657e-05, "loss": 0.7744, "step": 3356 }, { "epoch": 0.23, "learning_rate": 1.7999185103040705e-05, "loss": 0.8369, "step": 3357 }, { "epoch": 0.23, "learning_rate": 1.7997860312612844e-05, "loss": 0.877, "step": 3358 }, { "epoch": 0.23, "learning_rate": 1.7996535132529616e-05, "loss": 0.8008, "step": 3359 }, { "epoch": 0.23, "learning_rate": 1.799520956285559e-05, "loss": 0.8623, "step": 3360 }, { "epoch": 0.23, "learning_rate": 1.799388360365534e-05, "loss": 0.834, "step": 3361 }, { "epoch": 0.23, "learning_rate": 1.7992557254993475e-05, "loss": 0.8496, "step": 3362 }, { "epoch": 0.23, "learning_rate": 1.799123051693461e-05, "loss": 0.8486, "step": 3363 }, { "epoch": 0.23, "learning_rate": 1.7989903389543378e-05, "loss": 0.8213, "step": 3364 }, { "epoch": 0.23, "learning_rate": 1.798857587288445e-05, "loss": 0.8652, "step": 3365 }, { "epoch": 0.23, "learning_rate": 1.798724796702249e-05, "loss": 0.9199, "step": 3366 }, { "epoch": 0.23, "learning_rate": 1.7985919672022204e-05, "loss": 0.8438, "step": 3367 }, { "epoch": 0.23, "learning_rate": 1.7984590987948296e-05, "loss": 0.9004, "step": 3368 }, { "epoch": 0.23, "learning_rate": 1.7983261914865505e-05, "loss": 0.8369, "step": 3369 }, { "epoch": 0.23, "learning_rate": 1.7981932452838585e-05, "loss": 0.8721, "step": 3370 }, { "epoch": 0.23, "learning_rate": 1.7980602601932303e-05, "loss": 0.8652, "step": 3371 }, { "epoch": 0.23, "learning_rate": 1.797927236221145e-05, "loss": 0.8877, "step": 3372 }, { "epoch": 0.23, "learning_rate": 1.7977941733740842e-05, "loss": 0.8301, "step": 3373 }, { "epoch": 0.23, "learning_rate": 1.7976610716585297e-05, "loss": 0.8564, "step": 3374 }, { "epoch": 0.23, "learning_rate": 1.797527931080967e-05, "loss": 0.8682, "step": 3375 }, { "epoch": 0.23, "learning_rate": 1.7973947516478823e-05, "loss": 0.7529, "step": 3376 }, { "epoch": 0.23, "learning_rate": 1.797261533365764e-05, "loss": 0.8984, "step": 3377 }, { "epoch": 0.23, "learning_rate": 1.7971282762411028e-05, "loss": 0.7705, "step": 3378 }, { "epoch": 0.23, "learning_rate": 1.796994980280391e-05, "loss": 0.9102, "step": 3379 }, { "epoch": 0.23, "learning_rate": 1.7968616454901223e-05, "loss": 0.8467, "step": 3380 }, { "epoch": 0.23, "learning_rate": 1.7967282718767935e-05, "loss": 0.8701, "step": 3381 }, { "epoch": 0.23, "learning_rate": 1.796594859446902e-05, "loss": 0.8008, "step": 3382 }, { "epoch": 0.23, "learning_rate": 1.7964614082069475e-05, "loss": 0.915, "step": 3383 }, { "epoch": 0.23, "learning_rate": 1.7963279181634324e-05, "loss": 0.8252, "step": 3384 }, { "epoch": 0.23, "learning_rate": 1.79619438932286e-05, "loss": 0.8672, "step": 3385 }, { "epoch": 0.23, "learning_rate": 1.7960608216917356e-05, "loss": 0.8447, "step": 3386 }, { "epoch": 0.23, "learning_rate": 1.7959272152765668e-05, "loss": 0.8486, "step": 3387 }, { "epoch": 0.23, "learning_rate": 1.7957935700838627e-05, "loss": 0.8945, "step": 3388 }, { "epoch": 0.23, "learning_rate": 1.795659886120135e-05, "loss": 0.9453, "step": 3389 }, { "epoch": 0.23, "learning_rate": 1.7955261633918964e-05, "loss": 0.96, "step": 3390 }, { "epoch": 0.23, "learning_rate": 1.7953924019056615e-05, "loss": 0.874, "step": 3391 }, { "epoch": 0.23, "learning_rate": 1.795258601667948e-05, "loss": 0.8281, "step": 3392 }, { "epoch": 0.23, "learning_rate": 1.795124762685274e-05, "loss": 0.9033, "step": 3393 }, { "epoch": 0.23, "learning_rate": 1.7949908849641606e-05, "loss": 0.918, "step": 3394 }, { "epoch": 0.23, "learning_rate": 1.7948569685111298e-05, "loss": 0.8525, "step": 3395 }, { "epoch": 0.23, "learning_rate": 1.7947230133327064e-05, "loss": 0.9355, "step": 3396 }, { "epoch": 0.23, "learning_rate": 1.7945890194354162e-05, "loss": 0.8477, "step": 3397 }, { "epoch": 0.23, "learning_rate": 1.7944549868257883e-05, "loss": 0.7842, "step": 3398 }, { "epoch": 0.23, "learning_rate": 1.794320915510352e-05, "loss": 0.7676, "step": 3399 }, { "epoch": 0.23, "learning_rate": 1.794186805495639e-05, "loss": 0.8301, "step": 3400 }, { "epoch": 0.23, "learning_rate": 1.794052656788184e-05, "loss": 0.793, "step": 3401 }, { "epoch": 0.23, "learning_rate": 1.7939184693945222e-05, "loss": 0.8965, "step": 3402 }, { "epoch": 0.23, "learning_rate": 1.7937842433211915e-05, "loss": 0.9277, "step": 3403 }, { "epoch": 0.23, "learning_rate": 1.793649978574731e-05, "loss": 0.8701, "step": 3404 }, { "epoch": 0.23, "learning_rate": 1.793515675161682e-05, "loss": 0.8965, "step": 3405 }, { "epoch": 0.23, "learning_rate": 1.7933813330885882e-05, "loss": 0.8994, "step": 3406 }, { "epoch": 0.23, "learning_rate": 1.7932469523619945e-05, "loss": 0.8018, "step": 3407 }, { "epoch": 0.23, "learning_rate": 1.793112532988448e-05, "loss": 0.792, "step": 3408 }, { "epoch": 0.23, "learning_rate": 1.7929780749744977e-05, "loss": 0.8682, "step": 3409 }, { "epoch": 0.23, "learning_rate": 1.792843578326694e-05, "loss": 0.874, "step": 3410 }, { "epoch": 0.23, "learning_rate": 1.79270904305159e-05, "loss": 0.8672, "step": 3411 }, { "epoch": 0.23, "learning_rate": 1.79257446915574e-05, "loss": 0.7949, "step": 3412 }, { "epoch": 0.23, "learning_rate": 1.7924398566457006e-05, "loss": 0.877, "step": 3413 }, { "epoch": 0.23, "learning_rate": 1.79230520552803e-05, "loss": 0.8486, "step": 3414 }, { "epoch": 0.23, "learning_rate": 1.7921705158092884e-05, "loss": 0.7744, "step": 3415 }, { "epoch": 0.23, "learning_rate": 1.792035787496038e-05, "loss": 0.8574, "step": 3416 }, { "epoch": 0.23, "learning_rate": 1.7919010205948424e-05, "loss": 0.9199, "step": 3417 }, { "epoch": 0.23, "learning_rate": 1.791766215112268e-05, "loss": 0.9014, "step": 3418 }, { "epoch": 0.23, "learning_rate": 1.791631371054882e-05, "loss": 0.8057, "step": 3419 }, { "epoch": 0.23, "learning_rate": 1.7914964884292543e-05, "loss": 0.8447, "step": 3420 }, { "epoch": 0.23, "learning_rate": 1.7913615672419563e-05, "loss": 0.8975, "step": 3421 }, { "epoch": 0.23, "learning_rate": 1.791226607499561e-05, "loss": 0.8975, "step": 3422 }, { "epoch": 0.23, "learning_rate": 1.7910916092086443e-05, "loss": 0.8369, "step": 3423 }, { "epoch": 0.23, "learning_rate": 1.7909565723757832e-05, "loss": 0.8809, "step": 3424 }, { "epoch": 0.23, "learning_rate": 1.7908214970075563e-05, "loss": 0.7598, "step": 3425 }, { "epoch": 0.23, "learning_rate": 1.7906863831105443e-05, "loss": 0.8525, "step": 3426 }, { "epoch": 0.23, "learning_rate": 1.7905512306913308e-05, "loss": 0.876, "step": 3427 }, { "epoch": 0.23, "learning_rate": 1.7904160397564995e-05, "loss": 0.8701, "step": 3428 }, { "epoch": 0.23, "learning_rate": 1.7902808103126372e-05, "loss": 0.8896, "step": 3429 }, { "epoch": 0.23, "learning_rate": 1.7901455423663327e-05, "loss": 0.8691, "step": 3430 }, { "epoch": 0.23, "learning_rate": 1.7900102359241757e-05, "loss": 0.8926, "step": 3431 }, { "epoch": 0.23, "learning_rate": 1.7898748909927586e-05, "loss": 0.8975, "step": 3432 }, { "epoch": 0.23, "learning_rate": 1.7897395075786754e-05, "loss": 0.9072, "step": 3433 }, { "epoch": 0.23, "learning_rate": 1.789604085688522e-05, "loss": 0.876, "step": 3434 }, { "epoch": 0.23, "learning_rate": 1.789468625328896e-05, "loss": 0.8115, "step": 3435 }, { "epoch": 0.23, "learning_rate": 1.7893331265063967e-05, "loss": 0.8633, "step": 3436 }, { "epoch": 0.23, "learning_rate": 1.7891975892276263e-05, "loss": 0.8496, "step": 3437 }, { "epoch": 0.23, "learning_rate": 1.7890620134991877e-05, "loss": 0.8379, "step": 3438 }, { "epoch": 0.23, "learning_rate": 1.7889263993276862e-05, "loss": 0.9473, "step": 3439 }, { "epoch": 0.23, "learning_rate": 1.7887907467197293e-05, "loss": 0.8838, "step": 3440 }, { "epoch": 0.23, "learning_rate": 1.7886550556819255e-05, "loss": 0.9736, "step": 3441 }, { "epoch": 0.23, "learning_rate": 1.788519326220886e-05, "loss": 0.8945, "step": 3442 }, { "epoch": 0.23, "learning_rate": 1.788383558343223e-05, "loss": 0.875, "step": 3443 }, { "epoch": 0.23, "learning_rate": 1.788247752055552e-05, "loss": 0.8193, "step": 3444 }, { "epoch": 0.23, "learning_rate": 1.788111907364489e-05, "loss": 0.876, "step": 3445 }, { "epoch": 0.23, "learning_rate": 1.7879760242766516e-05, "loss": 0.8379, "step": 3446 }, { "epoch": 0.23, "learning_rate": 1.7878401027986613e-05, "loss": 0.793, "step": 3447 }, { "epoch": 0.23, "learning_rate": 1.7877041429371393e-05, "loss": 0.8828, "step": 3448 }, { "epoch": 0.24, "learning_rate": 1.78756814469871e-05, "loss": 0.8369, "step": 3449 }, { "epoch": 0.24, "learning_rate": 1.787432108089999e-05, "loss": 0.8525, "step": 3450 }, { "epoch": 0.24, "learning_rate": 1.7872960331176347e-05, "loss": 0.8818, "step": 3451 }, { "epoch": 0.24, "learning_rate": 1.7871599197882452e-05, "loss": 0.8594, "step": 3452 }, { "epoch": 0.24, "learning_rate": 1.7870237681084632e-05, "loss": 0.8955, "step": 3453 }, { "epoch": 0.24, "learning_rate": 1.7868875780849214e-05, "loss": 0.8652, "step": 3454 }, { "epoch": 0.24, "learning_rate": 1.7867513497242557e-05, "loss": 0.9053, "step": 3455 }, { "epoch": 0.24, "learning_rate": 1.786615083033102e-05, "loss": 0.8896, "step": 3456 }, { "epoch": 0.24, "learning_rate": 1.7864787780181e-05, "loss": 0.792, "step": 3457 }, { "epoch": 0.24, "learning_rate": 1.7863424346858906e-05, "loss": 0.8779, "step": 3458 }, { "epoch": 0.24, "learning_rate": 1.7862060530431158e-05, "loss": 0.8408, "step": 3459 }, { "epoch": 0.24, "learning_rate": 1.7860696330964205e-05, "loss": 0.832, "step": 3460 }, { "epoch": 0.24, "learning_rate": 1.7859331748524508e-05, "loss": 0.8271, "step": 3461 }, { "epoch": 0.24, "learning_rate": 1.7857966783178557e-05, "loss": 0.8828, "step": 3462 }, { "epoch": 0.24, "learning_rate": 1.7856601434992842e-05, "loss": 0.8535, "step": 3463 }, { "epoch": 0.24, "learning_rate": 1.785523570403389e-05, "loss": 0.832, "step": 3464 }, { "epoch": 0.24, "learning_rate": 1.785386959036824e-05, "loss": 0.8818, "step": 3465 }, { "epoch": 0.24, "learning_rate": 1.7852503094062443e-05, "loss": 0.8418, "step": 3466 }, { "epoch": 0.24, "learning_rate": 1.785113621518308e-05, "loss": 0.8789, "step": 3467 }, { "epoch": 0.24, "learning_rate": 1.7849768953796743e-05, "loss": 0.8457, "step": 3468 }, { "epoch": 0.24, "learning_rate": 1.7848401309970046e-05, "loss": 0.8164, "step": 3469 }, { "epoch": 0.24, "learning_rate": 1.784703328376962e-05, "loss": 0.8623, "step": 3470 }, { "epoch": 0.24, "learning_rate": 1.7845664875262115e-05, "loss": 0.9092, "step": 3471 }, { "epoch": 0.24, "learning_rate": 1.78442960845142e-05, "loss": 0.9023, "step": 3472 }, { "epoch": 0.24, "learning_rate": 1.784292691159256e-05, "loss": 0.9209, "step": 3473 }, { "epoch": 0.24, "learning_rate": 1.7841557356563907e-05, "loss": 0.8701, "step": 3474 }, { "epoch": 0.24, "learning_rate": 1.7840187419494958e-05, "loss": 0.8428, "step": 3475 }, { "epoch": 0.24, "learning_rate": 1.7838817100452462e-05, "loss": 0.9336, "step": 3476 }, { "epoch": 0.24, "learning_rate": 1.7837446399503183e-05, "loss": 0.8438, "step": 3477 }, { "epoch": 0.24, "learning_rate": 1.783607531671389e-05, "loss": 0.8721, "step": 3478 }, { "epoch": 0.24, "learning_rate": 1.7834703852151397e-05, "loss": 0.748, "step": 3479 }, { "epoch": 0.24, "learning_rate": 1.7833332005882513e-05, "loss": 0.9111, "step": 3480 }, { "epoch": 0.24, "learning_rate": 1.7831959777974072e-05, "loss": 0.8604, "step": 3481 }, { "epoch": 0.24, "learning_rate": 1.7830587168492935e-05, "loss": 0.917, "step": 3482 }, { "epoch": 0.24, "learning_rate": 1.7829214177505973e-05, "loss": 0.8721, "step": 3483 }, { "epoch": 0.24, "learning_rate": 1.7827840805080078e-05, "loss": 0.8438, "step": 3484 }, { "epoch": 0.24, "learning_rate": 1.7826467051282162e-05, "loss": 0.9033, "step": 3485 }, { "epoch": 0.24, "learning_rate": 1.7825092916179148e-05, "loss": 0.8652, "step": 3486 }, { "epoch": 0.24, "learning_rate": 1.7823718399837992e-05, "loss": 0.8516, "step": 3487 }, { "epoch": 0.24, "learning_rate": 1.7822343502325657e-05, "loss": 0.8936, "step": 3488 }, { "epoch": 0.24, "learning_rate": 1.782096822370913e-05, "loss": 0.9326, "step": 3489 }, { "epoch": 0.24, "learning_rate": 1.781959256405541e-05, "loss": 0.8477, "step": 3490 }, { "epoch": 0.24, "learning_rate": 1.7818216523431523e-05, "loss": 0.9453, "step": 3491 }, { "epoch": 0.24, "learning_rate": 1.7816840101904506e-05, "loss": 0.8281, "step": 3492 }, { "epoch": 0.24, "learning_rate": 1.7815463299541423e-05, "loss": 0.9053, "step": 3493 }, { "epoch": 0.24, "learning_rate": 1.781408611640935e-05, "loss": 0.8711, "step": 3494 }, { "epoch": 0.24, "learning_rate": 1.781270855257538e-05, "loss": 0.8008, "step": 3495 }, { "epoch": 0.24, "learning_rate": 1.781133060810663e-05, "loss": 0.8887, "step": 3496 }, { "epoch": 0.24, "learning_rate": 1.7809952283070235e-05, "loss": 0.8115, "step": 3497 }, { "epoch": 0.24, "learning_rate": 1.7808573577533342e-05, "loss": 0.8857, "step": 3498 }, { "epoch": 0.24, "learning_rate": 1.780719449156313e-05, "loss": 0.8916, "step": 3499 }, { "epoch": 0.24, "learning_rate": 1.780581502522678e-05, "loss": 0.791, "step": 3500 }, { "epoch": 0.24, "learning_rate": 1.7804435178591507e-05, "loss": 0.8564, "step": 3501 }, { "epoch": 0.24, "learning_rate": 1.780305495172453e-05, "loss": 0.9199, "step": 3502 }, { "epoch": 0.24, "learning_rate": 1.7801674344693097e-05, "loss": 0.9766, "step": 3503 }, { "epoch": 0.24, "learning_rate": 1.7800293357564466e-05, "loss": 0.9053, "step": 3504 }, { "epoch": 0.24, "learning_rate": 1.7798911990405928e-05, "loss": 0.8164, "step": 3505 }, { "epoch": 0.24, "learning_rate": 1.779753024328478e-05, "loss": 0.8652, "step": 3506 }, { "epoch": 0.24, "learning_rate": 1.7796148116268332e-05, "loss": 0.8662, "step": 3507 }, { "epoch": 0.24, "learning_rate": 1.779476560942393e-05, "loss": 0.8115, "step": 3508 }, { "epoch": 0.24, "learning_rate": 1.7793382722818932e-05, "loss": 0.9072, "step": 3509 }, { "epoch": 0.24, "learning_rate": 1.7791999456520705e-05, "loss": 0.8896, "step": 3510 }, { "epoch": 0.24, "learning_rate": 1.7790615810596642e-05, "loss": 0.8604, "step": 3511 }, { "epoch": 0.24, "learning_rate": 1.778923178511416e-05, "loss": 0.9121, "step": 3512 }, { "epoch": 0.24, "learning_rate": 1.7787847380140687e-05, "loss": 0.8252, "step": 3513 }, { "epoch": 0.24, "learning_rate": 1.7786462595743662e-05, "loss": 0.9229, "step": 3514 }, { "epoch": 0.24, "learning_rate": 1.7785077431990565e-05, "loss": 0.8906, "step": 3515 }, { "epoch": 0.24, "learning_rate": 1.7783691888948877e-05, "loss": 0.8613, "step": 3516 }, { "epoch": 0.24, "learning_rate": 1.7782305966686097e-05, "loss": 0.8701, "step": 3517 }, { "epoch": 0.24, "learning_rate": 1.7780919665269746e-05, "loss": 0.8652, "step": 3518 }, { "epoch": 0.24, "learning_rate": 1.7779532984767375e-05, "loss": 0.835, "step": 3519 }, { "epoch": 0.24, "learning_rate": 1.777814592524653e-05, "loss": 0.915, "step": 3520 }, { "epoch": 0.24, "learning_rate": 1.77767584867748e-05, "loss": 0.8506, "step": 3521 }, { "epoch": 0.24, "learning_rate": 1.7775370669419775e-05, "loss": 0.8984, "step": 3522 }, { "epoch": 0.24, "learning_rate": 1.7773982473249068e-05, "loss": 0.8584, "step": 3523 }, { "epoch": 0.24, "learning_rate": 1.7772593898330314e-05, "loss": 0.9561, "step": 3524 }, { "epoch": 0.24, "learning_rate": 1.7771204944731165e-05, "loss": 0.8486, "step": 3525 }, { "epoch": 0.24, "learning_rate": 1.7769815612519294e-05, "loss": 0.8613, "step": 3526 }, { "epoch": 0.24, "learning_rate": 1.7768425901762378e-05, "loss": 0.8701, "step": 3527 }, { "epoch": 0.24, "learning_rate": 1.7767035812528135e-05, "loss": 0.9062, "step": 3528 }, { "epoch": 0.24, "learning_rate": 1.7765645344884285e-05, "loss": 0.8369, "step": 3529 }, { "epoch": 0.24, "learning_rate": 1.7764254498898573e-05, "loss": 0.8379, "step": 3530 }, { "epoch": 0.24, "learning_rate": 1.776286327463876e-05, "loss": 0.8232, "step": 3531 }, { "epoch": 0.24, "learning_rate": 1.7761471672172628e-05, "loss": 0.9258, "step": 3532 }, { "epoch": 0.24, "learning_rate": 1.7760079691567977e-05, "loss": 0.876, "step": 3533 }, { "epoch": 0.24, "learning_rate": 1.7758687332892616e-05, "loss": 0.8818, "step": 3534 }, { "epoch": 0.24, "learning_rate": 1.775729459621439e-05, "loss": 0.9238, "step": 3535 }, { "epoch": 0.24, "learning_rate": 1.7755901481601148e-05, "loss": 0.8994, "step": 3536 }, { "epoch": 0.24, "learning_rate": 1.7754507989120762e-05, "loss": 0.7871, "step": 3537 }, { "epoch": 0.24, "learning_rate": 1.775311411884113e-05, "loss": 0.8516, "step": 3538 }, { "epoch": 0.24, "learning_rate": 1.7751719870830155e-05, "loss": 0.8145, "step": 3539 }, { "epoch": 0.24, "learning_rate": 1.7750325245155764e-05, "loss": 0.8545, "step": 3540 }, { "epoch": 0.24, "learning_rate": 1.7748930241885905e-05, "loss": 0.8535, "step": 3541 }, { "epoch": 0.24, "learning_rate": 1.7747534861088546e-05, "loss": 0.8945, "step": 3542 }, { "epoch": 0.24, "learning_rate": 1.7746139102831663e-05, "loss": 0.8047, "step": 3543 }, { "epoch": 0.24, "learning_rate": 1.774474296718326e-05, "loss": 0.8574, "step": 3544 }, { "epoch": 0.24, "learning_rate": 1.774334645421136e-05, "loss": 0.7705, "step": 3545 }, { "epoch": 0.24, "learning_rate": 1.7741949563983997e-05, "loss": 0.8516, "step": 3546 }, { "epoch": 0.24, "learning_rate": 1.774055229656923e-05, "loss": 0.8662, "step": 3547 }, { "epoch": 0.24, "learning_rate": 1.7739154652035133e-05, "loss": 0.8984, "step": 3548 }, { "epoch": 0.24, "learning_rate": 1.7737756630449795e-05, "loss": 0.7998, "step": 3549 }, { "epoch": 0.24, "learning_rate": 1.7736358231881334e-05, "loss": 0.8223, "step": 3550 }, { "epoch": 0.24, "learning_rate": 1.773495945639788e-05, "loss": 0.8623, "step": 3551 }, { "epoch": 0.24, "learning_rate": 1.7733560304067575e-05, "loss": 0.8584, "step": 3552 }, { "epoch": 0.24, "learning_rate": 1.773216077495859e-05, "loss": 0.8672, "step": 3553 }, { "epoch": 0.24, "learning_rate": 1.7730760869139105e-05, "loss": 0.916, "step": 3554 }, { "epoch": 0.24, "learning_rate": 1.7729360586677334e-05, "loss": 0.8965, "step": 3555 }, { "epoch": 0.24, "learning_rate": 1.7727959927641486e-05, "loss": 0.8984, "step": 3556 }, { "epoch": 0.24, "learning_rate": 1.7726558892099812e-05, "loss": 0.8848, "step": 3557 }, { "epoch": 0.24, "learning_rate": 1.7725157480120565e-05, "loss": 0.9355, "step": 3558 }, { "epoch": 0.24, "learning_rate": 1.7723755691772023e-05, "loss": 0.9238, "step": 3559 }, { "epoch": 0.24, "learning_rate": 1.7722353527122477e-05, "loss": 0.875, "step": 3560 }, { "epoch": 0.24, "learning_rate": 1.7720950986240242e-05, "loss": 0.8984, "step": 3561 }, { "epoch": 0.24, "learning_rate": 1.7719548069193657e-05, "loss": 0.8525, "step": 3562 }, { "epoch": 0.24, "learning_rate": 1.7718144776051064e-05, "loss": 0.9014, "step": 3563 }, { "epoch": 0.24, "learning_rate": 1.7716741106880838e-05, "loss": 0.8779, "step": 3564 }, { "epoch": 0.24, "learning_rate": 1.7715337061751356e-05, "loss": 0.8896, "step": 3565 }, { "epoch": 0.24, "learning_rate": 1.771393264073103e-05, "loss": 0.877, "step": 3566 }, { "epoch": 0.24, "learning_rate": 1.7712527843888284e-05, "loss": 0.9189, "step": 3567 }, { "epoch": 0.24, "learning_rate": 1.7711122671291555e-05, "loss": 0.8486, "step": 3568 }, { "epoch": 0.24, "learning_rate": 1.7709717123009307e-05, "loss": 0.8545, "step": 3569 }, { "epoch": 0.24, "learning_rate": 1.7708311199110017e-05, "loss": 0.8926, "step": 3570 }, { "epoch": 0.24, "learning_rate": 1.770690489966218e-05, "loss": 0.8809, "step": 3571 }, { "epoch": 0.24, "learning_rate": 1.7705498224734314e-05, "loss": 0.8633, "step": 3572 }, { "epoch": 0.24, "learning_rate": 1.7704091174394947e-05, "loss": 0.7871, "step": 3573 }, { "epoch": 0.24, "learning_rate": 1.770268374871264e-05, "loss": 0.7959, "step": 3574 }, { "epoch": 0.24, "learning_rate": 1.7701275947755947e-05, "loss": 0.8281, "step": 3575 }, { "epoch": 0.24, "learning_rate": 1.7699867771593472e-05, "loss": 0.8838, "step": 3576 }, { "epoch": 0.24, "learning_rate": 1.769845922029381e-05, "loss": 0.8809, "step": 3577 }, { "epoch": 0.24, "learning_rate": 1.7697050293925596e-05, "loss": 0.8965, "step": 3578 }, { "epoch": 0.24, "learning_rate": 1.7695640992557463e-05, "loss": 0.7979, "step": 3579 }, { "epoch": 0.24, "learning_rate": 1.769423131625808e-05, "loss": 0.9141, "step": 3580 }, { "epoch": 0.24, "learning_rate": 1.7692821265096117e-05, "loss": 0.8115, "step": 3581 }, { "epoch": 0.24, "learning_rate": 1.7691410839140283e-05, "loss": 0.8467, "step": 3582 }, { "epoch": 0.24, "learning_rate": 1.7690000038459282e-05, "loss": 0.8525, "step": 3583 }, { "epoch": 0.24, "learning_rate": 1.768858886312186e-05, "loss": 0.9648, "step": 3584 }, { "epoch": 0.24, "learning_rate": 1.768717731319676e-05, "loss": 0.8779, "step": 3585 }, { "epoch": 0.24, "learning_rate": 1.7685765388752754e-05, "loss": 0.7676, "step": 3586 }, { "epoch": 0.24, "learning_rate": 1.768435308985864e-05, "loss": 0.877, "step": 3587 }, { "epoch": 0.24, "learning_rate": 1.7682940416583213e-05, "loss": 0.8252, "step": 3588 }, { "epoch": 0.24, "learning_rate": 1.7681527368995305e-05, "loss": 0.9658, "step": 3589 }, { "epoch": 0.24, "learning_rate": 1.7680113947163757e-05, "loss": 0.8027, "step": 3590 }, { "epoch": 0.24, "learning_rate": 1.7678700151157435e-05, "loss": 0.8506, "step": 3591 }, { "epoch": 0.24, "learning_rate": 1.7677285981045215e-05, "loss": 0.8916, "step": 3592 }, { "epoch": 0.24, "learning_rate": 1.767587143689599e-05, "loss": 0.8096, "step": 3593 }, { "epoch": 0.24, "learning_rate": 1.7674456518778693e-05, "loss": 0.8838, "step": 3594 }, { "epoch": 0.24, "learning_rate": 1.7673041226762244e-05, "loss": 0.8027, "step": 3595 }, { "epoch": 0.25, "learning_rate": 1.76716255609156e-05, "loss": 0.8779, "step": 3596 }, { "epoch": 0.25, "learning_rate": 1.7670209521307732e-05, "loss": 0.8662, "step": 3597 }, { "epoch": 0.25, "learning_rate": 1.7668793108007634e-05, "loss": 0.8965, "step": 3598 }, { "epoch": 0.25, "learning_rate": 1.7667376321084306e-05, "loss": 0.8486, "step": 3599 }, { "epoch": 0.25, "learning_rate": 1.766595916060678e-05, "loss": 0.8555, "step": 3600 }, { "epoch": 0.25, "learning_rate": 1.7664541626644097e-05, "loss": 0.8506, "step": 3601 }, { "epoch": 0.25, "learning_rate": 1.766312371926532e-05, "loss": 0.8652, "step": 3602 }, { "epoch": 0.25, "learning_rate": 1.7661705438539526e-05, "loss": 0.9014, "step": 3603 }, { "epoch": 0.25, "learning_rate": 1.766028678453582e-05, "loss": 0.8867, "step": 3604 }, { "epoch": 0.25, "learning_rate": 1.7658867757323316e-05, "loss": 0.9219, "step": 3605 }, { "epoch": 0.25, "learning_rate": 1.7657448356971145e-05, "loss": 0.9189, "step": 3606 }, { "epoch": 0.25, "learning_rate": 1.7656028583548463e-05, "loss": 0.8262, "step": 3607 }, { "epoch": 0.25, "learning_rate": 1.7654608437124445e-05, "loss": 0.8564, "step": 3608 }, { "epoch": 0.25, "learning_rate": 1.765318791776828e-05, "loss": 0.8594, "step": 3609 }, { "epoch": 0.25, "learning_rate": 1.7651767025549166e-05, "loss": 0.8535, "step": 3610 }, { "epoch": 0.25, "learning_rate": 1.7650345760536337e-05, "loss": 0.8379, "step": 3611 }, { "epoch": 0.25, "learning_rate": 1.7648924122799037e-05, "loss": 0.8906, "step": 3612 }, { "epoch": 0.25, "learning_rate": 1.764750211240653e-05, "loss": 0.8652, "step": 3613 }, { "epoch": 0.25, "learning_rate": 1.764607972942809e-05, "loss": 0.7959, "step": 3614 }, { "epoch": 0.25, "learning_rate": 1.7644656973933018e-05, "loss": 0.873, "step": 3615 }, { "epoch": 0.25, "learning_rate": 1.7643233845990634e-05, "loss": 0.875, "step": 3616 }, { "epoch": 0.25, "learning_rate": 1.7641810345670265e-05, "loss": 0.9902, "step": 3617 }, { "epoch": 0.25, "learning_rate": 1.764038647304127e-05, "loss": 0.8955, "step": 3618 }, { "epoch": 0.25, "learning_rate": 1.763896222817302e-05, "loss": 0.8643, "step": 3619 }, { "epoch": 0.25, "learning_rate": 1.7637537611134905e-05, "loss": 0.8799, "step": 3620 }, { "epoch": 0.25, "learning_rate": 1.7636112621996325e-05, "loss": 0.8213, "step": 3621 }, { "epoch": 0.25, "learning_rate": 1.7634687260826713e-05, "loss": 0.8955, "step": 3622 }, { "epoch": 0.25, "learning_rate": 1.763326152769551e-05, "loss": 0.875, "step": 3623 }, { "epoch": 0.25, "learning_rate": 1.763183542267218e-05, "loss": 0.8408, "step": 3624 }, { "epoch": 0.25, "learning_rate": 1.76304089458262e-05, "loss": 0.8779, "step": 3625 }, { "epoch": 0.25, "learning_rate": 1.7628982097227064e-05, "loss": 0.8066, "step": 3626 }, { "epoch": 0.25, "learning_rate": 1.7627554876944294e-05, "loss": 0.8965, "step": 3627 }, { "epoch": 0.25, "learning_rate": 1.762612728504742e-05, "loss": 0.958, "step": 3628 }, { "epoch": 0.25, "learning_rate": 1.7624699321606004e-05, "loss": 0.8867, "step": 3629 }, { "epoch": 0.25, "learning_rate": 1.76232709866896e-05, "loss": 0.8633, "step": 3630 }, { "epoch": 0.25, "learning_rate": 1.762184228036781e-05, "loss": 0.8418, "step": 3631 }, { "epoch": 0.25, "learning_rate": 1.7620413202710238e-05, "loss": 0.8379, "step": 3632 }, { "epoch": 0.25, "learning_rate": 1.7618983753786504e-05, "loss": 0.9141, "step": 3633 }, { "epoch": 0.25, "learning_rate": 1.761755393366625e-05, "loss": 0.8857, "step": 3634 }, { "epoch": 0.25, "learning_rate": 1.7616123742419145e-05, "loss": 0.8633, "step": 3635 }, { "epoch": 0.25, "learning_rate": 1.761469318011486e-05, "loss": 0.873, "step": 3636 }, { "epoch": 0.25, "learning_rate": 1.7613262246823096e-05, "loss": 0.8867, "step": 3637 }, { "epoch": 0.25, "learning_rate": 1.7611830942613566e-05, "loss": 0.916, "step": 3638 }, { "epoch": 0.25, "learning_rate": 1.7610399267556e-05, "loss": 0.7676, "step": 3639 }, { "epoch": 0.25, "learning_rate": 1.7608967221720157e-05, "loss": 0.873, "step": 3640 }, { "epoch": 0.25, "learning_rate": 1.7607534805175805e-05, "loss": 0.8242, "step": 3641 }, { "epoch": 0.25, "learning_rate": 1.760610201799272e-05, "loss": 0.998, "step": 3642 }, { "epoch": 0.25, "learning_rate": 1.7604668860240722e-05, "loss": 0.8779, "step": 3643 }, { "epoch": 0.25, "learning_rate": 1.7603235331989624e-05, "loss": 0.8203, "step": 3644 }, { "epoch": 0.25, "learning_rate": 1.7601801433309273e-05, "loss": 0.9512, "step": 3645 }, { "epoch": 0.25, "learning_rate": 1.760036716426953e-05, "loss": 0.8174, "step": 3646 }, { "epoch": 0.25, "learning_rate": 1.7598932524940266e-05, "loss": 0.8926, "step": 3647 }, { "epoch": 0.25, "learning_rate": 1.759749751539138e-05, "loss": 0.9336, "step": 3648 }, { "epoch": 0.25, "learning_rate": 1.7596062135692786e-05, "loss": 0.9209, "step": 3649 }, { "epoch": 0.25, "learning_rate": 1.7594626385914418e-05, "loss": 0.916, "step": 3650 }, { "epoch": 0.25, "learning_rate": 1.7593190266126218e-05, "loss": 0.9766, "step": 3651 }, { "epoch": 0.25, "learning_rate": 1.7591753776398163e-05, "loss": 0.8447, "step": 3652 }, { "epoch": 0.25, "learning_rate": 1.759031691680023e-05, "loss": 0.832, "step": 3653 }, { "epoch": 0.25, "learning_rate": 1.758887968740243e-05, "loss": 0.8809, "step": 3654 }, { "epoch": 0.25, "learning_rate": 1.7587442088274777e-05, "loss": 0.8115, "step": 3655 }, { "epoch": 0.25, "learning_rate": 1.758600411948732e-05, "loss": 0.8164, "step": 3656 }, { "epoch": 0.25, "learning_rate": 1.7584565781110113e-05, "loss": 0.9189, "step": 3657 }, { "epoch": 0.25, "learning_rate": 1.758312707321323e-05, "loss": 0.8271, "step": 3658 }, { "epoch": 0.25, "learning_rate": 1.7581687995866766e-05, "loss": 0.7998, "step": 3659 }, { "epoch": 0.25, "learning_rate": 1.758024854914083e-05, "loss": 0.9082, "step": 3660 }, { "epoch": 0.25, "learning_rate": 1.7578808733105556e-05, "loss": 0.8555, "step": 3661 }, { "epoch": 0.25, "learning_rate": 1.757736854783109e-05, "loss": 0.8428, "step": 3662 }, { "epoch": 0.25, "learning_rate": 1.75759279933876e-05, "loss": 0.7959, "step": 3663 }, { "epoch": 0.25, "learning_rate": 1.7574487069845263e-05, "loss": 0.917, "step": 3664 }, { "epoch": 0.25, "learning_rate": 1.7573045777274288e-05, "loss": 0.877, "step": 3665 }, { "epoch": 0.25, "learning_rate": 1.7571604115744895e-05, "loss": 0.8721, "step": 3666 }, { "epoch": 0.25, "learning_rate": 1.7570162085327313e-05, "loss": 0.9189, "step": 3667 }, { "epoch": 0.25, "learning_rate": 1.7568719686091807e-05, "loss": 0.8008, "step": 3668 }, { "epoch": 0.25, "learning_rate": 1.7567276918108645e-05, "loss": 0.7891, "step": 3669 }, { "epoch": 0.25, "learning_rate": 1.7565833781448125e-05, "loss": 0.8164, "step": 3670 }, { "epoch": 0.25, "learning_rate": 1.756439027618055e-05, "loss": 0.873, "step": 3671 }, { "epoch": 0.25, "learning_rate": 1.7562946402376246e-05, "loss": 0.873, "step": 3672 }, { "epoch": 0.25, "learning_rate": 1.7561502160105565e-05, "loss": 0.8652, "step": 3673 }, { "epoch": 0.25, "learning_rate": 1.7560057549438865e-05, "loss": 0.8496, "step": 3674 }, { "epoch": 0.25, "learning_rate": 1.7558612570446533e-05, "loss": 0.9219, "step": 3675 }, { "epoch": 0.25, "learning_rate": 1.7557167223198967e-05, "loss": 0.7363, "step": 3676 }, { "epoch": 0.25, "learning_rate": 1.7555721507766578e-05, "loss": 0.8496, "step": 3677 }, { "epoch": 0.25, "learning_rate": 1.7554275424219806e-05, "loss": 0.835, "step": 3678 }, { "epoch": 0.25, "learning_rate": 1.7552828972629104e-05, "loss": 0.8262, "step": 3679 }, { "epoch": 0.25, "learning_rate": 1.7551382153064946e-05, "loss": 0.8604, "step": 3680 }, { "epoch": 0.25, "learning_rate": 1.7549934965597813e-05, "loss": 0.8838, "step": 3681 }, { "epoch": 0.25, "learning_rate": 1.754848741029822e-05, "loss": 0.8721, "step": 3682 }, { "epoch": 0.25, "learning_rate": 1.754703948723669e-05, "loss": 0.8535, "step": 3683 }, { "epoch": 0.25, "learning_rate": 1.7545591196483762e-05, "loss": 0.792, "step": 3684 }, { "epoch": 0.25, "learning_rate": 1.7544142538109998e-05, "loss": 0.8877, "step": 3685 }, { "epoch": 0.25, "learning_rate": 1.7542693512185978e-05, "loss": 0.7988, "step": 3686 }, { "epoch": 0.25, "learning_rate": 1.7541244118782298e-05, "loss": 0.8887, "step": 3687 }, { "epoch": 0.25, "learning_rate": 1.7539794357969572e-05, "loss": 0.791, "step": 3688 }, { "epoch": 0.25, "learning_rate": 1.7538344229818434e-05, "loss": 0.8877, "step": 3689 }, { "epoch": 0.25, "learning_rate": 1.753689373439953e-05, "loss": 0.8506, "step": 3690 }, { "epoch": 0.25, "learning_rate": 1.753544287178353e-05, "loss": 0.8418, "step": 3691 }, { "epoch": 0.25, "learning_rate": 1.7533991642041125e-05, "loss": 0.8799, "step": 3692 }, { "epoch": 0.25, "learning_rate": 1.7532540045243016e-05, "loss": 0.9365, "step": 3693 }, { "epoch": 0.25, "learning_rate": 1.7531088081459917e-05, "loss": 0.876, "step": 3694 }, { "epoch": 0.25, "learning_rate": 1.752963575076258e-05, "loss": 0.8359, "step": 3695 }, { "epoch": 0.25, "learning_rate": 1.7528183053221753e-05, "loss": 0.916, "step": 3696 }, { "epoch": 0.25, "learning_rate": 1.7526729988908213e-05, "loss": 0.8867, "step": 3697 }, { "epoch": 0.25, "learning_rate": 1.752527655789276e-05, "loss": 0.8652, "step": 3698 }, { "epoch": 0.25, "learning_rate": 1.7523822760246195e-05, "loss": 0.8262, "step": 3699 }, { "epoch": 0.25, "learning_rate": 1.7522368596039358e-05, "loss": 0.8535, "step": 3700 }, { "epoch": 0.25, "learning_rate": 1.7520914065343085e-05, "loss": 0.8711, "step": 3701 }, { "epoch": 0.25, "learning_rate": 1.7519459168228246e-05, "loss": 0.7871, "step": 3702 }, { "epoch": 0.25, "learning_rate": 1.7518003904765722e-05, "loss": 0.9688, "step": 3703 }, { "epoch": 0.25, "learning_rate": 1.7516548275026416e-05, "loss": 0.8008, "step": 3704 }, { "epoch": 0.25, "learning_rate": 1.7515092279081245e-05, "loss": 0.9004, "step": 3705 }, { "epoch": 0.25, "learning_rate": 1.7513635917001145e-05, "loss": 0.9111, "step": 3706 }, { "epoch": 0.25, "learning_rate": 1.751217918885707e-05, "loss": 0.9238, "step": 3707 }, { "epoch": 0.25, "learning_rate": 1.7510722094719993e-05, "loss": 0.9551, "step": 3708 }, { "epoch": 0.25, "learning_rate": 1.7509264634660896e-05, "loss": 0.8223, "step": 3709 }, { "epoch": 0.25, "learning_rate": 1.7507806808750797e-05, "loss": 0.834, "step": 3710 }, { "epoch": 0.25, "learning_rate": 1.7506348617060714e-05, "loss": 0.8057, "step": 3711 }, { "epoch": 0.25, "learning_rate": 1.7504890059661692e-05, "loss": 0.8867, "step": 3712 }, { "epoch": 0.25, "learning_rate": 1.7503431136624792e-05, "loss": 0.8809, "step": 3713 }, { "epoch": 0.25, "learning_rate": 1.7501971848021096e-05, "loss": 0.9062, "step": 3714 }, { "epoch": 0.25, "learning_rate": 1.7500512193921694e-05, "loss": 0.8301, "step": 3715 }, { "epoch": 0.25, "learning_rate": 1.749905217439771e-05, "loss": 0.8584, "step": 3716 }, { "epoch": 0.25, "learning_rate": 1.7497591789520263e-05, "loss": 0.9551, "step": 3717 }, { "epoch": 0.25, "learning_rate": 1.749613103936051e-05, "loss": 0.834, "step": 3718 }, { "epoch": 0.25, "learning_rate": 1.7494669923989623e-05, "loss": 0.8027, "step": 3719 }, { "epoch": 0.25, "learning_rate": 1.749320844347878e-05, "loss": 0.8633, "step": 3720 }, { "epoch": 0.25, "learning_rate": 1.7491746597899185e-05, "loss": 0.8643, "step": 3721 }, { "epoch": 0.25, "learning_rate": 1.7490284387322062e-05, "loss": 0.834, "step": 3722 }, { "epoch": 0.25, "learning_rate": 1.7488821811818652e-05, "loss": 0.7969, "step": 3723 }, { "epoch": 0.25, "learning_rate": 1.7487358871460208e-05, "loss": 0.9131, "step": 3724 }, { "epoch": 0.25, "learning_rate": 1.7485895566318003e-05, "loss": 0.7686, "step": 3725 }, { "epoch": 0.25, "learning_rate": 1.748443189646333e-05, "loss": 0.8789, "step": 3726 }, { "epoch": 0.25, "learning_rate": 1.7482967861967502e-05, "loss": 0.8848, "step": 3727 }, { "epoch": 0.25, "learning_rate": 1.7481503462901846e-05, "loss": 0.8262, "step": 3728 }, { "epoch": 0.25, "learning_rate": 1.7480038699337702e-05, "loss": 0.8486, "step": 3729 }, { "epoch": 0.25, "learning_rate": 1.747857357134644e-05, "loss": 0.8945, "step": 3730 }, { "epoch": 0.25, "learning_rate": 1.7477108078999437e-05, "loss": 0.8906, "step": 3731 }, { "epoch": 0.25, "learning_rate": 1.7475642222368098e-05, "loss": 0.8721, "step": 3732 }, { "epoch": 0.25, "learning_rate": 1.747417600152383e-05, "loss": 0.873, "step": 3733 }, { "epoch": 0.25, "learning_rate": 1.7472709416538068e-05, "loss": 0.833, "step": 3734 }, { "epoch": 0.25, "learning_rate": 1.7471242467482276e-05, "loss": 0.8398, "step": 3735 }, { "epoch": 0.25, "learning_rate": 1.746977515442791e-05, "loss": 0.8564, "step": 3736 }, { "epoch": 0.25, "learning_rate": 1.7468307477446464e-05, "loss": 0.9092, "step": 3737 }, { "epoch": 0.25, "learning_rate": 1.746683943660944e-05, "loss": 0.8174, "step": 3738 }, { "epoch": 0.25, "learning_rate": 1.7465371031988366e-05, "loss": 0.8145, "step": 3739 }, { "epoch": 0.25, "learning_rate": 1.7463902263654776e-05, "loss": 0.9629, "step": 3740 }, { "epoch": 0.25, "learning_rate": 1.7462433131680234e-05, "loss": 0.8994, "step": 3741 }, { "epoch": 0.26, "learning_rate": 1.7460963636136316e-05, "loss": 0.8838, "step": 3742 }, { "epoch": 0.26, "learning_rate": 1.7459493777094608e-05, "loss": 0.8271, "step": 3743 }, { "epoch": 0.26, "learning_rate": 1.745802355462673e-05, "loss": 0.8545, "step": 3744 }, { "epoch": 0.26, "learning_rate": 1.745655296880431e-05, "loss": 0.8584, "step": 3745 }, { "epoch": 0.26, "learning_rate": 1.7455082019698994e-05, "loss": 0.8291, "step": 3746 }, { "epoch": 0.26, "learning_rate": 1.745361070738244e-05, "loss": 0.8213, "step": 3747 }, { "epoch": 0.26, "learning_rate": 1.7452139031926337e-05, "loss": 0.9004, "step": 3748 }, { "epoch": 0.26, "learning_rate": 1.7450666993402384e-05, "loss": 0.8447, "step": 3749 }, { "epoch": 0.26, "learning_rate": 1.7449194591882303e-05, "loss": 0.8135, "step": 3750 }, { "epoch": 0.26, "learning_rate": 1.744772182743782e-05, "loss": 0.8965, "step": 3751 }, { "epoch": 0.26, "learning_rate": 1.7446248700140694e-05, "loss": 0.9004, "step": 3752 }, { "epoch": 0.26, "learning_rate": 1.7444775210062698e-05, "loss": 0.8594, "step": 3753 }, { "epoch": 0.26, "learning_rate": 1.744330135727561e-05, "loss": 0.9316, "step": 3754 }, { "epoch": 0.26, "learning_rate": 1.7441827141851246e-05, "loss": 0.8799, "step": 3755 }, { "epoch": 0.26, "learning_rate": 1.744035256386143e-05, "loss": 0.8623, "step": 3756 }, { "epoch": 0.26, "learning_rate": 1.7438877623377994e-05, "loss": 0.8828, "step": 3757 }, { "epoch": 0.26, "learning_rate": 1.7437402320472804e-05, "loss": 0.8486, "step": 3758 }, { "epoch": 0.26, "learning_rate": 1.743592665521774e-05, "loss": 0.8965, "step": 3759 }, { "epoch": 0.26, "learning_rate": 1.743445062768469e-05, "loss": 0.9375, "step": 3760 }, { "epoch": 0.26, "learning_rate": 1.7432974237945564e-05, "loss": 0.8291, "step": 3761 }, { "epoch": 0.26, "learning_rate": 1.74314974860723e-05, "loss": 0.8252, "step": 3762 }, { "epoch": 0.26, "learning_rate": 1.743002037213684e-05, "loss": 0.9121, "step": 3763 }, { "epoch": 0.26, "learning_rate": 1.742854289621115e-05, "loss": 0.8105, "step": 3764 }, { "epoch": 0.26, "learning_rate": 1.7427065058367213e-05, "loss": 0.8906, "step": 3765 }, { "epoch": 0.26, "learning_rate": 1.7425586858677028e-05, "loss": 0.9092, "step": 3766 }, { "epoch": 0.26, "learning_rate": 1.7424108297212613e-05, "loss": 0.9062, "step": 3767 }, { "epoch": 0.26, "learning_rate": 1.7422629374046003e-05, "loss": 0.8232, "step": 3768 }, { "epoch": 0.26, "learning_rate": 1.742115008924925e-05, "loss": 0.8037, "step": 3769 }, { "epoch": 0.26, "learning_rate": 1.7419670442894432e-05, "loss": 0.8262, "step": 3770 }, { "epoch": 0.26, "learning_rate": 1.741819043505363e-05, "loss": 0.8555, "step": 3771 }, { "epoch": 0.26, "learning_rate": 1.741671006579895e-05, "loss": 0.7959, "step": 3772 }, { "epoch": 0.26, "learning_rate": 1.7415229335202516e-05, "loss": 0.8506, "step": 3773 }, { "epoch": 0.26, "learning_rate": 1.7413748243336472e-05, "loss": 0.8389, "step": 3774 }, { "epoch": 0.26, "learning_rate": 1.7412266790272978e-05, "loss": 0.835, "step": 3775 }, { "epoch": 0.26, "learning_rate": 1.7410784976084203e-05, "loss": 0.8506, "step": 3776 }, { "epoch": 0.26, "learning_rate": 1.740930280084235e-05, "loss": 0.8652, "step": 3777 }, { "epoch": 0.26, "learning_rate": 1.7407820264619623e-05, "loss": 0.7041, "step": 3778 }, { "epoch": 0.26, "learning_rate": 1.7406337367488254e-05, "loss": 0.9355, "step": 3779 }, { "epoch": 0.26, "learning_rate": 1.7404854109520487e-05, "loss": 0.916, "step": 3780 }, { "epoch": 0.26, "learning_rate": 1.7403370490788594e-05, "loss": 0.8086, "step": 3781 }, { "epoch": 0.26, "learning_rate": 1.740188651136485e-05, "loss": 0.9053, "step": 3782 }, { "epoch": 0.26, "learning_rate": 1.7400402171321554e-05, "loss": 0.9082, "step": 3783 }, { "epoch": 0.26, "learning_rate": 1.7398917470731025e-05, "loss": 0.8721, "step": 3784 }, { "epoch": 0.26, "learning_rate": 1.7397432409665603e-05, "loss": 0.7969, "step": 3785 }, { "epoch": 0.26, "learning_rate": 1.739594698819763e-05, "loss": 0.9561, "step": 3786 }, { "epoch": 0.26, "learning_rate": 1.7394461206399484e-05, "loss": 0.9043, "step": 3787 }, { "epoch": 0.26, "learning_rate": 1.7392975064343543e-05, "loss": 0.8721, "step": 3788 }, { "epoch": 0.26, "learning_rate": 1.7391488562102223e-05, "loss": 0.9678, "step": 3789 }, { "epoch": 0.26, "learning_rate": 1.739000169974794e-05, "loss": 0.8711, "step": 3790 }, { "epoch": 0.26, "learning_rate": 1.738851447735313e-05, "loss": 0.7939, "step": 3791 }, { "epoch": 0.26, "learning_rate": 1.7387026894990258e-05, "loss": 0.8838, "step": 3792 }, { "epoch": 0.26, "learning_rate": 1.7385538952731795e-05, "loss": 0.9209, "step": 3793 }, { "epoch": 0.26, "learning_rate": 1.7384050650650234e-05, "loss": 0.8447, "step": 3794 }, { "epoch": 0.26, "learning_rate": 1.738256198881809e-05, "loss": 0.9795, "step": 3795 }, { "epoch": 0.26, "learning_rate": 1.738107296730788e-05, "loss": 0.9219, "step": 3796 }, { "epoch": 0.26, "learning_rate": 1.7379583586192155e-05, "loss": 0.8711, "step": 3797 }, { "epoch": 0.26, "learning_rate": 1.7378093845543484e-05, "loss": 0.8887, "step": 3798 }, { "epoch": 0.26, "learning_rate": 1.7376603745434436e-05, "loss": 0.8818, "step": 3799 }, { "epoch": 0.26, "learning_rate": 1.7375113285937613e-05, "loss": 0.8574, "step": 3800 }, { "epoch": 0.26, "learning_rate": 1.737362246712563e-05, "loss": 0.8828, "step": 3801 }, { "epoch": 0.26, "learning_rate": 1.7372131289071122e-05, "loss": 0.8789, "step": 3802 }, { "epoch": 0.26, "learning_rate": 1.7370639751846735e-05, "loss": 0.8125, "step": 3803 }, { "epoch": 0.26, "learning_rate": 1.7369147855525145e-05, "loss": 0.8008, "step": 3804 }, { "epoch": 0.26, "learning_rate": 1.7367655600179022e-05, "loss": 0.9141, "step": 3805 }, { "epoch": 0.26, "learning_rate": 1.7366162985881084e-05, "loss": 0.8887, "step": 3806 }, { "epoch": 0.26, "learning_rate": 1.7364670012704042e-05, "loss": 0.8955, "step": 3807 }, { "epoch": 0.26, "learning_rate": 1.7363176680720635e-05, "loss": 0.8613, "step": 3808 }, { "epoch": 0.26, "learning_rate": 1.7361682990003622e-05, "loss": 0.7744, "step": 3809 }, { "epoch": 0.26, "learning_rate": 1.736018894062577e-05, "loss": 0.8662, "step": 3810 }, { "epoch": 0.26, "learning_rate": 1.735869453265987e-05, "loss": 0.918, "step": 3811 }, { "epoch": 0.26, "learning_rate": 1.7357199766178734e-05, "loss": 0.8262, "step": 3812 }, { "epoch": 0.26, "learning_rate": 1.7355704641255188e-05, "loss": 0.8271, "step": 3813 }, { "epoch": 0.26, "learning_rate": 1.7354209157962065e-05, "loss": 0.8711, "step": 3814 }, { "epoch": 0.26, "learning_rate": 1.7352713316372233e-05, "loss": 0.9199, "step": 3815 }, { "epoch": 0.26, "learning_rate": 1.7351217116558565e-05, "loss": 0.8203, "step": 3816 }, { "epoch": 0.26, "learning_rate": 1.734972055859396e-05, "loss": 0.8633, "step": 3817 }, { "epoch": 0.26, "learning_rate": 1.7348223642551324e-05, "loss": 0.8604, "step": 3818 }, { "epoch": 0.26, "learning_rate": 1.7346726368503593e-05, "loss": 0.8867, "step": 3819 }, { "epoch": 0.26, "learning_rate": 1.734522873652371e-05, "loss": 0.7725, "step": 3820 }, { "epoch": 0.26, "learning_rate": 1.7343730746684642e-05, "loss": 0.8652, "step": 3821 }, { "epoch": 0.26, "learning_rate": 1.7342232399059372e-05, "loss": 0.8486, "step": 3822 }, { "epoch": 0.26, "learning_rate": 1.7340733693720897e-05, "loss": 0.8779, "step": 3823 }, { "epoch": 0.26, "learning_rate": 1.7339234630742235e-05, "loss": 0.8496, "step": 3824 }, { "epoch": 0.26, "learning_rate": 1.7337735210196417e-05, "loss": 0.792, "step": 3825 }, { "epoch": 0.26, "learning_rate": 1.7336235432156502e-05, "loss": 0.835, "step": 3826 }, { "epoch": 0.26, "learning_rate": 1.733473529669555e-05, "loss": 0.8789, "step": 3827 }, { "epoch": 0.26, "learning_rate": 1.7333234803886653e-05, "loss": 0.917, "step": 3828 }, { "epoch": 0.26, "learning_rate": 1.7331733953802913e-05, "loss": 0.8721, "step": 3829 }, { "epoch": 0.26, "learning_rate": 1.7330232746517458e-05, "loss": 0.791, "step": 3830 }, { "epoch": 0.26, "learning_rate": 1.7328731182103414e-05, "loss": 0.8174, "step": 3831 }, { "epoch": 0.26, "learning_rate": 1.7327229260633947e-05, "loss": 0.8164, "step": 3832 }, { "epoch": 0.26, "learning_rate": 1.7325726982182228e-05, "loss": 0.8818, "step": 3833 }, { "epoch": 0.26, "learning_rate": 1.7324224346821447e-05, "loss": 0.877, "step": 3834 }, { "epoch": 0.26, "learning_rate": 1.7322721354624814e-05, "loss": 0.8145, "step": 3835 }, { "epoch": 0.26, "learning_rate": 1.732121800566555e-05, "loss": 0.8213, "step": 3836 }, { "epoch": 0.26, "learning_rate": 1.7319714300016906e-05, "loss": 0.9395, "step": 3837 }, { "epoch": 0.26, "learning_rate": 1.7318210237752137e-05, "loss": 0.8252, "step": 3838 }, { "epoch": 0.26, "learning_rate": 1.7316705818944525e-05, "loss": 0.832, "step": 3839 }, { "epoch": 0.26, "learning_rate": 1.7315201043667356e-05, "loss": 0.9189, "step": 3840 }, { "epoch": 0.26, "learning_rate": 1.7313695911993953e-05, "loss": 0.8936, "step": 3841 }, { "epoch": 0.26, "learning_rate": 1.7312190423997642e-05, "loss": 0.8477, "step": 3842 }, { "epoch": 0.26, "learning_rate": 1.731068457975177e-05, "loss": 0.7959, "step": 3843 }, { "epoch": 0.26, "learning_rate": 1.7309178379329702e-05, "loss": 0.8789, "step": 3844 }, { "epoch": 0.26, "learning_rate": 1.7307671822804818e-05, "loss": 0.8789, "step": 3845 }, { "epoch": 0.26, "learning_rate": 1.730616491025052e-05, "loss": 0.9141, "step": 3846 }, { "epoch": 0.26, "learning_rate": 1.7304657641740224e-05, "loss": 0.8506, "step": 3847 }, { "epoch": 0.26, "learning_rate": 1.7303150017347364e-05, "loss": 0.8213, "step": 3848 }, { "epoch": 0.26, "learning_rate": 1.7301642037145392e-05, "loss": 0.9395, "step": 3849 }, { "epoch": 0.26, "learning_rate": 1.7300133701207776e-05, "loss": 0.8662, "step": 3850 }, { "epoch": 0.26, "learning_rate": 1.7298625009608002e-05, "loss": 0.8262, "step": 3851 }, { "epoch": 0.26, "learning_rate": 1.7297115962419572e-05, "loss": 0.9365, "step": 3852 }, { "epoch": 0.26, "learning_rate": 1.7295606559716008e-05, "loss": 0.8867, "step": 3853 }, { "epoch": 0.26, "learning_rate": 1.729409680157085e-05, "loss": 0.8477, "step": 3854 }, { "epoch": 0.26, "learning_rate": 1.729258668805765e-05, "loss": 0.8164, "step": 3855 }, { "epoch": 0.26, "learning_rate": 1.729107621924998e-05, "loss": 0.8525, "step": 3856 }, { "epoch": 0.26, "learning_rate": 1.728956539522144e-05, "loss": 0.876, "step": 3857 }, { "epoch": 0.26, "learning_rate": 1.7288054216045625e-05, "loss": 0.8721, "step": 3858 }, { "epoch": 0.26, "learning_rate": 1.728654268179616e-05, "loss": 0.7852, "step": 3859 }, { "epoch": 0.26, "learning_rate": 1.7285030792546696e-05, "loss": 0.9365, "step": 3860 }, { "epoch": 0.26, "learning_rate": 1.7283518548370886e-05, "loss": 0.8584, "step": 3861 }, { "epoch": 0.26, "learning_rate": 1.7282005949342406e-05, "loss": 0.7793, "step": 3862 }, { "epoch": 0.26, "learning_rate": 1.7280492995534953e-05, "loss": 0.8867, "step": 3863 }, { "epoch": 0.26, "learning_rate": 1.7278979687022234e-05, "loss": 0.8506, "step": 3864 }, { "epoch": 0.26, "learning_rate": 1.7277466023877983e-05, "loss": 0.833, "step": 3865 }, { "epoch": 0.26, "learning_rate": 1.727595200617594e-05, "loss": 0.875, "step": 3866 }, { "epoch": 0.26, "learning_rate": 1.727443763398987e-05, "loss": 0.9072, "step": 3867 }, { "epoch": 0.26, "learning_rate": 1.727292290739355e-05, "loss": 0.8662, "step": 3868 }, { "epoch": 0.26, "learning_rate": 1.7271407826460788e-05, "loss": 0.8643, "step": 3869 }, { "epoch": 0.26, "learning_rate": 1.726989239126539e-05, "loss": 0.7734, "step": 3870 }, { "epoch": 0.26, "learning_rate": 1.7268376601881185e-05, "loss": 0.8975, "step": 3871 }, { "epoch": 0.26, "learning_rate": 1.726686045838203e-05, "loss": 0.8047, "step": 3872 }, { "epoch": 0.26, "learning_rate": 1.7265343960841785e-05, "loss": 0.8984, "step": 3873 }, { "epoch": 0.26, "learning_rate": 1.7263827109334338e-05, "loss": 0.9023, "step": 3874 }, { "epoch": 0.26, "learning_rate": 1.726230990393359e-05, "loss": 0.8916, "step": 3875 }, { "epoch": 0.26, "learning_rate": 1.7260792344713452e-05, "loss": 0.8896, "step": 3876 }, { "epoch": 0.26, "learning_rate": 1.7259274431747867e-05, "loss": 0.8428, "step": 3877 }, { "epoch": 0.26, "learning_rate": 1.725775616511079e-05, "loss": 0.8027, "step": 3878 }, { "epoch": 0.26, "learning_rate": 1.7256237544876183e-05, "loss": 0.8135, "step": 3879 }, { "epoch": 0.26, "learning_rate": 1.7254718571118038e-05, "loss": 0.8594, "step": 3880 }, { "epoch": 0.26, "learning_rate": 1.7253199243910357e-05, "loss": 0.8955, "step": 3881 }, { "epoch": 0.26, "learning_rate": 1.7251679563327165e-05, "loss": 0.7998, "step": 3882 }, { "epoch": 0.26, "learning_rate": 1.7250159529442495e-05, "loss": 0.833, "step": 3883 }, { "epoch": 0.26, "learning_rate": 1.724863914233041e-05, "loss": 0.8535, "step": 3884 }, { "epoch": 0.26, "learning_rate": 1.7247118402064977e-05, "loss": 0.832, "step": 3885 }, { "epoch": 0.26, "learning_rate": 1.724559730872029e-05, "loss": 0.792, "step": 3886 }, { "epoch": 0.26, "learning_rate": 1.7244075862370455e-05, "loss": 0.9258, "step": 3887 }, { "epoch": 0.26, "learning_rate": 1.7242554063089596e-05, "loss": 0.7959, "step": 3888 }, { "epoch": 0.27, "learning_rate": 1.7241031910951854e-05, "loss": 0.8867, "step": 3889 }, { "epoch": 0.27, "learning_rate": 1.7239509406031397e-05, "loss": 0.8096, "step": 3890 }, { "epoch": 0.27, "learning_rate": 1.723798654840239e-05, "loss": 0.959, "step": 3891 }, { "epoch": 0.27, "learning_rate": 1.7236463338139034e-05, "loss": 0.8701, "step": 3892 }, { "epoch": 0.27, "learning_rate": 1.7234939775315535e-05, "loss": 0.8242, "step": 3893 }, { "epoch": 0.27, "learning_rate": 1.7233415860006125e-05, "loss": 0.9014, "step": 3894 }, { "epoch": 0.27, "learning_rate": 1.7231891592285043e-05, "loss": 0.8984, "step": 3895 }, { "epoch": 0.27, "learning_rate": 1.723036697222656e-05, "loss": 0.8535, "step": 3896 }, { "epoch": 0.27, "learning_rate": 1.722884199990495e-05, "loss": 0.9121, "step": 3897 }, { "epoch": 0.27, "learning_rate": 1.7227316675394508e-05, "loss": 0.8467, "step": 3898 }, { "epoch": 0.27, "learning_rate": 1.7225790998769548e-05, "loss": 0.8486, "step": 3899 }, { "epoch": 0.27, "learning_rate": 1.722426497010441e-05, "loss": 0.8379, "step": 3900 }, { "epoch": 0.27, "learning_rate": 1.722273858947343e-05, "loss": 0.8135, "step": 3901 }, { "epoch": 0.27, "learning_rate": 1.722121185695098e-05, "loss": 0.7793, "step": 3902 }, { "epoch": 0.27, "learning_rate": 1.721968477261144e-05, "loss": 0.8213, "step": 3903 }, { "epoch": 0.27, "learning_rate": 1.721815733652921e-05, "loss": 0.9043, "step": 3904 }, { "epoch": 0.27, "learning_rate": 1.7216629548778704e-05, "loss": 0.9033, "step": 3905 }, { "epoch": 0.27, "learning_rate": 1.721510140943436e-05, "loss": 0.8184, "step": 3906 }, { "epoch": 0.27, "learning_rate": 1.721357291857063e-05, "loss": 0.9141, "step": 3907 }, { "epoch": 0.27, "learning_rate": 1.7212044076261975e-05, "loss": 0.9072, "step": 3908 }, { "epoch": 0.27, "learning_rate": 1.721051488258289e-05, "loss": 0.8252, "step": 3909 }, { "epoch": 0.27, "learning_rate": 1.7208985337607864e-05, "loss": 0.9268, "step": 3910 }, { "epoch": 0.27, "learning_rate": 1.7207455441411428e-05, "loss": 0.8018, "step": 3911 }, { "epoch": 0.27, "learning_rate": 1.7205925194068115e-05, "loss": 0.917, "step": 3912 }, { "epoch": 0.27, "learning_rate": 1.7204394595652475e-05, "loss": 0.8535, "step": 3913 }, { "epoch": 0.27, "learning_rate": 1.7202863646239084e-05, "loss": 0.8428, "step": 3914 }, { "epoch": 0.27, "learning_rate": 1.7201332345902528e-05, "loss": 0.8457, "step": 3915 }, { "epoch": 0.27, "learning_rate": 1.719980069471741e-05, "loss": 0.8594, "step": 3916 }, { "epoch": 0.27, "learning_rate": 1.7198268692758354e-05, "loss": 0.8516, "step": 3917 }, { "epoch": 0.27, "learning_rate": 1.7196736340099997e-05, "loss": 0.7988, "step": 3918 }, { "epoch": 0.27, "learning_rate": 1.7195203636816997e-05, "loss": 0.8721, "step": 3919 }, { "epoch": 0.27, "learning_rate": 1.7193670582984028e-05, "loss": 0.873, "step": 3920 }, { "epoch": 0.27, "learning_rate": 1.7192137178675778e-05, "loss": 0.8408, "step": 3921 }, { "epoch": 0.27, "learning_rate": 1.7190603423966955e-05, "loss": 0.8965, "step": 3922 }, { "epoch": 0.27, "learning_rate": 1.7189069318932285e-05, "loss": 0.9111, "step": 3923 }, { "epoch": 0.27, "learning_rate": 1.718753486364651e-05, "loss": 0.8115, "step": 3924 }, { "epoch": 0.27, "learning_rate": 1.718600005818438e-05, "loss": 0.8545, "step": 3925 }, { "epoch": 0.27, "learning_rate": 1.7184464902620687e-05, "loss": 0.8613, "step": 3926 }, { "epoch": 0.27, "learning_rate": 1.7182929397030208e-05, "loss": 0.8779, "step": 3927 }, { "epoch": 0.27, "learning_rate": 1.7181393541487762e-05, "loss": 0.8896, "step": 3928 }, { "epoch": 0.27, "learning_rate": 1.717985733606817e-05, "loss": 0.833, "step": 3929 }, { "epoch": 0.27, "learning_rate": 1.717832078084628e-05, "loss": 0.9131, "step": 3930 }, { "epoch": 0.27, "learning_rate": 1.717678387589695e-05, "loss": 0.8086, "step": 3931 }, { "epoch": 0.27, "learning_rate": 1.7175246621295062e-05, "loss": 0.8945, "step": 3932 }, { "epoch": 0.27, "learning_rate": 1.717370901711551e-05, "loss": 0.8652, "step": 3933 }, { "epoch": 0.27, "learning_rate": 1.7172171063433202e-05, "loss": 0.9355, "step": 3934 }, { "epoch": 0.27, "learning_rate": 1.717063276032307e-05, "loss": 0.874, "step": 3935 }, { "epoch": 0.27, "learning_rate": 1.716909410786006e-05, "loss": 0.7646, "step": 3936 }, { "epoch": 0.27, "learning_rate": 1.7167555106119135e-05, "loss": 0.9033, "step": 3937 }, { "epoch": 0.27, "learning_rate": 1.7166015755175272e-05, "loss": 0.9473, "step": 3938 }, { "epoch": 0.27, "learning_rate": 1.7164476055103473e-05, "loss": 0.9209, "step": 3939 }, { "epoch": 0.27, "learning_rate": 1.716293600597875e-05, "loss": 0.8447, "step": 3940 }, { "epoch": 0.27, "learning_rate": 1.7161395607876133e-05, "loss": 0.8574, "step": 3941 }, { "epoch": 0.27, "learning_rate": 1.7159854860870673e-05, "loss": 0.8184, "step": 3942 }, { "epoch": 0.27, "learning_rate": 1.7158313765037434e-05, "loss": 0.8779, "step": 3943 }, { "epoch": 0.27, "learning_rate": 1.7156772320451495e-05, "loss": 0.8232, "step": 3944 }, { "epoch": 0.27, "learning_rate": 1.7155230527187957e-05, "loss": 0.8838, "step": 3945 }, { "epoch": 0.27, "learning_rate": 1.715368838532194e-05, "loss": 0.918, "step": 3946 }, { "epoch": 0.27, "learning_rate": 1.7152145894928572e-05, "loss": 0.9189, "step": 3947 }, { "epoch": 0.27, "learning_rate": 1.7150603056083003e-05, "loss": 0.8301, "step": 3948 }, { "epoch": 0.27, "learning_rate": 1.7149059868860406e-05, "loss": 0.8545, "step": 3949 }, { "epoch": 0.27, "learning_rate": 1.7147516333335957e-05, "loss": 0.7637, "step": 3950 }, { "epoch": 0.27, "learning_rate": 1.7145972449584863e-05, "loss": 0.8672, "step": 3951 }, { "epoch": 0.27, "learning_rate": 1.714442821768234e-05, "loss": 0.833, "step": 3952 }, { "epoch": 0.27, "learning_rate": 1.714288363770362e-05, "loss": 0.9053, "step": 3953 }, { "epoch": 0.27, "learning_rate": 1.7141338709723962e-05, "loss": 0.8965, "step": 3954 }, { "epoch": 0.27, "learning_rate": 1.7139793433818626e-05, "loss": 0.8525, "step": 3955 }, { "epoch": 0.27, "learning_rate": 1.7138247810062903e-05, "loss": 0.9297, "step": 3956 }, { "epoch": 0.27, "learning_rate": 1.713670183853209e-05, "loss": 0.8584, "step": 3957 }, { "epoch": 0.27, "learning_rate": 1.713515551930152e-05, "loss": 0.8643, "step": 3958 }, { "epoch": 0.27, "learning_rate": 1.7133608852446518e-05, "loss": 0.8789, "step": 3959 }, { "epoch": 0.27, "learning_rate": 1.713206183804244e-05, "loss": 0.8066, "step": 3960 }, { "epoch": 0.27, "learning_rate": 1.713051447616466e-05, "loss": 0.8438, "step": 3961 }, { "epoch": 0.27, "learning_rate": 1.712896676688856e-05, "loss": 0.8525, "step": 3962 }, { "epoch": 0.27, "learning_rate": 1.7127418710289545e-05, "loss": 0.8545, "step": 3963 }, { "epoch": 0.27, "learning_rate": 1.7125870306443042e-05, "loss": 0.957, "step": 3964 }, { "epoch": 0.27, "learning_rate": 1.712432155542448e-05, "loss": 0.917, "step": 3965 }, { "epoch": 0.27, "learning_rate": 1.7122772457309322e-05, "loss": 0.8691, "step": 3966 }, { "epoch": 0.27, "learning_rate": 1.7121223012173037e-05, "loss": 0.877, "step": 3967 }, { "epoch": 0.27, "learning_rate": 1.7119673220091114e-05, "loss": 0.8271, "step": 3968 }, { "epoch": 0.27, "learning_rate": 1.7118123081139062e-05, "loss": 0.9014, "step": 3969 }, { "epoch": 0.27, "learning_rate": 1.71165725953924e-05, "loss": 0.8564, "step": 3970 }, { "epoch": 0.27, "learning_rate": 1.7115021762926664e-05, "loss": 0.8838, "step": 3971 }, { "epoch": 0.27, "learning_rate": 1.7113470583817418e-05, "loss": 0.752, "step": 3972 }, { "epoch": 0.27, "learning_rate": 1.711191905814023e-05, "loss": 0.9238, "step": 3973 }, { "epoch": 0.27, "learning_rate": 1.7110367185970693e-05, "loss": 0.9014, "step": 3974 }, { "epoch": 0.27, "learning_rate": 1.7108814967384413e-05, "loss": 0.8867, "step": 3975 }, { "epoch": 0.27, "learning_rate": 1.7107262402457016e-05, "loss": 0.8359, "step": 3976 }, { "epoch": 0.27, "learning_rate": 1.7105709491264143e-05, "loss": 0.8154, "step": 3977 }, { "epoch": 0.27, "learning_rate": 1.7104156233881447e-05, "loss": 0.7871, "step": 3978 }, { "epoch": 0.27, "learning_rate": 1.7102602630384603e-05, "loss": 0.8311, "step": 3979 }, { "epoch": 0.27, "learning_rate": 1.710104868084931e-05, "loss": 0.8457, "step": 3980 }, { "epoch": 0.27, "learning_rate": 1.709949438535127e-05, "loss": 0.8525, "step": 3981 }, { "epoch": 0.27, "learning_rate": 1.709793974396621e-05, "loss": 0.9053, "step": 3982 }, { "epoch": 0.27, "learning_rate": 1.709638475676987e-05, "loss": 0.8359, "step": 3983 }, { "epoch": 0.27, "learning_rate": 1.7094829423838014e-05, "loss": 0.9277, "step": 3984 }, { "epoch": 0.27, "learning_rate": 1.709327374524641e-05, "loss": 0.8701, "step": 3985 }, { "epoch": 0.27, "learning_rate": 1.7091717721070858e-05, "loss": 0.8408, "step": 3986 }, { "epoch": 0.27, "learning_rate": 1.7090161351387167e-05, "loss": 0.8262, "step": 3987 }, { "epoch": 0.27, "learning_rate": 1.708860463627116e-05, "loss": 0.8271, "step": 3988 }, { "epoch": 0.27, "learning_rate": 1.708704757579868e-05, "loss": 0.8906, "step": 3989 }, { "epoch": 0.27, "learning_rate": 1.7085490170045585e-05, "loss": 0.8643, "step": 3990 }, { "epoch": 0.27, "learning_rate": 1.7083932419087753e-05, "loss": 0.8691, "step": 3991 }, { "epoch": 0.27, "learning_rate": 1.7082374323001083e-05, "loss": 0.8174, "step": 3992 }, { "epoch": 0.27, "learning_rate": 1.708081588186148e-05, "loss": 0.7842, "step": 3993 }, { "epoch": 0.27, "learning_rate": 1.7079257095744874e-05, "loss": 0.7881, "step": 3994 }, { "epoch": 0.27, "learning_rate": 1.7077697964727206e-05, "loss": 0.8037, "step": 3995 }, { "epoch": 0.27, "learning_rate": 1.707613848888444e-05, "loss": 0.8545, "step": 3996 }, { "epoch": 0.27, "learning_rate": 1.707457866829255e-05, "loss": 0.8945, "step": 3997 }, { "epoch": 0.27, "learning_rate": 1.7073018503027534e-05, "loss": 0.8809, "step": 3998 }, { "epoch": 0.27, "learning_rate": 1.70714579931654e-05, "loss": 0.8672, "step": 3999 }, { "epoch": 0.27, "learning_rate": 1.706989713878218e-05, "loss": 0.915, "step": 4000 }, { "epoch": 0.27, "learning_rate": 1.706833593995391e-05, "loss": 0.8818, "step": 4001 }, { "epoch": 0.27, "learning_rate": 1.7066774396756663e-05, "loss": 0.8652, "step": 4002 }, { "epoch": 0.27, "learning_rate": 1.706521250926651e-05, "loss": 0.8828, "step": 4003 }, { "epoch": 0.27, "learning_rate": 1.7063650277559548e-05, "loss": 0.8242, "step": 4004 }, { "epoch": 0.27, "learning_rate": 1.7062087701711894e-05, "loss": 0.8555, "step": 4005 }, { "epoch": 0.27, "learning_rate": 1.7060524781799666e-05, "loss": 0.8398, "step": 4006 }, { "epoch": 0.27, "learning_rate": 1.7058961517899018e-05, "loss": 0.8955, "step": 4007 }, { "epoch": 0.27, "learning_rate": 1.7057397910086106e-05, "loss": 0.8535, "step": 4008 }, { "epoch": 0.27, "learning_rate": 1.7055833958437116e-05, "loss": 0.8682, "step": 4009 }, { "epoch": 0.27, "learning_rate": 1.7054269663028232e-05, "loss": 0.7549, "step": 4010 }, { "epoch": 0.27, "learning_rate": 1.705270502393568e-05, "loss": 0.8174, "step": 4011 }, { "epoch": 0.27, "learning_rate": 1.7051140041235684e-05, "loss": 0.8389, "step": 4012 }, { "epoch": 0.27, "learning_rate": 1.7049574715004488e-05, "loss": 0.8467, "step": 4013 }, { "epoch": 0.27, "learning_rate": 1.7048009045318355e-05, "loss": 0.8076, "step": 4014 }, { "epoch": 0.27, "learning_rate": 1.7046443032253565e-05, "loss": 0.8467, "step": 4015 }, { "epoch": 0.27, "learning_rate": 1.704487667588641e-05, "loss": 0.8125, "step": 4016 }, { "epoch": 0.27, "learning_rate": 1.7043309976293215e-05, "loss": 0.8193, "step": 4017 }, { "epoch": 0.27, "learning_rate": 1.7041742933550297e-05, "loss": 0.916, "step": 4018 }, { "epoch": 0.27, "learning_rate": 1.7040175547734006e-05, "loss": 0.8594, "step": 4019 }, { "epoch": 0.27, "learning_rate": 1.703860781892071e-05, "loss": 0.8662, "step": 4020 }, { "epoch": 0.27, "learning_rate": 1.703703974718678e-05, "loss": 0.8428, "step": 4021 }, { "epoch": 0.27, "learning_rate": 1.703547133260862e-05, "loss": 0.9277, "step": 4022 }, { "epoch": 0.27, "learning_rate": 1.7033902575262635e-05, "loss": 0.8857, "step": 4023 }, { "epoch": 0.27, "learning_rate": 1.7032333475225263e-05, "loss": 0.8691, "step": 4024 }, { "epoch": 0.27, "learning_rate": 1.7030764032572945e-05, "loss": 0.9023, "step": 4025 }, { "epoch": 0.27, "learning_rate": 1.702919424738215e-05, "loss": 0.8779, "step": 4026 }, { "epoch": 0.27, "learning_rate": 1.702762411972935e-05, "loss": 0.8633, "step": 4027 }, { "epoch": 0.27, "learning_rate": 1.7026053649691046e-05, "loss": 0.8652, "step": 4028 }, { "epoch": 0.27, "learning_rate": 1.702448283734375e-05, "loss": 0.9043, "step": 4029 }, { "epoch": 0.27, "learning_rate": 1.7022911682763998e-05, "loss": 0.8311, "step": 4030 }, { "epoch": 0.27, "learning_rate": 1.7021340186028325e-05, "loss": 0.9355, "step": 4031 }, { "epoch": 0.27, "learning_rate": 1.7019768347213305e-05, "loss": 0.876, "step": 4032 }, { "epoch": 0.27, "learning_rate": 1.701819616639551e-05, "loss": 0.8936, "step": 4033 }, { "epoch": 0.27, "learning_rate": 1.7016623643651543e-05, "loss": 0.8643, "step": 4034 }, { "epoch": 0.27, "learning_rate": 1.7015050779058014e-05, "loss": 0.7754, "step": 4035 }, { "epoch": 0.28, "learning_rate": 1.7013477572691552e-05, "loss": 0.8438, "step": 4036 }, { "epoch": 0.28, "learning_rate": 1.7011904024628804e-05, "loss": 0.7998, "step": 4037 }, { "epoch": 0.28, "learning_rate": 1.7010330134946437e-05, "loss": 0.8135, "step": 4038 }, { "epoch": 0.28, "learning_rate": 1.7008755903721124e-05, "loss": 0.8125, "step": 4039 }, { "epoch": 0.28, "learning_rate": 1.7007181331029566e-05, "loss": 0.8379, "step": 4040 }, { "epoch": 0.28, "learning_rate": 1.7005606416948477e-05, "loss": 0.9014, "step": 4041 }, { "epoch": 0.28, "learning_rate": 1.7004031161554584e-05, "loss": 0.8525, "step": 4042 }, { "epoch": 0.28, "learning_rate": 1.7002455564924635e-05, "loss": 0.833, "step": 4043 }, { "epoch": 0.28, "learning_rate": 1.7000879627135392e-05, "loss": 0.8789, "step": 4044 }, { "epoch": 0.28, "learning_rate": 1.6999303348263634e-05, "loss": 0.9189, "step": 4045 }, { "epoch": 0.28, "learning_rate": 1.699772672838616e-05, "loss": 0.8545, "step": 4046 }, { "epoch": 0.28, "learning_rate": 1.699614976757978e-05, "loss": 0.8594, "step": 4047 }, { "epoch": 0.28, "learning_rate": 1.6994572465921323e-05, "loss": 0.8379, "step": 4048 }, { "epoch": 0.28, "learning_rate": 1.6992994823487635e-05, "loss": 0.8896, "step": 4049 }, { "epoch": 0.28, "learning_rate": 1.6991416840355585e-05, "loss": 0.8594, "step": 4050 }, { "epoch": 0.28, "learning_rate": 1.698983851660205e-05, "loss": 0.7822, "step": 4051 }, { "epoch": 0.28, "learning_rate": 1.6988259852303914e-05, "loss": 0.8447, "step": 4052 }, { "epoch": 0.28, "learning_rate": 1.6986680847538107e-05, "loss": 0.7871, "step": 4053 }, { "epoch": 0.28, "learning_rate": 1.6985101502381547e-05, "loss": 0.8135, "step": 4054 }, { "epoch": 0.28, "learning_rate": 1.698352181691118e-05, "loss": 0.8613, "step": 4055 }, { "epoch": 0.28, "learning_rate": 1.6981941791203972e-05, "loss": 0.8076, "step": 4056 }, { "epoch": 0.28, "learning_rate": 1.6980361425336904e-05, "loss": 0.8857, "step": 4057 }, { "epoch": 0.28, "learning_rate": 1.6978780719386962e-05, "loss": 0.8896, "step": 4058 }, { "epoch": 0.28, "learning_rate": 1.6977199673431168e-05, "loss": 0.9268, "step": 4059 }, { "epoch": 0.28, "learning_rate": 1.6975618287546543e-05, "loss": 0.917, "step": 4060 }, { "epoch": 0.28, "learning_rate": 1.697403656181014e-05, "loss": 0.873, "step": 4061 }, { "epoch": 0.28, "learning_rate": 1.697245449629901e-05, "loss": 0.8115, "step": 4062 }, { "epoch": 0.28, "learning_rate": 1.6970872091090242e-05, "loss": 0.7969, "step": 4063 }, { "epoch": 0.28, "learning_rate": 1.6969289346260923e-05, "loss": 0.9316, "step": 4064 }, { "epoch": 0.28, "learning_rate": 1.6967706261888167e-05, "loss": 0.8223, "step": 4065 }, { "epoch": 0.28, "learning_rate": 1.6966122838049103e-05, "loss": 0.8945, "step": 4066 }, { "epoch": 0.28, "learning_rate": 1.6964539074820873e-05, "loss": 0.9414, "step": 4067 }, { "epoch": 0.28, "learning_rate": 1.6962954972280637e-05, "loss": 0.8477, "step": 4068 }, { "epoch": 0.28, "learning_rate": 1.6961370530505576e-05, "loss": 0.8525, "step": 4069 }, { "epoch": 0.28, "learning_rate": 1.6959785749572884e-05, "loss": 0.9102, "step": 4070 }, { "epoch": 0.28, "learning_rate": 1.695820062955977e-05, "loss": 0.9053, "step": 4071 }, { "epoch": 0.28, "learning_rate": 1.6956615170543457e-05, "loss": 0.8594, "step": 4072 }, { "epoch": 0.28, "learning_rate": 1.6955029372601193e-05, "loss": 0.9346, "step": 4073 }, { "epoch": 0.28, "learning_rate": 1.695344323581024e-05, "loss": 0.7578, "step": 4074 }, { "epoch": 0.28, "learning_rate": 1.6951856760247868e-05, "loss": 0.8486, "step": 4075 }, { "epoch": 0.28, "learning_rate": 1.6950269945991377e-05, "loss": 0.791, "step": 4076 }, { "epoch": 0.28, "learning_rate": 1.6948682793118074e-05, "loss": 0.8467, "step": 4077 }, { "epoch": 0.28, "learning_rate": 1.694709530170528e-05, "loss": 0.8262, "step": 4078 }, { "epoch": 0.28, "learning_rate": 1.6945507471830343e-05, "loss": 0.749, "step": 4079 }, { "epoch": 0.28, "learning_rate": 1.6943919303570622e-05, "loss": 0.8906, "step": 4080 }, { "epoch": 0.28, "learning_rate": 1.694233079700349e-05, "loss": 0.8809, "step": 4081 }, { "epoch": 0.28, "learning_rate": 1.6940741952206342e-05, "loss": 0.9316, "step": 4082 }, { "epoch": 0.28, "learning_rate": 1.693915276925658e-05, "loss": 0.8584, "step": 4083 }, { "epoch": 0.28, "learning_rate": 1.693756324823164e-05, "loss": 0.8467, "step": 4084 }, { "epoch": 0.28, "learning_rate": 1.693597338920895e-05, "loss": 0.8262, "step": 4085 }, { "epoch": 0.28, "learning_rate": 1.693438319226598e-05, "loss": 0.9072, "step": 4086 }, { "epoch": 0.28, "learning_rate": 1.6932792657480197e-05, "loss": 0.9473, "step": 4087 }, { "epoch": 0.28, "learning_rate": 1.6931201784929096e-05, "loss": 0.8125, "step": 4088 }, { "epoch": 0.28, "learning_rate": 1.692961057469018e-05, "loss": 0.8037, "step": 4089 }, { "epoch": 0.28, "learning_rate": 1.6928019026840973e-05, "loss": 0.793, "step": 4090 }, { "epoch": 0.28, "learning_rate": 1.692642714145902e-05, "loss": 0.8896, "step": 4091 }, { "epoch": 0.28, "learning_rate": 1.6924834918621872e-05, "loss": 0.8125, "step": 4092 }, { "epoch": 0.28, "learning_rate": 1.6923242358407103e-05, "loss": 0.8438, "step": 4093 }, { "epoch": 0.28, "learning_rate": 1.6921649460892305e-05, "loss": 0.8125, "step": 4094 }, { "epoch": 0.28, "learning_rate": 1.6920056226155087e-05, "loss": 0.7793, "step": 4095 }, { "epoch": 0.28, "learning_rate": 1.6918462654273063e-05, "loss": 0.8594, "step": 4096 }, { "epoch": 0.28, "learning_rate": 1.6916868745323877e-05, "loss": 0.8438, "step": 4097 }, { "epoch": 0.28, "learning_rate": 1.6915274499385187e-05, "loss": 0.8799, "step": 4098 }, { "epoch": 0.28, "learning_rate": 1.6913679916534653e-05, "loss": 0.8135, "step": 4099 }, { "epoch": 0.28, "learning_rate": 1.691208499684998e-05, "loss": 0.7871, "step": 4100 }, { "epoch": 0.28, "learning_rate": 1.6910489740408857e-05, "loss": 0.917, "step": 4101 }, { "epoch": 0.28, "learning_rate": 1.690889414728901e-05, "loss": 0.8857, "step": 4102 }, { "epoch": 0.28, "learning_rate": 1.690729821756818e-05, "loss": 0.8711, "step": 4103 }, { "epoch": 0.28, "learning_rate": 1.6905701951324115e-05, "loss": 0.8428, "step": 4104 }, { "epoch": 0.28, "learning_rate": 1.6904105348634587e-05, "loss": 0.8652, "step": 4105 }, { "epoch": 0.28, "learning_rate": 1.6902508409577386e-05, "loss": 0.8789, "step": 4106 }, { "epoch": 0.28, "learning_rate": 1.690091113423031e-05, "loss": 0.7988, "step": 4107 }, { "epoch": 0.28, "learning_rate": 1.6899313522671182e-05, "loss": 0.7812, "step": 4108 }, { "epoch": 0.28, "learning_rate": 1.6897715574977837e-05, "loss": 0.8486, "step": 4109 }, { "epoch": 0.28, "learning_rate": 1.6896117291228124e-05, "loss": 0.8252, "step": 4110 }, { "epoch": 0.28, "learning_rate": 1.689451867149991e-05, "loss": 0.7881, "step": 4111 }, { "epoch": 0.28, "learning_rate": 1.6892919715871082e-05, "loss": 0.7266, "step": 4112 }, { "epoch": 0.28, "learning_rate": 1.6891320424419546e-05, "loss": 0.8379, "step": 4113 }, { "epoch": 0.28, "learning_rate": 1.6889720797223212e-05, "loss": 0.8604, "step": 4114 }, { "epoch": 0.28, "learning_rate": 1.6888120834360016e-05, "loss": 0.8154, "step": 4115 }, { "epoch": 0.28, "learning_rate": 1.6886520535907913e-05, "loss": 0.7812, "step": 4116 }, { "epoch": 0.28, "learning_rate": 1.6884919901944864e-05, "loss": 0.7686, "step": 4117 }, { "epoch": 0.28, "learning_rate": 1.6883318932548852e-05, "loss": 0.8887, "step": 4118 }, { "epoch": 0.28, "learning_rate": 1.688171762779788e-05, "loss": 0.9307, "step": 4119 }, { "epoch": 0.28, "learning_rate": 1.6880115987769957e-05, "loss": 0.8594, "step": 4120 }, { "epoch": 0.28, "learning_rate": 1.6878514012543117e-05, "loss": 0.8623, "step": 4121 }, { "epoch": 0.28, "learning_rate": 1.6876911702195413e-05, "loss": 0.8066, "step": 4122 }, { "epoch": 0.28, "learning_rate": 1.6875309056804908e-05, "loss": 0.7812, "step": 4123 }, { "epoch": 0.28, "learning_rate": 1.6873706076449677e-05, "loss": 0.7744, "step": 4124 }, { "epoch": 0.28, "learning_rate": 1.6872102761207825e-05, "loss": 0.8926, "step": 4125 }, { "epoch": 0.28, "learning_rate": 1.687049911115746e-05, "loss": 0.9072, "step": 4126 }, { "epoch": 0.28, "learning_rate": 1.6868895126376713e-05, "loss": 0.8262, "step": 4127 }, { "epoch": 0.28, "learning_rate": 1.686729080694373e-05, "loss": 0.8711, "step": 4128 }, { "epoch": 0.28, "learning_rate": 1.6865686152936673e-05, "loss": 0.8799, "step": 4129 }, { "epoch": 0.28, "learning_rate": 1.6864081164433725e-05, "loss": 0.8691, "step": 4130 }, { "epoch": 0.28, "learning_rate": 1.6862475841513072e-05, "loss": 0.8633, "step": 4131 }, { "epoch": 0.28, "learning_rate": 1.6860870184252937e-05, "loss": 0.7979, "step": 4132 }, { "epoch": 0.28, "learning_rate": 1.6859264192731537e-05, "loss": 0.8545, "step": 4133 }, { "epoch": 0.28, "learning_rate": 1.685765786702712e-05, "loss": 0.9111, "step": 4134 }, { "epoch": 0.28, "learning_rate": 1.6856051207217946e-05, "loss": 0.8721, "step": 4135 }, { "epoch": 0.28, "learning_rate": 1.6854444213382297e-05, "loss": 0.8789, "step": 4136 }, { "epoch": 0.28, "learning_rate": 1.6852836885598453e-05, "loss": 0.832, "step": 4137 }, { "epoch": 0.28, "learning_rate": 1.6851229223944732e-05, "loss": 0.9385, "step": 4138 }, { "epoch": 0.28, "learning_rate": 1.684962122849946e-05, "loss": 0.8936, "step": 4139 }, { "epoch": 0.28, "learning_rate": 1.6848012899340974e-05, "loss": 0.8164, "step": 4140 }, { "epoch": 0.28, "learning_rate": 1.6846404236547635e-05, "loss": 0.7256, "step": 4141 }, { "epoch": 0.28, "learning_rate": 1.684479524019781e-05, "loss": 0.8408, "step": 4142 }, { "epoch": 0.28, "learning_rate": 1.68431859103699e-05, "loss": 0.832, "step": 4143 }, { "epoch": 0.28, "learning_rate": 1.6841576247142306e-05, "loss": 0.8496, "step": 4144 }, { "epoch": 0.28, "learning_rate": 1.683996625059345e-05, "loss": 0.7949, "step": 4145 }, { "epoch": 0.28, "learning_rate": 1.6838355920801773e-05, "loss": 0.7969, "step": 4146 }, { "epoch": 0.28, "learning_rate": 1.6836745257845727e-05, "loss": 0.8809, "step": 4147 }, { "epoch": 0.28, "learning_rate": 1.6835134261803786e-05, "loss": 0.8613, "step": 4148 }, { "epoch": 0.28, "learning_rate": 1.6833522932754437e-05, "loss": 0.8145, "step": 4149 }, { "epoch": 0.28, "learning_rate": 1.6831911270776183e-05, "loss": 0.7656, "step": 4150 }, { "epoch": 0.28, "learning_rate": 1.6830299275947547e-05, "loss": 1.0459, "step": 4151 }, { "epoch": 0.28, "learning_rate": 1.6828686948347065e-05, "loss": 0.8291, "step": 4152 }, { "epoch": 0.28, "learning_rate": 1.6827074288053285e-05, "loss": 0.9072, "step": 4153 }, { "epoch": 0.28, "learning_rate": 1.6825461295144778e-05, "loss": 0.877, "step": 4154 }, { "epoch": 0.28, "learning_rate": 1.682384796970013e-05, "loss": 0.9316, "step": 4155 }, { "epoch": 0.28, "learning_rate": 1.6822234311797943e-05, "loss": 0.8984, "step": 4156 }, { "epoch": 0.28, "learning_rate": 1.6820620321516828e-05, "loss": 0.8838, "step": 4157 }, { "epoch": 0.28, "learning_rate": 1.681900599893543e-05, "loss": 0.9883, "step": 4158 }, { "epoch": 0.28, "learning_rate": 1.681739134413239e-05, "loss": 0.8896, "step": 4159 }, { "epoch": 0.28, "learning_rate": 1.6815776357186377e-05, "loss": 0.9043, "step": 4160 }, { "epoch": 0.28, "learning_rate": 1.6814161038176072e-05, "loss": 0.8057, "step": 4161 }, { "epoch": 0.28, "learning_rate": 1.6812545387180175e-05, "loss": 0.8203, "step": 4162 }, { "epoch": 0.28, "learning_rate": 1.6810929404277395e-05, "loss": 0.9512, "step": 4163 }, { "epoch": 0.28, "learning_rate": 1.680931308954647e-05, "loss": 0.8818, "step": 4164 }, { "epoch": 0.28, "learning_rate": 1.680769644306614e-05, "loss": 0.7734, "step": 4165 }, { "epoch": 0.28, "learning_rate": 1.6806079464915176e-05, "loss": 0.834, "step": 4166 }, { "epoch": 0.28, "learning_rate": 1.6804462155172347e-05, "loss": 0.8662, "step": 4167 }, { "epoch": 0.28, "learning_rate": 1.680284451391646e-05, "loss": 0.834, "step": 4168 }, { "epoch": 0.28, "learning_rate": 1.6801226541226313e-05, "loss": 0.8115, "step": 4169 }, { "epoch": 0.28, "learning_rate": 1.6799608237180748e-05, "loss": 0.8232, "step": 4170 }, { "epoch": 0.28, "learning_rate": 1.6797989601858594e-05, "loss": 0.8203, "step": 4171 }, { "epoch": 0.28, "learning_rate": 1.679637063533872e-05, "loss": 0.9043, "step": 4172 }, { "epoch": 0.28, "learning_rate": 1.6794751337700005e-05, "loss": 0.8105, "step": 4173 }, { "epoch": 0.28, "learning_rate": 1.679313170902133e-05, "loss": 0.8047, "step": 4174 }, { "epoch": 0.28, "learning_rate": 1.6791511749381612e-05, "loss": 0.835, "step": 4175 }, { "epoch": 0.28, "learning_rate": 1.6789891458859772e-05, "loss": 0.8691, "step": 4176 }, { "epoch": 0.28, "learning_rate": 1.6788270837534755e-05, "loss": 0.9297, "step": 4177 }, { "epoch": 0.28, "learning_rate": 1.6786649885485512e-05, "loss": 0.8926, "step": 4178 }, { "epoch": 0.28, "learning_rate": 1.6785028602791013e-05, "loss": 0.793, "step": 4179 }, { "epoch": 0.28, "learning_rate": 1.6783406989530254e-05, "loss": 0.75, "step": 4180 }, { "epoch": 0.28, "learning_rate": 1.678178504578224e-05, "loss": 0.9473, "step": 4181 }, { "epoch": 0.28, "learning_rate": 1.6780162771625987e-05, "loss": 0.8857, "step": 4182 }, { "epoch": 0.29, "learning_rate": 1.6778540167140534e-05, "loss": 0.8428, "step": 4183 }, { "epoch": 0.29, "learning_rate": 1.6776917232404938e-05, "loss": 0.8193, "step": 4184 }, { "epoch": 0.29, "learning_rate": 1.677529396749826e-05, "loss": 0.8359, "step": 4185 }, { "epoch": 0.29, "learning_rate": 1.677367037249959e-05, "loss": 0.8145, "step": 4186 }, { "epoch": 0.29, "learning_rate": 1.6772046447488035e-05, "loss": 0.8057, "step": 4187 }, { "epoch": 0.29, "learning_rate": 1.6770422192542706e-05, "loss": 0.9111, "step": 4188 }, { "epoch": 0.29, "learning_rate": 1.6768797607742734e-05, "loss": 0.8525, "step": 4189 }, { "epoch": 0.29, "learning_rate": 1.676717269316728e-05, "loss": 0.8545, "step": 4190 }, { "epoch": 0.29, "learning_rate": 1.6765547448895498e-05, "loss": 0.8096, "step": 4191 }, { "epoch": 0.29, "learning_rate": 1.676392187500657e-05, "loss": 0.7236, "step": 4192 }, { "epoch": 0.29, "learning_rate": 1.67622959715797e-05, "loss": 0.834, "step": 4193 }, { "epoch": 0.29, "learning_rate": 1.6760669738694105e-05, "loss": 0.8369, "step": 4194 }, { "epoch": 0.29, "learning_rate": 1.6759043176429005e-05, "loss": 0.8857, "step": 4195 }, { "epoch": 0.29, "learning_rate": 1.6757416284863655e-05, "loss": 0.8916, "step": 4196 }, { "epoch": 0.29, "learning_rate": 1.675578906407731e-05, "loss": 0.9209, "step": 4197 }, { "epoch": 0.29, "learning_rate": 1.6754161514149253e-05, "loss": 0.8203, "step": 4198 }, { "epoch": 0.29, "learning_rate": 1.6752533635158775e-05, "loss": 0.8662, "step": 4199 }, { "epoch": 0.29, "learning_rate": 1.675090542718519e-05, "loss": 0.8867, "step": 4200 }, { "epoch": 0.29, "learning_rate": 1.674927689030782e-05, "loss": 0.8174, "step": 4201 }, { "epoch": 0.29, "learning_rate": 1.674764802460601e-05, "loss": 0.8633, "step": 4202 }, { "epoch": 0.29, "learning_rate": 1.6746018830159117e-05, "loss": 0.8467, "step": 4203 }, { "epoch": 0.29, "learning_rate": 1.6744389307046514e-05, "loss": 0.9062, "step": 4204 }, { "epoch": 0.29, "learning_rate": 1.6742759455347595e-05, "loss": 0.877, "step": 4205 }, { "epoch": 0.29, "learning_rate": 1.6741129275141764e-05, "loss": 0.8281, "step": 4206 }, { "epoch": 0.29, "learning_rate": 1.673949876650844e-05, "loss": 0.9111, "step": 4207 }, { "epoch": 0.29, "learning_rate": 1.673786792952707e-05, "loss": 0.9473, "step": 4208 }, { "epoch": 0.29, "learning_rate": 1.67362367642771e-05, "loss": 0.8584, "step": 4209 }, { "epoch": 0.29, "learning_rate": 1.6734605270838003e-05, "loss": 0.8672, "step": 4210 }, { "epoch": 0.29, "learning_rate": 1.6732973449289267e-05, "loss": 0.9229, "step": 4211 }, { "epoch": 0.29, "learning_rate": 1.673134129971039e-05, "loss": 0.8652, "step": 4212 }, { "epoch": 0.29, "learning_rate": 1.6729708822180898e-05, "loss": 0.8721, "step": 4213 }, { "epoch": 0.29, "learning_rate": 1.672807601678032e-05, "loss": 0.8359, "step": 4214 }, { "epoch": 0.29, "learning_rate": 1.6726442883588204e-05, "loss": 0.7334, "step": 4215 }, { "epoch": 0.29, "learning_rate": 1.672480942268412e-05, "loss": 0.7959, "step": 4216 }, { "epoch": 0.29, "learning_rate": 1.672317563414765e-05, "loss": 0.8096, "step": 4217 }, { "epoch": 0.29, "learning_rate": 1.6721541518058386e-05, "loss": 0.9043, "step": 4218 }, { "epoch": 0.29, "learning_rate": 1.671990707449595e-05, "loss": 0.9111, "step": 4219 }, { "epoch": 0.29, "learning_rate": 1.6718272303539968e-05, "loss": 0.8525, "step": 4220 }, { "epoch": 0.29, "learning_rate": 1.671663720527009e-05, "loss": 0.9092, "step": 4221 }, { "epoch": 0.29, "learning_rate": 1.6715001779765973e-05, "loss": 0.8525, "step": 4222 }, { "epoch": 0.29, "learning_rate": 1.6713366027107296e-05, "loss": 0.9102, "step": 4223 }, { "epoch": 0.29, "learning_rate": 1.6711729947373755e-05, "loss": 0.8467, "step": 4224 }, { "epoch": 0.29, "learning_rate": 1.6710093540645056e-05, "loss": 0.8008, "step": 4225 }, { "epoch": 0.29, "learning_rate": 1.670845680700093e-05, "loss": 0.792, "step": 4226 }, { "epoch": 0.29, "learning_rate": 1.6706819746521113e-05, "loss": 0.8154, "step": 4227 }, { "epoch": 0.29, "learning_rate": 1.6705182359285367e-05, "loss": 0.8389, "step": 4228 }, { "epoch": 0.29, "learning_rate": 1.670354464537346e-05, "loss": 0.8213, "step": 4229 }, { "epoch": 0.29, "learning_rate": 1.6701906604865187e-05, "loss": 0.8994, "step": 4230 }, { "epoch": 0.29, "learning_rate": 1.6700268237840352e-05, "loss": 0.8008, "step": 4231 }, { "epoch": 0.29, "learning_rate": 1.6698629544378774e-05, "loss": 0.8809, "step": 4232 }, { "epoch": 0.29, "learning_rate": 1.6696990524560293e-05, "loss": 0.8955, "step": 4233 }, { "epoch": 0.29, "learning_rate": 1.6695351178464762e-05, "loss": 0.8066, "step": 4234 }, { "epoch": 0.29, "learning_rate": 1.6693711506172045e-05, "loss": 0.8926, "step": 4235 }, { "epoch": 0.29, "learning_rate": 1.6692071507762028e-05, "loss": 0.8574, "step": 4236 }, { "epoch": 0.29, "learning_rate": 1.6690431183314616e-05, "loss": 0.8418, "step": 4237 }, { "epoch": 0.29, "learning_rate": 1.6688790532909723e-05, "loss": 0.8389, "step": 4238 }, { "epoch": 0.29, "learning_rate": 1.668714955662728e-05, "loss": 0.8291, "step": 4239 }, { "epoch": 0.29, "learning_rate": 1.6685508254547238e-05, "loss": 0.832, "step": 4240 }, { "epoch": 0.29, "learning_rate": 1.668386662674956e-05, "loss": 0.8408, "step": 4241 }, { "epoch": 0.29, "learning_rate": 1.6682224673314225e-05, "loss": 0.7852, "step": 4242 }, { "epoch": 0.29, "learning_rate": 1.6680582394321228e-05, "loss": 0.8545, "step": 4243 }, { "epoch": 0.29, "learning_rate": 1.6678939789850587e-05, "loss": 0.7578, "step": 4244 }, { "epoch": 0.29, "learning_rate": 1.6677296859982322e-05, "loss": 0.7227, "step": 4245 }, { "epoch": 0.29, "learning_rate": 1.667565360479648e-05, "loss": 0.9287, "step": 4246 }, { "epoch": 0.29, "learning_rate": 1.6674010024373123e-05, "loss": 0.8418, "step": 4247 }, { "epoch": 0.29, "learning_rate": 1.667236611879232e-05, "loss": 0.9209, "step": 4248 }, { "epoch": 0.29, "learning_rate": 1.6670721888134164e-05, "loss": 0.8662, "step": 4249 }, { "epoch": 0.29, "learning_rate": 1.6669077332478765e-05, "loss": 0.8398, "step": 4250 }, { "epoch": 0.29, "learning_rate": 1.6667432451906243e-05, "loss": 0.9033, "step": 4251 }, { "epoch": 0.29, "learning_rate": 1.666578724649674e-05, "loss": 0.793, "step": 4252 }, { "epoch": 0.29, "learning_rate": 1.6664141716330404e-05, "loss": 0.8408, "step": 4253 }, { "epoch": 0.29, "learning_rate": 1.6662495861487407e-05, "loss": 0.8418, "step": 4254 }, { "epoch": 0.29, "learning_rate": 1.666084968204794e-05, "loss": 0.8223, "step": 4255 }, { "epoch": 0.29, "learning_rate": 1.66592031780922e-05, "loss": 0.8379, "step": 4256 }, { "epoch": 0.29, "learning_rate": 1.6657556349700406e-05, "loss": 0.835, "step": 4257 }, { "epoch": 0.29, "learning_rate": 1.665590919695279e-05, "loss": 0.8662, "step": 4258 }, { "epoch": 0.29, "learning_rate": 1.6654261719929606e-05, "loss": 0.8145, "step": 4259 }, { "epoch": 0.29, "learning_rate": 1.665261391871111e-05, "loss": 0.8047, "step": 4260 }, { "epoch": 0.29, "learning_rate": 1.6650965793377592e-05, "loss": 0.8213, "step": 4261 }, { "epoch": 0.29, "learning_rate": 1.6649317344009346e-05, "loss": 0.7871, "step": 4262 }, { "epoch": 0.29, "learning_rate": 1.664766857068668e-05, "loss": 0.8701, "step": 4263 }, { "epoch": 0.29, "learning_rate": 1.6646019473489928e-05, "loss": 0.8037, "step": 4264 }, { "epoch": 0.29, "learning_rate": 1.664437005249943e-05, "loss": 0.7793, "step": 4265 }, { "epoch": 0.29, "learning_rate": 1.6642720307795548e-05, "loss": 0.8389, "step": 4266 }, { "epoch": 0.29, "learning_rate": 1.6641070239458657e-05, "loss": 0.7588, "step": 4267 }, { "epoch": 0.29, "learning_rate": 1.6639419847569147e-05, "loss": 0.8926, "step": 4268 }, { "epoch": 0.29, "learning_rate": 1.6637769132207427e-05, "loss": 0.8535, "step": 4269 }, { "epoch": 0.29, "learning_rate": 1.663611809345392e-05, "loss": 0.9219, "step": 4270 }, { "epoch": 0.29, "learning_rate": 1.6634466731389055e-05, "loss": 0.7363, "step": 4271 }, { "epoch": 0.29, "learning_rate": 1.66328150460933e-05, "loss": 0.8232, "step": 4272 }, { "epoch": 0.29, "learning_rate": 1.663116303764712e-05, "loss": 0.8301, "step": 4273 }, { "epoch": 0.29, "learning_rate": 1.6629510706131e-05, "loss": 0.8945, "step": 4274 }, { "epoch": 0.29, "learning_rate": 1.662785805162544e-05, "loss": 0.8438, "step": 4275 }, { "epoch": 0.29, "learning_rate": 1.662620507421096e-05, "loss": 0.791, "step": 4276 }, { "epoch": 0.29, "learning_rate": 1.6624551773968095e-05, "loss": 0.79, "step": 4277 }, { "epoch": 0.29, "learning_rate": 1.6622898150977386e-05, "loss": 0.8223, "step": 4278 }, { "epoch": 0.29, "learning_rate": 1.6621244205319404e-05, "loss": 0.9092, "step": 4279 }, { "epoch": 0.29, "learning_rate": 1.6619589937074727e-05, "loss": 0.8975, "step": 4280 }, { "epoch": 0.29, "learning_rate": 1.6617935346323947e-05, "loss": 0.8936, "step": 4281 }, { "epoch": 0.29, "learning_rate": 1.6616280433147686e-05, "loss": 0.8057, "step": 4282 }, { "epoch": 0.29, "learning_rate": 1.6614625197626563e-05, "loss": 0.8789, "step": 4283 }, { "epoch": 0.29, "learning_rate": 1.661296963984122e-05, "loss": 0.8848, "step": 4284 }, { "epoch": 0.29, "learning_rate": 1.6611313759872322e-05, "loss": 0.8252, "step": 4285 }, { "epoch": 0.29, "learning_rate": 1.6609657557800544e-05, "loss": 0.8135, "step": 4286 }, { "epoch": 0.29, "learning_rate": 1.6608001033706565e-05, "loss": 0.7949, "step": 4287 }, { "epoch": 0.29, "learning_rate": 1.66063441876711e-05, "loss": 0.9033, "step": 4288 }, { "epoch": 0.29, "learning_rate": 1.6604687019774867e-05, "loss": 0.7998, "step": 4289 }, { "epoch": 0.29, "learning_rate": 1.6603029530098605e-05, "loss": 0.835, "step": 4290 }, { "epoch": 0.29, "learning_rate": 1.660137171872307e-05, "loss": 0.835, "step": 4291 }, { "epoch": 0.29, "learning_rate": 1.6599713585729024e-05, "loss": 0.7842, "step": 4292 }, { "epoch": 0.29, "learning_rate": 1.6598055131197255e-05, "loss": 0.8545, "step": 4293 }, { "epoch": 0.29, "learning_rate": 1.659639635520856e-05, "loss": 0.8721, "step": 4294 }, { "epoch": 0.29, "learning_rate": 1.6594737257843755e-05, "loss": 0.9121, "step": 4295 }, { "epoch": 0.29, "learning_rate": 1.6593077839183675e-05, "loss": 0.8359, "step": 4296 }, { "epoch": 0.29, "learning_rate": 1.6591418099309166e-05, "loss": 0.8203, "step": 4297 }, { "epoch": 0.29, "learning_rate": 1.658975803830109e-05, "loss": 0.8916, "step": 4298 }, { "epoch": 0.29, "learning_rate": 1.6588097656240314e-05, "loss": 0.8535, "step": 4299 }, { "epoch": 0.29, "learning_rate": 1.658643695320775e-05, "loss": 0.8281, "step": 4300 }, { "epoch": 0.29, "learning_rate": 1.6584775929284294e-05, "loss": 0.8037, "step": 4301 }, { "epoch": 0.29, "learning_rate": 1.658311458455088e-05, "loss": 0.8545, "step": 4302 }, { "epoch": 0.29, "learning_rate": 1.658145291908844e-05, "loss": 0.9365, "step": 4303 }, { "epoch": 0.29, "learning_rate": 1.657979093297794e-05, "loss": 0.8018, "step": 4304 }, { "epoch": 0.29, "learning_rate": 1.6578128626300345e-05, "loss": 0.9268, "step": 4305 }, { "epoch": 0.29, "learning_rate": 1.6576465999136643e-05, "loss": 0.9316, "step": 4306 }, { "epoch": 0.29, "learning_rate": 1.6574803051567838e-05, "loss": 0.8857, "step": 4307 }, { "epoch": 0.29, "learning_rate": 1.657313978367495e-05, "loss": 0.8447, "step": 4308 }, { "epoch": 0.29, "learning_rate": 1.657147619553901e-05, "loss": 0.8965, "step": 4309 }, { "epoch": 0.29, "learning_rate": 1.6569812287241074e-05, "loss": 0.9395, "step": 4310 }, { "epoch": 0.29, "learning_rate": 1.65681480588622e-05, "loss": 0.8281, "step": 4311 }, { "epoch": 0.29, "learning_rate": 1.6566483510483476e-05, "loss": 0.8506, "step": 4312 }, { "epoch": 0.29, "learning_rate": 1.6564818642185995e-05, "loss": 0.7109, "step": 4313 }, { "epoch": 0.29, "learning_rate": 1.6563153454050865e-05, "loss": 0.7266, "step": 4314 }, { "epoch": 0.29, "learning_rate": 1.6561487946159226e-05, "loss": 0.8057, "step": 4315 }, { "epoch": 0.29, "learning_rate": 1.655982211859221e-05, "loss": 0.9092, "step": 4316 }, { "epoch": 0.29, "learning_rate": 1.655815597143098e-05, "loss": 0.8105, "step": 4317 }, { "epoch": 0.29, "learning_rate": 1.6556489504756715e-05, "loss": 0.8965, "step": 4318 }, { "epoch": 0.29, "learning_rate": 1.6554822718650596e-05, "loss": 0.7871, "step": 4319 }, { "epoch": 0.29, "learning_rate": 1.6553155613193835e-05, "loss": 0.8906, "step": 4320 }, { "epoch": 0.29, "learning_rate": 1.6551488188467653e-05, "loss": 0.8916, "step": 4321 }, { "epoch": 0.29, "learning_rate": 1.654982044455329e-05, "loss": 0.8164, "step": 4322 }, { "epoch": 0.29, "learning_rate": 1.654815238153199e-05, "loss": 0.8701, "step": 4323 }, { "epoch": 0.29, "learning_rate": 1.6546483999485022e-05, "loss": 0.8789, "step": 4324 }, { "epoch": 0.29, "learning_rate": 1.6544815298493678e-05, "loss": 0.8486, "step": 4325 }, { "epoch": 0.29, "learning_rate": 1.654314627863925e-05, "loss": 0.8672, "step": 4326 }, { "epoch": 0.29, "learning_rate": 1.6541476940003055e-05, "loss": 0.9131, "step": 4327 }, { "epoch": 0.29, "learning_rate": 1.6539807282666424e-05, "loss": 0.8145, "step": 4328 }, { "epoch": 0.3, "learning_rate": 1.65381373067107e-05, "loss": 0.8506, "step": 4329 }, { "epoch": 0.3, "learning_rate": 1.653646701221724e-05, "loss": 0.8408, "step": 4330 }, { "epoch": 0.3, "learning_rate": 1.6534796399267434e-05, "loss": 0.8047, "step": 4331 }, { "epoch": 0.3, "learning_rate": 1.653312546794266e-05, "loss": 0.8896, "step": 4332 }, { "epoch": 0.3, "learning_rate": 1.6531454218324338e-05, "loss": 0.832, "step": 4333 }, { "epoch": 0.3, "learning_rate": 1.652978265049388e-05, "loss": 0.9072, "step": 4334 }, { "epoch": 0.3, "learning_rate": 1.652811076453273e-05, "loss": 0.9434, "step": 4335 }, { "epoch": 0.3, "learning_rate": 1.6526438560522344e-05, "loss": 0.7969, "step": 4336 }, { "epoch": 0.3, "learning_rate": 1.6524766038544185e-05, "loss": 0.875, "step": 4337 }, { "epoch": 0.3, "learning_rate": 1.652309319867975e-05, "loss": 0.8535, "step": 4338 }, { "epoch": 0.3, "learning_rate": 1.652142004101053e-05, "loss": 0.8359, "step": 4339 }, { "epoch": 0.3, "learning_rate": 1.651974656561804e-05, "loss": 0.8164, "step": 4340 }, { "epoch": 0.3, "learning_rate": 1.651807277258382e-05, "loss": 0.8838, "step": 4341 }, { "epoch": 0.3, "learning_rate": 1.651639866198941e-05, "loss": 0.8613, "step": 4342 }, { "epoch": 0.3, "learning_rate": 1.6514724233916373e-05, "loss": 0.8896, "step": 4343 }, { "epoch": 0.3, "learning_rate": 1.6513049488446292e-05, "loss": 0.8115, "step": 4344 }, { "epoch": 0.3, "learning_rate": 1.651137442566076e-05, "loss": 0.875, "step": 4345 }, { "epoch": 0.3, "learning_rate": 1.6509699045641377e-05, "loss": 0.8066, "step": 4346 }, { "epoch": 0.3, "learning_rate": 1.650802334846978e-05, "loss": 0.8203, "step": 4347 }, { "epoch": 0.3, "learning_rate": 1.65063473342276e-05, "loss": 0.8457, "step": 4348 }, { "epoch": 0.3, "learning_rate": 1.6504671002996496e-05, "loss": 0.8262, "step": 4349 }, { "epoch": 0.3, "learning_rate": 1.6502994354858136e-05, "loss": 0.8389, "step": 4350 }, { "epoch": 0.3, "learning_rate": 1.650131738989421e-05, "loss": 0.874, "step": 4351 }, { "epoch": 0.3, "learning_rate": 1.6499640108186416e-05, "loss": 0.8613, "step": 4352 }, { "epoch": 0.3, "learning_rate": 1.6497962509816473e-05, "loss": 0.8496, "step": 4353 }, { "epoch": 0.3, "learning_rate": 1.6496284594866115e-05, "loss": 0.8984, "step": 4354 }, { "epoch": 0.3, "learning_rate": 1.6494606363417087e-05, "loss": 0.8164, "step": 4355 }, { "epoch": 0.3, "learning_rate": 1.6492927815551155e-05, "loss": 0.8447, "step": 4356 }, { "epoch": 0.3, "learning_rate": 1.6491248951350096e-05, "loss": 0.8096, "step": 4357 }, { "epoch": 0.3, "learning_rate": 1.6489569770895704e-05, "loss": 0.8027, "step": 4358 }, { "epoch": 0.3, "learning_rate": 1.648789027426979e-05, "loss": 0.8545, "step": 4359 }, { "epoch": 0.3, "learning_rate": 1.648621046155418e-05, "loss": 0.8359, "step": 4360 }, { "epoch": 0.3, "learning_rate": 1.648453033283071e-05, "loss": 0.875, "step": 4361 }, { "epoch": 0.3, "learning_rate": 1.6482849888181237e-05, "loss": 0.8809, "step": 4362 }, { "epoch": 0.3, "learning_rate": 1.6481169127687638e-05, "loss": 0.832, "step": 4363 }, { "epoch": 0.3, "learning_rate": 1.6479488051431794e-05, "loss": 0.8643, "step": 4364 }, { "epoch": 0.3, "learning_rate": 1.6477806659495604e-05, "loss": 0.8096, "step": 4365 }, { "epoch": 0.3, "learning_rate": 1.6476124951960995e-05, "loss": 0.8506, "step": 4366 }, { "epoch": 0.3, "learning_rate": 1.647444292890989e-05, "loss": 0.8252, "step": 4367 }, { "epoch": 0.3, "learning_rate": 1.6472760590424245e-05, "loss": 0.7783, "step": 4368 }, { "epoch": 0.3, "learning_rate": 1.6471077936586017e-05, "loss": 0.8242, "step": 4369 }, { "epoch": 0.3, "learning_rate": 1.646939496747719e-05, "loss": 0.8945, "step": 4370 }, { "epoch": 0.3, "learning_rate": 1.646771168317975e-05, "loss": 0.8613, "step": 4371 }, { "epoch": 0.3, "learning_rate": 1.6466028083775717e-05, "loss": 0.751, "step": 4372 }, { "epoch": 0.3, "learning_rate": 1.6464344169347112e-05, "loss": 0.8594, "step": 4373 }, { "epoch": 0.3, "learning_rate": 1.646265993997597e-05, "loss": 0.9102, "step": 4374 }, { "epoch": 0.3, "learning_rate": 1.6460975395744352e-05, "loss": 0.8584, "step": 4375 }, { "epoch": 0.3, "learning_rate": 1.6459290536734332e-05, "loss": 0.8232, "step": 4376 }, { "epoch": 0.3, "learning_rate": 1.6457605363027988e-05, "loss": 0.8652, "step": 4377 }, { "epoch": 0.3, "learning_rate": 1.6455919874707426e-05, "loss": 0.834, "step": 4378 }, { "epoch": 0.3, "learning_rate": 1.6454234071854763e-05, "loss": 0.9033, "step": 4379 }, { "epoch": 0.3, "learning_rate": 1.6452547954552132e-05, "loss": 0.8203, "step": 4380 }, { "epoch": 0.3, "learning_rate": 1.6450861522881677e-05, "loss": 0.9297, "step": 4381 }, { "epoch": 0.3, "learning_rate": 1.6449174776925562e-05, "loss": 0.8965, "step": 4382 }, { "epoch": 0.3, "learning_rate": 1.6447487716765974e-05, "loss": 0.8926, "step": 4383 }, { "epoch": 0.3, "learning_rate": 1.644580034248509e-05, "loss": 0.8574, "step": 4384 }, { "epoch": 0.3, "learning_rate": 1.644411265416513e-05, "loss": 0.9004, "step": 4385 }, { "epoch": 0.3, "learning_rate": 1.644242465188832e-05, "loss": 0.876, "step": 4386 }, { "epoch": 0.3, "learning_rate": 1.6440736335736893e-05, "loss": 0.957, "step": 4387 }, { "epoch": 0.3, "learning_rate": 1.6439047705793102e-05, "loss": 0.8828, "step": 4388 }, { "epoch": 0.3, "learning_rate": 1.6437358762139227e-05, "loss": 0.873, "step": 4389 }, { "epoch": 0.3, "learning_rate": 1.6435669504857547e-05, "loss": 0.8838, "step": 4390 }, { "epoch": 0.3, "learning_rate": 1.6433979934030354e-05, "loss": 0.8945, "step": 4391 }, { "epoch": 0.3, "learning_rate": 1.643229004973998e-05, "loss": 0.8633, "step": 4392 }, { "epoch": 0.3, "learning_rate": 1.6430599852068743e-05, "loss": 0.79, "step": 4393 }, { "epoch": 0.3, "learning_rate": 1.6428909341099e-05, "loss": 0.8564, "step": 4394 }, { "epoch": 0.3, "learning_rate": 1.6427218516913108e-05, "loss": 0.9434, "step": 4395 }, { "epoch": 0.3, "learning_rate": 1.642552737959344e-05, "loss": 0.8936, "step": 4396 }, { "epoch": 0.3, "learning_rate": 1.6423835929222393e-05, "loss": 0.8574, "step": 4397 }, { "epoch": 0.3, "learning_rate": 1.642214416588237e-05, "loss": 0.9297, "step": 4398 }, { "epoch": 0.3, "learning_rate": 1.64204520896558e-05, "loss": 0.8008, "step": 4399 }, { "epoch": 0.3, "learning_rate": 1.6418759700625116e-05, "loss": 0.8174, "step": 4400 }, { "epoch": 0.3, "learning_rate": 1.6417066998872774e-05, "loss": 0.8623, "step": 4401 }, { "epoch": 0.3, "learning_rate": 1.6415373984481236e-05, "loss": 0.8828, "step": 4402 }, { "epoch": 0.3, "learning_rate": 1.6413680657532992e-05, "loss": 0.8252, "step": 4403 }, { "epoch": 0.3, "learning_rate": 1.6411987018110543e-05, "loss": 0.9229, "step": 4404 }, { "epoch": 0.3, "learning_rate": 1.6410293066296397e-05, "loss": 0.8232, "step": 4405 }, { "epoch": 0.3, "learning_rate": 1.6408598802173085e-05, "loss": 0.8525, "step": 4406 }, { "epoch": 0.3, "learning_rate": 1.640690422582315e-05, "loss": 0.9453, "step": 4407 }, { "epoch": 0.3, "learning_rate": 1.6405209337329155e-05, "loss": 0.8613, "step": 4408 }, { "epoch": 0.3, "learning_rate": 1.6403514136773674e-05, "loss": 0.875, "step": 4409 }, { "epoch": 0.3, "learning_rate": 1.6401818624239296e-05, "loss": 0.8047, "step": 4410 }, { "epoch": 0.3, "learning_rate": 1.640012279980863e-05, "loss": 0.8262, "step": 4411 }, { "epoch": 0.3, "learning_rate": 1.639842666356429e-05, "loss": 0.8135, "step": 4412 }, { "epoch": 0.3, "learning_rate": 1.6396730215588913e-05, "loss": 0.8789, "step": 4413 }, { "epoch": 0.3, "learning_rate": 1.6395033455965156e-05, "loss": 0.8008, "step": 4414 }, { "epoch": 0.3, "learning_rate": 1.639333638477568e-05, "loss": 0.7842, "step": 4415 }, { "epoch": 0.3, "learning_rate": 1.6391639002103167e-05, "loss": 0.833, "step": 4416 }, { "epoch": 0.3, "learning_rate": 1.638994130803031e-05, "loss": 0.8643, "step": 4417 }, { "epoch": 0.3, "learning_rate": 1.6388243302639828e-05, "loss": 0.8115, "step": 4418 }, { "epoch": 0.3, "learning_rate": 1.6386544986014442e-05, "loss": 0.8379, "step": 4419 }, { "epoch": 0.3, "learning_rate": 1.63848463582369e-05, "loss": 0.8496, "step": 4420 }, { "epoch": 0.3, "learning_rate": 1.638314741938995e-05, "loss": 0.8281, "step": 4421 }, { "epoch": 0.3, "learning_rate": 1.638144816955637e-05, "loss": 0.9062, "step": 4422 }, { "epoch": 0.3, "learning_rate": 1.6379748608818947e-05, "loss": 0.8613, "step": 4423 }, { "epoch": 0.3, "learning_rate": 1.6378048737260482e-05, "loss": 0.8604, "step": 4424 }, { "epoch": 0.3, "learning_rate": 1.6376348554963796e-05, "loss": 0.9336, "step": 4425 }, { "epoch": 0.3, "learning_rate": 1.6374648062011718e-05, "loss": 0.8467, "step": 4426 }, { "epoch": 0.3, "learning_rate": 1.6372947258487092e-05, "loss": 0.9199, "step": 4427 }, { "epoch": 0.3, "learning_rate": 1.6371246144472795e-05, "loss": 0.8574, "step": 4428 }, { "epoch": 0.3, "learning_rate": 1.636954472005169e-05, "loss": 0.8359, "step": 4429 }, { "epoch": 0.3, "learning_rate": 1.636784298530668e-05, "loss": 0.9238, "step": 4430 }, { "epoch": 0.3, "learning_rate": 1.636614094032067e-05, "loss": 0.8701, "step": 4431 }, { "epoch": 0.3, "learning_rate": 1.6364438585176584e-05, "loss": 0.874, "step": 4432 }, { "epoch": 0.3, "learning_rate": 1.636273591995736e-05, "loss": 0.873, "step": 4433 }, { "epoch": 0.3, "learning_rate": 1.6361032944745952e-05, "loss": 0.8057, "step": 4434 }, { "epoch": 0.3, "learning_rate": 1.6359329659625333e-05, "loss": 0.9424, "step": 4435 }, { "epoch": 0.3, "learning_rate": 1.635762606467848e-05, "loss": 0.9414, "step": 4436 }, { "epoch": 0.3, "learning_rate": 1.6355922159988393e-05, "loss": 0.8193, "step": 4437 }, { "epoch": 0.3, "learning_rate": 1.6354217945638092e-05, "loss": 0.8125, "step": 4438 }, { "epoch": 0.3, "learning_rate": 1.6352513421710598e-05, "loss": 0.9531, "step": 4439 }, { "epoch": 0.3, "learning_rate": 1.6350808588288964e-05, "loss": 0.8467, "step": 4440 }, { "epoch": 0.3, "learning_rate": 1.6349103445456244e-05, "loss": 0.833, "step": 4441 }, { "epoch": 0.3, "learning_rate": 1.6347397993295514e-05, "loss": 0.834, "step": 4442 }, { "epoch": 0.3, "learning_rate": 1.6345692231889862e-05, "loss": 0.8877, "step": 4443 }, { "epoch": 0.3, "learning_rate": 1.6343986161322395e-05, "loss": 0.916, "step": 4444 }, { "epoch": 0.3, "learning_rate": 1.634227978167623e-05, "loss": 0.8496, "step": 4445 }, { "epoch": 0.3, "learning_rate": 1.6340573093034504e-05, "loss": 0.8066, "step": 4446 }, { "epoch": 0.3, "learning_rate": 1.633886609548037e-05, "loss": 0.749, "step": 4447 }, { "epoch": 0.3, "learning_rate": 1.6337158789096986e-05, "loss": 0.8906, "step": 4448 }, { "epoch": 0.3, "learning_rate": 1.6335451173967532e-05, "loss": 0.8467, "step": 4449 }, { "epoch": 0.3, "learning_rate": 1.633374325017521e-05, "loss": 0.8945, "step": 4450 }, { "epoch": 0.3, "learning_rate": 1.6332035017803224e-05, "loss": 0.9072, "step": 4451 }, { "epoch": 0.3, "learning_rate": 1.6330326476934803e-05, "loss": 0.8691, "step": 4452 }, { "epoch": 0.3, "learning_rate": 1.632861762765318e-05, "loss": 0.8037, "step": 4453 }, { "epoch": 0.3, "learning_rate": 1.6326908470041618e-05, "loss": 0.8057, "step": 4454 }, { "epoch": 0.3, "learning_rate": 1.6325199004183385e-05, "loss": 0.7803, "step": 4455 }, { "epoch": 0.3, "learning_rate": 1.6323489230161763e-05, "loss": 0.8633, "step": 4456 }, { "epoch": 0.3, "learning_rate": 1.6321779148060054e-05, "loss": 0.7627, "step": 4457 }, { "epoch": 0.3, "learning_rate": 1.6320068757961574e-05, "loss": 0.8936, "step": 4458 }, { "epoch": 0.3, "learning_rate": 1.6318358059949653e-05, "loss": 0.8086, "step": 4459 }, { "epoch": 0.3, "learning_rate": 1.6316647054107632e-05, "loss": 0.7871, "step": 4460 }, { "epoch": 0.3, "learning_rate": 1.6314935740518877e-05, "loss": 0.7705, "step": 4461 }, { "epoch": 0.3, "learning_rate": 1.631322411926676e-05, "loss": 0.8682, "step": 4462 }, { "epoch": 0.3, "learning_rate": 1.6311512190434674e-05, "loss": 0.8408, "step": 4463 }, { "epoch": 0.3, "learning_rate": 1.630979995410602e-05, "loss": 0.874, "step": 4464 }, { "epoch": 0.3, "learning_rate": 1.6308087410364222e-05, "loss": 0.9209, "step": 4465 }, { "epoch": 0.3, "learning_rate": 1.630637455929271e-05, "loss": 0.9141, "step": 4466 }, { "epoch": 0.3, "learning_rate": 1.6304661400974938e-05, "loss": 0.8066, "step": 4467 }, { "epoch": 0.3, "learning_rate": 1.6302947935494373e-05, "loss": 0.9238, "step": 4468 }, { "epoch": 0.3, "learning_rate": 1.6301234162934487e-05, "loss": 0.8906, "step": 4469 }, { "epoch": 0.3, "learning_rate": 1.6299520083378783e-05, "loss": 0.8809, "step": 4470 }, { "epoch": 0.3, "learning_rate": 1.6297805696910766e-05, "loss": 0.8604, "step": 4471 }, { "epoch": 0.3, "learning_rate": 1.6296091003613964e-05, "loss": 0.8154, "step": 4472 }, { "epoch": 0.3, "learning_rate": 1.6294376003571913e-05, "loss": 0.874, "step": 4473 }, { "epoch": 0.3, "learning_rate": 1.6292660696868173e-05, "loss": 0.8672, "step": 4474 }, { "epoch": 0.3, "learning_rate": 1.629094508358631e-05, "loss": 0.8438, "step": 4475 }, { "epoch": 0.31, "learning_rate": 1.628922916380991e-05, "loss": 0.8418, "step": 4476 }, { "epoch": 0.31, "learning_rate": 1.6287512937622568e-05, "loss": 0.8682, "step": 4477 }, { "epoch": 0.31, "learning_rate": 1.6285796405107905e-05, "loss": 0.8906, "step": 4478 }, { "epoch": 0.31, "learning_rate": 1.628407956634955e-05, "loss": 0.8486, "step": 4479 }, { "epoch": 0.31, "learning_rate": 1.628236242143114e-05, "loss": 0.8184, "step": 4480 }, { "epoch": 0.31, "learning_rate": 1.6280644970436342e-05, "loss": 0.9414, "step": 4481 }, { "epoch": 0.31, "learning_rate": 1.6278927213448828e-05, "loss": 0.9375, "step": 4482 }, { "epoch": 0.31, "learning_rate": 1.6277209150552285e-05, "loss": 0.8984, "step": 4483 }, { "epoch": 0.31, "learning_rate": 1.627549078183042e-05, "loss": 0.915, "step": 4484 }, { "epoch": 0.31, "learning_rate": 1.627377210736695e-05, "loss": 0.8809, "step": 4485 }, { "epoch": 0.31, "learning_rate": 1.6272053127245607e-05, "loss": 0.8379, "step": 4486 }, { "epoch": 0.31, "learning_rate": 1.6270333841550143e-05, "loss": 0.8047, "step": 4487 }, { "epoch": 0.31, "learning_rate": 1.626861425036432e-05, "loss": 0.8994, "step": 4488 }, { "epoch": 0.31, "learning_rate": 1.6266894353771915e-05, "loss": 0.8545, "step": 4489 }, { "epoch": 0.31, "learning_rate": 1.6265174151856724e-05, "loss": 0.8154, "step": 4490 }, { "epoch": 0.31, "learning_rate": 1.6263453644702552e-05, "loss": 0.8271, "step": 4491 }, { "epoch": 0.31, "learning_rate": 1.6261732832393224e-05, "loss": 0.8174, "step": 4492 }, { "epoch": 0.31, "learning_rate": 1.6260011715012583e-05, "loss": 0.9287, "step": 4493 }, { "epoch": 0.31, "learning_rate": 1.6258290292644468e-05, "loss": 0.9141, "step": 4494 }, { "epoch": 0.31, "learning_rate": 1.6256568565372763e-05, "loss": 0.8789, "step": 4495 }, { "epoch": 0.31, "learning_rate": 1.625484653328134e-05, "loss": 0.8506, "step": 4496 }, { "epoch": 0.31, "learning_rate": 1.6253124196454097e-05, "loss": 0.9453, "step": 4497 }, { "epoch": 0.31, "learning_rate": 1.6251401554974948e-05, "loss": 0.875, "step": 4498 }, { "epoch": 0.31, "learning_rate": 1.6249678608927823e-05, "loss": 0.9102, "step": 4499 }, { "epoch": 0.31, "learning_rate": 1.624795535839666e-05, "loss": 0.833, "step": 4500 }, { "epoch": 0.31, "learning_rate": 1.6246231803465416e-05, "loss": 0.8369, "step": 4501 }, { "epoch": 0.31, "learning_rate": 1.624450794421806e-05, "loss": 0.8652, "step": 4502 }, { "epoch": 0.31, "learning_rate": 1.6242783780738585e-05, "loss": 0.8906, "step": 4503 }, { "epoch": 0.31, "learning_rate": 1.624105931311099e-05, "loss": 0.8945, "step": 4504 }, { "epoch": 0.31, "learning_rate": 1.6239334541419288e-05, "loss": 0.8184, "step": 4505 }, { "epoch": 0.31, "learning_rate": 1.6237609465747513e-05, "loss": 0.7988, "step": 4506 }, { "epoch": 0.31, "learning_rate": 1.6235884086179705e-05, "loss": 0.917, "step": 4507 }, { "epoch": 0.31, "learning_rate": 1.6234158402799935e-05, "loss": 0.9209, "step": 4508 }, { "epoch": 0.31, "learning_rate": 1.6232432415692266e-05, "loss": 0.7881, "step": 4509 }, { "epoch": 0.31, "learning_rate": 1.6230706124940795e-05, "loss": 0.8838, "step": 4510 }, { "epoch": 0.31, "learning_rate": 1.6228979530629623e-05, "loss": 0.7236, "step": 4511 }, { "epoch": 0.31, "learning_rate": 1.6227252632842877e-05, "loss": 0.8867, "step": 4512 }, { "epoch": 0.31, "learning_rate": 1.622552543166468e-05, "loss": 0.9512, "step": 4513 }, { "epoch": 0.31, "learning_rate": 1.6223797927179195e-05, "loss": 0.8018, "step": 4514 }, { "epoch": 0.31, "learning_rate": 1.6222070119470575e-05, "loss": 0.8877, "step": 4515 }, { "epoch": 0.31, "learning_rate": 1.6220342008623e-05, "loss": 0.8203, "step": 4516 }, { "epoch": 0.31, "learning_rate": 1.621861359472067e-05, "loss": 0.8818, "step": 4517 }, { "epoch": 0.31, "learning_rate": 1.6216884877847786e-05, "loss": 0.8447, "step": 4518 }, { "epoch": 0.31, "learning_rate": 1.6215155858088574e-05, "loss": 0.9004, "step": 4519 }, { "epoch": 0.31, "learning_rate": 1.621342653552727e-05, "loss": 0.8457, "step": 4520 }, { "epoch": 0.31, "learning_rate": 1.6211696910248133e-05, "loss": 0.8271, "step": 4521 }, { "epoch": 0.31, "learning_rate": 1.6209966982335425e-05, "loss": 0.7627, "step": 4522 }, { "epoch": 0.31, "learning_rate": 1.6208236751873424e-05, "loss": 0.8838, "step": 4523 }, { "epoch": 0.31, "learning_rate": 1.6206506218946434e-05, "loss": 0.8213, "step": 4524 }, { "epoch": 0.31, "learning_rate": 1.6204775383638765e-05, "loss": 0.8389, "step": 4525 }, { "epoch": 0.31, "learning_rate": 1.620304424603474e-05, "loss": 0.835, "step": 4526 }, { "epoch": 0.31, "learning_rate": 1.62013128062187e-05, "loss": 0.9219, "step": 4527 }, { "epoch": 0.31, "learning_rate": 1.6199581064275006e-05, "loss": 0.8525, "step": 4528 }, { "epoch": 0.31, "learning_rate": 1.6197849020288025e-05, "loss": 0.915, "step": 4529 }, { "epoch": 0.31, "learning_rate": 1.619611667434214e-05, "loss": 0.8691, "step": 4530 }, { "epoch": 0.31, "learning_rate": 1.6194384026521752e-05, "loss": 0.8896, "step": 4531 }, { "epoch": 0.31, "learning_rate": 1.619265107691128e-05, "loss": 0.9473, "step": 4532 }, { "epoch": 0.31, "learning_rate": 1.6190917825595147e-05, "loss": 0.7822, "step": 4533 }, { "epoch": 0.31, "learning_rate": 1.61891842726578e-05, "loss": 0.8223, "step": 4534 }, { "epoch": 0.31, "learning_rate": 1.6187450418183693e-05, "loss": 0.8945, "step": 4535 }, { "epoch": 0.31, "learning_rate": 1.6185716262257308e-05, "loss": 0.8369, "step": 4536 }, { "epoch": 0.31, "learning_rate": 1.6183981804963126e-05, "loss": 0.8115, "step": 4537 }, { "epoch": 0.31, "learning_rate": 1.6182247046385656e-05, "loss": 0.7627, "step": 4538 }, { "epoch": 0.31, "learning_rate": 1.618051198660941e-05, "loss": 0.7832, "step": 4539 }, { "epoch": 0.31, "learning_rate": 1.6178776625718918e-05, "loss": 0.8164, "step": 4540 }, { "epoch": 0.31, "learning_rate": 1.6177040963798733e-05, "loss": 0.8809, "step": 4541 }, { "epoch": 0.31, "learning_rate": 1.6175305000933415e-05, "loss": 0.8027, "step": 4542 }, { "epoch": 0.31, "learning_rate": 1.6173568737207536e-05, "loss": 0.8154, "step": 4543 }, { "epoch": 0.31, "learning_rate": 1.617183217270569e-05, "loss": 0.8682, "step": 4544 }, { "epoch": 0.31, "learning_rate": 1.6170095307512478e-05, "loss": 0.8408, "step": 4545 }, { "epoch": 0.31, "learning_rate": 1.6168358141712526e-05, "loss": 0.8281, "step": 4546 }, { "epoch": 0.31, "learning_rate": 1.616662067539047e-05, "loss": 0.7646, "step": 4547 }, { "epoch": 0.31, "learning_rate": 1.616488290863095e-05, "loss": 0.9395, "step": 4548 }, { "epoch": 0.31, "learning_rate": 1.6163144841518636e-05, "loss": 0.8291, "step": 4549 }, { "epoch": 0.31, "learning_rate": 1.616140647413821e-05, "loss": 0.8701, "step": 4550 }, { "epoch": 0.31, "learning_rate": 1.6159667806574358e-05, "loss": 0.9082, "step": 4551 }, { "epoch": 0.31, "learning_rate": 1.615792883891179e-05, "loss": 0.8418, "step": 4552 }, { "epoch": 0.31, "learning_rate": 1.615618957123523e-05, "loss": 0.8896, "step": 4553 }, { "epoch": 0.31, "learning_rate": 1.6154450003629417e-05, "loss": 0.8086, "step": 4554 }, { "epoch": 0.31, "learning_rate": 1.6152710136179096e-05, "loss": 0.9043, "step": 4555 }, { "epoch": 0.31, "learning_rate": 1.615096996896904e-05, "loss": 0.8672, "step": 4556 }, { "epoch": 0.31, "learning_rate": 1.6149229502084025e-05, "loss": 0.8418, "step": 4557 }, { "epoch": 0.31, "learning_rate": 1.614748873560885e-05, "loss": 0.9873, "step": 4558 }, { "epoch": 0.31, "learning_rate": 1.6145747669628323e-05, "loss": 0.8496, "step": 4559 }, { "epoch": 0.31, "learning_rate": 1.6144006304227268e-05, "loss": 0.8125, "step": 4560 }, { "epoch": 0.31, "learning_rate": 1.6142264639490527e-05, "loss": 0.8428, "step": 4561 }, { "epoch": 0.31, "learning_rate": 1.6140522675502954e-05, "loss": 0.8428, "step": 4562 }, { "epoch": 0.31, "learning_rate": 1.6138780412349416e-05, "loss": 0.8809, "step": 4563 }, { "epoch": 0.31, "learning_rate": 1.613703785011479e-05, "loss": 0.8691, "step": 4564 }, { "epoch": 0.31, "learning_rate": 1.6135294988883984e-05, "loss": 0.8877, "step": 4565 }, { "epoch": 0.31, "learning_rate": 1.6133551828741904e-05, "loss": 0.8496, "step": 4566 }, { "epoch": 0.31, "learning_rate": 1.613180836977348e-05, "loss": 0.8389, "step": 4567 }, { "epoch": 0.31, "learning_rate": 1.6130064612063648e-05, "loss": 0.8857, "step": 4568 }, { "epoch": 0.31, "learning_rate": 1.6128320555697365e-05, "loss": 0.7676, "step": 4569 }, { "epoch": 0.31, "learning_rate": 1.612657620075961e-05, "loss": 0.8652, "step": 4570 }, { "epoch": 0.31, "learning_rate": 1.6124831547335357e-05, "loss": 0.877, "step": 4571 }, { "epoch": 0.31, "learning_rate": 1.612308659550961e-05, "loss": 0.8193, "step": 4572 }, { "epoch": 0.31, "learning_rate": 1.6121341345367384e-05, "loss": 0.7568, "step": 4573 }, { "epoch": 0.31, "learning_rate": 1.6119595796993707e-05, "loss": 0.8369, "step": 4574 }, { "epoch": 0.31, "learning_rate": 1.6117849950473618e-05, "loss": 0.9248, "step": 4575 }, { "epoch": 0.31, "learning_rate": 1.611610380589218e-05, "loss": 0.8057, "step": 4576 }, { "epoch": 0.31, "learning_rate": 1.6114357363334466e-05, "loss": 0.96, "step": 4577 }, { "epoch": 0.31, "learning_rate": 1.6112610622885552e-05, "loss": 0.9004, "step": 4578 }, { "epoch": 0.31, "learning_rate": 1.611086358463055e-05, "loss": 0.7773, "step": 4579 }, { "epoch": 0.31, "learning_rate": 1.6109116248654574e-05, "loss": 0.8594, "step": 4580 }, { "epoch": 0.31, "learning_rate": 1.610736861504275e-05, "loss": 0.8408, "step": 4581 }, { "epoch": 0.31, "learning_rate": 1.6105620683880228e-05, "loss": 0.8115, "step": 4582 }, { "epoch": 0.31, "learning_rate": 1.6103872455252162e-05, "loss": 0.9072, "step": 4583 }, { "epoch": 0.31, "learning_rate": 1.6102123929243725e-05, "loss": 0.8516, "step": 4584 }, { "epoch": 0.31, "learning_rate": 1.6100375105940112e-05, "loss": 0.8389, "step": 4585 }, { "epoch": 0.31, "learning_rate": 1.609862598542652e-05, "loss": 0.8828, "step": 4586 }, { "epoch": 0.31, "learning_rate": 1.6096876567788166e-05, "loss": 0.8164, "step": 4587 }, { "epoch": 0.31, "learning_rate": 1.6095126853110286e-05, "loss": 0.8545, "step": 4588 }, { "epoch": 0.31, "learning_rate": 1.6093376841478117e-05, "loss": 0.8018, "step": 4589 }, { "epoch": 0.31, "learning_rate": 1.609162653297693e-05, "loss": 0.9053, "step": 4590 }, { "epoch": 0.31, "learning_rate": 1.6089875927691997e-05, "loss": 0.8008, "step": 4591 }, { "epoch": 0.31, "learning_rate": 1.60881250257086e-05, "loss": 0.7764, "step": 4592 }, { "epoch": 0.31, "learning_rate": 1.6086373827112056e-05, "loss": 0.8721, "step": 4593 }, { "epoch": 0.31, "learning_rate": 1.608462233198767e-05, "loss": 0.8037, "step": 4594 }, { "epoch": 0.31, "learning_rate": 1.6082870540420782e-05, "loss": 0.8906, "step": 4595 }, { "epoch": 0.31, "learning_rate": 1.608111845249674e-05, "loss": 0.8262, "step": 4596 }, { "epoch": 0.31, "learning_rate": 1.6079366068300902e-05, "loss": 0.8408, "step": 4597 }, { "epoch": 0.31, "learning_rate": 1.6077613387918646e-05, "loss": 0.8369, "step": 4598 }, { "epoch": 0.31, "learning_rate": 1.607586041143536e-05, "loss": 0.8555, "step": 4599 }, { "epoch": 0.31, "learning_rate": 1.6074107138936454e-05, "loss": 0.7744, "step": 4600 }, { "epoch": 0.31, "learning_rate": 1.6072353570507343e-05, "loss": 0.877, "step": 4601 }, { "epoch": 0.31, "learning_rate": 1.607059970623346e-05, "loss": 0.916, "step": 4602 }, { "epoch": 0.31, "learning_rate": 1.606884554620026e-05, "loss": 0.9111, "step": 4603 }, { "epoch": 0.31, "learning_rate": 1.60670910904932e-05, "loss": 0.7822, "step": 4604 }, { "epoch": 0.31, "learning_rate": 1.6065336339197758e-05, "loss": 0.834, "step": 4605 }, { "epoch": 0.31, "learning_rate": 1.6063581292399424e-05, "loss": 0.7559, "step": 4606 }, { "epoch": 0.31, "learning_rate": 1.6061825950183706e-05, "loss": 0.8398, "step": 4607 }, { "epoch": 0.31, "learning_rate": 1.606007031263612e-05, "loss": 0.8252, "step": 4608 }, { "epoch": 0.31, "learning_rate": 1.6058314379842208e-05, "loss": 0.9268, "step": 4609 }, { "epoch": 0.31, "learning_rate": 1.6056558151887512e-05, "loss": 0.8311, "step": 4610 }, { "epoch": 0.31, "learning_rate": 1.6054801628857603e-05, "loss": 0.8301, "step": 4611 }, { "epoch": 0.31, "learning_rate": 1.6053044810838048e-05, "loss": 0.8359, "step": 4612 }, { "epoch": 0.31, "learning_rate": 1.6051287697914448e-05, "loss": 0.8672, "step": 4613 }, { "epoch": 0.31, "learning_rate": 1.6049530290172405e-05, "loss": 0.835, "step": 4614 }, { "epoch": 0.31, "learning_rate": 1.6047772587697543e-05, "loss": 0.8428, "step": 4615 }, { "epoch": 0.31, "learning_rate": 1.6046014590575494e-05, "loss": 0.8516, "step": 4616 }, { "epoch": 0.31, "learning_rate": 1.604425629889191e-05, "loss": 0.8525, "step": 4617 }, { "epoch": 0.31, "learning_rate": 1.604249771273245e-05, "loss": 0.7773, "step": 4618 }, { "epoch": 0.31, "learning_rate": 1.6040738832182804e-05, "loss": 0.7793, "step": 4619 }, { "epoch": 0.31, "learning_rate": 1.6038979657328652e-05, "loss": 0.8281, "step": 4620 }, { "epoch": 0.31, "learning_rate": 1.6037220188255706e-05, "loss": 0.8115, "step": 4621 }, { "epoch": 0.31, "learning_rate": 1.6035460425049688e-05, "loss": 0.8076, "step": 4622 }, { "epoch": 0.32, "learning_rate": 1.603370036779633e-05, "loss": 0.8662, "step": 4623 }, { "epoch": 0.32, "learning_rate": 1.6031940016581386e-05, "loss": 0.9082, "step": 4624 }, { "epoch": 0.32, "learning_rate": 1.603017937149062e-05, "loss": 0.8916, "step": 4625 }, { "epoch": 0.32, "learning_rate": 1.6028418432609806e-05, "loss": 0.8926, "step": 4626 }, { "epoch": 0.32, "learning_rate": 1.602665720002474e-05, "loss": 0.8896, "step": 4627 }, { "epoch": 0.32, "learning_rate": 1.602489567382123e-05, "loss": 0.8252, "step": 4628 }, { "epoch": 0.32, "learning_rate": 1.60231338540851e-05, "loss": 0.8418, "step": 4629 }, { "epoch": 0.32, "learning_rate": 1.6021371740902175e-05, "loss": 0.8164, "step": 4630 }, { "epoch": 0.32, "learning_rate": 1.601960933435832e-05, "loss": 0.9004, "step": 4631 }, { "epoch": 0.32, "learning_rate": 1.6017846634539384e-05, "loss": 0.875, "step": 4632 }, { "epoch": 0.32, "learning_rate": 1.6016083641531263e-05, "loss": 0.8828, "step": 4633 }, { "epoch": 0.32, "learning_rate": 1.6014320355419834e-05, "loss": 0.792, "step": 4634 }, { "epoch": 0.32, "learning_rate": 1.601255677629101e-05, "loss": 0.876, "step": 4635 }, { "epoch": 0.32, "learning_rate": 1.6010792904230715e-05, "loss": 0.8369, "step": 4636 }, { "epoch": 0.32, "learning_rate": 1.6009028739324883e-05, "loss": 0.9062, "step": 4637 }, { "epoch": 0.32, "learning_rate": 1.600726428165946e-05, "loss": 0.8096, "step": 4638 }, { "epoch": 0.32, "learning_rate": 1.6005499531320422e-05, "loss": 0.8096, "step": 4639 }, { "epoch": 0.32, "learning_rate": 1.6003734488393733e-05, "loss": 0.8613, "step": 4640 }, { "epoch": 0.32, "learning_rate": 1.6001969152965394e-05, "loss": 0.9277, "step": 4641 }, { "epoch": 0.32, "learning_rate": 1.6000203525121414e-05, "loss": 0.8799, "step": 4642 }, { "epoch": 0.32, "learning_rate": 1.599843760494781e-05, "loss": 0.8848, "step": 4643 }, { "epoch": 0.32, "learning_rate": 1.5996671392530615e-05, "loss": 0.8516, "step": 4644 }, { "epoch": 0.32, "learning_rate": 1.5994904887955883e-05, "loss": 0.8359, "step": 4645 }, { "epoch": 0.32, "learning_rate": 1.599313809130968e-05, "loss": 0.8984, "step": 4646 }, { "epoch": 0.32, "learning_rate": 1.599137100267808e-05, "loss": 0.8428, "step": 4647 }, { "epoch": 0.32, "learning_rate": 1.5989603622147175e-05, "loss": 0.875, "step": 4648 }, { "epoch": 0.32, "learning_rate": 1.5987835949803074e-05, "loss": 0.832, "step": 4649 }, { "epoch": 0.32, "learning_rate": 1.5986067985731898e-05, "loss": 0.8613, "step": 4650 }, { "epoch": 0.32, "learning_rate": 1.5984299730019787e-05, "loss": 0.833, "step": 4651 }, { "epoch": 0.32, "learning_rate": 1.5982531182752877e-05, "loss": 0.8535, "step": 4652 }, { "epoch": 0.32, "learning_rate": 1.5980762344017343e-05, "loss": 0.7979, "step": 4653 }, { "epoch": 0.32, "learning_rate": 1.5978993213899358e-05, "loss": 0.8457, "step": 4654 }, { "epoch": 0.32, "learning_rate": 1.597722379248512e-05, "loss": 0.8809, "step": 4655 }, { "epoch": 0.32, "learning_rate": 1.5975454079860825e-05, "loss": 0.7773, "step": 4656 }, { "epoch": 0.32, "learning_rate": 1.5973684076112702e-05, "loss": 0.9033, "step": 4657 }, { "epoch": 0.32, "learning_rate": 1.5971913781326976e-05, "loss": 0.8877, "step": 4658 }, { "epoch": 0.32, "learning_rate": 1.597014319558991e-05, "loss": 0.79, "step": 4659 }, { "epoch": 0.32, "learning_rate": 1.5968372318987754e-05, "loss": 0.8535, "step": 4660 }, { "epoch": 0.32, "learning_rate": 1.596660115160679e-05, "loss": 0.8809, "step": 4661 }, { "epoch": 0.32, "learning_rate": 1.5964829693533307e-05, "loss": 0.8135, "step": 4662 }, { "epoch": 0.32, "learning_rate": 1.5963057944853617e-05, "loss": 0.793, "step": 4663 }, { "epoch": 0.32, "learning_rate": 1.5961285905654032e-05, "loss": 0.9189, "step": 4664 }, { "epoch": 0.32, "learning_rate": 1.5959513576020887e-05, "loss": 0.7803, "step": 4665 }, { "epoch": 0.32, "learning_rate": 1.5957740956040532e-05, "loss": 0.874, "step": 4666 }, { "epoch": 0.32, "learning_rate": 1.595596804579933e-05, "loss": 0.8779, "step": 4667 }, { "epoch": 0.32, "learning_rate": 1.5954194845383656e-05, "loss": 0.8613, "step": 4668 }, { "epoch": 0.32, "learning_rate": 1.5952421354879897e-05, "loss": 0.7881, "step": 4669 }, { "epoch": 0.32, "learning_rate": 1.595064757437446e-05, "loss": 0.8633, "step": 4670 }, { "epoch": 0.32, "learning_rate": 1.5948873503953763e-05, "loss": 0.8379, "step": 4671 }, { "epoch": 0.32, "learning_rate": 1.5947099143704245e-05, "loss": 0.8809, "step": 4672 }, { "epoch": 0.32, "learning_rate": 1.594532449371234e-05, "loss": 0.8545, "step": 4673 }, { "epoch": 0.32, "learning_rate": 1.5943549554064513e-05, "loss": 0.8105, "step": 4674 }, { "epoch": 0.32, "learning_rate": 1.594177432484725e-05, "loss": 0.8828, "step": 4675 }, { "epoch": 0.32, "learning_rate": 1.5939998806147027e-05, "loss": 0.8252, "step": 4676 }, { "epoch": 0.32, "learning_rate": 1.5938222998050353e-05, "loss": 0.873, "step": 4677 }, { "epoch": 0.32, "learning_rate": 1.5936446900643744e-05, "loss": 0.7832, "step": 4678 }, { "epoch": 0.32, "learning_rate": 1.593467051401373e-05, "loss": 0.7959, "step": 4679 }, { "epoch": 0.32, "learning_rate": 1.593289383824686e-05, "loss": 0.8555, "step": 4680 }, { "epoch": 0.32, "learning_rate": 1.593111687342969e-05, "loss": 0.9561, "step": 4681 }, { "epoch": 0.32, "learning_rate": 1.59293396196488e-05, "loss": 0.8857, "step": 4682 }, { "epoch": 0.32, "learning_rate": 1.5927562076990764e-05, "loss": 0.8428, "step": 4683 }, { "epoch": 0.32, "learning_rate": 1.59257842455422e-05, "loss": 0.8945, "step": 4684 }, { "epoch": 0.32, "learning_rate": 1.5924006125389714e-05, "loss": 0.8545, "step": 4685 }, { "epoch": 0.32, "learning_rate": 1.5922227716619935e-05, "loss": 0.8633, "step": 4686 }, { "epoch": 0.32, "learning_rate": 1.5920449019319515e-05, "loss": 0.7393, "step": 4687 }, { "epoch": 0.32, "learning_rate": 1.5918670033575104e-05, "loss": 0.877, "step": 4688 }, { "epoch": 0.32, "learning_rate": 1.591689075947338e-05, "loss": 0.8203, "step": 4689 }, { "epoch": 0.32, "learning_rate": 1.591511119710103e-05, "loss": 0.8291, "step": 4690 }, { "epoch": 0.32, "learning_rate": 1.5913331346544744e-05, "loss": 0.8994, "step": 4691 }, { "epoch": 0.32, "learning_rate": 1.5911551207891248e-05, "loss": 0.8271, "step": 4692 }, { "epoch": 0.32, "learning_rate": 1.5909770781227265e-05, "loss": 0.8936, "step": 4693 }, { "epoch": 0.32, "learning_rate": 1.5907990066639535e-05, "loss": 0.9131, "step": 4694 }, { "epoch": 0.32, "learning_rate": 1.5906209064214823e-05, "loss": 0.9219, "step": 4695 }, { "epoch": 0.32, "learning_rate": 1.5904427774039887e-05, "loss": 0.8164, "step": 4696 }, { "epoch": 0.32, "learning_rate": 1.590264619620152e-05, "loss": 0.8516, "step": 4697 }, { "epoch": 0.32, "learning_rate": 1.590086433078652e-05, "loss": 0.8643, "step": 4698 }, { "epoch": 0.32, "learning_rate": 1.5899082177881695e-05, "loss": 0.7881, "step": 4699 }, { "epoch": 0.32, "learning_rate": 1.5897299737573876e-05, "loss": 0.917, "step": 4700 }, { "epoch": 0.32, "learning_rate": 1.58955170099499e-05, "loss": 0.7988, "step": 4701 }, { "epoch": 0.32, "learning_rate": 1.589373399509662e-05, "loss": 0.8506, "step": 4702 }, { "epoch": 0.32, "learning_rate": 1.5891950693100914e-05, "loss": 0.7529, "step": 4703 }, { "epoch": 0.32, "learning_rate": 1.589016710404965e-05, "loss": 0.8428, "step": 4704 }, { "epoch": 0.32, "learning_rate": 1.588838322802974e-05, "loss": 0.9316, "step": 4705 }, { "epoch": 0.32, "learning_rate": 1.5886599065128077e-05, "loss": 0.8281, "step": 4706 }, { "epoch": 0.32, "learning_rate": 1.58848146154316e-05, "loss": 0.8242, "step": 4707 }, { "epoch": 0.32, "learning_rate": 1.5883029879027245e-05, "loss": 0.8271, "step": 4708 }, { "epoch": 0.32, "learning_rate": 1.5881244856001956e-05, "loss": 0.8184, "step": 4709 }, { "epoch": 0.32, "learning_rate": 1.5879459546442707e-05, "loss": 0.7998, "step": 4710 }, { "epoch": 0.32, "learning_rate": 1.5877673950436478e-05, "loss": 0.8428, "step": 4711 }, { "epoch": 0.32, "learning_rate": 1.5875888068070257e-05, "loss": 0.9141, "step": 4712 }, { "epoch": 0.32, "learning_rate": 1.5874101899431053e-05, "loss": 0.8936, "step": 4713 }, { "epoch": 0.32, "learning_rate": 1.5872315444605898e-05, "loss": 0.8447, "step": 4714 }, { "epoch": 0.32, "learning_rate": 1.5870528703681813e-05, "loss": 0.8906, "step": 4715 }, { "epoch": 0.32, "learning_rate": 1.5868741676745862e-05, "loss": 0.8359, "step": 4716 }, { "epoch": 0.32, "learning_rate": 1.58669543638851e-05, "loss": 0.8301, "step": 4717 }, { "epoch": 0.32, "learning_rate": 1.586516676518661e-05, "loss": 0.8115, "step": 4718 }, { "epoch": 0.32, "learning_rate": 1.586337888073748e-05, "loss": 0.8232, "step": 4719 }, { "epoch": 0.32, "learning_rate": 1.5861590710624813e-05, "loss": 0.8252, "step": 4720 }, { "epoch": 0.32, "learning_rate": 1.5859802254935737e-05, "loss": 0.8945, "step": 4721 }, { "epoch": 0.32, "learning_rate": 1.585801351375738e-05, "loss": 0.8379, "step": 4722 }, { "epoch": 0.32, "learning_rate": 1.585622448717689e-05, "loss": 0.8896, "step": 4723 }, { "epoch": 0.32, "learning_rate": 1.5854435175281428e-05, "loss": 0.9365, "step": 4724 }, { "epoch": 0.32, "learning_rate": 1.5852645578158172e-05, "loss": 0.9189, "step": 4725 }, { "epoch": 0.32, "learning_rate": 1.585085569589431e-05, "loss": 0.7383, "step": 4726 }, { "epoch": 0.32, "learning_rate": 1.5849065528577038e-05, "loss": 0.7852, "step": 4727 }, { "epoch": 0.32, "learning_rate": 1.584727507629358e-05, "loss": 0.7969, "step": 4728 }, { "epoch": 0.32, "learning_rate": 1.584548433913117e-05, "loss": 0.8213, "step": 4729 }, { "epoch": 0.32, "learning_rate": 1.5843693317177043e-05, "loss": 0.7988, "step": 4730 }, { "epoch": 0.32, "learning_rate": 1.5841902010518466e-05, "loss": 0.8662, "step": 4731 }, { "epoch": 0.32, "learning_rate": 1.5840110419242706e-05, "loss": 0.8643, "step": 4732 }, { "epoch": 0.32, "learning_rate": 1.583831854343705e-05, "loss": 0.7852, "step": 4733 }, { "epoch": 0.32, "learning_rate": 1.5836526383188802e-05, "loss": 0.8135, "step": 4734 }, { "epoch": 0.32, "learning_rate": 1.5834733938585275e-05, "loss": 0.8447, "step": 4735 }, { "epoch": 0.32, "learning_rate": 1.583294120971379e-05, "loss": 0.835, "step": 4736 }, { "epoch": 0.32, "learning_rate": 1.5831148196661697e-05, "loss": 0.9902, "step": 4737 }, { "epoch": 0.32, "learning_rate": 1.5829354899516347e-05, "loss": 0.9033, "step": 4738 }, { "epoch": 0.32, "learning_rate": 1.582756131836511e-05, "loss": 0.8135, "step": 4739 }, { "epoch": 0.32, "learning_rate": 1.5825767453295374e-05, "loss": 0.8652, "step": 4740 }, { "epoch": 0.32, "learning_rate": 1.5823973304394526e-05, "loss": 0.7949, "step": 4741 }, { "epoch": 0.32, "learning_rate": 1.5822178871749984e-05, "loss": 0.8896, "step": 4742 }, { "epoch": 0.32, "learning_rate": 1.5820384155449175e-05, "loss": 0.8242, "step": 4743 }, { "epoch": 0.32, "learning_rate": 1.581858915557953e-05, "loss": 0.8984, "step": 4744 }, { "epoch": 0.32, "learning_rate": 1.5816793872228506e-05, "loss": 0.8945, "step": 4745 }, { "epoch": 0.32, "learning_rate": 1.581499830548357e-05, "loss": 0.8418, "step": 4746 }, { "epoch": 0.32, "learning_rate": 1.5813202455432196e-05, "loss": 0.7871, "step": 4747 }, { "epoch": 0.32, "learning_rate": 1.5811406322161886e-05, "loss": 0.8809, "step": 4748 }, { "epoch": 0.32, "learning_rate": 1.580960990576014e-05, "loss": 0.8184, "step": 4749 }, { "epoch": 0.32, "learning_rate": 1.5807813206314485e-05, "loss": 0.79, "step": 4750 }, { "epoch": 0.32, "learning_rate": 1.5806016223912456e-05, "loss": 0.8457, "step": 4751 }, { "epoch": 0.32, "learning_rate": 1.5804218958641596e-05, "loss": 0.8301, "step": 4752 }, { "epoch": 0.32, "learning_rate": 1.5802421410589474e-05, "loss": 0.8945, "step": 4753 }, { "epoch": 0.32, "learning_rate": 1.580062357984366e-05, "loss": 0.8291, "step": 4754 }, { "epoch": 0.32, "learning_rate": 1.579882546649175e-05, "loss": 0.8936, "step": 4755 }, { "epoch": 0.32, "learning_rate": 1.579702707062135e-05, "loss": 0.8398, "step": 4756 }, { "epoch": 0.32, "learning_rate": 1.5795228392320068e-05, "loss": 0.834, "step": 4757 }, { "epoch": 0.32, "learning_rate": 1.5793429431675545e-05, "loss": 0.8525, "step": 4758 }, { "epoch": 0.32, "learning_rate": 1.5791630188775423e-05, "loss": 0.7969, "step": 4759 }, { "epoch": 0.32, "learning_rate": 1.5789830663707358e-05, "loss": 0.8936, "step": 4760 }, { "epoch": 0.32, "learning_rate": 1.5788030856559026e-05, "loss": 0.8369, "step": 4761 }, { "epoch": 0.32, "learning_rate": 1.578623076741811e-05, "loss": 0.7969, "step": 4762 }, { "epoch": 0.32, "learning_rate": 1.578443039637232e-05, "loss": 0.8447, "step": 4763 }, { "epoch": 0.32, "learning_rate": 1.5782629743509356e-05, "loss": 0.876, "step": 4764 }, { "epoch": 0.32, "learning_rate": 1.578082880891696e-05, "loss": 0.8711, "step": 4765 }, { "epoch": 0.32, "learning_rate": 1.577902759268286e-05, "loss": 0.8311, "step": 4766 }, { "epoch": 0.32, "learning_rate": 1.5777226094894822e-05, "loss": 0.8242, "step": 4767 }, { "epoch": 0.32, "learning_rate": 1.5775424315640608e-05, "loss": 0.8613, "step": 4768 }, { "epoch": 0.32, "learning_rate": 1.5773622255008004e-05, "loss": 0.9043, "step": 4769 }, { "epoch": 0.33, "learning_rate": 1.5771819913084806e-05, "loss": 0.8613, "step": 4770 }, { "epoch": 0.33, "learning_rate": 1.5770017289958822e-05, "loss": 0.7744, "step": 4771 }, { "epoch": 0.33, "learning_rate": 1.5768214385717877e-05, "loss": 0.8584, "step": 4772 }, { "epoch": 0.33, "learning_rate": 1.5766411200449807e-05, "loss": 0.8447, "step": 4773 }, { "epoch": 0.33, "learning_rate": 1.5764607734242468e-05, "loss": 0.832, "step": 4774 }, { "epoch": 0.33, "learning_rate": 1.576280398718372e-05, "loss": 0.8691, "step": 4775 }, { "epoch": 0.33, "learning_rate": 1.576099995936144e-05, "loss": 0.9199, "step": 4776 }, { "epoch": 0.33, "learning_rate": 1.5759195650863528e-05, "loss": 0.8848, "step": 4777 }, { "epoch": 0.33, "learning_rate": 1.5757391061777882e-05, "loss": 0.7939, "step": 4778 }, { "epoch": 0.33, "learning_rate": 1.5755586192192423e-05, "loss": 0.8291, "step": 4779 }, { "epoch": 0.33, "learning_rate": 1.5753781042195088e-05, "loss": 0.7598, "step": 4780 }, { "epoch": 0.33, "learning_rate": 1.575197561187382e-05, "loss": 0.8447, "step": 4781 }, { "epoch": 0.33, "learning_rate": 1.5750169901316577e-05, "loss": 0.7734, "step": 4782 }, { "epoch": 0.33, "learning_rate": 1.574836391061134e-05, "loss": 0.8623, "step": 4783 }, { "epoch": 0.33, "learning_rate": 1.5746557639846095e-05, "loss": 0.8154, "step": 4784 }, { "epoch": 0.33, "learning_rate": 1.5744751089108843e-05, "loss": 0.8936, "step": 4785 }, { "epoch": 0.33, "learning_rate": 1.5742944258487596e-05, "loss": 0.8877, "step": 4786 }, { "epoch": 0.33, "learning_rate": 1.5741137148070387e-05, "loss": 0.793, "step": 4787 }, { "epoch": 0.33, "learning_rate": 1.5739329757945254e-05, "loss": 0.7705, "step": 4788 }, { "epoch": 0.33, "learning_rate": 1.5737522088200253e-05, "loss": 0.8379, "step": 4789 }, { "epoch": 0.33, "learning_rate": 1.5735714138923457e-05, "loss": 0.8398, "step": 4790 }, { "epoch": 0.33, "learning_rate": 1.573390591020295e-05, "loss": 0.7988, "step": 4791 }, { "epoch": 0.33, "learning_rate": 1.5732097402126828e-05, "loss": 0.8389, "step": 4792 }, { "epoch": 0.33, "learning_rate": 1.5730288614783192e-05, "loss": 0.8457, "step": 4793 }, { "epoch": 0.33, "learning_rate": 1.5728479548260184e-05, "loss": 0.8555, "step": 4794 }, { "epoch": 0.33, "learning_rate": 1.5726670202645925e-05, "loss": 0.8672, "step": 4795 }, { "epoch": 0.33, "learning_rate": 1.5724860578028575e-05, "loss": 0.8564, "step": 4796 }, { "epoch": 0.33, "learning_rate": 1.57230506744963e-05, "loss": 0.8662, "step": 4797 }, { "epoch": 0.33, "learning_rate": 1.572124049213727e-05, "loss": 0.8252, "step": 4798 }, { "epoch": 0.33, "learning_rate": 1.5719430031039684e-05, "loss": 0.876, "step": 4799 }, { "epoch": 0.33, "learning_rate": 1.571761929129175e-05, "loss": 0.8369, "step": 4800 }, { "epoch": 0.33, "learning_rate": 1.5715808272981678e-05, "loss": 0.8076, "step": 4801 }, { "epoch": 0.33, "learning_rate": 1.5713996976197704e-05, "loss": 0.8467, "step": 4802 }, { "epoch": 0.33, "learning_rate": 1.571218540102808e-05, "loss": 0.8701, "step": 4803 }, { "epoch": 0.33, "learning_rate": 1.5710373547561065e-05, "loss": 0.832, "step": 4804 }, { "epoch": 0.33, "learning_rate": 1.570856141588492e-05, "loss": 0.7979, "step": 4805 }, { "epoch": 0.33, "learning_rate": 1.5706749006087948e-05, "loss": 0.9033, "step": 4806 }, { "epoch": 0.33, "learning_rate": 1.570493631825844e-05, "loss": 0.7744, "step": 4807 }, { "epoch": 0.33, "learning_rate": 1.5703123352484716e-05, "loss": 0.8281, "step": 4808 }, { "epoch": 0.33, "learning_rate": 1.57013101088551e-05, "loss": 0.8594, "step": 4809 }, { "epoch": 0.33, "learning_rate": 1.569949658745793e-05, "loss": 0.8018, "step": 4810 }, { "epoch": 0.33, "learning_rate": 1.5697682788381565e-05, "loss": 0.7754, "step": 4811 }, { "epoch": 0.33, "learning_rate": 1.5695868711714375e-05, "loss": 0.7891, "step": 4812 }, { "epoch": 0.33, "learning_rate": 1.5694054357544737e-05, "loss": 0.8018, "step": 4813 }, { "epoch": 0.33, "learning_rate": 1.5692239725961048e-05, "loss": 0.8271, "step": 4814 }, { "epoch": 0.33, "learning_rate": 1.569042481705172e-05, "loss": 0.875, "step": 4815 }, { "epoch": 0.33, "learning_rate": 1.5688609630905168e-05, "loss": 0.7715, "step": 4816 }, { "epoch": 0.33, "learning_rate": 1.5686794167609837e-05, "loss": 0.7666, "step": 4817 }, { "epoch": 0.33, "learning_rate": 1.568497842725417e-05, "loss": 0.8271, "step": 4818 }, { "epoch": 0.33, "learning_rate": 1.5683162409926628e-05, "loss": 0.8486, "step": 4819 }, { "epoch": 0.33, "learning_rate": 1.5681346115715693e-05, "loss": 0.9082, "step": 4820 }, { "epoch": 0.33, "learning_rate": 1.567952954470985e-05, "loss": 0.8174, "step": 4821 }, { "epoch": 0.33, "learning_rate": 1.567771269699761e-05, "loss": 0.7471, "step": 4822 }, { "epoch": 0.33, "learning_rate": 1.567589557266748e-05, "loss": 0.8389, "step": 4823 }, { "epoch": 0.33, "learning_rate": 1.5674078171807995e-05, "loss": 0.8447, "step": 4824 }, { "epoch": 0.33, "learning_rate": 1.5672260494507697e-05, "loss": 0.8125, "step": 4825 }, { "epoch": 0.33, "learning_rate": 1.5670442540855148e-05, "loss": 0.7598, "step": 4826 }, { "epoch": 0.33, "learning_rate": 1.5668624310938914e-05, "loss": 0.8818, "step": 4827 }, { "epoch": 0.33, "learning_rate": 1.5666805804847577e-05, "loss": 0.9004, "step": 4828 }, { "epoch": 0.33, "learning_rate": 1.566498702266974e-05, "loss": 0.8027, "step": 4829 }, { "epoch": 0.33, "learning_rate": 1.5663167964494014e-05, "loss": 0.7744, "step": 4830 }, { "epoch": 0.33, "learning_rate": 1.5661348630409014e-05, "loss": 0.8877, "step": 4831 }, { "epoch": 0.33, "learning_rate": 1.565952902050339e-05, "loss": 0.916, "step": 4832 }, { "epoch": 0.33, "learning_rate": 1.5657709134865787e-05, "loss": 0.8457, "step": 4833 }, { "epoch": 0.33, "learning_rate": 1.565588897358487e-05, "loss": 0.8818, "step": 4834 }, { "epoch": 0.33, "learning_rate": 1.565406853674932e-05, "loss": 0.7568, "step": 4835 }, { "epoch": 0.33, "learning_rate": 1.5652247824447824e-05, "loss": 0.958, "step": 4836 }, { "epoch": 0.33, "learning_rate": 1.565042683676909e-05, "loss": 0.7695, "step": 4837 }, { "epoch": 0.33, "learning_rate": 1.5648605573801838e-05, "loss": 0.8018, "step": 4838 }, { "epoch": 0.33, "learning_rate": 1.56467840356348e-05, "loss": 0.8721, "step": 4839 }, { "epoch": 0.33, "learning_rate": 1.5644962222356716e-05, "loss": 0.8604, "step": 4840 }, { "epoch": 0.33, "learning_rate": 1.5643140134056346e-05, "loss": 0.8438, "step": 4841 }, { "epoch": 0.33, "learning_rate": 1.5641317770822468e-05, "loss": 0.8828, "step": 4842 }, { "epoch": 0.33, "learning_rate": 1.5639495132743857e-05, "loss": 0.875, "step": 4843 }, { "epoch": 0.33, "learning_rate": 1.5637672219909324e-05, "loss": 0.8262, "step": 4844 }, { "epoch": 0.33, "learning_rate": 1.563584903240767e-05, "loss": 0.8135, "step": 4845 }, { "epoch": 0.33, "learning_rate": 1.5634025570327732e-05, "loss": 0.8359, "step": 4846 }, { "epoch": 0.33, "learning_rate": 1.5632201833758344e-05, "loss": 0.8848, "step": 4847 }, { "epoch": 0.33, "learning_rate": 1.5630377822788353e-05, "loss": 0.8389, "step": 4848 }, { "epoch": 0.33, "learning_rate": 1.562855353750663e-05, "loss": 0.8604, "step": 4849 }, { "epoch": 0.33, "learning_rate": 1.5626728978002056e-05, "loss": 0.8389, "step": 4850 }, { "epoch": 0.33, "learning_rate": 1.5624904144363516e-05, "loss": 0.8574, "step": 4851 }, { "epoch": 0.33, "learning_rate": 1.562307903667992e-05, "loss": 0.8789, "step": 4852 }, { "epoch": 0.33, "learning_rate": 1.562125365504019e-05, "loss": 0.8066, "step": 4853 }, { "epoch": 0.33, "learning_rate": 1.5619427999533256e-05, "loss": 0.8564, "step": 4854 }, { "epoch": 0.33, "learning_rate": 1.5617602070248064e-05, "loss": 0.8145, "step": 4855 }, { "epoch": 0.33, "learning_rate": 1.5615775867273574e-05, "loss": 0.8525, "step": 4856 }, { "epoch": 0.33, "learning_rate": 1.5613949390698755e-05, "loss": 0.8281, "step": 4857 }, { "epoch": 0.33, "learning_rate": 1.5612122640612596e-05, "loss": 0.7881, "step": 4858 }, { "epoch": 0.33, "learning_rate": 1.56102956171041e-05, "loss": 0.8604, "step": 4859 }, { "epoch": 0.33, "learning_rate": 1.560846832026227e-05, "loss": 0.835, "step": 4860 }, { "epoch": 0.33, "learning_rate": 1.5606640750176136e-05, "loss": 0.8252, "step": 4861 }, { "epoch": 0.33, "learning_rate": 1.560481290693474e-05, "loss": 0.7725, "step": 4862 }, { "epoch": 0.33, "learning_rate": 1.5602984790627135e-05, "loss": 0.7852, "step": 4863 }, { "epoch": 0.33, "learning_rate": 1.5601156401342383e-05, "loss": 0.8213, "step": 4864 }, { "epoch": 0.33, "learning_rate": 1.559932773916956e-05, "loss": 0.8047, "step": 4865 }, { "epoch": 0.33, "learning_rate": 1.5597498804197768e-05, "loss": 0.8623, "step": 4866 }, { "epoch": 0.33, "learning_rate": 1.5595669596516105e-05, "loss": 0.9053, "step": 4867 }, { "epoch": 0.33, "learning_rate": 1.5593840116213695e-05, "loss": 0.8828, "step": 4868 }, { "epoch": 0.33, "learning_rate": 1.5592010363379665e-05, "loss": 0.7637, "step": 4869 }, { "epoch": 0.33, "learning_rate": 1.559018033810316e-05, "loss": 0.8701, "step": 4870 }, { "epoch": 0.33, "learning_rate": 1.5588350040473346e-05, "loss": 0.9053, "step": 4871 }, { "epoch": 0.33, "learning_rate": 1.558651947057939e-05, "loss": 0.8193, "step": 4872 }, { "epoch": 0.33, "learning_rate": 1.5584688628510475e-05, "loss": 0.8564, "step": 4873 }, { "epoch": 0.33, "learning_rate": 1.5582857514355806e-05, "loss": 0.876, "step": 4874 }, { "epoch": 0.33, "learning_rate": 1.558102612820459e-05, "loss": 0.8135, "step": 4875 }, { "epoch": 0.33, "learning_rate": 1.557919447014605e-05, "loss": 0.793, "step": 4876 }, { "epoch": 0.33, "learning_rate": 1.557736254026943e-05, "loss": 0.7803, "step": 4877 }, { "epoch": 0.33, "learning_rate": 1.557553033866398e-05, "loss": 0.8438, "step": 4878 }, { "epoch": 0.33, "learning_rate": 1.557369786541896e-05, "loss": 0.8877, "step": 4879 }, { "epoch": 0.33, "learning_rate": 1.5571865120623658e-05, "loss": 0.9111, "step": 4880 }, { "epoch": 0.33, "learning_rate": 1.5570032104367354e-05, "loss": 0.8662, "step": 4881 }, { "epoch": 0.33, "learning_rate": 1.556819881673936e-05, "loss": 0.791, "step": 4882 }, { "epoch": 0.33, "learning_rate": 1.5566365257828987e-05, "loss": 0.8213, "step": 4883 }, { "epoch": 0.33, "learning_rate": 1.5564531427725575e-05, "loss": 0.7754, "step": 4884 }, { "epoch": 0.33, "learning_rate": 1.5562697326518463e-05, "loss": 0.8633, "step": 4885 }, { "epoch": 0.33, "learning_rate": 1.5560862954297003e-05, "loss": 0.8701, "step": 4886 }, { "epoch": 0.33, "learning_rate": 1.5559028311150578e-05, "loss": 0.9111, "step": 4887 }, { "epoch": 0.33, "learning_rate": 1.555719339716856e-05, "loss": 0.9277, "step": 4888 }, { "epoch": 0.33, "learning_rate": 1.5555358212440354e-05, "loss": 0.8311, "step": 4889 }, { "epoch": 0.33, "learning_rate": 1.5553522757055368e-05, "loss": 0.8594, "step": 4890 }, { "epoch": 0.33, "learning_rate": 1.555168703110302e-05, "loss": 0.7197, "step": 4891 }, { "epoch": 0.33, "learning_rate": 1.5549851034672753e-05, "loss": 0.9492, "step": 4892 }, { "epoch": 0.33, "learning_rate": 1.554801476785401e-05, "loss": 0.7441, "step": 4893 }, { "epoch": 0.33, "learning_rate": 1.554617823073626e-05, "loss": 0.8398, "step": 4894 }, { "epoch": 0.33, "learning_rate": 1.554434142340898e-05, "loss": 0.8838, "step": 4895 }, { "epoch": 0.33, "learning_rate": 1.5542504345961656e-05, "loss": 0.8818, "step": 4896 }, { "epoch": 0.33, "learning_rate": 1.554066699848379e-05, "loss": 0.8291, "step": 4897 }, { "epoch": 0.33, "learning_rate": 1.5538829381064897e-05, "loss": 0.8643, "step": 4898 }, { "epoch": 0.33, "learning_rate": 1.5536991493794505e-05, "loss": 0.8076, "step": 4899 }, { "epoch": 0.33, "learning_rate": 1.553515333676216e-05, "loss": 0.9004, "step": 4900 }, { "epoch": 0.33, "learning_rate": 1.5533314910057417e-05, "loss": 0.8438, "step": 4901 }, { "epoch": 0.33, "learning_rate": 1.5531476213769835e-05, "loss": 0.7871, "step": 4902 }, { "epoch": 0.33, "learning_rate": 1.5529637247989006e-05, "loss": 0.8047, "step": 4903 }, { "epoch": 0.33, "learning_rate": 1.552779801280452e-05, "loss": 0.7881, "step": 4904 }, { "epoch": 0.33, "learning_rate": 1.552595850830598e-05, "loss": 0.8232, "step": 4905 }, { "epoch": 0.33, "learning_rate": 1.5524118734583017e-05, "loss": 0.8281, "step": 4906 }, { "epoch": 0.33, "learning_rate": 1.5522278691725254e-05, "loss": 0.7891, "step": 4907 }, { "epoch": 0.33, "learning_rate": 1.5520438379822345e-05, "loss": 0.9053, "step": 4908 }, { "epoch": 0.33, "learning_rate": 1.5518597798963945e-05, "loss": 0.8828, "step": 4909 }, { "epoch": 0.33, "learning_rate": 1.551675694923973e-05, "loss": 0.8535, "step": 4910 }, { "epoch": 0.33, "learning_rate": 1.551491583073939e-05, "loss": 0.7988, "step": 4911 }, { "epoch": 0.33, "learning_rate": 1.5513074443552612e-05, "loss": 0.7588, "step": 4912 }, { "epoch": 0.33, "learning_rate": 1.5511232787769124e-05, "loss": 0.9336, "step": 4913 }, { "epoch": 0.33, "learning_rate": 1.5509390863478638e-05, "loss": 0.7686, "step": 4914 }, { "epoch": 0.33, "learning_rate": 1.5507548670770898e-05, "loss": 0.8672, "step": 4915 }, { "epoch": 0.34, "learning_rate": 1.5505706209735657e-05, "loss": 0.8633, "step": 4916 }, { "epoch": 0.34, "learning_rate": 1.550386348046268e-05, "loss": 0.8652, "step": 4917 }, { "epoch": 0.34, "learning_rate": 1.5502020483041737e-05, "loss": 0.8574, "step": 4918 }, { "epoch": 0.34, "learning_rate": 1.550017721756263e-05, "loss": 0.9199, "step": 4919 }, { "epoch": 0.34, "learning_rate": 1.5498333684115153e-05, "loss": 0.8066, "step": 4920 }, { "epoch": 0.34, "learning_rate": 1.5496489882789128e-05, "loss": 0.874, "step": 4921 }, { "epoch": 0.34, "learning_rate": 1.5494645813674386e-05, "loss": 0.8311, "step": 4922 }, { "epoch": 0.34, "learning_rate": 1.5492801476860767e-05, "loss": 0.7939, "step": 4923 }, { "epoch": 0.34, "learning_rate": 1.5490956872438126e-05, "loss": 0.832, "step": 4924 }, { "epoch": 0.34, "learning_rate": 1.5489112000496334e-05, "loss": 0.8203, "step": 4925 }, { "epoch": 0.34, "learning_rate": 1.5487266861125275e-05, "loss": 0.7598, "step": 4926 }, { "epoch": 0.34, "learning_rate": 1.5485421454414843e-05, "loss": 0.8008, "step": 4927 }, { "epoch": 0.34, "learning_rate": 1.548357578045494e-05, "loss": 0.8877, "step": 4928 }, { "epoch": 0.34, "learning_rate": 1.54817298393355e-05, "loss": 0.8896, "step": 4929 }, { "epoch": 0.34, "learning_rate": 1.5479883631146445e-05, "loss": 0.8574, "step": 4930 }, { "epoch": 0.34, "learning_rate": 1.5478037155977727e-05, "loss": 0.8799, "step": 4931 }, { "epoch": 0.34, "learning_rate": 1.5476190413919304e-05, "loss": 0.8418, "step": 4932 }, { "epoch": 0.34, "learning_rate": 1.5474343405061153e-05, "loss": 0.8398, "step": 4933 }, { "epoch": 0.34, "learning_rate": 1.5472496129493262e-05, "loss": 0.8115, "step": 4934 }, { "epoch": 0.34, "learning_rate": 1.547064858730562e-05, "loss": 0.8945, "step": 4935 }, { "epoch": 0.34, "learning_rate": 1.546880077858825e-05, "loss": 0.8096, "step": 4936 }, { "epoch": 0.34, "learning_rate": 1.5466952703431174e-05, "loss": 0.8467, "step": 4937 }, { "epoch": 0.34, "learning_rate": 1.5465104361924425e-05, "loss": 0.7793, "step": 4938 }, { "epoch": 0.34, "learning_rate": 1.546325575415806e-05, "loss": 0.8555, "step": 4939 }, { "epoch": 0.34, "learning_rate": 1.546140688022214e-05, "loss": 0.8154, "step": 4940 }, { "epoch": 0.34, "learning_rate": 1.5459557740206744e-05, "loss": 0.8418, "step": 4941 }, { "epoch": 0.34, "learning_rate": 1.545770833420196e-05, "loss": 0.7725, "step": 4942 }, { "epoch": 0.34, "learning_rate": 1.5455858662297895e-05, "loss": 0.8291, "step": 4943 }, { "epoch": 0.34, "learning_rate": 1.5454008724584658e-05, "loss": 0.8574, "step": 4944 }, { "epoch": 0.34, "learning_rate": 1.5452158521152382e-05, "loss": 0.9023, "step": 4945 }, { "epoch": 0.34, "learning_rate": 1.5450308052091214e-05, "loss": 0.8926, "step": 4946 }, { "epoch": 0.34, "learning_rate": 1.5448457317491298e-05, "loss": 0.8242, "step": 4947 }, { "epoch": 0.34, "learning_rate": 1.544660631744281e-05, "loss": 0.8633, "step": 4948 }, { "epoch": 0.34, "learning_rate": 1.5444755052035926e-05, "loss": 0.7939, "step": 4949 }, { "epoch": 0.34, "learning_rate": 1.544290352136084e-05, "loss": 0.9336, "step": 4950 }, { "epoch": 0.34, "learning_rate": 1.5441051725507764e-05, "loss": 0.8096, "step": 4951 }, { "epoch": 0.34, "learning_rate": 1.5439199664566916e-05, "loss": 0.8486, "step": 4952 }, { "epoch": 0.34, "learning_rate": 1.5437347338628516e-05, "loss": 0.8789, "step": 4953 }, { "epoch": 0.34, "learning_rate": 1.5435494747782826e-05, "loss": 0.7598, "step": 4954 }, { "epoch": 0.34, "learning_rate": 1.5433641892120097e-05, "loss": 0.7461, "step": 4955 }, { "epoch": 0.34, "learning_rate": 1.5431788771730597e-05, "loss": 0.833, "step": 4956 }, { "epoch": 0.34, "learning_rate": 1.5429935386704613e-05, "loss": 0.7588, "step": 4957 }, { "epoch": 0.34, "learning_rate": 1.5428081737132442e-05, "loss": 0.8477, "step": 4958 }, { "epoch": 0.34, "learning_rate": 1.5426227823104394e-05, "loss": 0.8574, "step": 4959 }, { "epoch": 0.34, "learning_rate": 1.5424373644710793e-05, "loss": 0.8232, "step": 4960 }, { "epoch": 0.34, "learning_rate": 1.542251920204197e-05, "loss": 0.8936, "step": 4961 }, { "epoch": 0.34, "learning_rate": 1.542066449518828e-05, "loss": 0.8242, "step": 4962 }, { "epoch": 0.34, "learning_rate": 1.5418809524240072e-05, "loss": 0.8496, "step": 4963 }, { "epoch": 0.34, "learning_rate": 1.5416954289287734e-05, "loss": 0.8486, "step": 4964 }, { "epoch": 0.34, "learning_rate": 1.5415098790421648e-05, "loss": 0.7822, "step": 4965 }, { "epoch": 0.34, "learning_rate": 1.5413243027732212e-05, "loss": 0.7949, "step": 4966 }, { "epoch": 0.34, "learning_rate": 1.541138700130984e-05, "loss": 0.8193, "step": 4967 }, { "epoch": 0.34, "learning_rate": 1.5409530711244954e-05, "loss": 0.9111, "step": 4968 }, { "epoch": 0.34, "learning_rate": 1.5407674157627997e-05, "loss": 0.8115, "step": 4969 }, { "epoch": 0.34, "learning_rate": 1.5405817340549424e-05, "loss": 0.7471, "step": 4970 }, { "epoch": 0.34, "learning_rate": 1.5403960260099685e-05, "loss": 0.8613, "step": 4971 }, { "epoch": 0.34, "learning_rate": 1.5402102916369274e-05, "loss": 0.9258, "step": 4972 }, { "epoch": 0.34, "learning_rate": 1.5400245309448666e-05, "loss": 0.8057, "step": 4973 }, { "epoch": 0.34, "learning_rate": 1.539838743942837e-05, "loss": 0.8486, "step": 4974 }, { "epoch": 0.34, "learning_rate": 1.5396529306398905e-05, "loss": 0.835, "step": 4975 }, { "epoch": 0.34, "learning_rate": 1.5394670910450793e-05, "loss": 0.8506, "step": 4976 }, { "epoch": 0.34, "learning_rate": 1.539281225167458e-05, "loss": 0.8623, "step": 4977 }, { "epoch": 0.34, "learning_rate": 1.5390953330160812e-05, "loss": 0.8633, "step": 4978 }, { "epoch": 0.34, "learning_rate": 1.5389094146000066e-05, "loss": 0.8594, "step": 4979 }, { "epoch": 0.34, "learning_rate": 1.538723469928291e-05, "loss": 0.8555, "step": 4980 }, { "epoch": 0.34, "learning_rate": 1.538537499009995e-05, "loss": 0.8027, "step": 4981 }, { "epoch": 0.34, "learning_rate": 1.538351501854178e-05, "loss": 0.8496, "step": 4982 }, { "epoch": 0.34, "learning_rate": 1.5381654784699016e-05, "loss": 0.8398, "step": 4983 }, { "epoch": 0.34, "learning_rate": 1.5379794288662298e-05, "loss": 0.8525, "step": 4984 }, { "epoch": 0.34, "learning_rate": 1.5377933530522265e-05, "loss": 0.8145, "step": 4985 }, { "epoch": 0.34, "learning_rate": 1.5376072510369572e-05, "loss": 0.8057, "step": 4986 }, { "epoch": 0.34, "learning_rate": 1.5374211228294888e-05, "loss": 0.7715, "step": 4987 }, { "epoch": 0.34, "learning_rate": 1.5372349684388895e-05, "loss": 0.8838, "step": 4988 }, { "epoch": 0.34, "learning_rate": 1.5370487878742285e-05, "loss": 0.8916, "step": 4989 }, { "epoch": 0.34, "learning_rate": 1.536862581144577e-05, "loss": 0.7998, "step": 4990 }, { "epoch": 0.34, "learning_rate": 1.536676348259007e-05, "loss": 0.8721, "step": 4991 }, { "epoch": 0.34, "learning_rate": 1.5364900892265912e-05, "loss": 0.8301, "step": 4992 }, { "epoch": 0.34, "learning_rate": 1.536303804056404e-05, "loss": 0.8262, "step": 4993 }, { "epoch": 0.34, "learning_rate": 1.5361174927575223e-05, "loss": 0.9287, "step": 4994 }, { "epoch": 0.34, "learning_rate": 1.5359311553390223e-05, "loss": 0.8379, "step": 4995 }, { "epoch": 0.34, "learning_rate": 1.5357447918099823e-05, "loss": 0.8477, "step": 4996 }, { "epoch": 0.34, "learning_rate": 1.5355584021794824e-05, "loss": 0.7734, "step": 4997 }, { "epoch": 0.34, "learning_rate": 1.535371986456603e-05, "loss": 0.8066, "step": 4998 }, { "epoch": 0.34, "learning_rate": 1.5351855446504268e-05, "loss": 0.874, "step": 4999 }, { "epoch": 0.34, "learning_rate": 1.534999076770037e-05, "loss": 0.8066, "step": 5000 }, { "epoch": 0.34, "learning_rate": 1.5348125828245182e-05, "loss": 0.7842, "step": 5001 }, { "epoch": 0.34, "learning_rate": 1.5346260628229564e-05, "loss": 0.7725, "step": 5002 }, { "epoch": 0.34, "learning_rate": 1.5344395167744394e-05, "loss": 0.8584, "step": 5003 }, { "epoch": 0.34, "learning_rate": 1.534252944688054e-05, "loss": 0.7803, "step": 5004 }, { "epoch": 0.34, "learning_rate": 1.5340663465728922e-05, "loss": 0.8008, "step": 5005 }, { "epoch": 0.34, "learning_rate": 1.533879722438044e-05, "loss": 0.7529, "step": 5006 }, { "epoch": 0.34, "learning_rate": 1.5336930722926013e-05, "loss": 0.8545, "step": 5007 }, { "epoch": 0.34, "learning_rate": 1.5335063961456582e-05, "loss": 0.8105, "step": 5008 }, { "epoch": 0.34, "learning_rate": 1.5333196940063098e-05, "loss": 0.8379, "step": 5009 }, { "epoch": 0.34, "learning_rate": 1.5331329658836517e-05, "loss": 0.9092, "step": 5010 }, { "epoch": 0.34, "learning_rate": 1.5329462117867815e-05, "loss": 0.7871, "step": 5011 }, { "epoch": 0.34, "learning_rate": 1.532759431724798e-05, "loss": 0.9512, "step": 5012 }, { "epoch": 0.34, "learning_rate": 1.5325726257068007e-05, "loss": 0.9092, "step": 5013 }, { "epoch": 0.34, "learning_rate": 1.5323857937418915e-05, "loss": 0.7939, "step": 5014 }, { "epoch": 0.34, "learning_rate": 1.5321989358391722e-05, "loss": 0.8916, "step": 5015 }, { "epoch": 0.34, "learning_rate": 1.5320120520077465e-05, "loss": 0.8311, "step": 5016 }, { "epoch": 0.34, "learning_rate": 1.5318251422567195e-05, "loss": 0.8486, "step": 5017 }, { "epoch": 0.34, "learning_rate": 1.531638206595198e-05, "loss": 0.7451, "step": 5018 }, { "epoch": 0.34, "learning_rate": 1.5314512450322884e-05, "loss": 0.8096, "step": 5019 }, { "epoch": 0.34, "learning_rate": 1.5312642575771003e-05, "loss": 0.833, "step": 5020 }, { "epoch": 0.34, "learning_rate": 1.531077244238744e-05, "loss": 0.8457, "step": 5021 }, { "epoch": 0.34, "learning_rate": 1.530890205026329e-05, "loss": 0.8145, "step": 5022 }, { "epoch": 0.34, "learning_rate": 1.5307031399489702e-05, "loss": 0.8867, "step": 5023 }, { "epoch": 0.34, "learning_rate": 1.53051604901578e-05, "loss": 0.8477, "step": 5024 }, { "epoch": 0.34, "learning_rate": 1.530328932235874e-05, "loss": 0.8359, "step": 5025 }, { "epoch": 0.34, "learning_rate": 1.5301417896183683e-05, "loss": 0.8379, "step": 5026 }, { "epoch": 0.34, "learning_rate": 1.52995462117238e-05, "loss": 0.8828, "step": 5027 }, { "epoch": 0.34, "learning_rate": 1.5297674269070285e-05, "loss": 0.8008, "step": 5028 }, { "epoch": 0.34, "learning_rate": 1.529580206831434e-05, "loss": 0.833, "step": 5029 }, { "epoch": 0.34, "learning_rate": 1.5293929609547174e-05, "loss": 0.7715, "step": 5030 }, { "epoch": 0.34, "learning_rate": 1.5292056892860017e-05, "loss": 0.7529, "step": 5031 }, { "epoch": 0.34, "learning_rate": 1.5290183918344107e-05, "loss": 0.8213, "step": 5032 }, { "epoch": 0.34, "learning_rate": 1.5288310686090695e-05, "loss": 0.8135, "step": 5033 }, { "epoch": 0.34, "learning_rate": 1.5286437196191043e-05, "loss": 0.8877, "step": 5034 }, { "epoch": 0.34, "learning_rate": 1.5284563448736427e-05, "loss": 0.873, "step": 5035 }, { "epoch": 0.34, "learning_rate": 1.528268944381814e-05, "loss": 0.8086, "step": 5036 }, { "epoch": 0.34, "learning_rate": 1.5280815181527477e-05, "loss": 0.8086, "step": 5037 }, { "epoch": 0.34, "learning_rate": 1.527894066195576e-05, "loss": 0.8081, "step": 5038 }, { "epoch": 0.34, "learning_rate": 1.5277065885194313e-05, "loss": 0.8828, "step": 5039 }, { "epoch": 0.34, "learning_rate": 1.527519085133447e-05, "loss": 0.8418, "step": 5040 }, { "epoch": 0.34, "learning_rate": 1.527331556046759e-05, "loss": 0.8486, "step": 5041 }, { "epoch": 0.34, "learning_rate": 1.5271440012685027e-05, "loss": 0.8887, "step": 5042 }, { "epoch": 0.34, "learning_rate": 1.5269564208078165e-05, "loss": 0.8291, "step": 5043 }, { "epoch": 0.34, "learning_rate": 1.5267688146738392e-05, "loss": 0.9053, "step": 5044 }, { "epoch": 0.34, "learning_rate": 1.5265811828757113e-05, "loss": 0.7607, "step": 5045 }, { "epoch": 0.34, "learning_rate": 1.5263935254225735e-05, "loss": 0.8037, "step": 5046 }, { "epoch": 0.34, "learning_rate": 1.526205842323569e-05, "loss": 0.8643, "step": 5047 }, { "epoch": 0.34, "learning_rate": 1.526018133587841e-05, "loss": 0.7949, "step": 5048 }, { "epoch": 0.34, "learning_rate": 1.525830399224536e-05, "loss": 0.8516, "step": 5049 }, { "epoch": 0.34, "learning_rate": 1.5256426392427992e-05, "loss": 0.9141, "step": 5050 }, { "epoch": 0.34, "learning_rate": 1.5254548536517786e-05, "loss": 0.916, "step": 5051 }, { "epoch": 0.34, "learning_rate": 1.5252670424606236e-05, "loss": 0.8535, "step": 5052 }, { "epoch": 0.34, "learning_rate": 1.525079205678483e-05, "loss": 0.8223, "step": 5053 }, { "epoch": 0.34, "learning_rate": 1.5248913433145098e-05, "loss": 0.874, "step": 5054 }, { "epoch": 0.34, "learning_rate": 1.5247034553778556e-05, "loss": 0.8115, "step": 5055 }, { "epoch": 0.34, "learning_rate": 1.5245155418776751e-05, "loss": 0.917, "step": 5056 }, { "epoch": 0.34, "learning_rate": 1.5243276028231227e-05, "loss": 0.917, "step": 5057 }, { "epoch": 0.34, "learning_rate": 1.5241396382233552e-05, "loss": 0.7852, "step": 5058 }, { "epoch": 0.34, "learning_rate": 1.5239516480875298e-05, "loss": 0.8281, "step": 5059 }, { "epoch": 0.34, "learning_rate": 1.5237636324248057e-05, "loss": 0.7832, "step": 5060 }, { "epoch": 0.34, "learning_rate": 1.5235755912443431e-05, "loss": 0.9004, "step": 5061 }, { "epoch": 0.34, "learning_rate": 1.5233875245553034e-05, "loss": 0.9229, "step": 5062 }, { "epoch": 0.35, "learning_rate": 1.5231994323668487e-05, "loss": 0.8457, "step": 5063 }, { "epoch": 0.35, "learning_rate": 1.5230113146881436e-05, "loss": 0.7803, "step": 5064 }, { "epoch": 0.35, "learning_rate": 1.5228231715283524e-05, "loss": 0.8359, "step": 5065 }, { "epoch": 0.35, "learning_rate": 1.5226350028966415e-05, "loss": 0.8613, "step": 5066 }, { "epoch": 0.35, "learning_rate": 1.5224468088021792e-05, "loss": 0.8271, "step": 5067 }, { "epoch": 0.35, "learning_rate": 1.522258589254134e-05, "loss": 0.8311, "step": 5068 }, { "epoch": 0.35, "learning_rate": 1.5220703442616753e-05, "loss": 0.8242, "step": 5069 }, { "epoch": 0.35, "learning_rate": 1.5218820738339752e-05, "loss": 0.7861, "step": 5070 }, { "epoch": 0.35, "learning_rate": 1.521693777980206e-05, "loss": 0.7334, "step": 5071 }, { "epoch": 0.35, "learning_rate": 1.5215054567095411e-05, "loss": 0.8936, "step": 5072 }, { "epoch": 0.35, "learning_rate": 1.5213171100311562e-05, "loss": 0.8643, "step": 5073 }, { "epoch": 0.35, "learning_rate": 1.5211287379542266e-05, "loss": 0.7803, "step": 5074 }, { "epoch": 0.35, "learning_rate": 1.5209403404879305e-05, "loss": 0.7969, "step": 5075 }, { "epoch": 0.35, "learning_rate": 1.5207519176414462e-05, "loss": 0.8096, "step": 5076 }, { "epoch": 0.35, "learning_rate": 1.5205634694239544e-05, "loss": 0.9004, "step": 5077 }, { "epoch": 0.35, "learning_rate": 1.5203749958446352e-05, "loss": 0.8857, "step": 5078 }, { "epoch": 0.35, "learning_rate": 1.5201864969126718e-05, "loss": 0.835, "step": 5079 }, { "epoch": 0.35, "learning_rate": 1.519997972637248e-05, "loss": 0.8838, "step": 5080 }, { "epoch": 0.35, "learning_rate": 1.5198094230275478e-05, "loss": 0.9092, "step": 5081 }, { "epoch": 0.35, "learning_rate": 1.5196208480927581e-05, "loss": 0.8984, "step": 5082 }, { "epoch": 0.35, "learning_rate": 1.5194322478420663e-05, "loss": 0.9258, "step": 5083 }, { "epoch": 0.35, "learning_rate": 1.51924362228466e-05, "loss": 0.7979, "step": 5084 }, { "epoch": 0.35, "learning_rate": 1.5190549714297303e-05, "loss": 0.8379, "step": 5085 }, { "epoch": 0.35, "learning_rate": 1.5188662952864674e-05, "loss": 0.8477, "step": 5086 }, { "epoch": 0.35, "learning_rate": 1.5186775938640641e-05, "loss": 0.8369, "step": 5087 }, { "epoch": 0.35, "learning_rate": 1.5184888671717137e-05, "loss": 0.8408, "step": 5088 }, { "epoch": 0.35, "learning_rate": 1.5183001152186113e-05, "loss": 0.8184, "step": 5089 }, { "epoch": 0.35, "learning_rate": 1.5181113380139518e-05, "loss": 0.8506, "step": 5090 }, { "epoch": 0.35, "learning_rate": 1.5179225355669338e-05, "loss": 0.8096, "step": 5091 }, { "epoch": 0.35, "learning_rate": 1.5177337078867548e-05, "loss": 0.8799, "step": 5092 }, { "epoch": 0.35, "learning_rate": 1.517544854982615e-05, "loss": 0.8311, "step": 5093 }, { "epoch": 0.35, "learning_rate": 1.5173559768637149e-05, "loss": 0.8379, "step": 5094 }, { "epoch": 0.35, "learning_rate": 1.5171670735392572e-05, "loss": 0.8594, "step": 5095 }, { "epoch": 0.35, "learning_rate": 1.5169781450184445e-05, "loss": 0.8379, "step": 5096 }, { "epoch": 0.35, "learning_rate": 1.516789191310482e-05, "loss": 0.8379, "step": 5097 }, { "epoch": 0.35, "learning_rate": 1.5166002124245753e-05, "loss": 0.8564, "step": 5098 }, { "epoch": 0.35, "learning_rate": 1.5164112083699314e-05, "loss": 0.8604, "step": 5099 }, { "epoch": 0.35, "learning_rate": 1.5162221791557586e-05, "loss": 0.833, "step": 5100 }, { "epoch": 0.35, "learning_rate": 1.5160331247912665e-05, "loss": 0.7959, "step": 5101 }, { "epoch": 0.35, "learning_rate": 1.5158440452856653e-05, "loss": 0.7139, "step": 5102 }, { "epoch": 0.35, "learning_rate": 1.515654940648168e-05, "loss": 0.8643, "step": 5103 }, { "epoch": 0.35, "learning_rate": 1.5154658108879866e-05, "loss": 0.7246, "step": 5104 }, { "epoch": 0.35, "learning_rate": 1.5152766560143364e-05, "loss": 0.8203, "step": 5105 }, { "epoch": 0.35, "learning_rate": 1.5150874760364324e-05, "loss": 0.8262, "step": 5106 }, { "epoch": 0.35, "learning_rate": 1.5148982709634919e-05, "loss": 0.873, "step": 5107 }, { "epoch": 0.35, "learning_rate": 1.5147090408047325e-05, "loss": 0.874, "step": 5108 }, { "epoch": 0.35, "learning_rate": 1.5145197855693741e-05, "loss": 0.7754, "step": 5109 }, { "epoch": 0.35, "learning_rate": 1.5143305052666366e-05, "loss": 0.876, "step": 5110 }, { "epoch": 0.35, "learning_rate": 1.5141411999057418e-05, "loss": 0.751, "step": 5111 }, { "epoch": 0.35, "learning_rate": 1.5139518694959133e-05, "loss": 0.8896, "step": 5112 }, { "epoch": 0.35, "learning_rate": 1.5137625140463744e-05, "loss": 0.8467, "step": 5113 }, { "epoch": 0.35, "learning_rate": 1.513573133566351e-05, "loss": 0.8965, "step": 5114 }, { "epoch": 0.35, "learning_rate": 1.5133837280650694e-05, "loss": 0.7979, "step": 5115 }, { "epoch": 0.35, "learning_rate": 1.5131942975517579e-05, "loss": 0.875, "step": 5116 }, { "epoch": 0.35, "learning_rate": 1.5130048420356448e-05, "loss": 0.8398, "step": 5117 }, { "epoch": 0.35, "learning_rate": 1.5128153615259612e-05, "loss": 0.9033, "step": 5118 }, { "epoch": 0.35, "learning_rate": 1.5126258560319382e-05, "loss": 0.835, "step": 5119 }, { "epoch": 0.35, "learning_rate": 1.512436325562808e-05, "loss": 0.7715, "step": 5120 }, { "epoch": 0.35, "learning_rate": 1.5122467701278058e-05, "loss": 0.8369, "step": 5121 }, { "epoch": 0.35, "learning_rate": 1.5120571897361656e-05, "loss": 0.7988, "step": 5122 }, { "epoch": 0.35, "learning_rate": 1.5118675843971238e-05, "loss": 0.8174, "step": 5123 }, { "epoch": 0.35, "learning_rate": 1.5116779541199184e-05, "loss": 0.8906, "step": 5124 }, { "epoch": 0.35, "learning_rate": 1.5114882989137882e-05, "loss": 0.7881, "step": 5125 }, { "epoch": 0.35, "learning_rate": 1.511298618787973e-05, "loss": 0.8926, "step": 5126 }, { "epoch": 0.35, "learning_rate": 1.511108913751714e-05, "loss": 0.8652, "step": 5127 }, { "epoch": 0.35, "learning_rate": 1.5109191838142537e-05, "loss": 0.875, "step": 5128 }, { "epoch": 0.35, "learning_rate": 1.5107294289848353e-05, "loss": 0.8203, "step": 5129 }, { "epoch": 0.35, "learning_rate": 1.5105396492727043e-05, "loss": 0.7314, "step": 5130 }, { "epoch": 0.35, "learning_rate": 1.5103498446871067e-05, "loss": 0.8096, "step": 5131 }, { "epoch": 0.35, "learning_rate": 1.5101600152372892e-05, "loss": 0.8701, "step": 5132 }, { "epoch": 0.35, "learning_rate": 1.5099701609325009e-05, "loss": 0.8506, "step": 5133 }, { "epoch": 0.35, "learning_rate": 1.5097802817819911e-05, "loss": 0.8105, "step": 5134 }, { "epoch": 0.35, "learning_rate": 1.5095903777950108e-05, "loss": 0.9248, "step": 5135 }, { "epoch": 0.35, "learning_rate": 1.509400448980812e-05, "loss": 0.9004, "step": 5136 }, { "epoch": 0.35, "learning_rate": 1.5092104953486486e-05, "loss": 0.7695, "step": 5137 }, { "epoch": 0.35, "learning_rate": 1.5090205169077743e-05, "loss": 0.8213, "step": 5138 }, { "epoch": 0.35, "learning_rate": 1.5088305136674454e-05, "loss": 0.8154, "step": 5139 }, { "epoch": 0.35, "learning_rate": 1.5086404856369186e-05, "loss": 0.79, "step": 5140 }, { "epoch": 0.35, "learning_rate": 1.5084504328254524e-05, "loss": 0.8105, "step": 5141 }, { "epoch": 0.35, "learning_rate": 1.5082603552423059e-05, "loss": 0.8281, "step": 5142 }, { "epoch": 0.35, "learning_rate": 1.5080702528967393e-05, "loss": 0.7666, "step": 5143 }, { "epoch": 0.35, "learning_rate": 1.5078801257980149e-05, "loss": 0.8125, "step": 5144 }, { "epoch": 0.35, "learning_rate": 1.5076899739553957e-05, "loss": 0.7529, "step": 5145 }, { "epoch": 0.35, "learning_rate": 1.5074997973781455e-05, "loss": 0.7852, "step": 5146 }, { "epoch": 0.35, "learning_rate": 1.5073095960755302e-05, "loss": 0.8789, "step": 5147 }, { "epoch": 0.35, "learning_rate": 1.5071193700568159e-05, "loss": 0.7354, "step": 5148 }, { "epoch": 0.35, "learning_rate": 1.5069291193312707e-05, "loss": 0.8135, "step": 5149 }, { "epoch": 0.35, "learning_rate": 1.5067388439081634e-05, "loss": 0.7744, "step": 5150 }, { "epoch": 0.35, "learning_rate": 1.5065485437967646e-05, "loss": 0.8877, "step": 5151 }, { "epoch": 0.35, "learning_rate": 1.5063582190063453e-05, "loss": 0.875, "step": 5152 }, { "epoch": 0.35, "learning_rate": 1.5061678695461783e-05, "loss": 0.7354, "step": 5153 }, { "epoch": 0.35, "learning_rate": 1.5059774954255373e-05, "loss": 0.8506, "step": 5154 }, { "epoch": 0.35, "learning_rate": 1.5057870966536977e-05, "loss": 0.8398, "step": 5155 }, { "epoch": 0.35, "learning_rate": 1.5055966732399347e-05, "loss": 0.8467, "step": 5156 }, { "epoch": 0.35, "learning_rate": 1.5054062251935273e-05, "loss": 0.8643, "step": 5157 }, { "epoch": 0.35, "learning_rate": 1.5052157525237525e-05, "loss": 0.8027, "step": 5158 }, { "epoch": 0.35, "learning_rate": 1.5050252552398914e-05, "loss": 0.8887, "step": 5159 }, { "epoch": 0.35, "learning_rate": 1.5048347333512245e-05, "loss": 0.7666, "step": 5160 }, { "epoch": 0.35, "learning_rate": 1.5046441868670339e-05, "loss": 0.8311, "step": 5161 }, { "epoch": 0.35, "learning_rate": 1.5044536157966027e-05, "loss": 0.873, "step": 5162 }, { "epoch": 0.35, "learning_rate": 1.5042630201492165e-05, "loss": 0.8115, "step": 5163 }, { "epoch": 0.35, "learning_rate": 1.5040723999341603e-05, "loss": 0.8174, "step": 5164 }, { "epoch": 0.35, "learning_rate": 1.5038817551607214e-05, "loss": 0.8574, "step": 5165 }, { "epoch": 0.35, "learning_rate": 1.5036910858381878e-05, "loss": 0.8408, "step": 5166 }, { "epoch": 0.35, "learning_rate": 1.5035003919758492e-05, "loss": 0.8613, "step": 5167 }, { "epoch": 0.35, "learning_rate": 1.5033096735829963e-05, "loss": 0.8838, "step": 5168 }, { "epoch": 0.35, "learning_rate": 1.5031189306689205e-05, "loss": 0.9307, "step": 5169 }, { "epoch": 0.35, "learning_rate": 1.5029281632429147e-05, "loss": 0.9092, "step": 5170 }, { "epoch": 0.35, "learning_rate": 1.5027373713142735e-05, "loss": 0.8418, "step": 5171 }, { "epoch": 0.35, "learning_rate": 1.502546554892292e-05, "loss": 0.7969, "step": 5172 }, { "epoch": 0.35, "learning_rate": 1.502355713986267e-05, "loss": 0.7832, "step": 5173 }, { "epoch": 0.35, "learning_rate": 1.5021648486054959e-05, "loss": 0.9053, "step": 5174 }, { "epoch": 0.35, "learning_rate": 1.5019739587592783e-05, "loss": 0.8184, "step": 5175 }, { "epoch": 0.35, "learning_rate": 1.5017830444569134e-05, "loss": 0.9014, "step": 5176 }, { "epoch": 0.35, "learning_rate": 1.5015921057077033e-05, "loss": 0.8105, "step": 5177 }, { "epoch": 0.35, "learning_rate": 1.5014011425209503e-05, "loss": 0.8848, "step": 5178 }, { "epoch": 0.35, "learning_rate": 1.501210154905958e-05, "loss": 0.7793, "step": 5179 }, { "epoch": 0.35, "learning_rate": 1.5010191428720313e-05, "loss": 0.8574, "step": 5180 }, { "epoch": 0.35, "learning_rate": 1.5008281064284767e-05, "loss": 0.877, "step": 5181 }, { "epoch": 0.35, "learning_rate": 1.5006370455846007e-05, "loss": 0.8301, "step": 5182 }, { "epoch": 0.35, "learning_rate": 1.5004459603497126e-05, "loss": 0.8096, "step": 5183 }, { "epoch": 0.35, "learning_rate": 1.5002548507331216e-05, "loss": 0.8721, "step": 5184 }, { "epoch": 0.35, "learning_rate": 1.5000637167441388e-05, "loss": 0.7803, "step": 5185 }, { "epoch": 0.35, "learning_rate": 1.499872558392076e-05, "loss": 0.9385, "step": 5186 }, { "epoch": 0.35, "learning_rate": 1.4996813756862466e-05, "loss": 0.877, "step": 5187 }, { "epoch": 0.35, "learning_rate": 1.4994901686359646e-05, "loss": 0.8369, "step": 5188 }, { "epoch": 0.35, "learning_rate": 1.4992989372505466e-05, "loss": 0.8584, "step": 5189 }, { "epoch": 0.35, "learning_rate": 1.4991076815393082e-05, "loss": 0.7793, "step": 5190 }, { "epoch": 0.35, "learning_rate": 1.4989164015115681e-05, "loss": 0.8945, "step": 5191 }, { "epoch": 0.35, "learning_rate": 1.4987250971766451e-05, "loss": 0.9053, "step": 5192 }, { "epoch": 0.35, "learning_rate": 1.4985337685438598e-05, "loss": 0.918, "step": 5193 }, { "epoch": 0.35, "learning_rate": 1.4983424156225337e-05, "loss": 0.8018, "step": 5194 }, { "epoch": 0.35, "learning_rate": 1.4981510384219892e-05, "loss": 0.7451, "step": 5195 }, { "epoch": 0.35, "learning_rate": 1.4979596369515508e-05, "loss": 0.8105, "step": 5196 }, { "epoch": 0.35, "learning_rate": 1.4977682112205428e-05, "loss": 0.7217, "step": 5197 }, { "epoch": 0.35, "learning_rate": 1.497576761238292e-05, "loss": 0.833, "step": 5198 }, { "epoch": 0.35, "learning_rate": 1.4973852870141254e-05, "loss": 0.7998, "step": 5199 }, { "epoch": 0.35, "learning_rate": 1.497193788557372e-05, "loss": 0.8164, "step": 5200 }, { "epoch": 0.35, "learning_rate": 1.4970022658773616e-05, "loss": 0.876, "step": 5201 }, { "epoch": 0.35, "learning_rate": 1.4968107189834248e-05, "loss": 0.8125, "step": 5202 }, { "epoch": 0.35, "learning_rate": 1.4966191478848941e-05, "loss": 0.7988, "step": 5203 }, { "epoch": 0.35, "learning_rate": 1.4964275525911029e-05, "loss": 0.7705, "step": 5204 }, { "epoch": 0.35, "learning_rate": 1.4962359331113853e-05, "loss": 0.7598, "step": 5205 }, { "epoch": 0.35, "learning_rate": 1.4960442894550775e-05, "loss": 0.7832, "step": 5206 }, { "epoch": 0.35, "learning_rate": 1.4958526216315161e-05, "loss": 0.8584, "step": 5207 }, { "epoch": 0.35, "learning_rate": 1.4956609296500388e-05, "loss": 0.8975, "step": 5208 }, { "epoch": 0.35, "learning_rate": 1.4954692135199856e-05, "loss": 0.8418, "step": 5209 }, { "epoch": 0.36, "learning_rate": 1.4952774732506963e-05, "loss": 0.7539, "step": 5210 }, { "epoch": 0.36, "learning_rate": 1.4950857088515128e-05, "loss": 0.8076, "step": 5211 }, { "epoch": 0.36, "learning_rate": 1.4948939203317774e-05, "loss": 0.8447, "step": 5212 }, { "epoch": 0.36, "learning_rate": 1.4947021077008343e-05, "loss": 0.8525, "step": 5213 }, { "epoch": 0.36, "learning_rate": 1.4945102709680291e-05, "loss": 0.8408, "step": 5214 }, { "epoch": 0.36, "learning_rate": 1.4943184101427073e-05, "loss": 0.9297, "step": 5215 }, { "epoch": 0.36, "learning_rate": 1.4941265252342167e-05, "loss": 0.7949, "step": 5216 }, { "epoch": 0.36, "learning_rate": 1.493934616251906e-05, "loss": 0.8301, "step": 5217 }, { "epoch": 0.36, "learning_rate": 1.4937426832051245e-05, "loss": 0.8398, "step": 5218 }, { "epoch": 0.36, "learning_rate": 1.4935507261032241e-05, "loss": 0.8301, "step": 5219 }, { "epoch": 0.36, "learning_rate": 1.4933587449555562e-05, "loss": 0.8223, "step": 5220 }, { "epoch": 0.36, "learning_rate": 1.493166739771474e-05, "loss": 0.8047, "step": 5221 }, { "epoch": 0.36, "learning_rate": 1.4929747105603327e-05, "loss": 0.8154, "step": 5222 }, { "epoch": 0.36, "learning_rate": 1.4927826573314871e-05, "loss": 0.877, "step": 5223 }, { "epoch": 0.36, "learning_rate": 1.4925905800942948e-05, "loss": 0.835, "step": 5224 }, { "epoch": 0.36, "learning_rate": 1.4923984788581134e-05, "loss": 0.8555, "step": 5225 }, { "epoch": 0.36, "learning_rate": 1.4922063536323022e-05, "loss": 0.8574, "step": 5226 }, { "epoch": 0.36, "learning_rate": 1.4920142044262213e-05, "loss": 0.8242, "step": 5227 }, { "epoch": 0.36, "learning_rate": 1.4918220312492325e-05, "loss": 0.8389, "step": 5228 }, { "epoch": 0.36, "learning_rate": 1.4916298341106982e-05, "loss": 0.7412, "step": 5229 }, { "epoch": 0.36, "learning_rate": 1.4914376130199823e-05, "loss": 0.8252, "step": 5230 }, { "epoch": 0.36, "learning_rate": 1.49124536798645e-05, "loss": 0.8311, "step": 5231 }, { "epoch": 0.36, "learning_rate": 1.4910530990194674e-05, "loss": 0.8613, "step": 5232 }, { "epoch": 0.36, "learning_rate": 1.4908608061284016e-05, "loss": 0.8906, "step": 5233 }, { "epoch": 0.36, "learning_rate": 1.4906684893226213e-05, "loss": 0.8545, "step": 5234 }, { "epoch": 0.36, "learning_rate": 1.4904761486114963e-05, "loss": 0.7783, "step": 5235 }, { "epoch": 0.36, "learning_rate": 1.4902837840043969e-05, "loss": 0.7607, "step": 5236 }, { "epoch": 0.36, "learning_rate": 1.4900913955106957e-05, "loss": 0.8535, "step": 5237 }, { "epoch": 0.36, "learning_rate": 1.4898989831397657e-05, "loss": 0.8125, "step": 5238 }, { "epoch": 0.36, "learning_rate": 1.4897065469009808e-05, "loss": 0.8232, "step": 5239 }, { "epoch": 0.36, "learning_rate": 1.489514086803717e-05, "loss": 0.8428, "step": 5240 }, { "epoch": 0.36, "learning_rate": 1.4893216028573507e-05, "loss": 0.8271, "step": 5241 }, { "epoch": 0.36, "learning_rate": 1.48912909507126e-05, "loss": 0.8447, "step": 5242 }, { "epoch": 0.36, "learning_rate": 1.4889365634548237e-05, "loss": 0.8203, "step": 5243 }, { "epoch": 0.36, "learning_rate": 1.4887440080174217e-05, "loss": 0.9219, "step": 5244 }, { "epoch": 0.36, "learning_rate": 1.488551428768435e-05, "loss": 0.8506, "step": 5245 }, { "epoch": 0.36, "learning_rate": 1.488358825717247e-05, "loss": 0.8125, "step": 5246 }, { "epoch": 0.36, "learning_rate": 1.488166198873241e-05, "loss": 0.8633, "step": 5247 }, { "epoch": 0.36, "learning_rate": 1.4879735482458012e-05, "loss": 0.7861, "step": 5248 }, { "epoch": 0.36, "learning_rate": 1.487780873844314e-05, "loss": 0.8818, "step": 5249 }, { "epoch": 0.36, "learning_rate": 1.4875881756781667e-05, "loss": 0.832, "step": 5250 }, { "epoch": 0.36, "learning_rate": 1.487395453756747e-05, "loss": 0.7246, "step": 5251 }, { "epoch": 0.36, "learning_rate": 1.4872027080894445e-05, "loss": 0.8086, "step": 5252 }, { "epoch": 0.36, "learning_rate": 1.4870099386856502e-05, "loss": 0.917, "step": 5253 }, { "epoch": 0.36, "learning_rate": 1.4868171455547548e-05, "loss": 0.8193, "step": 5254 }, { "epoch": 0.36, "learning_rate": 1.4866243287061523e-05, "loss": 0.8965, "step": 5255 }, { "epoch": 0.36, "learning_rate": 1.4864314881492363e-05, "loss": 0.8594, "step": 5256 }, { "epoch": 0.36, "learning_rate": 1.4862386238934017e-05, "loss": 0.8652, "step": 5257 }, { "epoch": 0.36, "learning_rate": 1.4860457359480451e-05, "loss": 0.8262, "step": 5258 }, { "epoch": 0.36, "learning_rate": 1.4858528243225641e-05, "loss": 0.8545, "step": 5259 }, { "epoch": 0.36, "learning_rate": 1.4856598890263566e-05, "loss": 0.8047, "step": 5260 }, { "epoch": 0.36, "learning_rate": 1.4854669300688238e-05, "loss": 0.8027, "step": 5261 }, { "epoch": 0.36, "learning_rate": 1.4852739474593654e-05, "loss": 0.8203, "step": 5262 }, { "epoch": 0.36, "learning_rate": 1.4850809412073841e-05, "loss": 0.7959, "step": 5263 }, { "epoch": 0.36, "learning_rate": 1.484887911322283e-05, "loss": 0.7646, "step": 5264 }, { "epoch": 0.36, "learning_rate": 1.4846948578134664e-05, "loss": 0.8506, "step": 5265 }, { "epoch": 0.36, "learning_rate": 1.4845017806903399e-05, "loss": 0.8779, "step": 5266 }, { "epoch": 0.36, "learning_rate": 1.4843086799623104e-05, "loss": 0.8867, "step": 5267 }, { "epoch": 0.36, "learning_rate": 1.4841155556387857e-05, "loss": 0.8398, "step": 5268 }, { "epoch": 0.36, "learning_rate": 1.4839224077291745e-05, "loss": 0.8154, "step": 5269 }, { "epoch": 0.36, "learning_rate": 1.4837292362428872e-05, "loss": 0.7861, "step": 5270 }, { "epoch": 0.36, "learning_rate": 1.4835360411893353e-05, "loss": 0.8174, "step": 5271 }, { "epoch": 0.36, "learning_rate": 1.4833428225779308e-05, "loss": 0.8389, "step": 5272 }, { "epoch": 0.36, "learning_rate": 1.483149580418088e-05, "loss": 0.8535, "step": 5273 }, { "epoch": 0.36, "learning_rate": 1.482956314719221e-05, "loss": 0.8623, "step": 5274 }, { "epoch": 0.36, "learning_rate": 1.4827630254907454e-05, "loss": 0.8408, "step": 5275 }, { "epoch": 0.36, "learning_rate": 1.4825697127420795e-05, "loss": 0.7334, "step": 5276 }, { "epoch": 0.36, "learning_rate": 1.4823763764826401e-05, "loss": 0.8555, "step": 5277 }, { "epoch": 0.36, "learning_rate": 1.4821830167218476e-05, "loss": 0.8682, "step": 5278 }, { "epoch": 0.36, "learning_rate": 1.4819896334691221e-05, "loss": 0.833, "step": 5279 }, { "epoch": 0.36, "learning_rate": 1.481796226733885e-05, "loss": 0.8271, "step": 5280 }, { "epoch": 0.36, "learning_rate": 1.4816027965255591e-05, "loss": 0.833, "step": 5281 }, { "epoch": 0.36, "learning_rate": 1.4814093428535684e-05, "loss": 0.8545, "step": 5282 }, { "epoch": 0.36, "learning_rate": 1.4812158657273383e-05, "loss": 0.8691, "step": 5283 }, { "epoch": 0.36, "learning_rate": 1.4810223651562944e-05, "loss": 0.8555, "step": 5284 }, { "epoch": 0.36, "learning_rate": 1.4808288411498644e-05, "loss": 0.8164, "step": 5285 }, { "epoch": 0.36, "learning_rate": 1.4806352937174768e-05, "loss": 0.8242, "step": 5286 }, { "epoch": 0.36, "learning_rate": 1.4804417228685613e-05, "loss": 0.8057, "step": 5287 }, { "epoch": 0.36, "learning_rate": 1.480248128612548e-05, "loss": 0.8994, "step": 5288 }, { "epoch": 0.36, "learning_rate": 1.4800545109588696e-05, "loss": 0.833, "step": 5289 }, { "epoch": 0.36, "learning_rate": 1.479860869916959e-05, "loss": 0.8916, "step": 5290 }, { "epoch": 0.36, "learning_rate": 1.47966720549625e-05, "loss": 0.7861, "step": 5291 }, { "epoch": 0.36, "learning_rate": 1.479473517706178e-05, "loss": 0.8389, "step": 5292 }, { "epoch": 0.36, "learning_rate": 1.4792798065561798e-05, "loss": 0.8555, "step": 5293 }, { "epoch": 0.36, "learning_rate": 1.479086072055693e-05, "loss": 0.8506, "step": 5294 }, { "epoch": 0.36, "learning_rate": 1.4788923142141557e-05, "loss": 0.8164, "step": 5295 }, { "epoch": 0.36, "learning_rate": 1.4786985330410083e-05, "loss": 0.8203, "step": 5296 }, { "epoch": 0.36, "learning_rate": 1.4785047285456919e-05, "loss": 0.8662, "step": 5297 }, { "epoch": 0.36, "learning_rate": 1.4783109007376482e-05, "loss": 0.8789, "step": 5298 }, { "epoch": 0.36, "learning_rate": 1.478117049626321e-05, "loss": 0.8867, "step": 5299 }, { "epoch": 0.36, "learning_rate": 1.4779231752211546e-05, "loss": 0.8525, "step": 5300 }, { "epoch": 0.36, "learning_rate": 1.477729277531594e-05, "loss": 0.7988, "step": 5301 }, { "epoch": 0.36, "learning_rate": 1.4775353565670866e-05, "loss": 0.9023, "step": 5302 }, { "epoch": 0.36, "learning_rate": 1.4773414123370798e-05, "loss": 0.7861, "step": 5303 }, { "epoch": 0.36, "learning_rate": 1.4771474448510225e-05, "loss": 0.8809, "step": 5304 }, { "epoch": 0.36, "learning_rate": 1.4769534541183652e-05, "loss": 0.8398, "step": 5305 }, { "epoch": 0.36, "learning_rate": 1.476759440148559e-05, "loss": 0.8164, "step": 5306 }, { "epoch": 0.36, "learning_rate": 1.4765654029510556e-05, "loss": 0.8506, "step": 5307 }, { "epoch": 0.36, "learning_rate": 1.4763713425353096e-05, "loss": 0.8555, "step": 5308 }, { "epoch": 0.36, "learning_rate": 1.4761772589107747e-05, "loss": 0.8057, "step": 5309 }, { "epoch": 0.36, "learning_rate": 1.475983152086907e-05, "loss": 0.8369, "step": 5310 }, { "epoch": 0.36, "learning_rate": 1.4757890220731632e-05, "loss": 0.8594, "step": 5311 }, { "epoch": 0.36, "learning_rate": 1.4755948688790018e-05, "loss": 0.8857, "step": 5312 }, { "epoch": 0.36, "learning_rate": 1.4754006925138815e-05, "loss": 0.833, "step": 5313 }, { "epoch": 0.36, "learning_rate": 1.4752064929872623e-05, "loss": 0.8994, "step": 5314 }, { "epoch": 0.36, "learning_rate": 1.4750122703086062e-05, "loss": 0.8066, "step": 5315 }, { "epoch": 0.36, "learning_rate": 1.4748180244873753e-05, "loss": 0.8193, "step": 5316 }, { "epoch": 0.36, "learning_rate": 1.4746237555330339e-05, "loss": 0.9229, "step": 5317 }, { "epoch": 0.36, "learning_rate": 1.4744294634550457e-05, "loss": 0.873, "step": 5318 }, { "epoch": 0.36, "learning_rate": 1.4742351482628774e-05, "loss": 0.8936, "step": 5319 }, { "epoch": 0.36, "learning_rate": 1.4740408099659957e-05, "loss": 0.9053, "step": 5320 }, { "epoch": 0.36, "learning_rate": 1.473846448573869e-05, "loss": 0.8662, "step": 5321 }, { "epoch": 0.36, "learning_rate": 1.4736520640959664e-05, "loss": 0.8242, "step": 5322 }, { "epoch": 0.36, "learning_rate": 1.4734576565417585e-05, "loss": 0.8857, "step": 5323 }, { "epoch": 0.36, "learning_rate": 1.4732632259207162e-05, "loss": 0.748, "step": 5324 }, { "epoch": 0.36, "learning_rate": 1.4730687722423129e-05, "loss": 0.8145, "step": 5325 }, { "epoch": 0.36, "learning_rate": 1.4728742955160222e-05, "loss": 0.8262, "step": 5326 }, { "epoch": 0.36, "learning_rate": 1.4726797957513189e-05, "loss": 0.8496, "step": 5327 }, { "epoch": 0.36, "learning_rate": 1.4724852729576786e-05, "loss": 0.876, "step": 5328 }, { "epoch": 0.36, "learning_rate": 1.4722907271445792e-05, "loss": 0.8584, "step": 5329 }, { "epoch": 0.36, "learning_rate": 1.4720961583214985e-05, "loss": 0.8887, "step": 5330 }, { "epoch": 0.36, "learning_rate": 1.4719015664979162e-05, "loss": 0.8877, "step": 5331 }, { "epoch": 0.36, "learning_rate": 1.4717069516833123e-05, "loss": 0.877, "step": 5332 }, { "epoch": 0.36, "learning_rate": 1.4715123138871687e-05, "loss": 0.9062, "step": 5333 }, { "epoch": 0.36, "learning_rate": 1.4713176531189683e-05, "loss": 0.7666, "step": 5334 }, { "epoch": 0.36, "learning_rate": 1.4711229693881948e-05, "loss": 0.7998, "step": 5335 }, { "epoch": 0.36, "learning_rate": 1.4709282627043333e-05, "loss": 0.792, "step": 5336 }, { "epoch": 0.36, "learning_rate": 1.4707335330768695e-05, "loss": 0.8672, "step": 5337 }, { "epoch": 0.36, "learning_rate": 1.4705387805152914e-05, "loss": 0.79, "step": 5338 }, { "epoch": 0.36, "learning_rate": 1.4703440050290865e-05, "loss": 0.7822, "step": 5339 }, { "epoch": 0.36, "learning_rate": 1.4701492066277444e-05, "loss": 0.8623, "step": 5340 }, { "epoch": 0.36, "learning_rate": 1.4699543853207565e-05, "loss": 0.7734, "step": 5341 }, { "epoch": 0.36, "learning_rate": 1.4697595411176135e-05, "loss": 0.8691, "step": 5342 }, { "epoch": 0.36, "learning_rate": 1.4695646740278084e-05, "loss": 0.8164, "step": 5343 }, { "epoch": 0.36, "learning_rate": 1.4693697840608358e-05, "loss": 0.8857, "step": 5344 }, { "epoch": 0.36, "learning_rate": 1.4691748712261897e-05, "loss": 0.8535, "step": 5345 }, { "epoch": 0.36, "learning_rate": 1.4689799355333669e-05, "loss": 0.8809, "step": 5346 }, { "epoch": 0.36, "learning_rate": 1.4687849769918647e-05, "loss": 0.8623, "step": 5347 }, { "epoch": 0.36, "learning_rate": 1.4685899956111814e-05, "loss": 0.8184, "step": 5348 }, { "epoch": 0.36, "learning_rate": 1.4683949914008158e-05, "loss": 0.8662, "step": 5349 }, { "epoch": 0.36, "learning_rate": 1.4681999643702693e-05, "loss": 0.8721, "step": 5350 }, { "epoch": 0.36, "learning_rate": 1.4680049145290437e-05, "loss": 0.8535, "step": 5351 }, { "epoch": 0.36, "learning_rate": 1.467809841886641e-05, "loss": 0.8682, "step": 5352 }, { "epoch": 0.36, "learning_rate": 1.4676147464525659e-05, "loss": 0.8447, "step": 5353 }, { "epoch": 0.36, "learning_rate": 1.4674196282363234e-05, "loss": 0.832, "step": 5354 }, { "epoch": 0.36, "learning_rate": 1.4672244872474189e-05, "loss": 0.8223, "step": 5355 }, { "epoch": 0.36, "learning_rate": 1.4670293234953606e-05, "loss": 0.9082, "step": 5356 }, { "epoch": 0.37, "learning_rate": 1.466834136989656e-05, "loss": 0.8359, "step": 5357 }, { "epoch": 0.37, "learning_rate": 1.4666389277398153e-05, "loss": 0.8633, "step": 5358 }, { "epoch": 0.37, "learning_rate": 1.4664436957553488e-05, "loss": 0.8408, "step": 5359 }, { "epoch": 0.37, "learning_rate": 1.466248441045768e-05, "loss": 0.7939, "step": 5360 }, { "epoch": 0.37, "learning_rate": 1.466053163620586e-05, "loss": 0.8955, "step": 5361 }, { "epoch": 0.37, "learning_rate": 1.4658578634893168e-05, "loss": 0.8643, "step": 5362 }, { "epoch": 0.37, "learning_rate": 1.4656625406614749e-05, "loss": 0.8018, "step": 5363 }, { "epoch": 0.37, "learning_rate": 1.4654671951465767e-05, "loss": 0.8555, "step": 5364 }, { "epoch": 0.37, "learning_rate": 1.4652718269541395e-05, "loss": 0.8633, "step": 5365 }, { "epoch": 0.37, "learning_rate": 1.4650764360936817e-05, "loss": 0.8916, "step": 5366 }, { "epoch": 0.37, "learning_rate": 1.4648810225747228e-05, "loss": 0.8096, "step": 5367 }, { "epoch": 0.37, "learning_rate": 1.4646855864067829e-05, "loss": 0.7998, "step": 5368 }, { "epoch": 0.37, "learning_rate": 1.464490127599384e-05, "loss": 0.7363, "step": 5369 }, { "epoch": 0.37, "learning_rate": 1.4642946461620487e-05, "loss": 0.7627, "step": 5370 }, { "epoch": 0.37, "learning_rate": 1.4640991421043005e-05, "loss": 0.876, "step": 5371 }, { "epoch": 0.37, "learning_rate": 1.4639036154356654e-05, "loss": 0.7979, "step": 5372 }, { "epoch": 0.37, "learning_rate": 1.4637080661656683e-05, "loss": 0.8086, "step": 5373 }, { "epoch": 0.37, "learning_rate": 1.463512494303837e-05, "loss": 0.8506, "step": 5374 }, { "epoch": 0.37, "learning_rate": 1.4633168998596994e-05, "loss": 0.7803, "step": 5375 }, { "epoch": 0.37, "learning_rate": 1.4631212828427853e-05, "loss": 0.7969, "step": 5376 }, { "epoch": 0.37, "learning_rate": 1.4629256432626249e-05, "loss": 0.8125, "step": 5377 }, { "epoch": 0.37, "learning_rate": 1.4627299811287495e-05, "loss": 0.8926, "step": 5378 }, { "epoch": 0.37, "learning_rate": 1.4625342964506919e-05, "loss": 0.833, "step": 5379 }, { "epoch": 0.37, "learning_rate": 1.4623385892379864e-05, "loss": 0.8662, "step": 5380 }, { "epoch": 0.37, "learning_rate": 1.462142859500167e-05, "loss": 0.8594, "step": 5381 }, { "epoch": 0.37, "learning_rate": 1.46194710724677e-05, "loss": 0.876, "step": 5382 }, { "epoch": 0.37, "learning_rate": 1.4617513324873326e-05, "loss": 0.8359, "step": 5383 }, { "epoch": 0.37, "learning_rate": 1.461555535231393e-05, "loss": 0.834, "step": 5384 }, { "epoch": 0.37, "learning_rate": 1.46135971548849e-05, "loss": 0.8447, "step": 5385 }, { "epoch": 0.37, "learning_rate": 1.461163873268164e-05, "loss": 0.8818, "step": 5386 }, { "epoch": 0.37, "learning_rate": 1.4609680085799571e-05, "loss": 0.8574, "step": 5387 }, { "epoch": 0.37, "learning_rate": 1.460772121433411e-05, "loss": 0.7949, "step": 5388 }, { "epoch": 0.37, "learning_rate": 1.4605762118380696e-05, "loss": 0.8008, "step": 5389 }, { "epoch": 0.37, "learning_rate": 1.4603802798034776e-05, "loss": 0.873, "step": 5390 }, { "epoch": 0.37, "learning_rate": 1.4601843253391806e-05, "loss": 0.8789, "step": 5391 }, { "epoch": 0.37, "learning_rate": 1.459988348454726e-05, "loss": 0.8115, "step": 5392 }, { "epoch": 0.37, "learning_rate": 1.4597923491596616e-05, "loss": 0.8477, "step": 5393 }, { "epoch": 0.37, "learning_rate": 1.4595963274635359e-05, "loss": 0.7832, "step": 5394 }, { "epoch": 0.37, "learning_rate": 1.4594002833759e-05, "loss": 0.833, "step": 5395 }, { "epoch": 0.37, "learning_rate": 1.4592042169063045e-05, "loss": 0.8838, "step": 5396 }, { "epoch": 0.37, "learning_rate": 1.4590081280643018e-05, "loss": 0.8027, "step": 5397 }, { "epoch": 0.37, "learning_rate": 1.458812016859446e-05, "loss": 0.8662, "step": 5398 }, { "epoch": 0.37, "learning_rate": 1.4586158833012907e-05, "loss": 0.79, "step": 5399 }, { "epoch": 0.37, "learning_rate": 1.458419727399392e-05, "loss": 0.9033, "step": 5400 }, { "epoch": 0.37, "learning_rate": 1.4582235491633064e-05, "loss": 0.834, "step": 5401 }, { "epoch": 0.37, "learning_rate": 1.4580273486025922e-05, "loss": 0.9131, "step": 5402 }, { "epoch": 0.37, "learning_rate": 1.4578311257268076e-05, "loss": 0.8125, "step": 5403 }, { "epoch": 0.37, "learning_rate": 1.457634880545513e-05, "loss": 0.8379, "step": 5404 }, { "epoch": 0.37, "learning_rate": 1.4574386130682692e-05, "loss": 0.9121, "step": 5405 }, { "epoch": 0.37, "learning_rate": 1.4572423233046386e-05, "loss": 0.8428, "step": 5406 }, { "epoch": 0.37, "learning_rate": 1.4570460112641844e-05, "loss": 0.8594, "step": 5407 }, { "epoch": 0.37, "learning_rate": 1.4568496769564707e-05, "loss": 0.8301, "step": 5408 }, { "epoch": 0.37, "learning_rate": 1.456653320391063e-05, "loss": 0.8564, "step": 5409 }, { "epoch": 0.37, "learning_rate": 1.4564569415775278e-05, "loss": 0.8066, "step": 5410 }, { "epoch": 0.37, "learning_rate": 1.4562605405254329e-05, "loss": 0.79, "step": 5411 }, { "epoch": 0.37, "learning_rate": 1.4560641172443463e-05, "loss": 0.8789, "step": 5412 }, { "epoch": 0.37, "learning_rate": 1.4558676717438385e-05, "loss": 0.8291, "step": 5413 }, { "epoch": 0.37, "learning_rate": 1.4556712040334798e-05, "loss": 0.9043, "step": 5414 }, { "epoch": 0.37, "learning_rate": 1.4554747141228422e-05, "loss": 0.8711, "step": 5415 }, { "epoch": 0.37, "learning_rate": 1.455278202021499e-05, "loss": 0.8584, "step": 5416 }, { "epoch": 0.37, "learning_rate": 1.4550816677390236e-05, "loss": 0.874, "step": 5417 }, { "epoch": 0.37, "learning_rate": 1.454885111284992e-05, "loss": 0.7256, "step": 5418 }, { "epoch": 0.37, "learning_rate": 1.4546885326689796e-05, "loss": 0.7949, "step": 5419 }, { "epoch": 0.37, "learning_rate": 1.4544919319005641e-05, "loss": 0.8799, "step": 5420 }, { "epoch": 0.37, "learning_rate": 1.4542953089893241e-05, "loss": 0.8711, "step": 5421 }, { "epoch": 0.37, "learning_rate": 1.4540986639448386e-05, "loss": 0.8408, "step": 5422 }, { "epoch": 0.37, "learning_rate": 1.4539019967766883e-05, "loss": 0.8008, "step": 5423 }, { "epoch": 0.37, "learning_rate": 1.4537053074944552e-05, "loss": 0.8516, "step": 5424 }, { "epoch": 0.37, "learning_rate": 1.4535085961077214e-05, "loss": 0.8799, "step": 5425 }, { "epoch": 0.37, "learning_rate": 1.4533118626260707e-05, "loss": 0.8027, "step": 5426 }, { "epoch": 0.37, "learning_rate": 1.4531151070590884e-05, "loss": 0.8496, "step": 5427 }, { "epoch": 0.37, "learning_rate": 1.45291832941636e-05, "loss": 0.8252, "step": 5428 }, { "epoch": 0.37, "learning_rate": 1.4527215297074729e-05, "loss": 0.7266, "step": 5429 }, { "epoch": 0.37, "learning_rate": 1.4525247079420148e-05, "loss": 0.8027, "step": 5430 }, { "epoch": 0.37, "learning_rate": 1.4523278641295753e-05, "loss": 0.8906, "step": 5431 }, { "epoch": 0.37, "learning_rate": 1.4521309982797439e-05, "loss": 0.832, "step": 5432 }, { "epoch": 0.37, "learning_rate": 1.4519341104021125e-05, "loss": 0.8916, "step": 5433 }, { "epoch": 0.37, "learning_rate": 1.4517372005062734e-05, "loss": 0.832, "step": 5434 }, { "epoch": 0.37, "learning_rate": 1.4515402686018193e-05, "loss": 0.8281, "step": 5435 }, { "epoch": 0.37, "learning_rate": 1.4513433146983462e-05, "loss": 0.8652, "step": 5436 }, { "epoch": 0.37, "learning_rate": 1.4511463388054482e-05, "loss": 0.8281, "step": 5437 }, { "epoch": 0.37, "learning_rate": 1.4509493409327228e-05, "loss": 0.876, "step": 5438 }, { "epoch": 0.37, "learning_rate": 1.4507523210897678e-05, "loss": 0.7607, "step": 5439 }, { "epoch": 0.37, "learning_rate": 1.4505552792861811e-05, "loss": 0.8096, "step": 5440 }, { "epoch": 0.37, "learning_rate": 1.4503582155315636e-05, "loss": 0.9189, "step": 5441 }, { "epoch": 0.37, "learning_rate": 1.4501611298355159e-05, "loss": 0.791, "step": 5442 }, { "epoch": 0.37, "learning_rate": 1.4499640222076396e-05, "loss": 0.8496, "step": 5443 }, { "epoch": 0.37, "learning_rate": 1.4497668926575381e-05, "loss": 0.7197, "step": 5444 }, { "epoch": 0.37, "learning_rate": 1.4495697411948156e-05, "loss": 0.8125, "step": 5445 }, { "epoch": 0.37, "learning_rate": 1.4493725678290774e-05, "loss": 0.8906, "step": 5446 }, { "epoch": 0.37, "learning_rate": 1.4491753725699293e-05, "loss": 0.792, "step": 5447 }, { "epoch": 0.37, "learning_rate": 1.4489781554269791e-05, "loss": 0.7432, "step": 5448 }, { "epoch": 0.37, "learning_rate": 1.448780916409835e-05, "loss": 0.8086, "step": 5449 }, { "epoch": 0.37, "learning_rate": 1.4485836555281068e-05, "loss": 0.8252, "step": 5450 }, { "epoch": 0.37, "learning_rate": 1.4483863727914042e-05, "loss": 0.873, "step": 5451 }, { "epoch": 0.37, "learning_rate": 1.44818906820934e-05, "loss": 0.8447, "step": 5452 }, { "epoch": 0.37, "learning_rate": 1.4479917417915256e-05, "loss": 0.7422, "step": 5453 }, { "epoch": 0.37, "learning_rate": 1.447794393547576e-05, "loss": 0.8379, "step": 5454 }, { "epoch": 0.37, "learning_rate": 1.4475970234871055e-05, "loss": 0.8477, "step": 5455 }, { "epoch": 0.37, "learning_rate": 1.4473996316197292e-05, "loss": 0.7832, "step": 5456 }, { "epoch": 0.37, "learning_rate": 1.447202217955065e-05, "loss": 0.8428, "step": 5457 }, { "epoch": 0.37, "learning_rate": 1.4470047825027306e-05, "loss": 0.7793, "step": 5458 }, { "epoch": 0.37, "learning_rate": 1.446807325272345e-05, "loss": 0.8252, "step": 5459 }, { "epoch": 0.37, "learning_rate": 1.4466098462735283e-05, "loss": 0.7734, "step": 5460 }, { "epoch": 0.37, "learning_rate": 1.4464123455159015e-05, "loss": 0.8789, "step": 5461 }, { "epoch": 0.37, "learning_rate": 1.446214823009087e-05, "loss": 0.8594, "step": 5462 }, { "epoch": 0.37, "learning_rate": 1.4460172787627082e-05, "loss": 0.8047, "step": 5463 }, { "epoch": 0.37, "learning_rate": 1.4458197127863892e-05, "loss": 0.8779, "step": 5464 }, { "epoch": 0.37, "learning_rate": 1.4456221250897557e-05, "loss": 0.7861, "step": 5465 }, { "epoch": 0.37, "learning_rate": 1.445424515682434e-05, "loss": 0.834, "step": 5466 }, { "epoch": 0.37, "learning_rate": 1.4452268845740519e-05, "loss": 0.7646, "step": 5467 }, { "epoch": 0.37, "learning_rate": 1.4450292317742371e-05, "loss": 0.7715, "step": 5468 }, { "epoch": 0.37, "learning_rate": 1.4448315572926199e-05, "loss": 0.8086, "step": 5469 }, { "epoch": 0.37, "learning_rate": 1.4446338611388313e-05, "loss": 0.8428, "step": 5470 }, { "epoch": 0.37, "learning_rate": 1.4444361433225023e-05, "loss": 0.9014, "step": 5471 }, { "epoch": 0.37, "learning_rate": 1.4442384038532664e-05, "loss": 0.8291, "step": 5472 }, { "epoch": 0.37, "learning_rate": 1.4440406427407571e-05, "loss": 0.833, "step": 5473 }, { "epoch": 0.37, "learning_rate": 1.443842859994609e-05, "loss": 0.8643, "step": 5474 }, { "epoch": 0.37, "learning_rate": 1.4436450556244588e-05, "loss": 0.7969, "step": 5475 }, { "epoch": 0.37, "learning_rate": 1.443447229639943e-05, "loss": 0.7617, "step": 5476 }, { "epoch": 0.37, "learning_rate": 1.4432493820506994e-05, "loss": 0.8301, "step": 5477 }, { "epoch": 0.37, "learning_rate": 1.4430515128663682e-05, "loss": 0.8086, "step": 5478 }, { "epoch": 0.37, "learning_rate": 1.4428536220965886e-05, "loss": 0.8086, "step": 5479 }, { "epoch": 0.37, "learning_rate": 1.4426557097510019e-05, "loss": 0.8896, "step": 5480 }, { "epoch": 0.37, "learning_rate": 1.4424577758392509e-05, "loss": 0.8633, "step": 5481 }, { "epoch": 0.37, "learning_rate": 1.4422598203709785e-05, "loss": 0.918, "step": 5482 }, { "epoch": 0.37, "learning_rate": 1.4420618433558291e-05, "loss": 0.7441, "step": 5483 }, { "epoch": 0.37, "learning_rate": 1.4418638448034483e-05, "loss": 0.8799, "step": 5484 }, { "epoch": 0.37, "learning_rate": 1.441665824723483e-05, "loss": 0.7588, "step": 5485 }, { "epoch": 0.37, "learning_rate": 1.44146778312558e-05, "loss": 0.7969, "step": 5486 }, { "epoch": 0.37, "learning_rate": 1.4412697200193877e-05, "loss": 0.7822, "step": 5487 }, { "epoch": 0.37, "learning_rate": 1.4410716354145566e-05, "loss": 0.8398, "step": 5488 }, { "epoch": 0.37, "learning_rate": 1.4408735293207365e-05, "loss": 0.8584, "step": 5489 }, { "epoch": 0.37, "learning_rate": 1.44067540174758e-05, "loss": 0.8564, "step": 5490 }, { "epoch": 0.37, "learning_rate": 1.4404772527047395e-05, "loss": 0.8076, "step": 5491 }, { "epoch": 0.37, "learning_rate": 1.4402790822018683e-05, "loss": 0.8477, "step": 5492 }, { "epoch": 0.37, "learning_rate": 1.440080890248622e-05, "loss": 0.8506, "step": 5493 }, { "epoch": 0.37, "learning_rate": 1.439882676854656e-05, "loss": 0.8262, "step": 5494 }, { "epoch": 0.37, "learning_rate": 1.4396844420296276e-05, "loss": 0.8311, "step": 5495 }, { "epoch": 0.37, "learning_rate": 1.4394861857831948e-05, "loss": 0.8838, "step": 5496 }, { "epoch": 0.37, "learning_rate": 1.439287908125016e-05, "loss": 0.8516, "step": 5497 }, { "epoch": 0.37, "learning_rate": 1.439089609064752e-05, "loss": 0.8525, "step": 5498 }, { "epoch": 0.37, "learning_rate": 1.4388912886120636e-05, "loss": 0.9121, "step": 5499 }, { "epoch": 0.37, "learning_rate": 1.438692946776613e-05, "loss": 0.7852, "step": 5500 }, { "epoch": 0.37, "learning_rate": 1.4384945835680635e-05, "loss": 0.7461, "step": 5501 }, { "epoch": 0.37, "learning_rate": 1.4382961989960791e-05, "loss": 0.9238, "step": 5502 }, { "epoch": 0.38, "learning_rate": 1.4380977930703257e-05, "loss": 0.8711, "step": 5503 }, { "epoch": 0.38, "learning_rate": 1.4378993658004687e-05, "loss": 0.8564, "step": 5504 }, { "epoch": 0.38, "learning_rate": 1.4377009171961762e-05, "loss": 0.876, "step": 5505 }, { "epoch": 0.38, "learning_rate": 1.4375024472671164e-05, "loss": 0.8086, "step": 5506 }, { "epoch": 0.38, "learning_rate": 1.4373039560229583e-05, "loss": 0.8789, "step": 5507 }, { "epoch": 0.38, "learning_rate": 1.4371054434733734e-05, "loss": 0.8125, "step": 5508 }, { "epoch": 0.38, "learning_rate": 1.4369069096280324e-05, "loss": 0.8721, "step": 5509 }, { "epoch": 0.38, "learning_rate": 1.4367083544966075e-05, "loss": 0.9297, "step": 5510 }, { "epoch": 0.38, "learning_rate": 1.4365097780887735e-05, "loss": 0.8232, "step": 5511 }, { "epoch": 0.38, "learning_rate": 1.4363111804142043e-05, "loss": 0.8574, "step": 5512 }, { "epoch": 0.38, "learning_rate": 1.4361125614825755e-05, "loss": 0.8203, "step": 5513 }, { "epoch": 0.38, "learning_rate": 1.4359139213035642e-05, "loss": 0.7744, "step": 5514 }, { "epoch": 0.38, "learning_rate": 1.4357152598868478e-05, "loss": 0.8564, "step": 5515 }, { "epoch": 0.38, "learning_rate": 1.4355165772421051e-05, "loss": 0.8984, "step": 5516 }, { "epoch": 0.38, "learning_rate": 1.4353178733790163e-05, "loss": 0.8291, "step": 5517 }, { "epoch": 0.38, "learning_rate": 1.4351191483072615e-05, "loss": 0.7656, "step": 5518 }, { "epoch": 0.38, "learning_rate": 1.4349204020365233e-05, "loss": 0.8076, "step": 5519 }, { "epoch": 0.38, "learning_rate": 1.434721634576484e-05, "loss": 0.8086, "step": 5520 }, { "epoch": 0.38, "learning_rate": 1.4345228459368283e-05, "loss": 0.8877, "step": 5521 }, { "epoch": 0.38, "learning_rate": 1.4343240361272406e-05, "loss": 0.8369, "step": 5522 }, { "epoch": 0.38, "learning_rate": 1.4341252051574069e-05, "loss": 0.8193, "step": 5523 }, { "epoch": 0.38, "learning_rate": 1.4339263530370145e-05, "loss": 0.7598, "step": 5524 }, { "epoch": 0.38, "learning_rate": 1.4337274797757512e-05, "loss": 0.9082, "step": 5525 }, { "epoch": 0.38, "learning_rate": 1.4335285853833064e-05, "loss": 0.8838, "step": 5526 }, { "epoch": 0.38, "learning_rate": 1.43332966986937e-05, "loss": 0.8428, "step": 5527 }, { "epoch": 0.38, "learning_rate": 1.433130733243633e-05, "loss": 0.8496, "step": 5528 }, { "epoch": 0.38, "learning_rate": 1.432931775515788e-05, "loss": 0.8271, "step": 5529 }, { "epoch": 0.38, "learning_rate": 1.432732796695528e-05, "loss": 0.7607, "step": 5530 }, { "epoch": 0.38, "learning_rate": 1.4325337967925475e-05, "loss": 0.8486, "step": 5531 }, { "epoch": 0.38, "learning_rate": 1.4323347758165414e-05, "loss": 0.748, "step": 5532 }, { "epoch": 0.38, "learning_rate": 1.4321357337772056e-05, "loss": 0.8525, "step": 5533 }, { "epoch": 0.38, "learning_rate": 1.4319366706842383e-05, "loss": 0.748, "step": 5534 }, { "epoch": 0.38, "learning_rate": 1.4317375865473377e-05, "loss": 0.8408, "step": 5535 }, { "epoch": 0.38, "learning_rate": 1.4315384813762025e-05, "loss": 0.8467, "step": 5536 }, { "epoch": 0.38, "learning_rate": 1.431339355180534e-05, "loss": 0.8213, "step": 5537 }, { "epoch": 0.38, "learning_rate": 1.4311402079700327e-05, "loss": 0.7939, "step": 5538 }, { "epoch": 0.38, "learning_rate": 1.4309410397544017e-05, "loss": 0.7988, "step": 5539 }, { "epoch": 0.38, "learning_rate": 1.4307418505433444e-05, "loss": 0.8359, "step": 5540 }, { "epoch": 0.38, "learning_rate": 1.430542640346565e-05, "loss": 0.79, "step": 5541 }, { "epoch": 0.38, "learning_rate": 1.4303434091737689e-05, "loss": 0.8096, "step": 5542 }, { "epoch": 0.38, "learning_rate": 1.4301441570346635e-05, "loss": 0.9062, "step": 5543 }, { "epoch": 0.38, "learning_rate": 1.4299448839389554e-05, "loss": 0.7793, "step": 5544 }, { "epoch": 0.38, "learning_rate": 1.4297455898963533e-05, "loss": 0.8623, "step": 5545 }, { "epoch": 0.38, "learning_rate": 1.4295462749165671e-05, "loss": 0.8408, "step": 5546 }, { "epoch": 0.38, "learning_rate": 1.4293469390093075e-05, "loss": 0.8496, "step": 5547 }, { "epoch": 0.38, "learning_rate": 1.4291475821842862e-05, "loss": 0.7559, "step": 5548 }, { "epoch": 0.38, "learning_rate": 1.4289482044512152e-05, "loss": 0.8506, "step": 5549 }, { "epoch": 0.38, "learning_rate": 1.428748805819809e-05, "loss": 0.8604, "step": 5550 }, { "epoch": 0.38, "learning_rate": 1.4285493862997814e-05, "loss": 0.8203, "step": 5551 }, { "epoch": 0.38, "learning_rate": 1.4283499459008488e-05, "loss": 0.8662, "step": 5552 }, { "epoch": 0.38, "learning_rate": 1.4281504846327279e-05, "loss": 0.8086, "step": 5553 }, { "epoch": 0.38, "learning_rate": 1.427951002505136e-05, "loss": 0.793, "step": 5554 }, { "epoch": 0.38, "learning_rate": 1.4277514995277923e-05, "loss": 0.8555, "step": 5555 }, { "epoch": 0.38, "learning_rate": 1.4275519757104163e-05, "loss": 0.8086, "step": 5556 }, { "epoch": 0.38, "learning_rate": 1.4273524310627289e-05, "loss": 0.791, "step": 5557 }, { "epoch": 0.38, "learning_rate": 1.4271528655944522e-05, "loss": 0.7441, "step": 5558 }, { "epoch": 0.38, "learning_rate": 1.4269532793153085e-05, "loss": 0.7676, "step": 5559 }, { "epoch": 0.38, "learning_rate": 1.4267536722350218e-05, "loss": 0.8428, "step": 5560 }, { "epoch": 0.38, "learning_rate": 1.426554044363317e-05, "loss": 0.8994, "step": 5561 }, { "epoch": 0.38, "learning_rate": 1.42635439570992e-05, "loss": 0.8311, "step": 5562 }, { "epoch": 0.38, "learning_rate": 1.4261547262845575e-05, "loss": 0.8867, "step": 5563 }, { "epoch": 0.38, "learning_rate": 1.4259550360969577e-05, "loss": 0.8652, "step": 5564 }, { "epoch": 0.38, "learning_rate": 1.4257553251568493e-05, "loss": 0.8105, "step": 5565 }, { "epoch": 0.38, "learning_rate": 1.4255555934739622e-05, "loss": 0.8613, "step": 5566 }, { "epoch": 0.38, "learning_rate": 1.4253558410580273e-05, "loss": 0.8096, "step": 5567 }, { "epoch": 0.38, "learning_rate": 1.4251560679187766e-05, "loss": 0.8174, "step": 5568 }, { "epoch": 0.38, "learning_rate": 1.4249562740659429e-05, "loss": 0.8125, "step": 5569 }, { "epoch": 0.38, "learning_rate": 1.4247564595092605e-05, "loss": 0.8262, "step": 5570 }, { "epoch": 0.38, "learning_rate": 1.424556624258464e-05, "loss": 0.7529, "step": 5571 }, { "epoch": 0.38, "learning_rate": 1.4243567683232891e-05, "loss": 0.8369, "step": 5572 }, { "epoch": 0.38, "learning_rate": 1.4241568917134736e-05, "loss": 0.749, "step": 5573 }, { "epoch": 0.38, "learning_rate": 1.4239569944387548e-05, "loss": 0.8242, "step": 5574 }, { "epoch": 0.38, "learning_rate": 1.423757076508872e-05, "loss": 0.8428, "step": 5575 }, { "epoch": 0.38, "learning_rate": 1.4235571379335654e-05, "loss": 0.8105, "step": 5576 }, { "epoch": 0.38, "learning_rate": 1.4233571787225751e-05, "loss": 0.834, "step": 5577 }, { "epoch": 0.38, "learning_rate": 1.4231571988856439e-05, "loss": 0.7959, "step": 5578 }, { "epoch": 0.38, "learning_rate": 1.4229571984325147e-05, "loss": 0.7637, "step": 5579 }, { "epoch": 0.38, "learning_rate": 1.4227571773729315e-05, "loss": 0.918, "step": 5580 }, { "epoch": 0.38, "learning_rate": 1.422557135716639e-05, "loss": 0.835, "step": 5581 }, { "epoch": 0.38, "learning_rate": 1.4223570734733836e-05, "loss": 0.8633, "step": 5582 }, { "epoch": 0.38, "learning_rate": 1.4221569906529122e-05, "loss": 0.8916, "step": 5583 }, { "epoch": 0.38, "learning_rate": 1.421956887264973e-05, "loss": 0.8096, "step": 5584 }, { "epoch": 0.38, "learning_rate": 1.4217567633193143e-05, "loss": 0.8281, "step": 5585 }, { "epoch": 0.38, "learning_rate": 1.4215566188256871e-05, "loss": 0.8799, "step": 5586 }, { "epoch": 0.38, "learning_rate": 1.4213564537938418e-05, "loss": 0.8418, "step": 5587 }, { "epoch": 0.38, "learning_rate": 1.4211562682335308e-05, "loss": 0.7607, "step": 5588 }, { "epoch": 0.38, "learning_rate": 1.420956062154507e-05, "loss": 0.8086, "step": 5589 }, { "epoch": 0.38, "learning_rate": 1.420755835566524e-05, "loss": 0.7412, "step": 5590 }, { "epoch": 0.38, "learning_rate": 1.4205555884793375e-05, "loss": 0.8711, "step": 5591 }, { "epoch": 0.38, "learning_rate": 1.420355320902703e-05, "loss": 0.835, "step": 5592 }, { "epoch": 0.38, "learning_rate": 1.4201550328463778e-05, "loss": 0.7764, "step": 5593 }, { "epoch": 0.38, "learning_rate": 1.4199547243201201e-05, "loss": 0.7588, "step": 5594 }, { "epoch": 0.38, "learning_rate": 1.4197543953336885e-05, "loss": 0.8682, "step": 5595 }, { "epoch": 0.38, "learning_rate": 1.4195540458968434e-05, "loss": 0.7627, "step": 5596 }, { "epoch": 0.38, "learning_rate": 1.4193536760193456e-05, "loss": 0.8379, "step": 5597 }, { "epoch": 0.38, "learning_rate": 1.4191532857109572e-05, "loss": 0.8066, "step": 5598 }, { "epoch": 0.38, "learning_rate": 1.4189528749814409e-05, "loss": 0.8164, "step": 5599 }, { "epoch": 0.38, "learning_rate": 1.4187524438405614e-05, "loss": 0.9014, "step": 5600 }, { "epoch": 0.38, "learning_rate": 1.418551992298083e-05, "loss": 0.7988, "step": 5601 }, { "epoch": 0.38, "learning_rate": 1.4183515203637718e-05, "loss": 0.8047, "step": 5602 }, { "epoch": 0.38, "learning_rate": 1.4181510280473951e-05, "loss": 0.793, "step": 5603 }, { "epoch": 0.38, "learning_rate": 1.417950515358721e-05, "loss": 0.876, "step": 5604 }, { "epoch": 0.38, "learning_rate": 1.4177499823075176e-05, "loss": 0.8887, "step": 5605 }, { "epoch": 0.38, "learning_rate": 1.4175494289035557e-05, "loss": 0.835, "step": 5606 }, { "epoch": 0.38, "learning_rate": 1.417348855156606e-05, "loss": 0.793, "step": 5607 }, { "epoch": 0.38, "learning_rate": 1.4171482610764401e-05, "loss": 0.8789, "step": 5608 }, { "epoch": 0.38, "learning_rate": 1.416947646672832e-05, "loss": 0.7441, "step": 5609 }, { "epoch": 0.38, "learning_rate": 1.4167470119555544e-05, "loss": 0.7617, "step": 5610 }, { "epoch": 0.38, "learning_rate": 1.4165463569343826e-05, "loss": 0.9062, "step": 5611 }, { "epoch": 0.38, "learning_rate": 1.416345681619093e-05, "loss": 0.8398, "step": 5612 }, { "epoch": 0.38, "learning_rate": 1.4161449860194618e-05, "loss": 0.7998, "step": 5613 }, { "epoch": 0.38, "learning_rate": 1.4159442701452673e-05, "loss": 0.7695, "step": 5614 }, { "epoch": 0.38, "learning_rate": 1.4157435340062881e-05, "loss": 0.8818, "step": 5615 }, { "epoch": 0.38, "learning_rate": 1.4155427776123043e-05, "loss": 0.8154, "step": 5616 }, { "epoch": 0.38, "learning_rate": 1.4153420009730967e-05, "loss": 0.7998, "step": 5617 }, { "epoch": 0.38, "learning_rate": 1.415141204098447e-05, "loss": 0.8145, "step": 5618 }, { "epoch": 0.38, "learning_rate": 1.4149403869981382e-05, "loss": 0.7725, "step": 5619 }, { "epoch": 0.38, "learning_rate": 1.4147395496819537e-05, "loss": 0.917, "step": 5620 }, { "epoch": 0.38, "learning_rate": 1.4145386921596787e-05, "loss": 0.8652, "step": 5621 }, { "epoch": 0.38, "learning_rate": 1.414337814441099e-05, "loss": 0.8584, "step": 5622 }, { "epoch": 0.38, "learning_rate": 1.414136916536001e-05, "loss": 0.8193, "step": 5623 }, { "epoch": 0.38, "learning_rate": 1.4139359984541728e-05, "loss": 0.8057, "step": 5624 }, { "epoch": 0.38, "learning_rate": 1.4137350602054027e-05, "loss": 0.8535, "step": 5625 }, { "epoch": 0.38, "learning_rate": 1.4135341017994805e-05, "loss": 0.8623, "step": 5626 }, { "epoch": 0.38, "learning_rate": 1.4133331232461976e-05, "loss": 0.8379, "step": 5627 }, { "epoch": 0.38, "learning_rate": 1.413132124555345e-05, "loss": 0.8809, "step": 5628 }, { "epoch": 0.38, "learning_rate": 1.4129311057367148e-05, "loss": 0.8457, "step": 5629 }, { "epoch": 0.38, "learning_rate": 1.4127300668001019e-05, "loss": 0.8818, "step": 5630 }, { "epoch": 0.38, "learning_rate": 1.4125290077552998e-05, "loss": 0.8838, "step": 5631 }, { "epoch": 0.38, "learning_rate": 1.4123279286121048e-05, "loss": 0.8408, "step": 5632 }, { "epoch": 0.38, "learning_rate": 1.4121268293803134e-05, "loss": 0.8994, "step": 5633 }, { "epoch": 0.38, "learning_rate": 1.4119257100697228e-05, "loss": 0.7812, "step": 5634 }, { "epoch": 0.38, "learning_rate": 1.4117245706901316e-05, "loss": 0.8057, "step": 5635 }, { "epoch": 0.38, "learning_rate": 1.4115234112513393e-05, "loss": 0.8408, "step": 5636 }, { "epoch": 0.38, "learning_rate": 1.411322231763147e-05, "loss": 0.873, "step": 5637 }, { "epoch": 0.38, "learning_rate": 1.411121032235355e-05, "loss": 0.8223, "step": 5638 }, { "epoch": 0.38, "learning_rate": 1.4109198126777667e-05, "loss": 0.8174, "step": 5639 }, { "epoch": 0.38, "learning_rate": 1.4107185731001853e-05, "loss": 0.8711, "step": 5640 }, { "epoch": 0.38, "learning_rate": 1.4105173135124148e-05, "loss": 0.7441, "step": 5641 }, { "epoch": 0.38, "learning_rate": 1.4103160339242607e-05, "loss": 0.8584, "step": 5642 }, { "epoch": 0.38, "learning_rate": 1.4101147343455299e-05, "loss": 0.7236, "step": 5643 }, { "epoch": 0.38, "learning_rate": 1.4099134147860287e-05, "loss": 0.8711, "step": 5644 }, { "epoch": 0.38, "learning_rate": 1.4097120752555662e-05, "loss": 0.8105, "step": 5645 }, { "epoch": 0.38, "learning_rate": 1.4095107157639514e-05, "loss": 0.8643, "step": 5646 }, { "epoch": 0.38, "learning_rate": 1.4093093363209942e-05, "loss": 0.8477, "step": 5647 }, { "epoch": 0.38, "learning_rate": 1.4091079369365067e-05, "loss": 0.8154, "step": 5648 }, { "epoch": 0.38, "learning_rate": 1.4089065176203e-05, "loss": 0.8213, "step": 5649 }, { "epoch": 0.39, "learning_rate": 1.4087050783821878e-05, "loss": 0.8232, "step": 5650 }, { "epoch": 0.39, "learning_rate": 1.408503619231984e-05, "loss": 0.8408, "step": 5651 }, { "epoch": 0.39, "learning_rate": 1.4083021401795038e-05, "loss": 0.7969, "step": 5652 }, { "epoch": 0.39, "learning_rate": 1.4081006412345635e-05, "loss": 0.8164, "step": 5653 }, { "epoch": 0.39, "learning_rate": 1.4078991224069799e-05, "loss": 0.8057, "step": 5654 }, { "epoch": 0.39, "learning_rate": 1.4076975837065705e-05, "loss": 0.8652, "step": 5655 }, { "epoch": 0.39, "learning_rate": 1.4074960251431551e-05, "loss": 0.7529, "step": 5656 }, { "epoch": 0.39, "learning_rate": 1.407294446726553e-05, "loss": 0.8633, "step": 5657 }, { "epoch": 0.39, "learning_rate": 1.4070928484665853e-05, "loss": 0.7246, "step": 5658 }, { "epoch": 0.39, "learning_rate": 1.4068912303730742e-05, "loss": 0.8184, "step": 5659 }, { "epoch": 0.39, "learning_rate": 1.406689592455842e-05, "loss": 0.8447, "step": 5660 }, { "epoch": 0.39, "learning_rate": 1.4064879347247124e-05, "loss": 0.8691, "step": 5661 }, { "epoch": 0.39, "learning_rate": 1.406286257189511e-05, "loss": 0.8672, "step": 5662 }, { "epoch": 0.39, "learning_rate": 1.4060845598600626e-05, "loss": 0.8486, "step": 5663 }, { "epoch": 0.39, "learning_rate": 1.4058828427461943e-05, "loss": 0.8535, "step": 5664 }, { "epoch": 0.39, "learning_rate": 1.4056811058577338e-05, "loss": 0.7715, "step": 5665 }, { "epoch": 0.39, "learning_rate": 1.4054793492045095e-05, "loss": 0.8662, "step": 5666 }, { "epoch": 0.39, "learning_rate": 1.405277572796351e-05, "loss": 0.8867, "step": 5667 }, { "epoch": 0.39, "learning_rate": 1.4050757766430891e-05, "loss": 0.8174, "step": 5668 }, { "epoch": 0.39, "learning_rate": 1.4048739607545552e-05, "loss": 0.8379, "step": 5669 }, { "epoch": 0.39, "learning_rate": 1.4046721251405812e-05, "loss": 0.875, "step": 5670 }, { "epoch": 0.39, "learning_rate": 1.4044702698110015e-05, "loss": 0.8574, "step": 5671 }, { "epoch": 0.39, "learning_rate": 1.4042683947756498e-05, "loss": 0.8467, "step": 5672 }, { "epoch": 0.39, "learning_rate": 1.4040665000443613e-05, "loss": 0.8359, "step": 5673 }, { "epoch": 0.39, "learning_rate": 1.4038645856269733e-05, "loss": 0.8369, "step": 5674 }, { "epoch": 0.39, "learning_rate": 1.4036626515333219e-05, "loss": 0.7441, "step": 5675 }, { "epoch": 0.39, "learning_rate": 1.403460697773246e-05, "loss": 0.791, "step": 5676 }, { "epoch": 0.39, "learning_rate": 1.4032587243565845e-05, "loss": 0.8223, "step": 5677 }, { "epoch": 0.39, "learning_rate": 1.4030567312931776e-05, "loss": 0.8047, "step": 5678 }, { "epoch": 0.39, "learning_rate": 1.4028547185928663e-05, "loss": 0.8359, "step": 5679 }, { "epoch": 0.39, "learning_rate": 1.4026526862654928e-05, "loss": 0.8447, "step": 5680 }, { "epoch": 0.39, "learning_rate": 1.4024506343209003e-05, "loss": 0.8457, "step": 5681 }, { "epoch": 0.39, "learning_rate": 1.4022485627689321e-05, "loss": 0.8789, "step": 5682 }, { "epoch": 0.39, "learning_rate": 1.402046471619434e-05, "loss": 0.8359, "step": 5683 }, { "epoch": 0.39, "learning_rate": 1.4018443608822514e-05, "loss": 0.8037, "step": 5684 }, { "epoch": 0.39, "learning_rate": 1.4016422305672309e-05, "loss": 0.8545, "step": 5685 }, { "epoch": 0.39, "learning_rate": 1.4014400806842204e-05, "loss": 0.8828, "step": 5686 }, { "epoch": 0.39, "learning_rate": 1.4012379112430692e-05, "loss": 0.9062, "step": 5687 }, { "epoch": 0.39, "learning_rate": 1.4010357222536258e-05, "loss": 0.873, "step": 5688 }, { "epoch": 0.39, "learning_rate": 1.400833513725742e-05, "loss": 0.792, "step": 5689 }, { "epoch": 0.39, "learning_rate": 1.4006312856692692e-05, "loss": 0.8203, "step": 5690 }, { "epoch": 0.39, "learning_rate": 1.4004290380940593e-05, "loss": 0.8555, "step": 5691 }, { "epoch": 0.39, "learning_rate": 1.4002267710099666e-05, "loss": 0.7959, "step": 5692 }, { "epoch": 0.39, "learning_rate": 1.4000244844268447e-05, "loss": 0.873, "step": 5693 }, { "epoch": 0.39, "learning_rate": 1.3998221783545495e-05, "loss": 0.7744, "step": 5694 }, { "epoch": 0.39, "learning_rate": 1.3996198528029376e-05, "loss": 0.9082, "step": 5695 }, { "epoch": 0.39, "learning_rate": 1.3994175077818657e-05, "loss": 0.8066, "step": 5696 }, { "epoch": 0.39, "learning_rate": 1.3992151433011922e-05, "loss": 0.8467, "step": 5697 }, { "epoch": 0.39, "learning_rate": 1.3990127593707765e-05, "loss": 0.8271, "step": 5698 }, { "epoch": 0.39, "learning_rate": 1.3988103560004788e-05, "loss": 0.7832, "step": 5699 }, { "epoch": 0.39, "learning_rate": 1.3986079332001598e-05, "loss": 0.8008, "step": 5700 }, { "epoch": 0.39, "learning_rate": 1.3984054909796818e-05, "loss": 0.751, "step": 5701 }, { "epoch": 0.39, "learning_rate": 1.398203029348908e-05, "loss": 0.8252, "step": 5702 }, { "epoch": 0.39, "learning_rate": 1.3980005483177014e-05, "loss": 0.8281, "step": 5703 }, { "epoch": 0.39, "learning_rate": 1.3977980478959279e-05, "loss": 0.7686, "step": 5704 }, { "epoch": 0.39, "learning_rate": 1.397595528093453e-05, "loss": 0.8789, "step": 5705 }, { "epoch": 0.39, "learning_rate": 1.3973929889201428e-05, "loss": 0.8174, "step": 5706 }, { "epoch": 0.39, "learning_rate": 1.397190430385866e-05, "loss": 0.8008, "step": 5707 }, { "epoch": 0.39, "learning_rate": 1.396987852500491e-05, "loss": 0.8721, "step": 5708 }, { "epoch": 0.39, "learning_rate": 1.3967852552738867e-05, "loss": 0.8213, "step": 5709 }, { "epoch": 0.39, "learning_rate": 1.3965826387159245e-05, "loss": 0.8262, "step": 5710 }, { "epoch": 0.39, "learning_rate": 1.3963800028364753e-05, "loss": 0.8916, "step": 5711 }, { "epoch": 0.39, "learning_rate": 1.3961773476454117e-05, "loss": 0.918, "step": 5712 }, { "epoch": 0.39, "learning_rate": 1.3959746731526072e-05, "loss": 0.8096, "step": 5713 }, { "epoch": 0.39, "learning_rate": 1.3957719793679355e-05, "loss": 0.7793, "step": 5714 }, { "epoch": 0.39, "learning_rate": 1.3955692663012728e-05, "loss": 0.8682, "step": 5715 }, { "epoch": 0.39, "learning_rate": 1.3953665339624944e-05, "loss": 0.7686, "step": 5716 }, { "epoch": 0.39, "learning_rate": 1.3951637823614778e-05, "loss": 0.8877, "step": 5717 }, { "epoch": 0.39, "learning_rate": 1.3949610115081012e-05, "loss": 0.7998, "step": 5718 }, { "epoch": 0.39, "learning_rate": 1.394758221412243e-05, "loss": 0.8193, "step": 5719 }, { "epoch": 0.39, "learning_rate": 1.394555412083784e-05, "loss": 0.9268, "step": 5720 }, { "epoch": 0.39, "learning_rate": 1.3943525835326042e-05, "loss": 0.8223, "step": 5721 }, { "epoch": 0.39, "learning_rate": 1.3941497357685858e-05, "loss": 0.876, "step": 5722 }, { "epoch": 0.39, "learning_rate": 1.3939468688016118e-05, "loss": 0.7988, "step": 5723 }, { "epoch": 0.39, "learning_rate": 1.3937439826415648e-05, "loss": 0.8164, "step": 5724 }, { "epoch": 0.39, "learning_rate": 1.3935410772983309e-05, "loss": 0.875, "step": 5725 }, { "epoch": 0.39, "learning_rate": 1.3933381527817948e-05, "loss": 0.8535, "step": 5726 }, { "epoch": 0.39, "learning_rate": 1.3931352091018429e-05, "loss": 0.8877, "step": 5727 }, { "epoch": 0.39, "learning_rate": 1.3929322462683627e-05, "loss": 0.8613, "step": 5728 }, { "epoch": 0.39, "learning_rate": 1.392729264291243e-05, "loss": 0.7871, "step": 5729 }, { "epoch": 0.39, "learning_rate": 1.3925262631803722e-05, "loss": 0.792, "step": 5730 }, { "epoch": 0.39, "learning_rate": 1.3923232429456414e-05, "loss": 0.8848, "step": 5731 }, { "epoch": 0.39, "learning_rate": 1.3921202035969412e-05, "loss": 0.8428, "step": 5732 }, { "epoch": 0.39, "learning_rate": 1.3919171451441638e-05, "loss": 0.8457, "step": 5733 }, { "epoch": 0.39, "learning_rate": 1.3917140675972023e-05, "loss": 0.7012, "step": 5734 }, { "epoch": 0.39, "learning_rate": 1.3915109709659505e-05, "loss": 0.8369, "step": 5735 }, { "epoch": 0.39, "learning_rate": 1.391307855260303e-05, "loss": 0.8457, "step": 5736 }, { "epoch": 0.39, "learning_rate": 1.391104720490156e-05, "loss": 0.8096, "step": 5737 }, { "epoch": 0.39, "learning_rate": 1.3909015666654064e-05, "loss": 0.8477, "step": 5738 }, { "epoch": 0.39, "learning_rate": 1.3906983937959513e-05, "loss": 0.9199, "step": 5739 }, { "epoch": 0.39, "learning_rate": 1.3904952018916895e-05, "loss": 0.8594, "step": 5740 }, { "epoch": 0.39, "learning_rate": 1.3902919909625205e-05, "loss": 0.792, "step": 5741 }, { "epoch": 0.39, "learning_rate": 1.3900887610183449e-05, "loss": 0.8105, "step": 5742 }, { "epoch": 0.39, "learning_rate": 1.3898855120690637e-05, "loss": 0.8076, "step": 5743 }, { "epoch": 0.39, "learning_rate": 1.3896822441245794e-05, "loss": 0.9365, "step": 5744 }, { "epoch": 0.39, "learning_rate": 1.389478957194795e-05, "loss": 0.8955, "step": 5745 }, { "epoch": 0.39, "learning_rate": 1.3892756512896152e-05, "loss": 0.8477, "step": 5746 }, { "epoch": 0.39, "learning_rate": 1.3890723264189444e-05, "loss": 0.8262, "step": 5747 }, { "epoch": 0.39, "learning_rate": 1.3888689825926888e-05, "loss": 0.7529, "step": 5748 }, { "epoch": 0.39, "learning_rate": 1.3886656198207556e-05, "loss": 0.8838, "step": 5749 }, { "epoch": 0.39, "learning_rate": 1.388462238113052e-05, "loss": 0.834, "step": 5750 }, { "epoch": 0.39, "learning_rate": 1.3882588374794871e-05, "loss": 0.7842, "step": 5751 }, { "epoch": 0.39, "learning_rate": 1.388055417929971e-05, "loss": 0.832, "step": 5752 }, { "epoch": 0.39, "learning_rate": 1.3878519794744136e-05, "loss": 0.834, "step": 5753 }, { "epoch": 0.39, "learning_rate": 1.3876485221227265e-05, "loss": 0.8379, "step": 5754 }, { "epoch": 0.39, "learning_rate": 1.3874450458848226e-05, "loss": 0.8174, "step": 5755 }, { "epoch": 0.39, "learning_rate": 1.387241550770615e-05, "loss": 0.877, "step": 5756 }, { "epoch": 0.39, "learning_rate": 1.3870380367900176e-05, "loss": 0.8281, "step": 5757 }, { "epoch": 0.39, "learning_rate": 1.3868345039529461e-05, "loss": 0.8047, "step": 5758 }, { "epoch": 0.39, "learning_rate": 1.3866309522693167e-05, "loss": 0.751, "step": 5759 }, { "epoch": 0.39, "learning_rate": 1.3864273817490457e-05, "loss": 0.7578, "step": 5760 }, { "epoch": 0.39, "learning_rate": 1.3862237924020516e-05, "loss": 0.8105, "step": 5761 }, { "epoch": 0.39, "learning_rate": 1.3860201842382534e-05, "loss": 0.8037, "step": 5762 }, { "epoch": 0.39, "learning_rate": 1.38581655726757e-05, "loss": 0.8818, "step": 5763 }, { "epoch": 0.39, "learning_rate": 1.3856129114999238e-05, "loss": 0.8125, "step": 5764 }, { "epoch": 0.39, "learning_rate": 1.3854092469452348e-05, "loss": 0.8545, "step": 5765 }, { "epoch": 0.39, "learning_rate": 1.3852055636134258e-05, "loss": 0.9326, "step": 5766 }, { "epoch": 0.39, "learning_rate": 1.3850018615144209e-05, "loss": 0.8789, "step": 5767 }, { "epoch": 0.39, "learning_rate": 1.3847981406581439e-05, "loss": 0.7539, "step": 5768 }, { "epoch": 0.39, "learning_rate": 1.3845944010545206e-05, "loss": 0.7969, "step": 5769 }, { "epoch": 0.39, "learning_rate": 1.3843906427134766e-05, "loss": 0.7275, "step": 5770 }, { "epoch": 0.39, "learning_rate": 1.3841868656449388e-05, "loss": 0.8906, "step": 5771 }, { "epoch": 0.39, "learning_rate": 1.3839830698588363e-05, "loss": 0.7725, "step": 5772 }, { "epoch": 0.39, "learning_rate": 1.383779255365097e-05, "loss": 0.8623, "step": 5773 }, { "epoch": 0.39, "learning_rate": 1.3835754221736513e-05, "loss": 0.7451, "step": 5774 }, { "epoch": 0.39, "learning_rate": 1.3833715702944297e-05, "loss": 0.7197, "step": 5775 }, { "epoch": 0.39, "learning_rate": 1.383167699737364e-05, "loss": 0.7793, "step": 5776 }, { "epoch": 0.39, "learning_rate": 1.3829638105123864e-05, "loss": 0.8877, "step": 5777 }, { "epoch": 0.39, "learning_rate": 1.3827599026294307e-05, "loss": 0.8633, "step": 5778 }, { "epoch": 0.39, "learning_rate": 1.3825559760984313e-05, "loss": 0.8447, "step": 5779 }, { "epoch": 0.39, "learning_rate": 1.3823520309293232e-05, "loss": 0.8193, "step": 5780 }, { "epoch": 0.39, "learning_rate": 1.3821480671320428e-05, "loss": 0.8564, "step": 5781 }, { "epoch": 0.39, "learning_rate": 1.3819440847165275e-05, "loss": 0.8672, "step": 5782 }, { "epoch": 0.39, "learning_rate": 1.3817400836927149e-05, "loss": 0.8125, "step": 5783 }, { "epoch": 0.39, "learning_rate": 1.3815360640705439e-05, "loss": 0.8047, "step": 5784 }, { "epoch": 0.39, "learning_rate": 1.3813320258599547e-05, "loss": 0.7725, "step": 5785 }, { "epoch": 0.39, "learning_rate": 1.3811279690708877e-05, "loss": 0.8809, "step": 5786 }, { "epoch": 0.39, "learning_rate": 1.3809238937132845e-05, "loss": 0.8311, "step": 5787 }, { "epoch": 0.39, "learning_rate": 1.380719799797088e-05, "loss": 0.916, "step": 5788 }, { "epoch": 0.39, "learning_rate": 1.380515687332241e-05, "loss": 0.8623, "step": 5789 }, { "epoch": 0.39, "learning_rate": 1.3803115563286889e-05, "loss": 0.7773, "step": 5790 }, { "epoch": 0.39, "learning_rate": 1.3801074067963758e-05, "loss": 0.8379, "step": 5791 }, { "epoch": 0.39, "learning_rate": 1.3799032387452484e-05, "loss": 0.8652, "step": 5792 }, { "epoch": 0.39, "learning_rate": 1.3796990521852543e-05, "loss": 0.9102, "step": 5793 }, { "epoch": 0.39, "learning_rate": 1.3794948471263403e-05, "loss": 0.751, "step": 5794 }, { "epoch": 0.39, "learning_rate": 1.379290623578456e-05, "loss": 0.834, "step": 5795 }, { "epoch": 0.39, "learning_rate": 1.3790863815515511e-05, "loss": 0.7949, "step": 5796 }, { "epoch": 0.4, "learning_rate": 1.3788821210555763e-05, "loss": 0.8525, "step": 5797 }, { "epoch": 0.4, "learning_rate": 1.3786778421004827e-05, "loss": 0.9141, "step": 5798 }, { "epoch": 0.4, "learning_rate": 1.3784735446962232e-05, "loss": 0.873, "step": 5799 }, { "epoch": 0.4, "learning_rate": 1.3782692288527512e-05, "loss": 0.8086, "step": 5800 }, { "epoch": 0.4, "learning_rate": 1.3780648945800209e-05, "loss": 0.8555, "step": 5801 }, { "epoch": 0.4, "learning_rate": 1.3778605418879872e-05, "loss": 0.8281, "step": 5802 }, { "epoch": 0.4, "learning_rate": 1.3776561707866064e-05, "loss": 0.8818, "step": 5803 }, { "epoch": 0.4, "learning_rate": 1.3774517812858353e-05, "loss": 0.8848, "step": 5804 }, { "epoch": 0.4, "learning_rate": 1.3772473733956317e-05, "loss": 0.8584, "step": 5805 }, { "epoch": 0.4, "learning_rate": 1.3770429471259547e-05, "loss": 0.8096, "step": 5806 }, { "epoch": 0.4, "learning_rate": 1.3768385024867635e-05, "loss": 0.8555, "step": 5807 }, { "epoch": 0.4, "learning_rate": 1.376634039488019e-05, "loss": 0.7637, "step": 5808 }, { "epoch": 0.4, "learning_rate": 1.3764295581396824e-05, "loss": 0.8447, "step": 5809 }, { "epoch": 0.4, "learning_rate": 1.3762250584517161e-05, "loss": 0.8428, "step": 5810 }, { "epoch": 0.4, "learning_rate": 1.3760205404340835e-05, "loss": 0.8018, "step": 5811 }, { "epoch": 0.4, "learning_rate": 1.375816004096748e-05, "loss": 0.8311, "step": 5812 }, { "epoch": 0.4, "learning_rate": 1.3756114494496756e-05, "loss": 0.8018, "step": 5813 }, { "epoch": 0.4, "learning_rate": 1.3754068765028317e-05, "loss": 0.8564, "step": 5814 }, { "epoch": 0.4, "learning_rate": 1.3752022852661827e-05, "loss": 0.8682, "step": 5815 }, { "epoch": 0.4, "learning_rate": 1.3749976757496969e-05, "loss": 0.8535, "step": 5816 }, { "epoch": 0.4, "learning_rate": 1.3747930479633424e-05, "loss": 0.7246, "step": 5817 }, { "epoch": 0.4, "learning_rate": 1.3745884019170893e-05, "loss": 0.832, "step": 5818 }, { "epoch": 0.4, "learning_rate": 1.3743837376209072e-05, "loss": 0.752, "step": 5819 }, { "epoch": 0.4, "learning_rate": 1.3741790550847678e-05, "loss": 0.791, "step": 5820 }, { "epoch": 0.4, "learning_rate": 1.373974354318643e-05, "loss": 0.7627, "step": 5821 }, { "epoch": 0.4, "learning_rate": 1.373769635332506e-05, "loss": 0.8154, "step": 5822 }, { "epoch": 0.4, "learning_rate": 1.3735648981363303e-05, "loss": 0.7803, "step": 5823 }, { "epoch": 0.4, "learning_rate": 1.3733601427400915e-05, "loss": 0.8408, "step": 5824 }, { "epoch": 0.4, "learning_rate": 1.3731553691537643e-05, "loss": 0.8564, "step": 5825 }, { "epoch": 0.4, "learning_rate": 1.372950577387326e-05, "loss": 0.8145, "step": 5826 }, { "epoch": 0.4, "learning_rate": 1.3727457674507534e-05, "loss": 0.8291, "step": 5827 }, { "epoch": 0.4, "learning_rate": 1.3725409393540254e-05, "loss": 0.7354, "step": 5828 }, { "epoch": 0.4, "learning_rate": 1.3723360931071213e-05, "loss": 0.7637, "step": 5829 }, { "epoch": 0.4, "learning_rate": 1.3721312287200203e-05, "loss": 0.8213, "step": 5830 }, { "epoch": 0.4, "learning_rate": 1.3719263462027043e-05, "loss": 0.8369, "step": 5831 }, { "epoch": 0.4, "learning_rate": 1.3717214455651551e-05, "loss": 0.8994, "step": 5832 }, { "epoch": 0.4, "learning_rate": 1.371516526817355e-05, "loss": 0.8564, "step": 5833 }, { "epoch": 0.4, "learning_rate": 1.3713115899692877e-05, "loss": 0.8154, "step": 5834 }, { "epoch": 0.4, "learning_rate": 1.371106635030938e-05, "loss": 0.8623, "step": 5835 }, { "epoch": 0.4, "learning_rate": 1.370901662012291e-05, "loss": 0.8311, "step": 5836 }, { "epoch": 0.4, "learning_rate": 1.3706966709233331e-05, "loss": 0.8291, "step": 5837 }, { "epoch": 0.4, "learning_rate": 1.3704916617740515e-05, "loss": 0.7764, "step": 5838 }, { "epoch": 0.4, "learning_rate": 1.3702866345744345e-05, "loss": 0.8438, "step": 5839 }, { "epoch": 0.4, "learning_rate": 1.3700815893344703e-05, "loss": 0.9102, "step": 5840 }, { "epoch": 0.4, "learning_rate": 1.3698765260641493e-05, "loss": 0.8994, "step": 5841 }, { "epoch": 0.4, "learning_rate": 1.3696714447734623e-05, "loss": 0.7744, "step": 5842 }, { "epoch": 0.4, "learning_rate": 1.3694663454723998e-05, "loss": 0.8223, "step": 5843 }, { "epoch": 0.4, "learning_rate": 1.3692612281709556e-05, "loss": 0.7539, "step": 5844 }, { "epoch": 0.4, "learning_rate": 1.3690560928791222e-05, "loss": 0.835, "step": 5845 }, { "epoch": 0.4, "learning_rate": 1.368850939606894e-05, "loss": 0.7314, "step": 5846 }, { "epoch": 0.4, "learning_rate": 1.3686457683642658e-05, "loss": 0.8301, "step": 5847 }, { "epoch": 0.4, "learning_rate": 1.3684405791612338e-05, "loss": 0.8184, "step": 5848 }, { "epoch": 0.4, "learning_rate": 1.3682353720077948e-05, "loss": 0.7764, "step": 5849 }, { "epoch": 0.4, "learning_rate": 1.3680301469139465e-05, "loss": 0.8174, "step": 5850 }, { "epoch": 0.4, "learning_rate": 1.3678249038896874e-05, "loss": 0.749, "step": 5851 }, { "epoch": 0.4, "learning_rate": 1.3676196429450168e-05, "loss": 0.8164, "step": 5852 }, { "epoch": 0.4, "learning_rate": 1.367414364089935e-05, "loss": 0.8799, "step": 5853 }, { "epoch": 0.4, "learning_rate": 1.3672090673344439e-05, "loss": 0.7988, "step": 5854 }, { "epoch": 0.4, "learning_rate": 1.3670037526885443e-05, "loss": 0.7871, "step": 5855 }, { "epoch": 0.4, "learning_rate": 1.36679842016224e-05, "loss": 0.8643, "step": 5856 }, { "epoch": 0.4, "learning_rate": 1.3665930697655347e-05, "loss": 0.873, "step": 5857 }, { "epoch": 0.4, "learning_rate": 1.3663877015084325e-05, "loss": 0.8223, "step": 5858 }, { "epoch": 0.4, "learning_rate": 1.3661823154009397e-05, "loss": 0.8789, "step": 5859 }, { "epoch": 0.4, "learning_rate": 1.3659769114530623e-05, "loss": 0.876, "step": 5860 }, { "epoch": 0.4, "learning_rate": 1.3657714896748075e-05, "loss": 0.8115, "step": 5861 }, { "epoch": 0.4, "learning_rate": 1.3655660500761837e-05, "loss": 0.8184, "step": 5862 }, { "epoch": 0.4, "learning_rate": 1.3653605926672e-05, "loss": 0.79, "step": 5863 }, { "epoch": 0.4, "learning_rate": 1.3651551174578655e-05, "loss": 0.8398, "step": 5864 }, { "epoch": 0.4, "learning_rate": 1.3649496244581918e-05, "loss": 0.8477, "step": 5865 }, { "epoch": 0.4, "learning_rate": 1.36474411367819e-05, "loss": 0.8857, "step": 5866 }, { "epoch": 0.4, "learning_rate": 1.364538585127873e-05, "loss": 0.707, "step": 5867 }, { "epoch": 0.4, "learning_rate": 1.364333038817254e-05, "loss": 0.8135, "step": 5868 }, { "epoch": 0.4, "learning_rate": 1.364127474756347e-05, "loss": 0.8564, "step": 5869 }, { "epoch": 0.4, "learning_rate": 1.3639218929551667e-05, "loss": 0.8252, "step": 5870 }, { "epoch": 0.4, "learning_rate": 1.36371629342373e-05, "loss": 0.7656, "step": 5871 }, { "epoch": 0.4, "learning_rate": 1.3635106761720533e-05, "loss": 0.8604, "step": 5872 }, { "epoch": 0.4, "learning_rate": 1.363305041210154e-05, "loss": 0.8545, "step": 5873 }, { "epoch": 0.4, "learning_rate": 1.3630993885480508e-05, "loss": 0.8877, "step": 5874 }, { "epoch": 0.4, "learning_rate": 1.3628937181957633e-05, "loss": 0.875, "step": 5875 }, { "epoch": 0.4, "learning_rate": 1.3626880301633113e-05, "loss": 0.7178, "step": 5876 }, { "epoch": 0.4, "learning_rate": 1.3624823244607164e-05, "loss": 0.7734, "step": 5877 }, { "epoch": 0.4, "learning_rate": 1.3622766010980005e-05, "loss": 0.8154, "step": 5878 }, { "epoch": 0.4, "learning_rate": 1.3620708600851856e-05, "loss": 0.8174, "step": 5879 }, { "epoch": 0.4, "learning_rate": 1.3618651014322963e-05, "loss": 0.8936, "step": 5880 }, { "epoch": 0.4, "learning_rate": 1.3616593251493572e-05, "loss": 0.7979, "step": 5881 }, { "epoch": 0.4, "learning_rate": 1.361453531246393e-05, "loss": 0.7871, "step": 5882 }, { "epoch": 0.4, "learning_rate": 1.3612477197334309e-05, "loss": 0.8281, "step": 5883 }, { "epoch": 0.4, "learning_rate": 1.3610418906204972e-05, "loss": 0.8066, "step": 5884 }, { "epoch": 0.4, "learning_rate": 1.36083604391762e-05, "loss": 0.8877, "step": 5885 }, { "epoch": 0.4, "learning_rate": 1.360630179634829e-05, "loss": 0.7607, "step": 5886 }, { "epoch": 0.4, "learning_rate": 1.3604242977821522e-05, "loss": 0.9248, "step": 5887 }, { "epoch": 0.4, "learning_rate": 1.360218398369622e-05, "loss": 0.8174, "step": 5888 }, { "epoch": 0.4, "learning_rate": 1.360012481407269e-05, "loss": 0.8604, "step": 5889 }, { "epoch": 0.4, "learning_rate": 1.359806546905125e-05, "loss": 0.8164, "step": 5890 }, { "epoch": 0.4, "learning_rate": 1.3596005948732241e-05, "loss": 0.8242, "step": 5891 }, { "epoch": 0.4, "learning_rate": 1.3593946253215993e-05, "loss": 0.8281, "step": 5892 }, { "epoch": 0.4, "learning_rate": 1.3591886382602859e-05, "loss": 0.8154, "step": 5893 }, { "epoch": 0.4, "learning_rate": 1.35898263369932e-05, "loss": 0.6982, "step": 5894 }, { "epoch": 0.4, "learning_rate": 1.3587766116487374e-05, "loss": 0.8418, "step": 5895 }, { "epoch": 0.4, "learning_rate": 1.3585705721185755e-05, "loss": 0.7715, "step": 5896 }, { "epoch": 0.4, "learning_rate": 1.3583645151188731e-05, "loss": 0.8506, "step": 5897 }, { "epoch": 0.4, "learning_rate": 1.3581584406596692e-05, "loss": 0.8115, "step": 5898 }, { "epoch": 0.4, "learning_rate": 1.3579523487510034e-05, "loss": 0.8525, "step": 5899 }, { "epoch": 0.4, "learning_rate": 1.3577462394029164e-05, "loss": 0.8066, "step": 5900 }, { "epoch": 0.4, "learning_rate": 1.3575401126254504e-05, "loss": 0.8584, "step": 5901 }, { "epoch": 0.4, "learning_rate": 1.3573339684286472e-05, "loss": 0.8096, "step": 5902 }, { "epoch": 0.4, "learning_rate": 1.3571278068225507e-05, "loss": 0.8594, "step": 5903 }, { "epoch": 0.4, "learning_rate": 1.3569216278172048e-05, "loss": 0.8154, "step": 5904 }, { "epoch": 0.4, "learning_rate": 1.3567154314226545e-05, "loss": 0.8711, "step": 5905 }, { "epoch": 0.4, "learning_rate": 1.356509217648946e-05, "loss": 0.7695, "step": 5906 }, { "epoch": 0.4, "learning_rate": 1.3563029865061259e-05, "loss": 0.8301, "step": 5907 }, { "epoch": 0.4, "learning_rate": 1.3560967380042414e-05, "loss": 0.8037, "step": 5908 }, { "epoch": 0.4, "learning_rate": 1.3558904721533413e-05, "loss": 0.8701, "step": 5909 }, { "epoch": 0.4, "learning_rate": 1.3556841889634746e-05, "loss": 0.8447, "step": 5910 }, { "epoch": 0.4, "learning_rate": 1.3554778884446917e-05, "loss": 0.8848, "step": 5911 }, { "epoch": 0.4, "learning_rate": 1.3552715706070433e-05, "loss": 0.9111, "step": 5912 }, { "epoch": 0.4, "learning_rate": 1.3550652354605816e-05, "loss": 0.8525, "step": 5913 }, { "epoch": 0.4, "learning_rate": 1.3548588830153586e-05, "loss": 0.8271, "step": 5914 }, { "epoch": 0.4, "learning_rate": 1.3546525132814281e-05, "loss": 0.7295, "step": 5915 }, { "epoch": 0.4, "learning_rate": 1.3544461262688448e-05, "loss": 0.7715, "step": 5916 }, { "epoch": 0.4, "learning_rate": 1.3542397219876634e-05, "loss": 0.8115, "step": 5917 }, { "epoch": 0.4, "learning_rate": 1.3540333004479398e-05, "loss": 0.7969, "step": 5918 }, { "epoch": 0.4, "learning_rate": 1.3538268616597315e-05, "loss": 0.8223, "step": 5919 }, { "epoch": 0.4, "learning_rate": 1.3536204056330952e-05, "loss": 0.8887, "step": 5920 }, { "epoch": 0.4, "learning_rate": 1.3534139323780902e-05, "loss": 0.8154, "step": 5921 }, { "epoch": 0.4, "learning_rate": 1.3532074419047757e-05, "loss": 0.791, "step": 5922 }, { "epoch": 0.4, "learning_rate": 1.3530009342232118e-05, "loss": 0.7979, "step": 5923 }, { "epoch": 0.4, "learning_rate": 1.3527944093434597e-05, "loss": 0.8594, "step": 5924 }, { "epoch": 0.4, "learning_rate": 1.3525878672755815e-05, "loss": 0.8652, "step": 5925 }, { "epoch": 0.4, "learning_rate": 1.3523813080296389e-05, "loss": 0.8086, "step": 5926 }, { "epoch": 0.4, "learning_rate": 1.3521747316156965e-05, "loss": 0.709, "step": 5927 }, { "epoch": 0.4, "learning_rate": 1.3519681380438184e-05, "loss": 0.8398, "step": 5928 }, { "epoch": 0.4, "learning_rate": 1.3517615273240696e-05, "loss": 0.8369, "step": 5929 }, { "epoch": 0.4, "learning_rate": 1.3515548994665167e-05, "loss": 0.7549, "step": 5930 }, { "epoch": 0.4, "learning_rate": 1.3513482544812257e-05, "loss": 0.9287, "step": 5931 }, { "epoch": 0.4, "learning_rate": 1.3511415923782654e-05, "loss": 0.8457, "step": 5932 }, { "epoch": 0.4, "learning_rate": 1.3509349131677037e-05, "loss": 0.8057, "step": 5933 }, { "epoch": 0.4, "learning_rate": 1.35072821685961e-05, "loss": 0.8037, "step": 5934 }, { "epoch": 0.4, "learning_rate": 1.3505215034640546e-05, "loss": 0.8613, "step": 5935 }, { "epoch": 0.4, "learning_rate": 1.3503147729911087e-05, "loss": 0.7949, "step": 5936 }, { "epoch": 0.4, "learning_rate": 1.3501080254508446e-05, "loss": 0.8398, "step": 5937 }, { "epoch": 0.4, "learning_rate": 1.3499012608533342e-05, "loss": 0.8379, "step": 5938 }, { "epoch": 0.4, "learning_rate": 1.3496944792086513e-05, "loss": 0.8398, "step": 5939 }, { "epoch": 0.4, "learning_rate": 1.3494876805268707e-05, "loss": 0.8584, "step": 5940 }, { "epoch": 0.4, "learning_rate": 1.349280864818067e-05, "loss": 0.7998, "step": 5941 }, { "epoch": 0.4, "learning_rate": 1.3490740320923168e-05, "loss": 0.835, "step": 5942 }, { "epoch": 0.41, "learning_rate": 1.3488671823596971e-05, "loss": 0.8252, "step": 5943 }, { "epoch": 0.41, "learning_rate": 1.3486603156302846e-05, "loss": 0.7949, "step": 5944 }, { "epoch": 0.41, "learning_rate": 1.3484534319141592e-05, "loss": 0.8027, "step": 5945 }, { "epoch": 0.41, "learning_rate": 1.348246531221399e-05, "loss": 0.7295, "step": 5946 }, { "epoch": 0.41, "learning_rate": 1.3480396135620852e-05, "loss": 0.8164, "step": 5947 }, { "epoch": 0.41, "learning_rate": 1.3478326789462983e-05, "loss": 0.7637, "step": 5948 }, { "epoch": 0.41, "learning_rate": 1.3476257273841202e-05, "loss": 0.8037, "step": 5949 }, { "epoch": 0.41, "learning_rate": 1.3474187588856338e-05, "loss": 0.7705, "step": 5950 }, { "epoch": 0.41, "learning_rate": 1.3472117734609223e-05, "loss": 0.791, "step": 5951 }, { "epoch": 0.41, "learning_rate": 1.34700477112007e-05, "loss": 0.7871, "step": 5952 }, { "epoch": 0.41, "learning_rate": 1.3467977518731621e-05, "loss": 0.8408, "step": 5953 }, { "epoch": 0.41, "learning_rate": 1.346590715730285e-05, "loss": 0.8232, "step": 5954 }, { "epoch": 0.41, "learning_rate": 1.346383662701525e-05, "loss": 0.8672, "step": 5955 }, { "epoch": 0.41, "learning_rate": 1.3461765927969696e-05, "loss": 0.7588, "step": 5956 }, { "epoch": 0.41, "learning_rate": 1.3459695060267076e-05, "loss": 0.8477, "step": 5957 }, { "epoch": 0.41, "learning_rate": 1.3457624024008285e-05, "loss": 0.835, "step": 5958 }, { "epoch": 0.41, "learning_rate": 1.3455552819294213e-05, "loss": 0.8242, "step": 5959 }, { "epoch": 0.41, "learning_rate": 1.3453481446225782e-05, "loss": 0.7646, "step": 5960 }, { "epoch": 0.41, "learning_rate": 1.3451409904903903e-05, "loss": 0.8379, "step": 5961 }, { "epoch": 0.41, "learning_rate": 1.3449338195429497e-05, "loss": 0.832, "step": 5962 }, { "epoch": 0.41, "learning_rate": 1.344726631790351e-05, "loss": 0.8662, "step": 5963 }, { "epoch": 0.41, "learning_rate": 1.344519427242687e-05, "loss": 0.7549, "step": 5964 }, { "epoch": 0.41, "learning_rate": 1.3443122059100533e-05, "loss": 0.8379, "step": 5965 }, { "epoch": 0.41, "learning_rate": 1.3441049678025459e-05, "loss": 0.832, "step": 5966 }, { "epoch": 0.41, "learning_rate": 1.3438977129302613e-05, "loss": 0.8428, "step": 5967 }, { "epoch": 0.41, "learning_rate": 1.3436904413032968e-05, "loss": 0.8447, "step": 5968 }, { "epoch": 0.41, "learning_rate": 1.343483152931751e-05, "loss": 0.8086, "step": 5969 }, { "epoch": 0.41, "learning_rate": 1.3432758478257224e-05, "loss": 0.7168, "step": 5970 }, { "epoch": 0.41, "learning_rate": 1.3430685259953113e-05, "loss": 0.8164, "step": 5971 }, { "epoch": 0.41, "learning_rate": 1.3428611874506185e-05, "loss": 0.8262, "step": 5972 }, { "epoch": 0.41, "learning_rate": 1.3426538322017456e-05, "loss": 0.8047, "step": 5973 }, { "epoch": 0.41, "learning_rate": 1.3424464602587941e-05, "loss": 0.7617, "step": 5974 }, { "epoch": 0.41, "learning_rate": 1.342239071631868e-05, "loss": 0.8008, "step": 5975 }, { "epoch": 0.41, "learning_rate": 1.3420316663310713e-05, "loss": 0.8145, "step": 5976 }, { "epoch": 0.41, "learning_rate": 1.3418242443665081e-05, "loss": 0.8193, "step": 5977 }, { "epoch": 0.41, "learning_rate": 1.3416168057482845e-05, "loss": 0.7832, "step": 5978 }, { "epoch": 0.41, "learning_rate": 1.341409350486507e-05, "loss": 0.8398, "step": 5979 }, { "epoch": 0.41, "learning_rate": 1.3412018785912824e-05, "loss": 0.8193, "step": 5980 }, { "epoch": 0.41, "learning_rate": 1.3409943900727189e-05, "loss": 0.8438, "step": 5981 }, { "epoch": 0.41, "learning_rate": 1.3407868849409254e-05, "loss": 0.8682, "step": 5982 }, { "epoch": 0.41, "learning_rate": 1.3405793632060114e-05, "loss": 0.9561, "step": 5983 }, { "epoch": 0.41, "learning_rate": 1.3403718248780877e-05, "loss": 0.7656, "step": 5984 }, { "epoch": 0.41, "learning_rate": 1.340164269967265e-05, "loss": 0.8379, "step": 5985 }, { "epoch": 0.41, "learning_rate": 1.3399566984836558e-05, "loss": 0.8535, "step": 5986 }, { "epoch": 0.41, "learning_rate": 1.339749110437373e-05, "loss": 0.8232, "step": 5987 }, { "epoch": 0.41, "learning_rate": 1.3395415058385297e-05, "loss": 0.8721, "step": 5988 }, { "epoch": 0.41, "learning_rate": 1.3393338846972408e-05, "loss": 0.7783, "step": 5989 }, { "epoch": 0.41, "learning_rate": 1.3391262470236218e-05, "loss": 0.8311, "step": 5990 }, { "epoch": 0.41, "learning_rate": 1.3389185928277887e-05, "loss": 0.8252, "step": 5991 }, { "epoch": 0.41, "learning_rate": 1.3387109221198582e-05, "loss": 0.9033, "step": 5992 }, { "epoch": 0.41, "learning_rate": 1.3385032349099478e-05, "loss": 0.7959, "step": 5993 }, { "epoch": 0.41, "learning_rate": 1.3382955312081767e-05, "loss": 0.8008, "step": 5994 }, { "epoch": 0.41, "learning_rate": 1.3380878110246638e-05, "loss": 0.8623, "step": 5995 }, { "epoch": 0.41, "learning_rate": 1.337880074369529e-05, "loss": 0.832, "step": 5996 }, { "epoch": 0.41, "learning_rate": 1.3376723212528937e-05, "loss": 0.9004, "step": 5997 }, { "epoch": 0.41, "learning_rate": 1.337464551684879e-05, "loss": 0.7686, "step": 5998 }, { "epoch": 0.41, "learning_rate": 1.3372567656756079e-05, "loss": 0.8418, "step": 5999 }, { "epoch": 0.41, "learning_rate": 1.3370489632352037e-05, "loss": 0.8496, "step": 6000 }, { "epoch": 0.41, "learning_rate": 1.3368411443737905e-05, "loss": 0.8037, "step": 6001 }, { "epoch": 0.41, "learning_rate": 1.3366333091014933e-05, "loss": 0.7656, "step": 6002 }, { "epoch": 0.41, "learning_rate": 1.3364254574284377e-05, "loss": 0.9033, "step": 6003 }, { "epoch": 0.41, "learning_rate": 1.33621758936475e-05, "loss": 0.8096, "step": 6004 }, { "epoch": 0.41, "learning_rate": 1.3360097049205578e-05, "loss": 0.8232, "step": 6005 }, { "epoch": 0.41, "learning_rate": 1.335801804105989e-05, "loss": 0.7744, "step": 6006 }, { "epoch": 0.41, "learning_rate": 1.3355938869311729e-05, "loss": 0.8301, "step": 6007 }, { "epoch": 0.41, "learning_rate": 1.335385953406239e-05, "loss": 0.7969, "step": 6008 }, { "epoch": 0.41, "learning_rate": 1.3351780035413175e-05, "loss": 0.7832, "step": 6009 }, { "epoch": 0.41, "learning_rate": 1.3349700373465405e-05, "loss": 0.7734, "step": 6010 }, { "epoch": 0.41, "learning_rate": 1.3347620548320394e-05, "loss": 0.8369, "step": 6011 }, { "epoch": 0.41, "learning_rate": 1.3345540560079473e-05, "loss": 0.8389, "step": 6012 }, { "epoch": 0.41, "learning_rate": 1.334346040884398e-05, "loss": 0.9023, "step": 6013 }, { "epoch": 0.41, "learning_rate": 1.3341380094715257e-05, "loss": 0.9023, "step": 6014 }, { "epoch": 0.41, "learning_rate": 1.333929961779466e-05, "loss": 0.8652, "step": 6015 }, { "epoch": 0.41, "learning_rate": 1.3337218978183549e-05, "loss": 0.8252, "step": 6016 }, { "epoch": 0.41, "learning_rate": 1.3335138175983291e-05, "loss": 0.8584, "step": 6017 }, { "epoch": 0.41, "learning_rate": 1.3333057211295264e-05, "loss": 0.791, "step": 6018 }, { "epoch": 0.41, "learning_rate": 1.3330976084220853e-05, "loss": 0.7588, "step": 6019 }, { "epoch": 0.41, "learning_rate": 1.332889479486145e-05, "loss": 0.7637, "step": 6020 }, { "epoch": 0.41, "learning_rate": 1.3326813343318452e-05, "loss": 0.8555, "step": 6021 }, { "epoch": 0.41, "learning_rate": 1.3324731729693273e-05, "loss": 0.7568, "step": 6022 }, { "epoch": 0.41, "learning_rate": 1.3322649954087325e-05, "loss": 0.8467, "step": 6023 }, { "epoch": 0.41, "learning_rate": 1.3320568016602032e-05, "loss": 0.791, "step": 6024 }, { "epoch": 0.41, "learning_rate": 1.3318485917338829e-05, "loss": 0.7207, "step": 6025 }, { "epoch": 0.41, "learning_rate": 1.3316403656399153e-05, "loss": 0.8262, "step": 6026 }, { "epoch": 0.41, "learning_rate": 1.3314321233884453e-05, "loss": 0.9053, "step": 6027 }, { "epoch": 0.41, "learning_rate": 1.3312238649896185e-05, "loss": 0.8525, "step": 6028 }, { "epoch": 0.41, "learning_rate": 1.331015590453581e-05, "loss": 0.8076, "step": 6029 }, { "epoch": 0.41, "learning_rate": 1.3308072997904801e-05, "loss": 0.8076, "step": 6030 }, { "epoch": 0.41, "learning_rate": 1.3305989930104639e-05, "loss": 0.8477, "step": 6031 }, { "epoch": 0.41, "learning_rate": 1.3303906701236808e-05, "loss": 0.9062, "step": 6032 }, { "epoch": 0.41, "learning_rate": 1.3301823311402801e-05, "loss": 0.8242, "step": 6033 }, { "epoch": 0.41, "learning_rate": 1.3299739760704124e-05, "loss": 0.9326, "step": 6034 }, { "epoch": 0.41, "learning_rate": 1.3297656049242292e-05, "loss": 0.8496, "step": 6035 }, { "epoch": 0.41, "learning_rate": 1.3295572177118815e-05, "loss": 0.7969, "step": 6036 }, { "epoch": 0.41, "learning_rate": 1.3293488144435217e-05, "loss": 0.835, "step": 6037 }, { "epoch": 0.41, "learning_rate": 1.3291403951293045e-05, "loss": 0.7959, "step": 6038 }, { "epoch": 0.41, "learning_rate": 1.3289319597793828e-05, "loss": 0.7256, "step": 6039 }, { "epoch": 0.41, "learning_rate": 1.3287235084039122e-05, "loss": 0.7959, "step": 6040 }, { "epoch": 0.41, "learning_rate": 1.3285150410130484e-05, "loss": 0.8877, "step": 6041 }, { "epoch": 0.41, "learning_rate": 1.3283065576169476e-05, "loss": 0.7988, "step": 6042 }, { "epoch": 0.41, "learning_rate": 1.3280980582257677e-05, "loss": 0.8037, "step": 6043 }, { "epoch": 0.41, "learning_rate": 1.327889542849666e-05, "loss": 0.7998, "step": 6044 }, { "epoch": 0.41, "learning_rate": 1.327681011498802e-05, "loss": 0.8174, "step": 6045 }, { "epoch": 0.41, "learning_rate": 1.327472464183335e-05, "loss": 0.877, "step": 6046 }, { "epoch": 0.41, "learning_rate": 1.3272639009134257e-05, "loss": 0.7773, "step": 6047 }, { "epoch": 0.41, "learning_rate": 1.3270553216992346e-05, "loss": 0.8037, "step": 6048 }, { "epoch": 0.41, "learning_rate": 1.3268467265509248e-05, "loss": 0.8037, "step": 6049 }, { "epoch": 0.41, "learning_rate": 1.326638115478658e-05, "loss": 0.8203, "step": 6050 }, { "epoch": 0.41, "learning_rate": 1.3264294884925984e-05, "loss": 0.7744, "step": 6051 }, { "epoch": 0.41, "learning_rate": 1.3262208456029098e-05, "loss": 0.9082, "step": 6052 }, { "epoch": 0.41, "learning_rate": 1.3260121868197578e-05, "loss": 0.874, "step": 6053 }, { "epoch": 0.41, "learning_rate": 1.3258035121533077e-05, "loss": 0.752, "step": 6054 }, { "epoch": 0.41, "learning_rate": 1.3255948216137264e-05, "loss": 0.8184, "step": 6055 }, { "epoch": 0.41, "learning_rate": 1.3253861152111815e-05, "loss": 0.8369, "step": 6056 }, { "epoch": 0.41, "learning_rate": 1.3251773929558407e-05, "loss": 0.8232, "step": 6057 }, { "epoch": 0.41, "learning_rate": 1.3249686548578733e-05, "loss": 0.8574, "step": 6058 }, { "epoch": 0.41, "learning_rate": 1.324759900927449e-05, "loss": 0.7891, "step": 6059 }, { "epoch": 0.41, "learning_rate": 1.3245511311747377e-05, "loss": 0.8564, "step": 6060 }, { "epoch": 0.41, "learning_rate": 1.3243423456099116e-05, "loss": 0.8213, "step": 6061 }, { "epoch": 0.41, "learning_rate": 1.324133544243142e-05, "loss": 0.8125, "step": 6062 }, { "epoch": 0.41, "learning_rate": 1.3239247270846019e-05, "loss": 0.8193, "step": 6063 }, { "epoch": 0.41, "learning_rate": 1.323715894144465e-05, "loss": 0.8877, "step": 6064 }, { "epoch": 0.41, "learning_rate": 1.3235070454329055e-05, "loss": 0.8896, "step": 6065 }, { "epoch": 0.41, "learning_rate": 1.3232981809600984e-05, "loss": 0.8496, "step": 6066 }, { "epoch": 0.41, "learning_rate": 1.32308930073622e-05, "loss": 0.8066, "step": 6067 }, { "epoch": 0.41, "learning_rate": 1.3228804047714462e-05, "loss": 0.7432, "step": 6068 }, { "epoch": 0.41, "learning_rate": 1.3226714930759552e-05, "loss": 0.8408, "step": 6069 }, { "epoch": 0.41, "learning_rate": 1.3224625656599246e-05, "loss": 0.7949, "step": 6070 }, { "epoch": 0.41, "learning_rate": 1.3222536225335336e-05, "loss": 0.8203, "step": 6071 }, { "epoch": 0.41, "learning_rate": 1.322044663706962e-05, "loss": 0.8555, "step": 6072 }, { "epoch": 0.41, "learning_rate": 1.32183568919039e-05, "loss": 0.7998, "step": 6073 }, { "epoch": 0.41, "learning_rate": 1.3216266989939987e-05, "loss": 0.8184, "step": 6074 }, { "epoch": 0.41, "learning_rate": 1.3214176931279704e-05, "loss": 0.752, "step": 6075 }, { "epoch": 0.41, "learning_rate": 1.3212086716024877e-05, "loss": 0.8584, "step": 6076 }, { "epoch": 0.41, "learning_rate": 1.3209996344277346e-05, "loss": 0.875, "step": 6077 }, { "epoch": 0.41, "learning_rate": 1.3207905816138941e-05, "loss": 0.8604, "step": 6078 }, { "epoch": 0.41, "learning_rate": 1.3205815131711529e-05, "loss": 0.8477, "step": 6079 }, { "epoch": 0.41, "learning_rate": 1.3203724291096958e-05, "loss": 0.833, "step": 6080 }, { "epoch": 0.41, "learning_rate": 1.3201633294397093e-05, "loss": 0.8174, "step": 6081 }, { "epoch": 0.41, "learning_rate": 1.3199542141713814e-05, "loss": 0.8389, "step": 6082 }, { "epoch": 0.41, "learning_rate": 1.3197450833148997e-05, "loss": 0.8594, "step": 6083 }, { "epoch": 0.41, "learning_rate": 1.319535936880453e-05, "loss": 0.9385, "step": 6084 }, { "epoch": 0.41, "learning_rate": 1.3193267748782312e-05, "loss": 0.8008, "step": 6085 }, { "epoch": 0.41, "learning_rate": 1.3191175973184242e-05, "loss": 0.8691, "step": 6086 }, { "epoch": 0.41, "learning_rate": 1.3189084042112237e-05, "loss": 0.8535, "step": 6087 }, { "epoch": 0.41, "learning_rate": 1.318699195566821e-05, "loss": 0.8174, "step": 6088 }, { "epoch": 0.41, "learning_rate": 1.3184899713954095e-05, "loss": 0.7988, "step": 6089 }, { "epoch": 0.42, "learning_rate": 1.3182807317071818e-05, "loss": 0.8076, "step": 6090 }, { "epoch": 0.42, "learning_rate": 1.3180714765123324e-05, "loss": 0.8359, "step": 6091 }, { "epoch": 0.42, "learning_rate": 1.3178622058210564e-05, "loss": 0.7588, "step": 6092 }, { "epoch": 0.42, "learning_rate": 1.317652919643549e-05, "loss": 0.8281, "step": 6093 }, { "epoch": 0.42, "learning_rate": 1.3174436179900068e-05, "loss": 0.7803, "step": 6094 }, { "epoch": 0.42, "learning_rate": 1.3172343008706272e-05, "loss": 0.791, "step": 6095 }, { "epoch": 0.42, "learning_rate": 1.3170249682956078e-05, "loss": 0.8076, "step": 6096 }, { "epoch": 0.42, "learning_rate": 1.3168156202751475e-05, "loss": 0.7715, "step": 6097 }, { "epoch": 0.42, "learning_rate": 1.3166062568194458e-05, "loss": 0.8057, "step": 6098 }, { "epoch": 0.42, "learning_rate": 1.3163968779387021e-05, "loss": 0.7949, "step": 6099 }, { "epoch": 0.42, "learning_rate": 1.3161874836431185e-05, "loss": 0.7871, "step": 6100 }, { "epoch": 0.42, "learning_rate": 1.315978073942896e-05, "loss": 0.8525, "step": 6101 }, { "epoch": 0.42, "learning_rate": 1.3157686488482369e-05, "loss": 0.793, "step": 6102 }, { "epoch": 0.42, "learning_rate": 1.315559208369345e-05, "loss": 0.8291, "step": 6103 }, { "epoch": 0.42, "learning_rate": 1.3153497525164236e-05, "loss": 0.7939, "step": 6104 }, { "epoch": 0.42, "learning_rate": 1.3151402812996778e-05, "loss": 0.8438, "step": 6105 }, { "epoch": 0.42, "learning_rate": 1.3149307947293126e-05, "loss": 0.8076, "step": 6106 }, { "epoch": 0.42, "learning_rate": 1.3147212928155349e-05, "loss": 0.8115, "step": 6107 }, { "epoch": 0.42, "learning_rate": 1.3145117755685508e-05, "loss": 0.834, "step": 6108 }, { "epoch": 0.42, "learning_rate": 1.3143022429985684e-05, "loss": 0.8682, "step": 6109 }, { "epoch": 0.42, "learning_rate": 1.3140926951157961e-05, "loss": 0.7773, "step": 6110 }, { "epoch": 0.42, "learning_rate": 1.3138831319304428e-05, "loss": 0.79, "step": 6111 }, { "epoch": 0.42, "learning_rate": 1.3136735534527187e-05, "loss": 0.8916, "step": 6112 }, { "epoch": 0.42, "learning_rate": 1.3134639596928346e-05, "loss": 0.8066, "step": 6113 }, { "epoch": 0.42, "learning_rate": 1.3132543506610014e-05, "loss": 0.8369, "step": 6114 }, { "epoch": 0.42, "learning_rate": 1.3130447263674317e-05, "loss": 0.8672, "step": 6115 }, { "epoch": 0.42, "learning_rate": 1.3128350868223385e-05, "loss": 0.8711, "step": 6116 }, { "epoch": 0.42, "learning_rate": 1.3126254320359344e-05, "loss": 0.8203, "step": 6117 }, { "epoch": 0.42, "learning_rate": 1.312415762018435e-05, "loss": 0.8438, "step": 6118 }, { "epoch": 0.42, "learning_rate": 1.3122060767800547e-05, "loss": 0.8428, "step": 6119 }, { "epoch": 0.42, "learning_rate": 1.3119963763310095e-05, "loss": 0.8008, "step": 6120 }, { "epoch": 0.42, "learning_rate": 1.3117866606815165e-05, "loss": 0.8701, "step": 6121 }, { "epoch": 0.42, "learning_rate": 1.3115769298417923e-05, "loss": 0.8779, "step": 6122 }, { "epoch": 0.42, "learning_rate": 1.3113671838220552e-05, "loss": 0.7861, "step": 6123 }, { "epoch": 0.42, "learning_rate": 1.311157422632524e-05, "loss": 0.8838, "step": 6124 }, { "epoch": 0.42, "learning_rate": 1.3109476462834186e-05, "loss": 0.9043, "step": 6125 }, { "epoch": 0.42, "learning_rate": 1.310737854784959e-05, "loss": 0.8818, "step": 6126 }, { "epoch": 0.42, "learning_rate": 1.3105280481473661e-05, "loss": 0.7568, "step": 6127 }, { "epoch": 0.42, "learning_rate": 1.3103182263808617e-05, "loss": 0.9395, "step": 6128 }, { "epoch": 0.42, "learning_rate": 1.310108389495669e-05, "loss": 0.7979, "step": 6129 }, { "epoch": 0.42, "learning_rate": 1.3098985375020104e-05, "loss": 0.8789, "step": 6130 }, { "epoch": 0.42, "learning_rate": 1.30968867041011e-05, "loss": 0.8018, "step": 6131 }, { "epoch": 0.42, "learning_rate": 1.3094787882301927e-05, "loss": 0.8984, "step": 6132 }, { "epoch": 0.42, "learning_rate": 1.3092688909724842e-05, "loss": 0.7607, "step": 6133 }, { "epoch": 0.42, "learning_rate": 1.3090589786472104e-05, "loss": 0.8037, "step": 6134 }, { "epoch": 0.42, "learning_rate": 1.3088490512645979e-05, "loss": 0.8984, "step": 6135 }, { "epoch": 0.42, "learning_rate": 1.308639108834875e-05, "loss": 0.917, "step": 6136 }, { "epoch": 0.42, "learning_rate": 1.3084291513682697e-05, "loss": 0.875, "step": 6137 }, { "epoch": 0.42, "learning_rate": 1.308219178875011e-05, "loss": 0.834, "step": 6138 }, { "epoch": 0.42, "learning_rate": 1.3080091913653292e-05, "loss": 0.8711, "step": 6139 }, { "epoch": 0.42, "learning_rate": 1.307799188849454e-05, "loss": 0.7354, "step": 6140 }, { "epoch": 0.42, "learning_rate": 1.3075891713376181e-05, "loss": 0.8457, "step": 6141 }, { "epoch": 0.42, "learning_rate": 1.3073791388400528e-05, "loss": 0.8115, "step": 6142 }, { "epoch": 0.42, "learning_rate": 1.3071690913669902e-05, "loss": 0.8242, "step": 6143 }, { "epoch": 0.42, "learning_rate": 1.306959028928665e-05, "loss": 0.835, "step": 6144 }, { "epoch": 0.42, "learning_rate": 1.3067489515353105e-05, "loss": 0.8301, "step": 6145 }, { "epoch": 0.42, "learning_rate": 1.3065388591971622e-05, "loss": 0.791, "step": 6146 }, { "epoch": 0.42, "learning_rate": 1.3063287519244556e-05, "loss": 0.7617, "step": 6147 }, { "epoch": 0.42, "learning_rate": 1.3061186297274273e-05, "loss": 0.8262, "step": 6148 }, { "epoch": 0.42, "learning_rate": 1.3059084926163141e-05, "loss": 0.8135, "step": 6149 }, { "epoch": 0.42, "learning_rate": 1.3056983406013541e-05, "loss": 0.8887, "step": 6150 }, { "epoch": 0.42, "learning_rate": 1.305488173692786e-05, "loss": 0.8486, "step": 6151 }, { "epoch": 0.42, "learning_rate": 1.3052779919008487e-05, "loss": 0.7656, "step": 6152 }, { "epoch": 0.42, "learning_rate": 1.3050677952357826e-05, "loss": 0.7949, "step": 6153 }, { "epoch": 0.42, "learning_rate": 1.3048575837078286e-05, "loss": 0.8184, "step": 6154 }, { "epoch": 0.42, "learning_rate": 1.3046473573272279e-05, "loss": 0.8984, "step": 6155 }, { "epoch": 0.42, "learning_rate": 1.3044371161042226e-05, "loss": 0.7773, "step": 6156 }, { "epoch": 0.42, "learning_rate": 1.3042268600490562e-05, "loss": 0.8262, "step": 6157 }, { "epoch": 0.42, "learning_rate": 1.3040165891719716e-05, "loss": 0.8818, "step": 6158 }, { "epoch": 0.42, "learning_rate": 1.303806303483214e-05, "loss": 0.7754, "step": 6159 }, { "epoch": 0.42, "learning_rate": 1.303596002993028e-05, "loss": 0.8828, "step": 6160 }, { "epoch": 0.42, "learning_rate": 1.3033856877116593e-05, "loss": 0.8994, "step": 6161 }, { "epoch": 0.42, "learning_rate": 1.3031753576493549e-05, "loss": 0.7373, "step": 6162 }, { "epoch": 0.42, "learning_rate": 1.3029650128163618e-05, "loss": 0.8477, "step": 6163 }, { "epoch": 0.42, "learning_rate": 1.302754653222928e-05, "loss": 0.8369, "step": 6164 }, { "epoch": 0.42, "learning_rate": 1.3025442788793026e-05, "loss": 0.8398, "step": 6165 }, { "epoch": 0.42, "learning_rate": 1.3023338897957342e-05, "loss": 0.8125, "step": 6166 }, { "epoch": 0.42, "learning_rate": 1.3021234859824737e-05, "loss": 0.8311, "step": 6167 }, { "epoch": 0.42, "learning_rate": 1.3019130674497717e-05, "loss": 0.8262, "step": 6168 }, { "epoch": 0.42, "learning_rate": 1.3017026342078798e-05, "loss": 0.8574, "step": 6169 }, { "epoch": 0.42, "learning_rate": 1.3014921862670499e-05, "loss": 0.8438, "step": 6170 }, { "epoch": 0.42, "learning_rate": 1.3012817236375359e-05, "loss": 0.79, "step": 6171 }, { "epoch": 0.42, "learning_rate": 1.3010712463295909e-05, "loss": 0.8223, "step": 6172 }, { "epoch": 0.42, "learning_rate": 1.3008607543534693e-05, "loss": 0.8525, "step": 6173 }, { "epoch": 0.42, "learning_rate": 1.3006502477194265e-05, "loss": 0.8281, "step": 6174 }, { "epoch": 0.42, "learning_rate": 1.3004397264377184e-05, "loss": 0.8457, "step": 6175 }, { "epoch": 0.42, "learning_rate": 1.300229190518601e-05, "loss": 0.7539, "step": 6176 }, { "epoch": 0.42, "learning_rate": 1.3000186399723326e-05, "loss": 0.8174, "step": 6177 }, { "epoch": 0.42, "learning_rate": 1.2998080748091708e-05, "loss": 0.8447, "step": 6178 }, { "epoch": 0.42, "learning_rate": 1.2995974950393738e-05, "loss": 0.7949, "step": 6179 }, { "epoch": 0.42, "learning_rate": 1.2993869006732016e-05, "loss": 0.874, "step": 6180 }, { "epoch": 0.42, "learning_rate": 1.2991762917209142e-05, "loss": 0.8311, "step": 6181 }, { "epoch": 0.42, "learning_rate": 1.2989656681927723e-05, "loss": 0.8291, "step": 6182 }, { "epoch": 0.42, "learning_rate": 1.2987550300990379e-05, "loss": 0.793, "step": 6183 }, { "epoch": 0.42, "learning_rate": 1.2985443774499729e-05, "loss": 0.8379, "step": 6184 }, { "epoch": 0.42, "learning_rate": 1.2983337102558405e-05, "loss": 0.8379, "step": 6185 }, { "epoch": 0.42, "learning_rate": 1.2981230285269042e-05, "loss": 0.8682, "step": 6186 }, { "epoch": 0.42, "learning_rate": 1.2979123322734283e-05, "loss": 0.75, "step": 6187 }, { "epoch": 0.42, "learning_rate": 1.2977016215056781e-05, "loss": 0.793, "step": 6188 }, { "epoch": 0.42, "learning_rate": 1.2974908962339197e-05, "loss": 0.8564, "step": 6189 }, { "epoch": 0.42, "learning_rate": 1.2972801564684192e-05, "loss": 0.792, "step": 6190 }, { "epoch": 0.42, "learning_rate": 1.2970694022194441e-05, "loss": 0.8799, "step": 6191 }, { "epoch": 0.42, "learning_rate": 1.296858633497262e-05, "loss": 0.8291, "step": 6192 }, { "epoch": 0.42, "learning_rate": 1.296647850312142e-05, "loss": 0.8398, "step": 6193 }, { "epoch": 0.42, "learning_rate": 1.296437052674353e-05, "loss": 0.832, "step": 6194 }, { "epoch": 0.42, "learning_rate": 1.2962262405941652e-05, "loss": 0.8721, "step": 6195 }, { "epoch": 0.42, "learning_rate": 1.2960154140818495e-05, "loss": 0.8408, "step": 6196 }, { "epoch": 0.42, "learning_rate": 1.2958045731476772e-05, "loss": 0.8066, "step": 6197 }, { "epoch": 0.42, "learning_rate": 1.2955937178019207e-05, "loss": 0.8877, "step": 6198 }, { "epoch": 0.42, "learning_rate": 1.2953828480548524e-05, "loss": 0.8613, "step": 6199 }, { "epoch": 0.42, "learning_rate": 1.2951719639167464e-05, "loss": 0.8643, "step": 6200 }, { "epoch": 0.42, "learning_rate": 1.2949610653978768e-05, "loss": 0.9385, "step": 6201 }, { "epoch": 0.42, "learning_rate": 1.2947501525085182e-05, "loss": 0.8555, "step": 6202 }, { "epoch": 0.42, "learning_rate": 1.2945392252589466e-05, "loss": 0.8711, "step": 6203 }, { "epoch": 0.42, "learning_rate": 1.2943282836594384e-05, "loss": 0.8584, "step": 6204 }, { "epoch": 0.42, "learning_rate": 1.2941173277202706e-05, "loss": 0.8184, "step": 6205 }, { "epoch": 0.42, "learning_rate": 1.2939063574517208e-05, "loss": 0.8145, "step": 6206 }, { "epoch": 0.42, "learning_rate": 1.2936953728640675e-05, "loss": 0.8008, "step": 6207 }, { "epoch": 0.42, "learning_rate": 1.2934843739675902e-05, "loss": 0.8213, "step": 6208 }, { "epoch": 0.42, "learning_rate": 1.2932733607725685e-05, "loss": 0.8516, "step": 6209 }, { "epoch": 0.42, "learning_rate": 1.293062333289283e-05, "loss": 0.7861, "step": 6210 }, { "epoch": 0.42, "learning_rate": 1.292851291528015e-05, "loss": 0.834, "step": 6211 }, { "epoch": 0.42, "learning_rate": 1.2926402354990459e-05, "loss": 0.8193, "step": 6212 }, { "epoch": 0.42, "learning_rate": 1.292429165212659e-05, "loss": 0.835, "step": 6213 }, { "epoch": 0.42, "learning_rate": 1.2922180806791378e-05, "loss": 0.8916, "step": 6214 }, { "epoch": 0.42, "learning_rate": 1.2920069819087654e-05, "loss": 0.832, "step": 6215 }, { "epoch": 0.42, "learning_rate": 1.2917958689118275e-05, "loss": 0.8467, "step": 6216 }, { "epoch": 0.42, "learning_rate": 1.2915847416986086e-05, "loss": 0.834, "step": 6217 }, { "epoch": 0.42, "learning_rate": 1.2913736002793957e-05, "loss": 0.7627, "step": 6218 }, { "epoch": 0.42, "learning_rate": 1.2911624446644753e-05, "loss": 0.8389, "step": 6219 }, { "epoch": 0.42, "learning_rate": 1.2909512748641346e-05, "loss": 0.7881, "step": 6220 }, { "epoch": 0.42, "learning_rate": 1.290740090888662e-05, "loss": 0.7637, "step": 6221 }, { "epoch": 0.42, "learning_rate": 1.2905288927483466e-05, "loss": 0.8281, "step": 6222 }, { "epoch": 0.42, "learning_rate": 1.2903176804534773e-05, "loss": 0.8291, "step": 6223 }, { "epoch": 0.42, "learning_rate": 1.2901064540143448e-05, "loss": 0.8008, "step": 6224 }, { "epoch": 0.42, "learning_rate": 1.2898952134412404e-05, "loss": 0.877, "step": 6225 }, { "epoch": 0.42, "learning_rate": 1.2896839587444552e-05, "loss": 0.8379, "step": 6226 }, { "epoch": 0.42, "learning_rate": 1.2894726899342814e-05, "loss": 0.8662, "step": 6227 }, { "epoch": 0.42, "learning_rate": 1.2892614070210123e-05, "loss": 0.8779, "step": 6228 }, { "epoch": 0.42, "learning_rate": 1.2890501100149417e-05, "loss": 0.8086, "step": 6229 }, { "epoch": 0.42, "learning_rate": 1.288838798926364e-05, "loss": 0.8525, "step": 6230 }, { "epoch": 0.42, "learning_rate": 1.2886274737655738e-05, "loss": 0.7393, "step": 6231 }, { "epoch": 0.42, "learning_rate": 1.2884161345428673e-05, "loss": 0.9102, "step": 6232 }, { "epoch": 0.42, "learning_rate": 1.2882047812685405e-05, "loss": 0.7295, "step": 6233 }, { "epoch": 0.42, "learning_rate": 1.2879934139528913e-05, "loss": 0.8672, "step": 6234 }, { "epoch": 0.42, "learning_rate": 1.2877820326062167e-05, "loss": 0.7871, "step": 6235 }, { "epoch": 0.42, "learning_rate": 1.2875706372388155e-05, "loss": 0.7627, "step": 6236 }, { "epoch": 0.43, "learning_rate": 1.2873592278609871e-05, "loss": 0.8652, "step": 6237 }, { "epoch": 0.43, "learning_rate": 1.287147804483031e-05, "loss": 0.8398, "step": 6238 }, { "epoch": 0.43, "learning_rate": 1.2869363671152478e-05, "loss": 0.8252, "step": 6239 }, { "epoch": 0.43, "learning_rate": 1.286724915767939e-05, "loss": 0.7832, "step": 6240 }, { "epoch": 0.43, "learning_rate": 1.2865134504514061e-05, "loss": 0.835, "step": 6241 }, { "epoch": 0.43, "learning_rate": 1.286301971175952e-05, "loss": 0.6895, "step": 6242 }, { "epoch": 0.43, "learning_rate": 1.2860904779518795e-05, "loss": 0.8359, "step": 6243 }, { "epoch": 0.43, "learning_rate": 1.2858789707894929e-05, "loss": 0.7803, "step": 6244 }, { "epoch": 0.43, "learning_rate": 1.2856674496990973e-05, "loss": 0.8281, "step": 6245 }, { "epoch": 0.43, "learning_rate": 1.285455914690997e-05, "loss": 0.8174, "step": 6246 }, { "epoch": 0.43, "learning_rate": 1.2852443657754987e-05, "loss": 0.9365, "step": 6247 }, { "epoch": 0.43, "learning_rate": 1.2850328029629088e-05, "loss": 0.79, "step": 6248 }, { "epoch": 0.43, "learning_rate": 1.2848212262635347e-05, "loss": 0.8184, "step": 6249 }, { "epoch": 0.43, "learning_rate": 1.284609635687684e-05, "loss": 0.8594, "step": 6250 }, { "epoch": 0.43, "learning_rate": 1.2843980312456659e-05, "loss": 0.7656, "step": 6251 }, { "epoch": 0.43, "learning_rate": 1.2841864129477898e-05, "loss": 0.8145, "step": 6252 }, { "epoch": 0.43, "learning_rate": 1.2839747808043652e-05, "loss": 0.9189, "step": 6253 }, { "epoch": 0.43, "learning_rate": 1.2837631348257034e-05, "loss": 0.8242, "step": 6254 }, { "epoch": 0.43, "learning_rate": 1.2835514750221155e-05, "loss": 0.832, "step": 6255 }, { "epoch": 0.43, "learning_rate": 1.2833398014039133e-05, "loss": 0.8213, "step": 6256 }, { "epoch": 0.43, "learning_rate": 1.2831281139814098e-05, "loss": 0.7734, "step": 6257 }, { "epoch": 0.43, "learning_rate": 1.2829164127649189e-05, "loss": 0.7734, "step": 6258 }, { "epoch": 0.43, "learning_rate": 1.2827046977647535e-05, "loss": 0.8389, "step": 6259 }, { "epoch": 0.43, "learning_rate": 1.2824929689912295e-05, "loss": 0.7998, "step": 6260 }, { "epoch": 0.43, "learning_rate": 1.2822812264546616e-05, "loss": 0.8584, "step": 6261 }, { "epoch": 0.43, "learning_rate": 1.282069470165366e-05, "loss": 0.7646, "step": 6262 }, { "epoch": 0.43, "learning_rate": 1.2818577001336598e-05, "loss": 0.7646, "step": 6263 }, { "epoch": 0.43, "learning_rate": 1.2816459163698602e-05, "loss": 0.8213, "step": 6264 }, { "epoch": 0.43, "learning_rate": 1.2814341188842852e-05, "loss": 0.9482, "step": 6265 }, { "epoch": 0.43, "learning_rate": 1.2812223076872536e-05, "loss": 0.7842, "step": 6266 }, { "epoch": 0.43, "learning_rate": 1.281010482789085e-05, "loss": 0.8809, "step": 6267 }, { "epoch": 0.43, "learning_rate": 1.2807986442000992e-05, "loss": 0.7793, "step": 6268 }, { "epoch": 0.43, "learning_rate": 1.2805867919306174e-05, "loss": 0.7949, "step": 6269 }, { "epoch": 0.43, "learning_rate": 1.2803749259909608e-05, "loss": 0.7676, "step": 6270 }, { "epoch": 0.43, "learning_rate": 1.2801630463914512e-05, "loss": 0.9121, "step": 6271 }, { "epoch": 0.43, "learning_rate": 1.2799511531424117e-05, "loss": 0.8047, "step": 6272 }, { "epoch": 0.43, "learning_rate": 1.279739246254166e-05, "loss": 0.8076, "step": 6273 }, { "epoch": 0.43, "learning_rate": 1.2795273257370375e-05, "loss": 0.9219, "step": 6274 }, { "epoch": 0.43, "learning_rate": 1.2793153916013514e-05, "loss": 0.8525, "step": 6275 }, { "epoch": 0.43, "learning_rate": 1.2791034438574332e-05, "loss": 0.8418, "step": 6276 }, { "epoch": 0.43, "learning_rate": 1.2788914825156084e-05, "loss": 0.8027, "step": 6277 }, { "epoch": 0.43, "learning_rate": 1.2786795075862047e-05, "loss": 0.8584, "step": 6278 }, { "epoch": 0.43, "learning_rate": 1.2784675190795487e-05, "loss": 0.8389, "step": 6279 }, { "epoch": 0.43, "learning_rate": 1.2782555170059688e-05, "loss": 0.7393, "step": 6280 }, { "epoch": 0.43, "learning_rate": 1.2780435013757937e-05, "loss": 0.8115, "step": 6281 }, { "epoch": 0.43, "learning_rate": 1.2778314721993528e-05, "loss": 0.8926, "step": 6282 }, { "epoch": 0.43, "learning_rate": 1.2776194294869758e-05, "loss": 0.832, "step": 6283 }, { "epoch": 0.43, "learning_rate": 1.2774073732489945e-05, "loss": 0.8066, "step": 6284 }, { "epoch": 0.43, "learning_rate": 1.2771953034957389e-05, "loss": 0.8027, "step": 6285 }, { "epoch": 0.43, "learning_rate": 1.2769832202375416e-05, "loss": 0.8145, "step": 6286 }, { "epoch": 0.43, "learning_rate": 1.2767711234847355e-05, "loss": 0.8223, "step": 6287 }, { "epoch": 0.43, "learning_rate": 1.276559013247654e-05, "loss": 0.7988, "step": 6288 }, { "epoch": 0.43, "learning_rate": 1.2763468895366304e-05, "loss": 0.8936, "step": 6289 }, { "epoch": 0.43, "learning_rate": 1.276134752362e-05, "loss": 0.7578, "step": 6290 }, { "epoch": 0.43, "learning_rate": 1.2759226017340983e-05, "loss": 0.8965, "step": 6291 }, { "epoch": 0.43, "learning_rate": 1.2757104376632603e-05, "loss": 0.8975, "step": 6292 }, { "epoch": 0.43, "learning_rate": 1.2754982601598234e-05, "loss": 0.8438, "step": 6293 }, { "epoch": 0.43, "learning_rate": 1.275286069234125e-05, "loss": 0.8066, "step": 6294 }, { "epoch": 0.43, "learning_rate": 1.2750738648965021e-05, "loss": 0.8115, "step": 6295 }, { "epoch": 0.43, "learning_rate": 1.2748616471572946e-05, "loss": 0.7793, "step": 6296 }, { "epoch": 0.43, "learning_rate": 1.2746494160268406e-05, "loss": 0.8066, "step": 6297 }, { "epoch": 0.43, "learning_rate": 1.2744371715154807e-05, "loss": 0.8438, "step": 6298 }, { "epoch": 0.43, "learning_rate": 1.2742249136335552e-05, "loss": 0.793, "step": 6299 }, { "epoch": 0.43, "learning_rate": 1.274012642391405e-05, "loss": 0.7861, "step": 6300 }, { "epoch": 0.43, "learning_rate": 1.2738003577993725e-05, "loss": 0.9014, "step": 6301 }, { "epoch": 0.43, "learning_rate": 1.2735880598678e-05, "loss": 0.8076, "step": 6302 }, { "epoch": 0.43, "learning_rate": 1.2733757486070301e-05, "loss": 0.8096, "step": 6303 }, { "epoch": 0.43, "learning_rate": 1.2731634240274074e-05, "loss": 0.8447, "step": 6304 }, { "epoch": 0.43, "learning_rate": 1.272951086139276e-05, "loss": 0.8369, "step": 6305 }, { "epoch": 0.43, "learning_rate": 1.272738734952981e-05, "loss": 0.7646, "step": 6306 }, { "epoch": 0.43, "learning_rate": 1.2725263704788682e-05, "loss": 0.8096, "step": 6307 }, { "epoch": 0.43, "learning_rate": 1.2723139927272836e-05, "loss": 0.8096, "step": 6308 }, { "epoch": 0.43, "learning_rate": 1.272101601708575e-05, "loss": 0.8203, "step": 6309 }, { "epoch": 0.43, "learning_rate": 1.2718891974330893e-05, "loss": 0.8057, "step": 6310 }, { "epoch": 0.43, "learning_rate": 1.2716767799111751e-05, "loss": 0.8018, "step": 6311 }, { "epoch": 0.43, "learning_rate": 1.2714643491531818e-05, "loss": 0.8555, "step": 6312 }, { "epoch": 0.43, "learning_rate": 1.2712519051694581e-05, "loss": 0.8525, "step": 6313 }, { "epoch": 0.43, "learning_rate": 1.2710394479703553e-05, "loss": 0.8818, "step": 6314 }, { "epoch": 0.43, "learning_rate": 1.270826977566224e-05, "loss": 0.8486, "step": 6315 }, { "epoch": 0.43, "learning_rate": 1.2706144939674147e-05, "loss": 0.7529, "step": 6316 }, { "epoch": 0.43, "learning_rate": 1.2704019971842811e-05, "loss": 0.8857, "step": 6317 }, { "epoch": 0.43, "learning_rate": 1.2701894872271754e-05, "loss": 0.6592, "step": 6318 }, { "epoch": 0.43, "learning_rate": 1.2699769641064508e-05, "loss": 0.7842, "step": 6319 }, { "epoch": 0.43, "learning_rate": 1.2697644278324619e-05, "loss": 0.8154, "step": 6320 }, { "epoch": 0.43, "learning_rate": 1.269551878415563e-05, "loss": 0.8076, "step": 6321 }, { "epoch": 0.43, "learning_rate": 1.2693393158661098e-05, "loss": 0.7578, "step": 6322 }, { "epoch": 0.43, "learning_rate": 1.2691267401944582e-05, "loss": 0.8252, "step": 6323 }, { "epoch": 0.43, "learning_rate": 1.2689141514109653e-05, "loss": 0.791, "step": 6324 }, { "epoch": 0.43, "learning_rate": 1.2687015495259878e-05, "loss": 0.8896, "step": 6325 }, { "epoch": 0.43, "learning_rate": 1.2684889345498838e-05, "loss": 0.8652, "step": 6326 }, { "epoch": 0.43, "learning_rate": 1.268276306493012e-05, "loss": 0.8057, "step": 6327 }, { "epoch": 0.43, "learning_rate": 1.268063665365732e-05, "loss": 0.8721, "step": 6328 }, { "epoch": 0.43, "learning_rate": 1.267851011178403e-05, "loss": 0.8721, "step": 6329 }, { "epoch": 0.43, "learning_rate": 1.267638343941386e-05, "loss": 0.8018, "step": 6330 }, { "epoch": 0.43, "learning_rate": 1.2674256636650415e-05, "loss": 0.8984, "step": 6331 }, { "epoch": 0.43, "learning_rate": 1.2672129703597321e-05, "loss": 0.9033, "step": 6332 }, { "epoch": 0.43, "learning_rate": 1.2670002640358198e-05, "loss": 0.8496, "step": 6333 }, { "epoch": 0.43, "learning_rate": 1.2667875447036672e-05, "loss": 0.8369, "step": 6334 }, { "epoch": 0.43, "learning_rate": 1.266574812373639e-05, "loss": 0.8066, "step": 6335 }, { "epoch": 0.43, "learning_rate": 1.2663620670560988e-05, "loss": 0.7158, "step": 6336 }, { "epoch": 0.43, "learning_rate": 1.2661493087614117e-05, "loss": 0.8164, "step": 6337 }, { "epoch": 0.43, "learning_rate": 1.2659365374999433e-05, "loss": 0.835, "step": 6338 }, { "epoch": 0.43, "learning_rate": 1.2657237532820594e-05, "loss": 0.8242, "step": 6339 }, { "epoch": 0.43, "learning_rate": 1.2655109561181274e-05, "loss": 0.9014, "step": 6340 }, { "epoch": 0.43, "learning_rate": 1.2652981460185147e-05, "loss": 0.8135, "step": 6341 }, { "epoch": 0.43, "learning_rate": 1.2650853229935892e-05, "loss": 0.833, "step": 6342 }, { "epoch": 0.43, "learning_rate": 1.2648724870537194e-05, "loss": 0.7939, "step": 6343 }, { "epoch": 0.43, "learning_rate": 1.2646596382092753e-05, "loss": 0.9355, "step": 6344 }, { "epoch": 0.43, "learning_rate": 1.2644467764706265e-05, "loss": 0.7578, "step": 6345 }, { "epoch": 0.43, "learning_rate": 1.2642339018481435e-05, "loss": 0.7891, "step": 6346 }, { "epoch": 0.43, "learning_rate": 1.2640210143521978e-05, "loss": 0.8467, "step": 6347 }, { "epoch": 0.43, "learning_rate": 1.2638081139931613e-05, "loss": 0.7578, "step": 6348 }, { "epoch": 0.43, "learning_rate": 1.2635952007814058e-05, "loss": 0.8389, "step": 6349 }, { "epoch": 0.43, "learning_rate": 1.2633822747273055e-05, "loss": 0.8398, "step": 6350 }, { "epoch": 0.43, "learning_rate": 1.2631693358412336e-05, "loss": 0.8857, "step": 6351 }, { "epoch": 0.43, "learning_rate": 1.2629563841335642e-05, "loss": 0.8174, "step": 6352 }, { "epoch": 0.43, "learning_rate": 1.2627434196146729e-05, "loss": 0.8281, "step": 6353 }, { "epoch": 0.43, "learning_rate": 1.2625304422949346e-05, "loss": 0.7988, "step": 6354 }, { "epoch": 0.43, "learning_rate": 1.2623174521847263e-05, "loss": 0.8096, "step": 6355 }, { "epoch": 0.43, "learning_rate": 1.2621044492944246e-05, "loss": 0.7627, "step": 6356 }, { "epoch": 0.43, "learning_rate": 1.2618914336344066e-05, "loss": 0.7441, "step": 6357 }, { "epoch": 0.43, "learning_rate": 1.2616784052150508e-05, "loss": 0.7725, "step": 6358 }, { "epoch": 0.43, "learning_rate": 1.2614653640467362e-05, "loss": 0.917, "step": 6359 }, { "epoch": 0.43, "learning_rate": 1.2612523101398415e-05, "loss": 0.7842, "step": 6360 }, { "epoch": 0.43, "learning_rate": 1.2610392435047469e-05, "loss": 0.8398, "step": 6361 }, { "epoch": 0.43, "learning_rate": 1.2608261641518333e-05, "loss": 0.7461, "step": 6362 }, { "epoch": 0.43, "learning_rate": 1.2606130720914815e-05, "loss": 0.8223, "step": 6363 }, { "epoch": 0.43, "learning_rate": 1.260399967334074e-05, "loss": 0.8379, "step": 6364 }, { "epoch": 0.43, "learning_rate": 1.2601868498899924e-05, "loss": 0.7754, "step": 6365 }, { "epoch": 0.43, "learning_rate": 1.2599737197696201e-05, "loss": 0.7891, "step": 6366 }, { "epoch": 0.43, "learning_rate": 1.2597605769833407e-05, "loss": 0.8086, "step": 6367 }, { "epoch": 0.43, "learning_rate": 1.259547421541539e-05, "loss": 0.8184, "step": 6368 }, { "epoch": 0.43, "learning_rate": 1.2593342534545996e-05, "loss": 0.7686, "step": 6369 }, { "epoch": 0.43, "learning_rate": 1.2591210727329077e-05, "loss": 0.8135, "step": 6370 }, { "epoch": 0.43, "learning_rate": 1.2589078793868503e-05, "loss": 0.8105, "step": 6371 }, { "epoch": 0.43, "learning_rate": 1.2586946734268133e-05, "loss": 0.8428, "step": 6372 }, { "epoch": 0.43, "learning_rate": 1.2584814548631843e-05, "loss": 0.8291, "step": 6373 }, { "epoch": 0.43, "learning_rate": 1.2582682237063517e-05, "loss": 0.8408, "step": 6374 }, { "epoch": 0.43, "learning_rate": 1.2580549799667034e-05, "loss": 0.8984, "step": 6375 }, { "epoch": 0.43, "learning_rate": 1.2578417236546296e-05, "loss": 0.8545, "step": 6376 }, { "epoch": 0.43, "learning_rate": 1.2576284547805196e-05, "loss": 0.8311, "step": 6377 }, { "epoch": 0.43, "learning_rate": 1.2574151733547636e-05, "loss": 0.7939, "step": 6378 }, { "epoch": 0.43, "learning_rate": 1.2572018793877527e-05, "loss": 0.75, "step": 6379 }, { "epoch": 0.43, "learning_rate": 1.256988572889879e-05, "loss": 0.7783, "step": 6380 }, { "epoch": 0.43, "learning_rate": 1.2567752538715345e-05, "loss": 0.8096, "step": 6381 }, { "epoch": 0.43, "learning_rate": 1.2565619223431124e-05, "loss": 0.8066, "step": 6382 }, { "epoch": 0.43, "learning_rate": 1.2563485783150058e-05, "loss": 0.8301, "step": 6383 }, { "epoch": 0.44, "learning_rate": 1.2561352217976089e-05, "loss": 0.9043, "step": 6384 }, { "epoch": 0.44, "learning_rate": 1.2559218528013166e-05, "loss": 0.8164, "step": 6385 }, { "epoch": 0.44, "learning_rate": 1.255708471336524e-05, "loss": 0.8223, "step": 6386 }, { "epoch": 0.44, "learning_rate": 1.2554950774136271e-05, "loss": 0.8291, "step": 6387 }, { "epoch": 0.44, "learning_rate": 1.2552816710430226e-05, "loss": 0.7783, "step": 6388 }, { "epoch": 0.44, "learning_rate": 1.2550682522351077e-05, "loss": 0.8779, "step": 6389 }, { "epoch": 0.44, "learning_rate": 1.2548548210002798e-05, "loss": 0.8076, "step": 6390 }, { "epoch": 0.44, "learning_rate": 1.2546413773489374e-05, "loss": 0.8301, "step": 6391 }, { "epoch": 0.44, "learning_rate": 1.2544279212914796e-05, "loss": 0.7285, "step": 6392 }, { "epoch": 0.44, "learning_rate": 1.2542144528383056e-05, "loss": 0.8242, "step": 6393 }, { "epoch": 0.44, "learning_rate": 1.2540009719998163e-05, "loss": 0.8096, "step": 6394 }, { "epoch": 0.44, "learning_rate": 1.253787478786412e-05, "loss": 0.8164, "step": 6395 }, { "epoch": 0.44, "learning_rate": 1.2535739732084938e-05, "loss": 0.832, "step": 6396 }, { "epoch": 0.44, "learning_rate": 1.2533604552764642e-05, "loss": 0.8555, "step": 6397 }, { "epoch": 0.44, "learning_rate": 1.2531469250007253e-05, "loss": 0.9131, "step": 6398 }, { "epoch": 0.44, "learning_rate": 1.2529333823916807e-05, "loss": 0.7725, "step": 6399 }, { "epoch": 0.44, "learning_rate": 1.2527198274597343e-05, "loss": 0.8594, "step": 6400 }, { "epoch": 0.44, "learning_rate": 1.2525062602152899e-05, "loss": 0.8223, "step": 6401 }, { "epoch": 0.44, "learning_rate": 1.2522926806687529e-05, "loss": 0.8291, "step": 6402 }, { "epoch": 0.44, "learning_rate": 1.2520790888305291e-05, "loss": 0.7539, "step": 6403 }, { "epoch": 0.44, "learning_rate": 1.251865484711024e-05, "loss": 0.8164, "step": 6404 }, { "epoch": 0.44, "learning_rate": 1.251651868320645e-05, "loss": 0.874, "step": 6405 }, { "epoch": 0.44, "learning_rate": 1.251438239669799e-05, "loss": 0.8916, "step": 6406 }, { "epoch": 0.44, "learning_rate": 1.2512245987688946e-05, "loss": 0.8418, "step": 6407 }, { "epoch": 0.44, "learning_rate": 1.2510109456283396e-05, "loss": 0.8877, "step": 6408 }, { "epoch": 0.44, "learning_rate": 1.250797280258544e-05, "loss": 0.8398, "step": 6409 }, { "epoch": 0.44, "learning_rate": 1.250583602669917e-05, "loss": 0.8535, "step": 6410 }, { "epoch": 0.44, "learning_rate": 1.2503699128728689e-05, "loss": 0.8271, "step": 6411 }, { "epoch": 0.44, "learning_rate": 1.2501562108778109e-05, "loss": 0.7959, "step": 6412 }, { "epoch": 0.44, "learning_rate": 1.2499424966951547e-05, "loss": 0.8848, "step": 6413 }, { "epoch": 0.44, "learning_rate": 1.2497287703353118e-05, "loss": 0.8389, "step": 6414 }, { "epoch": 0.44, "learning_rate": 1.2495150318086959e-05, "loss": 0.7979, "step": 6415 }, { "epoch": 0.44, "learning_rate": 1.2493012811257194e-05, "loss": 0.8096, "step": 6416 }, { "epoch": 0.44, "learning_rate": 1.2490875182967969e-05, "loss": 0.8594, "step": 6417 }, { "epoch": 0.44, "learning_rate": 1.2488737433323429e-05, "loss": 0.7744, "step": 6418 }, { "epoch": 0.44, "learning_rate": 1.2486599562427718e-05, "loss": 0.8037, "step": 6419 }, { "epoch": 0.44, "learning_rate": 1.2484461570384997e-05, "loss": 0.8818, "step": 6420 }, { "epoch": 0.44, "learning_rate": 1.2482323457299434e-05, "loss": 0.8008, "step": 6421 }, { "epoch": 0.44, "learning_rate": 1.248018522327519e-05, "loss": 0.8203, "step": 6422 }, { "epoch": 0.44, "learning_rate": 1.2478046868416445e-05, "loss": 0.7725, "step": 6423 }, { "epoch": 0.44, "learning_rate": 1.2475908392827374e-05, "loss": 0.8174, "step": 6424 }, { "epoch": 0.44, "learning_rate": 1.2473769796612172e-05, "loss": 0.8896, "step": 6425 }, { "epoch": 0.44, "learning_rate": 1.2471631079875021e-05, "loss": 0.79, "step": 6426 }, { "epoch": 0.44, "learning_rate": 1.2469492242720126e-05, "loss": 0.8066, "step": 6427 }, { "epoch": 0.44, "learning_rate": 1.2467353285251691e-05, "loss": 0.7959, "step": 6428 }, { "epoch": 0.44, "learning_rate": 1.2465214207573923e-05, "loss": 0.8672, "step": 6429 }, { "epoch": 0.44, "learning_rate": 1.246307500979104e-05, "loss": 0.8037, "step": 6430 }, { "epoch": 0.44, "learning_rate": 1.2460935692007263e-05, "loss": 0.8037, "step": 6431 }, { "epoch": 0.44, "learning_rate": 1.2458796254326815e-05, "loss": 0.8574, "step": 6432 }, { "epoch": 0.44, "learning_rate": 1.2456656696853936e-05, "loss": 0.8711, "step": 6433 }, { "epoch": 0.44, "learning_rate": 1.2454517019692864e-05, "loss": 0.71, "step": 6434 }, { "epoch": 0.44, "learning_rate": 1.245237722294784e-05, "loss": 0.8223, "step": 6435 }, { "epoch": 0.44, "learning_rate": 1.2450237306723122e-05, "loss": 0.791, "step": 6436 }, { "epoch": 0.44, "learning_rate": 1.2448097271122956e-05, "loss": 0.8721, "step": 6437 }, { "epoch": 0.44, "learning_rate": 1.2445957116251613e-05, "loss": 0.8066, "step": 6438 }, { "epoch": 0.44, "learning_rate": 1.2443816842213358e-05, "loss": 0.8965, "step": 6439 }, { "epoch": 0.44, "learning_rate": 1.2441676449112467e-05, "loss": 0.7871, "step": 6440 }, { "epoch": 0.44, "learning_rate": 1.2439535937053218e-05, "loss": 0.8604, "step": 6441 }, { "epoch": 0.44, "learning_rate": 1.2437395306139895e-05, "loss": 0.8545, "step": 6442 }, { "epoch": 0.44, "learning_rate": 1.2435254556476794e-05, "loss": 0.8711, "step": 6443 }, { "epoch": 0.44, "learning_rate": 1.243311368816821e-05, "loss": 0.832, "step": 6444 }, { "epoch": 0.44, "learning_rate": 1.2430972701318442e-05, "loss": 0.8252, "step": 6445 }, { "epoch": 0.44, "learning_rate": 1.2428831596031808e-05, "loss": 0.7915, "step": 6446 }, { "epoch": 0.44, "learning_rate": 1.2426690372412613e-05, "loss": 0.7764, "step": 6447 }, { "epoch": 0.44, "learning_rate": 1.2424549030565182e-05, "loss": 0.9092, "step": 6448 }, { "epoch": 0.44, "learning_rate": 1.2422407570593844e-05, "loss": 0.8057, "step": 6449 }, { "epoch": 0.44, "learning_rate": 1.2420265992602923e-05, "loss": 0.8662, "step": 6450 }, { "epoch": 0.44, "learning_rate": 1.2418124296696762e-05, "loss": 0.8154, "step": 6451 }, { "epoch": 0.44, "learning_rate": 1.2415982482979703e-05, "loss": 0.8301, "step": 6452 }, { "epoch": 0.44, "learning_rate": 1.2413840551556096e-05, "loss": 0.8877, "step": 6453 }, { "epoch": 0.44, "learning_rate": 1.2411698502530297e-05, "loss": 0.8057, "step": 6454 }, { "epoch": 0.44, "learning_rate": 1.240955633600666e-05, "loss": 0.874, "step": 6455 }, { "epoch": 0.44, "learning_rate": 1.2407414052089559e-05, "loss": 0.7783, "step": 6456 }, { "epoch": 0.44, "learning_rate": 1.2405271650883363e-05, "loss": 0.9297, "step": 6457 }, { "epoch": 0.44, "learning_rate": 1.2403129132492449e-05, "loss": 0.8076, "step": 6458 }, { "epoch": 0.44, "learning_rate": 1.2400986497021199e-05, "loss": 0.7998, "step": 6459 }, { "epoch": 0.44, "learning_rate": 1.2398843744574005e-05, "loss": 0.7158, "step": 6460 }, { "epoch": 0.44, "learning_rate": 1.2396700875255263e-05, "loss": 0.8057, "step": 6461 }, { "epoch": 0.44, "learning_rate": 1.2394557889169368e-05, "loss": 0.7656, "step": 6462 }, { "epoch": 0.44, "learning_rate": 1.239241478642073e-05, "loss": 0.8467, "step": 6463 }, { "epoch": 0.44, "learning_rate": 1.2390271567113764e-05, "loss": 0.8281, "step": 6464 }, { "epoch": 0.44, "learning_rate": 1.2388128231352878e-05, "loss": 0.708, "step": 6465 }, { "epoch": 0.44, "learning_rate": 1.2385984779242504e-05, "loss": 0.7656, "step": 6466 }, { "epoch": 0.44, "learning_rate": 1.2383841210887069e-05, "loss": 0.8242, "step": 6467 }, { "epoch": 0.44, "learning_rate": 1.2381697526391004e-05, "loss": 0.8486, "step": 6468 }, { "epoch": 0.44, "learning_rate": 1.2379553725858752e-05, "loss": 0.8311, "step": 6469 }, { "epoch": 0.44, "learning_rate": 1.2377409809394761e-05, "loss": 0.7998, "step": 6470 }, { "epoch": 0.44, "learning_rate": 1.2375265777103475e-05, "loss": 0.9277, "step": 6471 }, { "epoch": 0.44, "learning_rate": 1.2373121629089363e-05, "loss": 0.8438, "step": 6472 }, { "epoch": 0.44, "learning_rate": 1.2370977365456877e-05, "loss": 0.835, "step": 6473 }, { "epoch": 0.44, "learning_rate": 1.2368832986310488e-05, "loss": 0.8271, "step": 6474 }, { "epoch": 0.44, "learning_rate": 1.2366688491754676e-05, "loss": 0.7881, "step": 6475 }, { "epoch": 0.44, "learning_rate": 1.2364543881893914e-05, "loss": 0.8848, "step": 6476 }, { "epoch": 0.44, "learning_rate": 1.2362399156832688e-05, "loss": 0.7256, "step": 6477 }, { "epoch": 0.44, "learning_rate": 1.236025431667549e-05, "loss": 0.8789, "step": 6478 }, { "epoch": 0.44, "learning_rate": 1.235810936152682e-05, "loss": 0.8203, "step": 6479 }, { "epoch": 0.44, "learning_rate": 1.2355964291491174e-05, "loss": 0.7539, "step": 6480 }, { "epoch": 0.44, "learning_rate": 1.2353819106673062e-05, "loss": 0.7969, "step": 6481 }, { "epoch": 0.44, "learning_rate": 1.2351673807176998e-05, "loss": 0.7607, "step": 6482 }, { "epoch": 0.44, "learning_rate": 1.2349528393107504e-05, "loss": 0.79, "step": 6483 }, { "epoch": 0.44, "learning_rate": 1.23473828645691e-05, "loss": 0.8662, "step": 6484 }, { "epoch": 0.44, "learning_rate": 1.2345237221666314e-05, "loss": 0.7998, "step": 6485 }, { "epoch": 0.44, "learning_rate": 1.2343091464503689e-05, "loss": 0.8184, "step": 6486 }, { "epoch": 0.44, "learning_rate": 1.2340945593185762e-05, "loss": 0.8438, "step": 6487 }, { "epoch": 0.44, "learning_rate": 1.2338799607817079e-05, "loss": 0.8271, "step": 6488 }, { "epoch": 0.44, "learning_rate": 1.233665350850219e-05, "loss": 0.875, "step": 6489 }, { "epoch": 0.44, "learning_rate": 1.2334507295345662e-05, "loss": 0.8105, "step": 6490 }, { "epoch": 0.44, "learning_rate": 1.2332360968452049e-05, "loss": 0.7549, "step": 6491 }, { "epoch": 0.44, "learning_rate": 1.2330214527925921e-05, "loss": 0.7568, "step": 6492 }, { "epoch": 0.44, "learning_rate": 1.232806797387186e-05, "loss": 0.7637, "step": 6493 }, { "epoch": 0.44, "learning_rate": 1.2325921306394435e-05, "loss": 0.9014, "step": 6494 }, { "epoch": 0.44, "learning_rate": 1.2323774525598243e-05, "loss": 0.8311, "step": 6495 }, { "epoch": 0.44, "learning_rate": 1.2321627631587867e-05, "loss": 0.8271, "step": 6496 }, { "epoch": 0.44, "learning_rate": 1.2319480624467905e-05, "loss": 0.8711, "step": 6497 }, { "epoch": 0.44, "learning_rate": 1.2317333504342963e-05, "loss": 0.7861, "step": 6498 }, { "epoch": 0.44, "learning_rate": 1.2315186271317643e-05, "loss": 0.7686, "step": 6499 }, { "epoch": 0.44, "learning_rate": 1.2313038925496561e-05, "loss": 0.7607, "step": 6500 }, { "epoch": 0.44, "learning_rate": 1.2310891466984339e-05, "loss": 0.8428, "step": 6501 }, { "epoch": 0.44, "learning_rate": 1.2308743895885592e-05, "loss": 0.7939, "step": 6502 }, { "epoch": 0.44, "learning_rate": 1.2306596212304958e-05, "loss": 0.8252, "step": 6503 }, { "epoch": 0.44, "learning_rate": 1.2304448416347066e-05, "loss": 0.8203, "step": 6504 }, { "epoch": 0.44, "learning_rate": 1.2302300508116565e-05, "loss": 0.8496, "step": 6505 }, { "epoch": 0.44, "learning_rate": 1.2300152487718091e-05, "loss": 0.751, "step": 6506 }, { "epoch": 0.44, "learning_rate": 1.2298004355256302e-05, "loss": 0.7017, "step": 6507 }, { "epoch": 0.44, "learning_rate": 1.2295856110835854e-05, "loss": 0.7969, "step": 6508 }, { "epoch": 0.44, "learning_rate": 1.2293707754561403e-05, "loss": 0.9492, "step": 6509 }, { "epoch": 0.44, "learning_rate": 1.2291559286537626e-05, "loss": 0.8555, "step": 6510 }, { "epoch": 0.44, "learning_rate": 1.2289410706869193e-05, "loss": 0.8203, "step": 6511 }, { "epoch": 0.44, "learning_rate": 1.228726201566078e-05, "loss": 0.9297, "step": 6512 }, { "epoch": 0.44, "learning_rate": 1.2285113213017074e-05, "loss": 0.834, "step": 6513 }, { "epoch": 0.44, "learning_rate": 1.2282964299042763e-05, "loss": 0.8252, "step": 6514 }, { "epoch": 0.44, "learning_rate": 1.2280815273842544e-05, "loss": 0.8643, "step": 6515 }, { "epoch": 0.44, "learning_rate": 1.2278666137521115e-05, "loss": 0.8242, "step": 6516 }, { "epoch": 0.44, "learning_rate": 1.2276516890183183e-05, "loss": 0.8223, "step": 6517 }, { "epoch": 0.44, "learning_rate": 1.227436753193346e-05, "loss": 0.8018, "step": 6518 }, { "epoch": 0.44, "learning_rate": 1.2272218062876662e-05, "loss": 0.8037, "step": 6519 }, { "epoch": 0.44, "learning_rate": 1.227006848311751e-05, "loss": 0.7412, "step": 6520 }, { "epoch": 0.44, "learning_rate": 1.2267918792760732e-05, "loss": 0.835, "step": 6521 }, { "epoch": 0.44, "learning_rate": 1.226576899191106e-05, "loss": 0.8086, "step": 6522 }, { "epoch": 0.44, "learning_rate": 1.2263619080673237e-05, "loss": 0.7676, "step": 6523 }, { "epoch": 0.44, "learning_rate": 1.2261469059152e-05, "loss": 0.7715, "step": 6524 }, { "epoch": 0.44, "learning_rate": 1.2259318927452099e-05, "loss": 0.7686, "step": 6525 }, { "epoch": 0.44, "learning_rate": 1.2257168685678296e-05, "loss": 0.7861, "step": 6526 }, { "epoch": 0.44, "learning_rate": 1.2255018333935338e-05, "loss": 0.8789, "step": 6527 }, { "epoch": 0.44, "learning_rate": 1.2252867872328001e-05, "loss": 0.7812, "step": 6528 }, { "epoch": 0.44, "learning_rate": 1.225071730096105e-05, "loss": 0.8047, "step": 6529 }, { "epoch": 0.45, "learning_rate": 1.2248566619939259e-05, "loss": 0.8799, "step": 6530 }, { "epoch": 0.45, "learning_rate": 1.2246415829367416e-05, "loss": 0.7812, "step": 6531 }, { "epoch": 0.45, "learning_rate": 1.2244264929350303e-05, "loss": 0.8271, "step": 6532 }, { "epoch": 0.45, "learning_rate": 1.224211391999271e-05, "loss": 0.7822, "step": 6533 }, { "epoch": 0.45, "learning_rate": 1.2239962801399436e-05, "loss": 0.791, "step": 6534 }, { "epoch": 0.45, "learning_rate": 1.2237811573675285e-05, "loss": 0.7695, "step": 6535 }, { "epoch": 0.45, "learning_rate": 1.2235660236925062e-05, "loss": 0.8965, "step": 6536 }, { "epoch": 0.45, "learning_rate": 1.2233508791253584e-05, "loss": 0.7197, "step": 6537 }, { "epoch": 0.45, "learning_rate": 1.2231357236765663e-05, "loss": 0.875, "step": 6538 }, { "epoch": 0.45, "learning_rate": 1.2229205573566128e-05, "loss": 0.7686, "step": 6539 }, { "epoch": 0.45, "learning_rate": 1.2227053801759805e-05, "loss": 0.7754, "step": 6540 }, { "epoch": 0.45, "learning_rate": 1.2224901921451532e-05, "loss": 0.833, "step": 6541 }, { "epoch": 0.45, "learning_rate": 1.2222749932746142e-05, "loss": 0.876, "step": 6542 }, { "epoch": 0.45, "learning_rate": 1.2220597835748486e-05, "loss": 0.8574, "step": 6543 }, { "epoch": 0.45, "learning_rate": 1.2218445630563416e-05, "loss": 0.7266, "step": 6544 }, { "epoch": 0.45, "learning_rate": 1.2216293317295778e-05, "loss": 0.7461, "step": 6545 }, { "epoch": 0.45, "learning_rate": 1.2214140896050437e-05, "loss": 0.7725, "step": 6546 }, { "epoch": 0.45, "learning_rate": 1.2211988366932262e-05, "loss": 0.8594, "step": 6547 }, { "epoch": 0.45, "learning_rate": 1.2209835730046119e-05, "loss": 0.8242, "step": 6548 }, { "epoch": 0.45, "learning_rate": 1.2207682985496889e-05, "loss": 0.8555, "step": 6549 }, { "epoch": 0.45, "learning_rate": 1.2205530133389453e-05, "loss": 0.7119, "step": 6550 }, { "epoch": 0.45, "learning_rate": 1.2203377173828692e-05, "loss": 0.8174, "step": 6551 }, { "epoch": 0.45, "learning_rate": 1.2201224106919507e-05, "loss": 0.8584, "step": 6552 }, { "epoch": 0.45, "learning_rate": 1.219907093276679e-05, "loss": 0.8408, "step": 6553 }, { "epoch": 0.45, "learning_rate": 1.2196917651475442e-05, "loss": 0.8721, "step": 6554 }, { "epoch": 0.45, "learning_rate": 1.2194764263150376e-05, "loss": 0.7949, "step": 6555 }, { "epoch": 0.45, "learning_rate": 1.21926107678965e-05, "loss": 0.8535, "step": 6556 }, { "epoch": 0.45, "learning_rate": 1.2190457165818734e-05, "loss": 0.79, "step": 6557 }, { "epoch": 0.45, "learning_rate": 1.2188303457022003e-05, "loss": 0.8115, "step": 6558 }, { "epoch": 0.45, "learning_rate": 1.2186149641611236e-05, "loss": 0.8408, "step": 6559 }, { "epoch": 0.45, "learning_rate": 1.2183995719691361e-05, "loss": 0.8262, "step": 6560 }, { "epoch": 0.45, "learning_rate": 1.2181841691367324e-05, "loss": 0.8877, "step": 6561 }, { "epoch": 0.45, "learning_rate": 1.2179687556744066e-05, "loss": 0.8525, "step": 6562 }, { "epoch": 0.45, "learning_rate": 1.2177533315926535e-05, "loss": 0.7773, "step": 6563 }, { "epoch": 0.45, "learning_rate": 1.2175378969019688e-05, "loss": 0.8027, "step": 6564 }, { "epoch": 0.45, "learning_rate": 1.2173224516128486e-05, "loss": 0.8066, "step": 6565 }, { "epoch": 0.45, "learning_rate": 1.2171069957357885e-05, "loss": 0.8223, "step": 6566 }, { "epoch": 0.45, "learning_rate": 1.2168915292812868e-05, "loss": 0.8438, "step": 6567 }, { "epoch": 0.45, "learning_rate": 1.2166760522598404e-05, "loss": 0.7842, "step": 6568 }, { "epoch": 0.45, "learning_rate": 1.2164605646819467e-05, "loss": 0.7666, "step": 6569 }, { "epoch": 0.45, "learning_rate": 1.2162450665581054e-05, "loss": 0.8105, "step": 6570 }, { "epoch": 0.45, "learning_rate": 1.2160295578988149e-05, "loss": 0.8408, "step": 6571 }, { "epoch": 0.45, "learning_rate": 1.2158140387145745e-05, "loss": 0.7998, "step": 6572 }, { "epoch": 0.45, "learning_rate": 1.215598509015885e-05, "loss": 0.7881, "step": 6573 }, { "epoch": 0.45, "learning_rate": 1.2153829688132466e-05, "loss": 0.7969, "step": 6574 }, { "epoch": 0.45, "learning_rate": 1.2151674181171604e-05, "loss": 0.8643, "step": 6575 }, { "epoch": 0.45, "learning_rate": 1.2149518569381285e-05, "loss": 0.8594, "step": 6576 }, { "epoch": 0.45, "learning_rate": 1.214736285286652e-05, "loss": 0.8281, "step": 6577 }, { "epoch": 0.45, "learning_rate": 1.2145207031732344e-05, "loss": 0.7422, "step": 6578 }, { "epoch": 0.45, "learning_rate": 1.2143051106083785e-05, "loss": 0.8711, "step": 6579 }, { "epoch": 0.45, "learning_rate": 1.2140895076025885e-05, "loss": 0.7793, "step": 6580 }, { "epoch": 0.45, "learning_rate": 1.2138738941663677e-05, "loss": 0.8564, "step": 6581 }, { "epoch": 0.45, "learning_rate": 1.2136582703102211e-05, "loss": 0.8086, "step": 6582 }, { "epoch": 0.45, "learning_rate": 1.2134426360446542e-05, "loss": 0.7471, "step": 6583 }, { "epoch": 0.45, "learning_rate": 1.2132269913801725e-05, "loss": 0.7725, "step": 6584 }, { "epoch": 0.45, "learning_rate": 1.2130113363272822e-05, "loss": 0.8135, "step": 6585 }, { "epoch": 0.45, "learning_rate": 1.21279567089649e-05, "loss": 0.8096, "step": 6586 }, { "epoch": 0.45, "learning_rate": 1.2125799950983028e-05, "loss": 0.8711, "step": 6587 }, { "epoch": 0.45, "learning_rate": 1.212364308943229e-05, "loss": 0.8525, "step": 6588 }, { "epoch": 0.45, "learning_rate": 1.2121486124417763e-05, "loss": 0.8594, "step": 6589 }, { "epoch": 0.45, "learning_rate": 1.2119329056044533e-05, "loss": 0.6846, "step": 6590 }, { "epoch": 0.45, "learning_rate": 1.2117171884417697e-05, "loss": 0.7598, "step": 6591 }, { "epoch": 0.45, "learning_rate": 1.211501460964235e-05, "loss": 0.7998, "step": 6592 }, { "epoch": 0.45, "learning_rate": 1.2112857231823593e-05, "loss": 0.8613, "step": 6593 }, { "epoch": 0.45, "learning_rate": 1.211069975106654e-05, "loss": 0.8223, "step": 6594 }, { "epoch": 0.45, "learning_rate": 1.2108542167476292e-05, "loss": 0.8799, "step": 6595 }, { "epoch": 0.45, "learning_rate": 1.2106384481157973e-05, "loss": 0.8232, "step": 6596 }, { "epoch": 0.45, "learning_rate": 1.2104226692216705e-05, "loss": 0.8164, "step": 6597 }, { "epoch": 0.45, "learning_rate": 1.2102068800757621e-05, "loss": 0.8535, "step": 6598 }, { "epoch": 0.45, "learning_rate": 1.209991080688584e-05, "loss": 0.7393, "step": 6599 }, { "epoch": 0.45, "learning_rate": 1.209775271070651e-05, "loss": 0.7812, "step": 6600 }, { "epoch": 0.45, "learning_rate": 1.2095594512324768e-05, "loss": 0.7686, "step": 6601 }, { "epoch": 0.45, "learning_rate": 1.2093436211845768e-05, "loss": 0.9004, "step": 6602 }, { "epoch": 0.45, "learning_rate": 1.2091277809374655e-05, "loss": 0.8174, "step": 6603 }, { "epoch": 0.45, "learning_rate": 1.2089119305016587e-05, "loss": 0.7764, "step": 6604 }, { "epoch": 0.45, "learning_rate": 1.2086960698876732e-05, "loss": 0.8359, "step": 6605 }, { "epoch": 0.45, "learning_rate": 1.2084801991060254e-05, "loss": 0.7588, "step": 6606 }, { "epoch": 0.45, "learning_rate": 1.2082643181672322e-05, "loss": 0.7236, "step": 6607 }, { "epoch": 0.45, "learning_rate": 1.2080484270818116e-05, "loss": 0.8057, "step": 6608 }, { "epoch": 0.45, "learning_rate": 1.207832525860282e-05, "loss": 0.8145, "step": 6609 }, { "epoch": 0.45, "learning_rate": 1.2076166145131616e-05, "loss": 0.8545, "step": 6610 }, { "epoch": 0.45, "learning_rate": 1.20740069305097e-05, "loss": 0.7334, "step": 6611 }, { "epoch": 0.45, "learning_rate": 1.2071847614842269e-05, "loss": 0.8594, "step": 6612 }, { "epoch": 0.45, "learning_rate": 1.206968819823452e-05, "loss": 0.8086, "step": 6613 }, { "epoch": 0.45, "learning_rate": 1.2067528680791665e-05, "loss": 0.832, "step": 6614 }, { "epoch": 0.45, "learning_rate": 1.2065369062618913e-05, "loss": 0.8535, "step": 6615 }, { "epoch": 0.45, "learning_rate": 1.2063209343821481e-05, "loss": 0.8027, "step": 6616 }, { "epoch": 0.45, "learning_rate": 1.2061049524504591e-05, "loss": 0.8447, "step": 6617 }, { "epoch": 0.45, "learning_rate": 1.205888960477347e-05, "loss": 0.7041, "step": 6618 }, { "epoch": 0.45, "learning_rate": 1.2056729584733344e-05, "loss": 0.7383, "step": 6619 }, { "epoch": 0.45, "learning_rate": 1.2054569464489456e-05, "loss": 0.8467, "step": 6620 }, { "epoch": 0.45, "learning_rate": 1.2052409244147043e-05, "loss": 0.8047, "step": 6621 }, { "epoch": 0.45, "learning_rate": 1.2050248923811349e-05, "loss": 0.8271, "step": 6622 }, { "epoch": 0.45, "learning_rate": 1.204808850358763e-05, "loss": 0.7539, "step": 6623 }, { "epoch": 0.45, "learning_rate": 1.204592798358114e-05, "loss": 0.8223, "step": 6624 }, { "epoch": 0.45, "learning_rate": 1.204376736389714e-05, "loss": 0.876, "step": 6625 }, { "epoch": 0.45, "learning_rate": 1.2041606644640889e-05, "loss": 0.8115, "step": 6626 }, { "epoch": 0.45, "learning_rate": 1.2039445825917664e-05, "loss": 0.7744, "step": 6627 }, { "epoch": 0.45, "learning_rate": 1.2037284907832735e-05, "loss": 0.7891, "step": 6628 }, { "epoch": 0.45, "learning_rate": 1.203512389049139e-05, "loss": 0.8359, "step": 6629 }, { "epoch": 0.45, "learning_rate": 1.2032962773998906e-05, "loss": 0.8047, "step": 6630 }, { "epoch": 0.45, "learning_rate": 1.2030801558460572e-05, "loss": 0.791, "step": 6631 }, { "epoch": 0.45, "learning_rate": 1.2028640243981689e-05, "loss": 0.7969, "step": 6632 }, { "epoch": 0.45, "learning_rate": 1.2026478830667551e-05, "loss": 0.7588, "step": 6633 }, { "epoch": 0.45, "learning_rate": 1.2024317318623462e-05, "loss": 0.8535, "step": 6634 }, { "epoch": 0.45, "learning_rate": 1.2022155707954735e-05, "loss": 0.7734, "step": 6635 }, { "epoch": 0.45, "learning_rate": 1.2019993998766676e-05, "loss": 0.7275, "step": 6636 }, { "epoch": 0.45, "learning_rate": 1.201783219116461e-05, "loss": 0.8164, "step": 6637 }, { "epoch": 0.45, "learning_rate": 1.2015670285253861e-05, "loss": 0.8486, "step": 6638 }, { "epoch": 0.45, "learning_rate": 1.2013508281139752e-05, "loss": 0.7568, "step": 6639 }, { "epoch": 0.45, "learning_rate": 1.2011346178927616e-05, "loss": 0.8027, "step": 6640 }, { "epoch": 0.45, "learning_rate": 1.2009183978722791e-05, "loss": 0.791, "step": 6641 }, { "epoch": 0.45, "learning_rate": 1.2007021680630626e-05, "loss": 0.8457, "step": 6642 }, { "epoch": 0.45, "learning_rate": 1.2004859284756458e-05, "loss": 0.8018, "step": 6643 }, { "epoch": 0.45, "learning_rate": 1.2002696791205646e-05, "loss": 0.8213, "step": 6644 }, { "epoch": 0.45, "learning_rate": 1.2000534200083544e-05, "loss": 0.8887, "step": 6645 }, { "epoch": 0.45, "learning_rate": 1.1998371511495512e-05, "loss": 0.7529, "step": 6646 }, { "epoch": 0.45, "learning_rate": 1.1996208725546915e-05, "loss": 0.8662, "step": 6647 }, { "epoch": 0.45, "learning_rate": 1.1994045842343131e-05, "loss": 0.8984, "step": 6648 }, { "epoch": 0.45, "learning_rate": 1.1991882861989525e-05, "loss": 0.8105, "step": 6649 }, { "epoch": 0.45, "learning_rate": 1.1989719784591491e-05, "loss": 0.8418, "step": 6650 }, { "epoch": 0.45, "learning_rate": 1.19875566102544e-05, "loss": 0.7686, "step": 6651 }, { "epoch": 0.45, "learning_rate": 1.1985393339083648e-05, "loss": 0.792, "step": 6652 }, { "epoch": 0.45, "learning_rate": 1.1983229971184635e-05, "loss": 0.8496, "step": 6653 }, { "epoch": 0.45, "learning_rate": 1.1981066506662749e-05, "loss": 0.7734, "step": 6654 }, { "epoch": 0.45, "learning_rate": 1.19789029456234e-05, "loss": 0.8389, "step": 6655 }, { "epoch": 0.45, "learning_rate": 1.1976739288172e-05, "loss": 0.7832, "step": 6656 }, { "epoch": 0.45, "learning_rate": 1.1974575534413954e-05, "loss": 0.7754, "step": 6657 }, { "epoch": 0.45, "learning_rate": 1.1972411684454686e-05, "loss": 0.7344, "step": 6658 }, { "epoch": 0.45, "learning_rate": 1.1970247738399616e-05, "loss": 0.7969, "step": 6659 }, { "epoch": 0.45, "learning_rate": 1.1968083696354173e-05, "loss": 0.6895, "step": 6660 }, { "epoch": 0.45, "learning_rate": 1.196591955842379e-05, "loss": 0.8252, "step": 6661 }, { "epoch": 0.45, "learning_rate": 1.1963755324713898e-05, "loss": 0.8369, "step": 6662 }, { "epoch": 0.45, "learning_rate": 1.1961590995329946e-05, "loss": 0.8555, "step": 6663 }, { "epoch": 0.45, "learning_rate": 1.1959426570377374e-05, "loss": 0.7568, "step": 6664 }, { "epoch": 0.45, "learning_rate": 1.1957262049961636e-05, "loss": 0.8848, "step": 6665 }, { "epoch": 0.45, "learning_rate": 1.1955097434188188e-05, "loss": 0.835, "step": 6666 }, { "epoch": 0.45, "learning_rate": 1.1952932723162483e-05, "loss": 0.8711, "step": 6667 }, { "epoch": 0.45, "learning_rate": 1.1950767916989995e-05, "loss": 0.7559, "step": 6668 }, { "epoch": 0.45, "learning_rate": 1.1948603015776188e-05, "loss": 0.9248, "step": 6669 }, { "epoch": 0.45, "learning_rate": 1.1946438019626538e-05, "loss": 0.8652, "step": 6670 }, { "epoch": 0.45, "learning_rate": 1.1944272928646524e-05, "loss": 0.8301, "step": 6671 }, { "epoch": 0.45, "learning_rate": 1.1942107742941627e-05, "loss": 0.8369, "step": 6672 }, { "epoch": 0.45, "learning_rate": 1.1939942462617333e-05, "loss": 0.9248, "step": 6673 }, { "epoch": 0.45, "learning_rate": 1.193777708777914e-05, "loss": 0.752, "step": 6674 }, { "epoch": 0.45, "learning_rate": 1.1935611618532538e-05, "loss": 0.8242, "step": 6675 }, { "epoch": 0.45, "learning_rate": 1.1933446054983035e-05, "loss": 0.8174, "step": 6676 }, { "epoch": 0.46, "learning_rate": 1.1931280397236134e-05, "loss": 0.7646, "step": 6677 }, { "epoch": 0.46, "learning_rate": 1.1929114645397348e-05, "loss": 0.8281, "step": 6678 }, { "epoch": 0.46, "learning_rate": 1.192694879957219e-05, "loss": 0.8154, "step": 6679 }, { "epoch": 0.46, "learning_rate": 1.1924782859866178e-05, "loss": 0.8232, "step": 6680 }, { "epoch": 0.46, "learning_rate": 1.192261682638484e-05, "loss": 0.791, "step": 6681 }, { "epoch": 0.46, "learning_rate": 1.1920450699233706e-05, "loss": 0.7861, "step": 6682 }, { "epoch": 0.46, "learning_rate": 1.1918284478518304e-05, "loss": 0.8984, "step": 6683 }, { "epoch": 0.46, "learning_rate": 1.1916118164344179e-05, "loss": 0.8447, "step": 6684 }, { "epoch": 0.46, "learning_rate": 1.1913951756816866e-05, "loss": 0.8525, "step": 6685 }, { "epoch": 0.46, "learning_rate": 1.1911785256041921e-05, "loss": 0.79, "step": 6686 }, { "epoch": 0.46, "learning_rate": 1.190961866212489e-05, "loss": 0.8418, "step": 6687 }, { "epoch": 0.46, "learning_rate": 1.1907451975171331e-05, "loss": 0.877, "step": 6688 }, { "epoch": 0.46, "learning_rate": 1.1905285195286807e-05, "loss": 0.8232, "step": 6689 }, { "epoch": 0.46, "learning_rate": 1.190311832257688e-05, "loss": 0.835, "step": 6690 }, { "epoch": 0.46, "learning_rate": 1.1900951357147118e-05, "loss": 0.8311, "step": 6691 }, { "epoch": 0.46, "learning_rate": 1.1898784299103104e-05, "loss": 0.834, "step": 6692 }, { "epoch": 0.46, "learning_rate": 1.1896617148550406e-05, "loss": 0.7637, "step": 6693 }, { "epoch": 0.46, "learning_rate": 1.1894449905594616e-05, "loss": 0.8174, "step": 6694 }, { "epoch": 0.46, "learning_rate": 1.1892282570341318e-05, "loss": 0.7754, "step": 6695 }, { "epoch": 0.46, "learning_rate": 1.1890115142896107e-05, "loss": 0.8594, "step": 6696 }, { "epoch": 0.46, "learning_rate": 1.1887947623364577e-05, "loss": 0.8682, "step": 6697 }, { "epoch": 0.46, "learning_rate": 1.188578001185233e-05, "loss": 0.8125, "step": 6698 }, { "epoch": 0.46, "learning_rate": 1.1883612308464976e-05, "loss": 0.834, "step": 6699 }, { "epoch": 0.46, "learning_rate": 1.188144451330812e-05, "loss": 0.7949, "step": 6700 }, { "epoch": 0.46, "learning_rate": 1.187927662648738e-05, "loss": 0.8213, "step": 6701 }, { "epoch": 0.46, "learning_rate": 1.1877108648108373e-05, "loss": 0.9336, "step": 6702 }, { "epoch": 0.46, "learning_rate": 1.1874940578276723e-05, "loss": 0.7676, "step": 6703 }, { "epoch": 0.46, "learning_rate": 1.1872772417098062e-05, "loss": 0.8896, "step": 6704 }, { "epoch": 0.46, "learning_rate": 1.1870604164678018e-05, "loss": 0.7979, "step": 6705 }, { "epoch": 0.46, "learning_rate": 1.1868435821122234e-05, "loss": 0.7754, "step": 6706 }, { "epoch": 0.46, "learning_rate": 1.1866267386536345e-05, "loss": 0.7939, "step": 6707 }, { "epoch": 0.46, "learning_rate": 1.1864098861026001e-05, "loss": 0.7881, "step": 6708 }, { "epoch": 0.46, "learning_rate": 1.186193024469685e-05, "loss": 0.7715, "step": 6709 }, { "epoch": 0.46, "learning_rate": 1.185976153765455e-05, "loss": 0.7646, "step": 6710 }, { "epoch": 0.46, "learning_rate": 1.185759274000476e-05, "loss": 0.8545, "step": 6711 }, { "epoch": 0.46, "learning_rate": 1.1855423851853139e-05, "loss": 0.8027, "step": 6712 }, { "epoch": 0.46, "learning_rate": 1.1853254873305358e-05, "loss": 0.834, "step": 6713 }, { "epoch": 0.46, "learning_rate": 1.1851085804467093e-05, "loss": 0.7871, "step": 6714 }, { "epoch": 0.46, "learning_rate": 1.1848916645444017e-05, "loss": 0.7402, "step": 6715 }, { "epoch": 0.46, "learning_rate": 1.1846747396341812e-05, "loss": 0.8164, "step": 6716 }, { "epoch": 0.46, "learning_rate": 1.1844578057266163e-05, "loss": 0.8408, "step": 6717 }, { "epoch": 0.46, "learning_rate": 1.1842408628322761e-05, "loss": 0.8223, "step": 6718 }, { "epoch": 0.46, "learning_rate": 1.1840239109617302e-05, "loss": 0.832, "step": 6719 }, { "epoch": 0.46, "learning_rate": 1.1838069501255482e-05, "loss": 0.7852, "step": 6720 }, { "epoch": 0.46, "learning_rate": 1.1835899803343005e-05, "loss": 0.8203, "step": 6721 }, { "epoch": 0.46, "learning_rate": 1.183373001598558e-05, "loss": 0.8008, "step": 6722 }, { "epoch": 0.46, "learning_rate": 1.1831560139288918e-05, "loss": 0.7461, "step": 6723 }, { "epoch": 0.46, "learning_rate": 1.1829390173358735e-05, "loss": 0.8203, "step": 6724 }, { "epoch": 0.46, "learning_rate": 1.1827220118300756e-05, "loss": 0.8799, "step": 6725 }, { "epoch": 0.46, "learning_rate": 1.1825049974220697e-05, "loss": 0.7871, "step": 6726 }, { "epoch": 0.46, "learning_rate": 1.1822879741224291e-05, "loss": 0.8486, "step": 6727 }, { "epoch": 0.46, "learning_rate": 1.1820709419417278e-05, "loss": 0.8037, "step": 6728 }, { "epoch": 0.46, "learning_rate": 1.1818539008905385e-05, "loss": 0.8057, "step": 6729 }, { "epoch": 0.46, "learning_rate": 1.1816368509794365e-05, "loss": 0.7627, "step": 6730 }, { "epoch": 0.46, "learning_rate": 1.1814197922189958e-05, "loss": 0.7568, "step": 6731 }, { "epoch": 0.46, "learning_rate": 1.1812027246197917e-05, "loss": 0.8438, "step": 6732 }, { "epoch": 0.46, "learning_rate": 1.1809856481923998e-05, "loss": 0.8291, "step": 6733 }, { "epoch": 0.46, "learning_rate": 1.1807685629473959e-05, "loss": 0.8477, "step": 6734 }, { "epoch": 0.46, "learning_rate": 1.1805514688953562e-05, "loss": 0.8828, "step": 6735 }, { "epoch": 0.46, "learning_rate": 1.1803343660468581e-05, "loss": 0.7803, "step": 6736 }, { "epoch": 0.46, "learning_rate": 1.1801172544124782e-05, "loss": 0.8203, "step": 6737 }, { "epoch": 0.46, "learning_rate": 1.1799001340027944e-05, "loss": 0.7852, "step": 6738 }, { "epoch": 0.46, "learning_rate": 1.1796830048283852e-05, "loss": 0.8486, "step": 6739 }, { "epoch": 0.46, "learning_rate": 1.1794658668998285e-05, "loss": 0.8252, "step": 6740 }, { "epoch": 0.46, "learning_rate": 1.1792487202277037e-05, "loss": 0.8506, "step": 6741 }, { "epoch": 0.46, "learning_rate": 1.1790315648225896e-05, "loss": 0.8916, "step": 6742 }, { "epoch": 0.46, "learning_rate": 1.1788144006950668e-05, "loss": 0.8477, "step": 6743 }, { "epoch": 0.46, "learning_rate": 1.178597227855715e-05, "loss": 0.752, "step": 6744 }, { "epoch": 0.46, "learning_rate": 1.178380046315115e-05, "loss": 0.7969, "step": 6745 }, { "epoch": 0.46, "learning_rate": 1.1781628560838479e-05, "loss": 0.834, "step": 6746 }, { "epoch": 0.46, "learning_rate": 1.1779456571724945e-05, "loss": 0.7998, "step": 6747 }, { "epoch": 0.46, "learning_rate": 1.177728449591638e-05, "loss": 0.8564, "step": 6748 }, { "epoch": 0.46, "learning_rate": 1.1775112333518601e-05, "loss": 0.7822, "step": 6749 }, { "epoch": 0.46, "learning_rate": 1.1772940084637434e-05, "loss": 0.7852, "step": 6750 }, { "epoch": 0.46, "learning_rate": 1.1770767749378716e-05, "loss": 0.7607, "step": 6751 }, { "epoch": 0.46, "learning_rate": 1.1768595327848275e-05, "loss": 0.7764, "step": 6752 }, { "epoch": 0.46, "learning_rate": 1.1766422820151957e-05, "loss": 0.8301, "step": 6753 }, { "epoch": 0.46, "learning_rate": 1.1764250226395607e-05, "loss": 0.8281, "step": 6754 }, { "epoch": 0.46, "learning_rate": 1.1762077546685072e-05, "loss": 0.9316, "step": 6755 }, { "epoch": 0.46, "learning_rate": 1.1759904781126201e-05, "loss": 0.8984, "step": 6756 }, { "epoch": 0.46, "learning_rate": 1.1757731929824859e-05, "loss": 0.8193, "step": 6757 }, { "epoch": 0.46, "learning_rate": 1.1755558992886901e-05, "loss": 0.8096, "step": 6758 }, { "epoch": 0.46, "learning_rate": 1.1753385970418196e-05, "loss": 0.8193, "step": 6759 }, { "epoch": 0.46, "learning_rate": 1.175121286252461e-05, "loss": 0.8086, "step": 6760 }, { "epoch": 0.46, "learning_rate": 1.1749039669312022e-05, "loss": 0.8525, "step": 6761 }, { "epoch": 0.46, "learning_rate": 1.1746866390886304e-05, "loss": 0.793, "step": 6762 }, { "epoch": 0.46, "learning_rate": 1.174469302735334e-05, "loss": 0.792, "step": 6763 }, { "epoch": 0.46, "learning_rate": 1.1742519578819021e-05, "loss": 0.8555, "step": 6764 }, { "epoch": 0.46, "learning_rate": 1.1740346045389225e-05, "loss": 0.749, "step": 6765 }, { "epoch": 0.46, "learning_rate": 1.1738172427169863e-05, "loss": 0.876, "step": 6766 }, { "epoch": 0.46, "learning_rate": 1.1735998724266825e-05, "loss": 0.8281, "step": 6767 }, { "epoch": 0.46, "learning_rate": 1.1733824936786005e-05, "loss": 0.7979, "step": 6768 }, { "epoch": 0.46, "learning_rate": 1.1731651064833327e-05, "loss": 0.8574, "step": 6769 }, { "epoch": 0.46, "learning_rate": 1.172947710851469e-05, "loss": 0.8564, "step": 6770 }, { "epoch": 0.46, "learning_rate": 1.1727303067936013e-05, "loss": 0.7598, "step": 6771 }, { "epoch": 0.46, "learning_rate": 1.1725128943203217e-05, "loss": 0.876, "step": 6772 }, { "epoch": 0.46, "learning_rate": 1.1722954734422221e-05, "loss": 0.834, "step": 6773 }, { "epoch": 0.46, "learning_rate": 1.1720780441698954e-05, "loss": 0.7734, "step": 6774 }, { "epoch": 0.46, "learning_rate": 1.1718606065139346e-05, "loss": 0.7578, "step": 6775 }, { "epoch": 0.46, "learning_rate": 1.171643160484934e-05, "loss": 0.7676, "step": 6776 }, { "epoch": 0.46, "learning_rate": 1.1714257060934864e-05, "loss": 0.7822, "step": 6777 }, { "epoch": 0.46, "learning_rate": 1.171208243350187e-05, "loss": 0.8057, "step": 6778 }, { "epoch": 0.46, "learning_rate": 1.1709907722656303e-05, "loss": 0.8545, "step": 6779 }, { "epoch": 0.46, "learning_rate": 1.1707732928504116e-05, "loss": 0.8252, "step": 6780 }, { "epoch": 0.46, "learning_rate": 1.1705558051151265e-05, "loss": 0.8057, "step": 6781 }, { "epoch": 0.46, "learning_rate": 1.1703383090703709e-05, "loss": 0.7637, "step": 6782 }, { "epoch": 0.46, "learning_rate": 1.1701208047267407e-05, "loss": 0.8428, "step": 6783 }, { "epoch": 0.46, "learning_rate": 1.1699032920948337e-05, "loss": 0.8672, "step": 6784 }, { "epoch": 0.46, "learning_rate": 1.1696857711852464e-05, "loss": 0.8486, "step": 6785 }, { "epoch": 0.46, "learning_rate": 1.1694682420085766e-05, "loss": 0.8223, "step": 6786 }, { "epoch": 0.46, "learning_rate": 1.1692507045754224e-05, "loss": 0.8438, "step": 6787 }, { "epoch": 0.46, "learning_rate": 1.1690331588963821e-05, "loss": 0.751, "step": 6788 }, { "epoch": 0.46, "learning_rate": 1.1688156049820542e-05, "loss": 0.835, "step": 6789 }, { "epoch": 0.46, "learning_rate": 1.1685980428430388e-05, "loss": 0.7812, "step": 6790 }, { "epoch": 0.46, "learning_rate": 1.1683804724899349e-05, "loss": 0.833, "step": 6791 }, { "epoch": 0.46, "learning_rate": 1.1681628939333423e-05, "loss": 0.8447, "step": 6792 }, { "epoch": 0.46, "learning_rate": 1.167945307183862e-05, "loss": 0.8652, "step": 6793 }, { "epoch": 0.46, "learning_rate": 1.1677277122520942e-05, "loss": 0.7891, "step": 6794 }, { "epoch": 0.46, "learning_rate": 1.1675101091486408e-05, "loss": 0.7783, "step": 6795 }, { "epoch": 0.46, "learning_rate": 1.1672924978841027e-05, "loss": 0.9453, "step": 6796 }, { "epoch": 0.46, "learning_rate": 1.1670748784690824e-05, "loss": 0.8135, "step": 6797 }, { "epoch": 0.46, "learning_rate": 1.1668572509141822e-05, "loss": 0.8164, "step": 6798 }, { "epoch": 0.46, "learning_rate": 1.1666396152300047e-05, "loss": 0.8232, "step": 6799 }, { "epoch": 0.46, "learning_rate": 1.1664219714271537e-05, "loss": 0.8262, "step": 6800 }, { "epoch": 0.46, "learning_rate": 1.1662043195162317e-05, "loss": 0.7627, "step": 6801 }, { "epoch": 0.46, "learning_rate": 1.1659866595078442e-05, "loss": 0.8682, "step": 6802 }, { "epoch": 0.46, "learning_rate": 1.1657689914125943e-05, "loss": 0.8701, "step": 6803 }, { "epoch": 0.46, "learning_rate": 1.165551315241087e-05, "loss": 0.7988, "step": 6804 }, { "epoch": 0.46, "learning_rate": 1.165333631003928e-05, "loss": 0.7402, "step": 6805 }, { "epoch": 0.46, "learning_rate": 1.1651159387117226e-05, "loss": 0.7139, "step": 6806 }, { "epoch": 0.46, "learning_rate": 1.1648982383750764e-05, "loss": 0.7295, "step": 6807 }, { "epoch": 0.46, "learning_rate": 1.1646805300045965e-05, "loss": 0.8086, "step": 6808 }, { "epoch": 0.46, "learning_rate": 1.164462813610889e-05, "loss": 0.8691, "step": 6809 }, { "epoch": 0.46, "learning_rate": 1.1642450892045609e-05, "loss": 0.7148, "step": 6810 }, { "epoch": 0.46, "learning_rate": 1.1640273567962205e-05, "loss": 0.7578, "step": 6811 }, { "epoch": 0.46, "learning_rate": 1.1638096163964754e-05, "loss": 0.833, "step": 6812 }, { "epoch": 0.46, "learning_rate": 1.1635918680159333e-05, "loss": 0.8232, "step": 6813 }, { "epoch": 0.46, "learning_rate": 1.1633741116652035e-05, "loss": 0.8467, "step": 6814 }, { "epoch": 0.46, "learning_rate": 1.1631563473548952e-05, "loss": 0.7783, "step": 6815 }, { "epoch": 0.46, "learning_rate": 1.1629385750956175e-05, "loss": 0.8174, "step": 6816 }, { "epoch": 0.46, "learning_rate": 1.1627207948979802e-05, "loss": 0.8564, "step": 6817 }, { "epoch": 0.46, "learning_rate": 1.1625030067725939e-05, "loss": 0.7471, "step": 6818 }, { "epoch": 0.46, "learning_rate": 1.1622852107300688e-05, "loss": 0.7373, "step": 6819 }, { "epoch": 0.46, "learning_rate": 1.1620674067810165e-05, "loss": 0.8037, "step": 6820 }, { "epoch": 0.46, "learning_rate": 1.161849594936048e-05, "loss": 0.8389, "step": 6821 }, { "epoch": 0.46, "learning_rate": 1.1616317752057749e-05, "loss": 0.749, "step": 6822 }, { "epoch": 0.46, "learning_rate": 1.1614139476008098e-05, "loss": 0.8008, "step": 6823 }, { "epoch": 0.47, "learning_rate": 1.1611961121317647e-05, "loss": 0.7461, "step": 6824 }, { "epoch": 0.47, "learning_rate": 1.1609782688092532e-05, "loss": 0.835, "step": 6825 }, { "epoch": 0.47, "learning_rate": 1.1607604176438882e-05, "loss": 0.7666, "step": 6826 }, { "epoch": 0.47, "learning_rate": 1.1605425586462835e-05, "loss": 0.7891, "step": 6827 }, { "epoch": 0.47, "learning_rate": 1.1603246918270532e-05, "loss": 0.7695, "step": 6828 }, { "epoch": 0.47, "learning_rate": 1.1601068171968118e-05, "loss": 0.7969, "step": 6829 }, { "epoch": 0.47, "learning_rate": 1.1598889347661739e-05, "loss": 0.7881, "step": 6830 }, { "epoch": 0.47, "learning_rate": 1.1596710445457549e-05, "loss": 0.8076, "step": 6831 }, { "epoch": 0.47, "learning_rate": 1.1594531465461705e-05, "loss": 0.7744, "step": 6832 }, { "epoch": 0.47, "learning_rate": 1.1592352407780368e-05, "loss": 0.8281, "step": 6833 }, { "epoch": 0.47, "learning_rate": 1.1590173272519695e-05, "loss": 0.8438, "step": 6834 }, { "epoch": 0.47, "learning_rate": 1.1587994059785859e-05, "loss": 0.8018, "step": 6835 }, { "epoch": 0.47, "learning_rate": 1.1585814769685031e-05, "loss": 0.8848, "step": 6836 }, { "epoch": 0.47, "learning_rate": 1.1583635402323383e-05, "loss": 0.8535, "step": 6837 }, { "epoch": 0.47, "learning_rate": 1.1581455957807097e-05, "loss": 0.8486, "step": 6838 }, { "epoch": 0.47, "learning_rate": 1.1579276436242355e-05, "loss": 0.6582, "step": 6839 }, { "epoch": 0.47, "learning_rate": 1.1577096837735338e-05, "loss": 0.7422, "step": 6840 }, { "epoch": 0.47, "learning_rate": 1.1574917162392243e-05, "loss": 0.8779, "step": 6841 }, { "epoch": 0.47, "learning_rate": 1.157273741031926e-05, "loss": 0.7578, "step": 6842 }, { "epoch": 0.47, "learning_rate": 1.1570557581622586e-05, "loss": 0.8359, "step": 6843 }, { "epoch": 0.47, "learning_rate": 1.1568377676408427e-05, "loss": 0.7656, "step": 6844 }, { "epoch": 0.47, "learning_rate": 1.1566197694782978e-05, "loss": 0.8369, "step": 6845 }, { "epoch": 0.47, "learning_rate": 1.1564017636852458e-05, "loss": 0.8857, "step": 6846 }, { "epoch": 0.47, "learning_rate": 1.1561837502723076e-05, "loss": 0.8223, "step": 6847 }, { "epoch": 0.47, "learning_rate": 1.1559657292501044e-05, "loss": 0.71, "step": 6848 }, { "epoch": 0.47, "learning_rate": 1.1557477006292585e-05, "loss": 0.792, "step": 6849 }, { "epoch": 0.47, "learning_rate": 1.1555296644203923e-05, "loss": 0.791, "step": 6850 }, { "epoch": 0.47, "learning_rate": 1.1553116206341283e-05, "loss": 0.8389, "step": 6851 }, { "epoch": 0.47, "learning_rate": 1.1550935692810903e-05, "loss": 0.7656, "step": 6852 }, { "epoch": 0.47, "learning_rate": 1.1548755103719005e-05, "loss": 0.8936, "step": 6853 }, { "epoch": 0.47, "learning_rate": 1.1546574439171836e-05, "loss": 0.8066, "step": 6854 }, { "epoch": 0.47, "learning_rate": 1.1544393699275637e-05, "loss": 0.791, "step": 6855 }, { "epoch": 0.47, "learning_rate": 1.1542212884136652e-05, "loss": 0.8057, "step": 6856 }, { "epoch": 0.47, "learning_rate": 1.154003199386113e-05, "loss": 0.8291, "step": 6857 }, { "epoch": 0.47, "learning_rate": 1.1537851028555323e-05, "loss": 0.8281, "step": 6858 }, { "epoch": 0.47, "learning_rate": 1.153566998832549e-05, "loss": 0.7734, "step": 6859 }, { "epoch": 0.47, "learning_rate": 1.153348887327789e-05, "loss": 0.8262, "step": 6860 }, { "epoch": 0.47, "learning_rate": 1.1531307683518787e-05, "loss": 0.7871, "step": 6861 }, { "epoch": 0.47, "learning_rate": 1.1529126419154448e-05, "loss": 0.8154, "step": 6862 }, { "epoch": 0.47, "learning_rate": 1.1526945080291145e-05, "loss": 0.792, "step": 6863 }, { "epoch": 0.47, "learning_rate": 1.152476366703515e-05, "loss": 0.8418, "step": 6864 }, { "epoch": 0.47, "learning_rate": 1.1522582179492747e-05, "loss": 0.8496, "step": 6865 }, { "epoch": 0.47, "learning_rate": 1.1520400617770211e-05, "loss": 0.8154, "step": 6866 }, { "epoch": 0.47, "learning_rate": 1.1518218981973834e-05, "loss": 0.8086, "step": 6867 }, { "epoch": 0.47, "learning_rate": 1.1516037272209902e-05, "loss": 0.752, "step": 6868 }, { "epoch": 0.47, "learning_rate": 1.1513855488584705e-05, "loss": 0.8408, "step": 6869 }, { "epoch": 0.47, "learning_rate": 1.1511673631204547e-05, "loss": 0.8691, "step": 6870 }, { "epoch": 0.47, "learning_rate": 1.1509491700175719e-05, "loss": 0.75, "step": 6871 }, { "epoch": 0.47, "learning_rate": 1.1507309695604531e-05, "loss": 0.7891, "step": 6872 }, { "epoch": 0.47, "learning_rate": 1.1505127617597289e-05, "loss": 0.7822, "step": 6873 }, { "epoch": 0.47, "learning_rate": 1.1502945466260302e-05, "loss": 0.8291, "step": 6874 }, { "epoch": 0.47, "learning_rate": 1.1500763241699883e-05, "loss": 0.7354, "step": 6875 }, { "epoch": 0.47, "learning_rate": 1.1498580944022356e-05, "loss": 0.8066, "step": 6876 }, { "epoch": 0.47, "learning_rate": 1.1496398573334037e-05, "loss": 0.7393, "step": 6877 }, { "epoch": 0.47, "learning_rate": 1.149421612974125e-05, "loss": 0.7881, "step": 6878 }, { "epoch": 0.47, "learning_rate": 1.1492033613350328e-05, "loss": 0.8018, "step": 6879 }, { "epoch": 0.47, "learning_rate": 1.1489851024267605e-05, "loss": 0.8848, "step": 6880 }, { "epoch": 0.47, "learning_rate": 1.1487668362599407e-05, "loss": 0.7744, "step": 6881 }, { "epoch": 0.47, "learning_rate": 1.148548562845208e-05, "loss": 0.8447, "step": 6882 }, { "epoch": 0.47, "learning_rate": 1.1483302821931969e-05, "loss": 0.9033, "step": 6883 }, { "epoch": 0.47, "learning_rate": 1.1481119943145411e-05, "loss": 0.7881, "step": 6884 }, { "epoch": 0.47, "learning_rate": 1.1478936992198766e-05, "loss": 0.8477, "step": 6885 }, { "epoch": 0.47, "learning_rate": 1.1476753969198381e-05, "loss": 0.8477, "step": 6886 }, { "epoch": 0.47, "learning_rate": 1.1474570874250616e-05, "loss": 0.8086, "step": 6887 }, { "epoch": 0.47, "learning_rate": 1.1472387707461831e-05, "loss": 0.7314, "step": 6888 }, { "epoch": 0.47, "learning_rate": 1.1470204468938387e-05, "loss": 0.8291, "step": 6889 }, { "epoch": 0.47, "learning_rate": 1.1468021158786651e-05, "loss": 0.7393, "step": 6890 }, { "epoch": 0.47, "learning_rate": 1.1465837777113e-05, "loss": 0.8643, "step": 6891 }, { "epoch": 0.47, "learning_rate": 1.1463654324023802e-05, "loss": 0.8174, "step": 6892 }, { "epoch": 0.47, "learning_rate": 1.1461470799625436e-05, "loss": 0.8252, "step": 6893 }, { "epoch": 0.47, "learning_rate": 1.1459287204024284e-05, "loss": 0.7139, "step": 6894 }, { "epoch": 0.47, "learning_rate": 1.1457103537326733e-05, "loss": 0.8379, "step": 6895 }, { "epoch": 0.47, "learning_rate": 1.1454919799639167e-05, "loss": 0.8096, "step": 6896 }, { "epoch": 0.47, "learning_rate": 1.1452735991067976e-05, "loss": 0.7793, "step": 6897 }, { "epoch": 0.47, "learning_rate": 1.1450552111719564e-05, "loss": 0.791, "step": 6898 }, { "epoch": 0.47, "learning_rate": 1.144836816170032e-05, "loss": 0.75, "step": 6899 }, { "epoch": 0.47, "learning_rate": 1.144618414111665e-05, "loss": 0.8428, "step": 6900 }, { "epoch": 0.47, "learning_rate": 1.144400005007496e-05, "loss": 0.7383, "step": 6901 }, { "epoch": 0.47, "learning_rate": 1.1441815888681658e-05, "loss": 0.9434, "step": 6902 }, { "epoch": 0.47, "learning_rate": 1.1439631657043157e-05, "loss": 0.8252, "step": 6903 }, { "epoch": 0.47, "learning_rate": 1.143744735526587e-05, "loss": 0.708, "step": 6904 }, { "epoch": 0.47, "learning_rate": 1.143526298345622e-05, "loss": 0.7666, "step": 6905 }, { "epoch": 0.47, "learning_rate": 1.1433078541720628e-05, "loss": 0.8252, "step": 6906 }, { "epoch": 0.47, "learning_rate": 1.1430894030165518e-05, "loss": 0.7988, "step": 6907 }, { "epoch": 0.47, "learning_rate": 1.1428709448897319e-05, "loss": 0.8613, "step": 6908 }, { "epoch": 0.47, "learning_rate": 1.142652479802247e-05, "loss": 0.7725, "step": 6909 }, { "epoch": 0.47, "learning_rate": 1.1424340077647398e-05, "loss": 0.8828, "step": 6910 }, { "epoch": 0.47, "learning_rate": 1.1422155287878547e-05, "loss": 0.8477, "step": 6911 }, { "epoch": 0.47, "learning_rate": 1.141997042882236e-05, "loss": 0.8291, "step": 6912 }, { "epoch": 0.47, "learning_rate": 1.1417785500585286e-05, "loss": 0.7578, "step": 6913 }, { "epoch": 0.47, "learning_rate": 1.141560050327377e-05, "loss": 0.9014, "step": 6914 }, { "epoch": 0.47, "learning_rate": 1.1413415436994265e-05, "loss": 0.7822, "step": 6915 }, { "epoch": 0.47, "learning_rate": 1.141123030185323e-05, "loss": 0.7959, "step": 6916 }, { "epoch": 0.47, "learning_rate": 1.1409045097957123e-05, "loss": 0.8252, "step": 6917 }, { "epoch": 0.47, "learning_rate": 1.1406859825412408e-05, "loss": 0.8076, "step": 6918 }, { "epoch": 0.47, "learning_rate": 1.1404674484325553e-05, "loss": 0.8027, "step": 6919 }, { "epoch": 0.47, "learning_rate": 1.140248907480302e-05, "loss": 0.8477, "step": 6920 }, { "epoch": 0.47, "learning_rate": 1.1400303596951292e-05, "loss": 0.8447, "step": 6921 }, { "epoch": 0.47, "learning_rate": 1.139811805087684e-05, "loss": 0.875, "step": 6922 }, { "epoch": 0.47, "learning_rate": 1.1395932436686143e-05, "loss": 0.873, "step": 6923 }, { "epoch": 0.47, "learning_rate": 1.139374675448569e-05, "loss": 0.7959, "step": 6924 }, { "epoch": 0.47, "learning_rate": 1.1391561004381962e-05, "loss": 0.8066, "step": 6925 }, { "epoch": 0.47, "learning_rate": 1.1389375186481447e-05, "loss": 0.8213, "step": 6926 }, { "epoch": 0.47, "learning_rate": 1.1387189300890645e-05, "loss": 0.918, "step": 6927 }, { "epoch": 0.47, "learning_rate": 1.1385003347716044e-05, "loss": 0.7275, "step": 6928 }, { "epoch": 0.47, "learning_rate": 1.1382817327064146e-05, "loss": 0.8232, "step": 6929 }, { "epoch": 0.47, "learning_rate": 1.1380631239041458e-05, "loss": 0.8057, "step": 6930 }, { "epoch": 0.47, "learning_rate": 1.1378445083754483e-05, "loss": 0.8193, "step": 6931 }, { "epoch": 0.47, "learning_rate": 1.1376258861309733e-05, "loss": 0.8213, "step": 6932 }, { "epoch": 0.47, "learning_rate": 1.1374072571813715e-05, "loss": 0.791, "step": 6933 }, { "epoch": 0.47, "learning_rate": 1.1371886215372952e-05, "loss": 0.8496, "step": 6934 }, { "epoch": 0.47, "learning_rate": 1.1369699792093956e-05, "loss": 0.7568, "step": 6935 }, { "epoch": 0.47, "learning_rate": 1.1367513302083253e-05, "loss": 0.7949, "step": 6936 }, { "epoch": 0.47, "learning_rate": 1.1365326745447372e-05, "loss": 0.8008, "step": 6937 }, { "epoch": 0.47, "learning_rate": 1.1363140122292832e-05, "loss": 0.8115, "step": 6938 }, { "epoch": 0.47, "learning_rate": 1.1360953432726178e-05, "loss": 0.7344, "step": 6939 }, { "epoch": 0.47, "learning_rate": 1.1358766676853936e-05, "loss": 0.7754, "step": 6940 }, { "epoch": 0.47, "learning_rate": 1.1356579854782648e-05, "loss": 0.8506, "step": 6941 }, { "epoch": 0.47, "learning_rate": 1.1354392966618857e-05, "loss": 0.8379, "step": 6942 }, { "epoch": 0.47, "learning_rate": 1.1352206012469107e-05, "loss": 0.7402, "step": 6943 }, { "epoch": 0.47, "learning_rate": 1.1350018992439945e-05, "loss": 0.8037, "step": 6944 }, { "epoch": 0.47, "learning_rate": 1.1347831906637925e-05, "loss": 0.7529, "step": 6945 }, { "epoch": 0.47, "learning_rate": 1.1345644755169597e-05, "loss": 0.8262, "step": 6946 }, { "epoch": 0.47, "learning_rate": 1.1343457538141524e-05, "loss": 0.8555, "step": 6947 }, { "epoch": 0.47, "learning_rate": 1.1341270255660263e-05, "loss": 0.8164, "step": 6948 }, { "epoch": 0.47, "learning_rate": 1.1339082907832386e-05, "loss": 0.7939, "step": 6949 }, { "epoch": 0.47, "learning_rate": 1.1336895494764451e-05, "loss": 0.8408, "step": 6950 }, { "epoch": 0.47, "learning_rate": 1.1334708016563032e-05, "loss": 0.8467, "step": 6951 }, { "epoch": 0.47, "learning_rate": 1.1332520473334708e-05, "loss": 0.7549, "step": 6952 }, { "epoch": 0.47, "learning_rate": 1.1330332865186047e-05, "loss": 0.8525, "step": 6953 }, { "epoch": 0.47, "learning_rate": 1.1328145192223637e-05, "loss": 0.7939, "step": 6954 }, { "epoch": 0.47, "learning_rate": 1.1325957454554055e-05, "loss": 0.835, "step": 6955 }, { "epoch": 0.47, "learning_rate": 1.132376965228389e-05, "loss": 0.8135, "step": 6956 }, { "epoch": 0.47, "learning_rate": 1.1321581785519736e-05, "loss": 0.7363, "step": 6957 }, { "epoch": 0.47, "learning_rate": 1.1319393854368181e-05, "loss": 0.9062, "step": 6958 }, { "epoch": 0.47, "learning_rate": 1.1317205858935818e-05, "loss": 0.8574, "step": 6959 }, { "epoch": 0.47, "learning_rate": 1.1315017799329254e-05, "loss": 0.7998, "step": 6960 }, { "epoch": 0.47, "learning_rate": 1.1312829675655084e-05, "loss": 0.7988, "step": 6961 }, { "epoch": 0.47, "learning_rate": 1.1310641488019915e-05, "loss": 0.833, "step": 6962 }, { "epoch": 0.47, "learning_rate": 1.1308453236530364e-05, "loss": 0.8486, "step": 6963 }, { "epoch": 0.47, "learning_rate": 1.1306264921293026e-05, "loss": 0.8652, "step": 6964 }, { "epoch": 0.47, "learning_rate": 1.1304076542414531e-05, "loss": 0.8418, "step": 6965 }, { "epoch": 0.47, "learning_rate": 1.1301888100001487e-05, "loss": 0.8555, "step": 6966 }, { "epoch": 0.47, "learning_rate": 1.1299699594160517e-05, "loss": 0.752, "step": 6967 }, { "epoch": 0.47, "learning_rate": 1.1297511024998253e-05, "loss": 0.7109, "step": 6968 }, { "epoch": 0.47, "learning_rate": 1.1295322392621308e-05, "loss": 0.8379, "step": 6969 }, { "epoch": 0.47, "learning_rate": 1.1293133697136322e-05, "loss": 0.8633, "step": 6970 }, { "epoch": 0.48, "learning_rate": 1.1290944938649927e-05, "loss": 0.7773, "step": 6971 }, { "epoch": 0.48, "learning_rate": 1.1288756117268756e-05, "loss": 0.8193, "step": 6972 }, { "epoch": 0.48, "learning_rate": 1.128656723309945e-05, "loss": 0.8984, "step": 6973 }, { "epoch": 0.48, "learning_rate": 1.128437828624865e-05, "loss": 0.7861, "step": 6974 }, { "epoch": 0.48, "learning_rate": 1.1282189276823005e-05, "loss": 0.8398, "step": 6975 }, { "epoch": 0.48, "learning_rate": 1.1280000204929158e-05, "loss": 0.7822, "step": 6976 }, { "epoch": 0.48, "learning_rate": 1.1277811070673765e-05, "loss": 0.8418, "step": 6977 }, { "epoch": 0.48, "learning_rate": 1.127562187416348e-05, "loss": 0.8262, "step": 6978 }, { "epoch": 0.48, "learning_rate": 1.1273432615504958e-05, "loss": 0.8359, "step": 6979 }, { "epoch": 0.48, "learning_rate": 1.1271243294804861e-05, "loss": 0.8291, "step": 6980 }, { "epoch": 0.48, "learning_rate": 1.1269053912169854e-05, "loss": 0.8271, "step": 6981 }, { "epoch": 0.48, "learning_rate": 1.12668644677066e-05, "loss": 0.8584, "step": 6982 }, { "epoch": 0.48, "learning_rate": 1.1264674961521774e-05, "loss": 0.7939, "step": 6983 }, { "epoch": 0.48, "learning_rate": 1.1262485393722044e-05, "loss": 0.7539, "step": 6984 }, { "epoch": 0.48, "learning_rate": 1.1260295764414085e-05, "loss": 0.7617, "step": 6985 }, { "epoch": 0.48, "learning_rate": 1.125810607370458e-05, "loss": 0.8809, "step": 6986 }, { "epoch": 0.48, "learning_rate": 1.1255916321700209e-05, "loss": 0.8408, "step": 6987 }, { "epoch": 0.48, "learning_rate": 1.1253726508507654e-05, "loss": 0.7539, "step": 6988 }, { "epoch": 0.48, "learning_rate": 1.1251536634233608e-05, "loss": 0.8311, "step": 6989 }, { "epoch": 0.48, "learning_rate": 1.1249346698984756e-05, "loss": 0.8223, "step": 6990 }, { "epoch": 0.48, "learning_rate": 1.1247156702867792e-05, "loss": 0.8965, "step": 6991 }, { "epoch": 0.48, "learning_rate": 1.1244966645989417e-05, "loss": 0.8408, "step": 6992 }, { "epoch": 0.48, "learning_rate": 1.1242776528456327e-05, "loss": 0.8721, "step": 6993 }, { "epoch": 0.48, "learning_rate": 1.1240586350375225e-05, "loss": 0.834, "step": 6994 }, { "epoch": 0.48, "learning_rate": 1.1238396111852816e-05, "loss": 0.8496, "step": 6995 }, { "epoch": 0.48, "learning_rate": 1.123620581299581e-05, "loss": 0.8916, "step": 6996 }, { "epoch": 0.48, "learning_rate": 1.1234015453910918e-05, "loss": 0.7988, "step": 6997 }, { "epoch": 0.48, "learning_rate": 1.123182503470485e-05, "loss": 0.7949, "step": 6998 }, { "epoch": 0.48, "learning_rate": 1.122963455548433e-05, "loss": 0.8311, "step": 6999 }, { "epoch": 0.48, "learning_rate": 1.1227444016356071e-05, "loss": 0.8057, "step": 7000 }, { "epoch": 0.48, "learning_rate": 1.12252534174268e-05, "loss": 0.8965, "step": 7001 }, { "epoch": 0.48, "learning_rate": 1.1223062758803245e-05, "loss": 0.7324, "step": 7002 }, { "epoch": 0.48, "learning_rate": 1.1220872040592127e-05, "loss": 0.8389, "step": 7003 }, { "epoch": 0.48, "learning_rate": 1.1218681262900188e-05, "loss": 0.8096, "step": 7004 }, { "epoch": 0.48, "learning_rate": 1.1216490425834155e-05, "loss": 0.8105, "step": 7005 }, { "epoch": 0.48, "learning_rate": 1.1214299529500767e-05, "loss": 0.7861, "step": 7006 }, { "epoch": 0.48, "learning_rate": 1.1212108574006768e-05, "loss": 0.7959, "step": 7007 }, { "epoch": 0.48, "learning_rate": 1.1209917559458896e-05, "loss": 0.832, "step": 7008 }, { "epoch": 0.48, "learning_rate": 1.1207726485963899e-05, "loss": 0.7676, "step": 7009 }, { "epoch": 0.48, "learning_rate": 1.1205535353628528e-05, "loss": 0.8154, "step": 7010 }, { "epoch": 0.48, "learning_rate": 1.1203344162559533e-05, "loss": 0.7725, "step": 7011 }, { "epoch": 0.48, "learning_rate": 1.120115291286367e-05, "loss": 0.7607, "step": 7012 }, { "epoch": 0.48, "learning_rate": 1.1198961604647694e-05, "loss": 0.8291, "step": 7013 }, { "epoch": 0.48, "learning_rate": 1.1196770238018368e-05, "loss": 0.8018, "step": 7014 }, { "epoch": 0.48, "learning_rate": 1.1194578813082455e-05, "loss": 0.75, "step": 7015 }, { "epoch": 0.48, "learning_rate": 1.1192387329946718e-05, "loss": 0.832, "step": 7016 }, { "epoch": 0.48, "learning_rate": 1.1190195788717932e-05, "loss": 0.8604, "step": 7017 }, { "epoch": 0.48, "learning_rate": 1.1188004189502859e-05, "loss": 0.8672, "step": 7018 }, { "epoch": 0.48, "learning_rate": 1.1185812532408287e-05, "loss": 0.8477, "step": 7019 }, { "epoch": 0.48, "learning_rate": 1.1183620817540985e-05, "loss": 0.8018, "step": 7020 }, { "epoch": 0.48, "learning_rate": 1.118142904500773e-05, "loss": 0.8369, "step": 7021 }, { "epoch": 0.48, "learning_rate": 1.1179237214915312e-05, "loss": 0.7666, "step": 7022 }, { "epoch": 0.48, "learning_rate": 1.1177045327370516e-05, "loss": 0.8291, "step": 7023 }, { "epoch": 0.48, "learning_rate": 1.1174853382480126e-05, "loss": 0.7979, "step": 7024 }, { "epoch": 0.48, "learning_rate": 1.117266138035094e-05, "loss": 0.7705, "step": 7025 }, { "epoch": 0.48, "learning_rate": 1.1170469321089747e-05, "loss": 0.8369, "step": 7026 }, { "epoch": 0.48, "learning_rate": 1.1168277204803344e-05, "loss": 0.8174, "step": 7027 }, { "epoch": 0.48, "learning_rate": 1.1166085031598537e-05, "loss": 0.8291, "step": 7028 }, { "epoch": 0.48, "learning_rate": 1.1163892801582121e-05, "loss": 0.7441, "step": 7029 }, { "epoch": 0.48, "learning_rate": 1.1161700514860905e-05, "loss": 0.8857, "step": 7030 }, { "epoch": 0.48, "learning_rate": 1.1159508171541696e-05, "loss": 0.708, "step": 7031 }, { "epoch": 0.48, "learning_rate": 1.1157315771731307e-05, "loss": 0.749, "step": 7032 }, { "epoch": 0.48, "learning_rate": 1.1155123315536546e-05, "loss": 0.8613, "step": 7033 }, { "epoch": 0.48, "learning_rate": 1.1152930803064238e-05, "loss": 0.7451, "step": 7034 }, { "epoch": 0.48, "learning_rate": 1.1150738234421197e-05, "loss": 0.8652, "step": 7035 }, { "epoch": 0.48, "learning_rate": 1.1148545609714241e-05, "loss": 0.8242, "step": 7036 }, { "epoch": 0.48, "learning_rate": 1.1146352929050203e-05, "loss": 0.793, "step": 7037 }, { "epoch": 0.48, "learning_rate": 1.1144160192535906e-05, "loss": 0.791, "step": 7038 }, { "epoch": 0.48, "learning_rate": 1.1141967400278178e-05, "loss": 0.7979, "step": 7039 }, { "epoch": 0.48, "learning_rate": 1.1139774552383858e-05, "loss": 0.8193, "step": 7040 }, { "epoch": 0.48, "learning_rate": 1.1137581648959774e-05, "loss": 0.791, "step": 7041 }, { "epoch": 0.48, "learning_rate": 1.1135388690112768e-05, "loss": 0.9131, "step": 7042 }, { "epoch": 0.48, "learning_rate": 1.1133195675949682e-05, "loss": 0.8232, "step": 7043 }, { "epoch": 0.48, "learning_rate": 1.1131002606577357e-05, "loss": 0.6846, "step": 7044 }, { "epoch": 0.48, "learning_rate": 1.1128809482102638e-05, "loss": 0.7607, "step": 7045 }, { "epoch": 0.48, "learning_rate": 1.112661630263238e-05, "loss": 0.8496, "step": 7046 }, { "epoch": 0.48, "learning_rate": 1.1124423068273428e-05, "loss": 0.8281, "step": 7047 }, { "epoch": 0.48, "learning_rate": 1.1122229779132639e-05, "loss": 0.8018, "step": 7048 }, { "epoch": 0.48, "learning_rate": 1.112003643531687e-05, "loss": 0.7656, "step": 7049 }, { "epoch": 0.48, "learning_rate": 1.1117843036932983e-05, "loss": 0.8428, "step": 7050 }, { "epoch": 0.48, "learning_rate": 1.1115649584087833e-05, "loss": 0.8203, "step": 7051 }, { "epoch": 0.48, "learning_rate": 1.1113456076888294e-05, "loss": 0.8359, "step": 7052 }, { "epoch": 0.48, "learning_rate": 1.1111262515441228e-05, "loss": 0.7686, "step": 7053 }, { "epoch": 0.48, "learning_rate": 1.1109068899853506e-05, "loss": 0.8965, "step": 7054 }, { "epoch": 0.48, "learning_rate": 1.1106875230231999e-05, "loss": 0.8037, "step": 7055 }, { "epoch": 0.48, "learning_rate": 1.110468150668359e-05, "loss": 0.8555, "step": 7056 }, { "epoch": 0.48, "learning_rate": 1.1102487729315146e-05, "loss": 0.8252, "step": 7057 }, { "epoch": 0.48, "learning_rate": 1.1100293898233558e-05, "loss": 0.7949, "step": 7058 }, { "epoch": 0.48, "learning_rate": 1.1098100013545703e-05, "loss": 0.8213, "step": 7059 }, { "epoch": 0.48, "learning_rate": 1.109590607535847e-05, "loss": 0.8311, "step": 7060 }, { "epoch": 0.48, "learning_rate": 1.1093712083778748e-05, "loss": 0.7646, "step": 7061 }, { "epoch": 0.48, "learning_rate": 1.1091518038913422e-05, "loss": 0.7832, "step": 7062 }, { "epoch": 0.48, "learning_rate": 1.1089323940869392e-05, "loss": 0.8008, "step": 7063 }, { "epoch": 0.48, "learning_rate": 1.1087129789753554e-05, "loss": 0.8359, "step": 7064 }, { "epoch": 0.48, "learning_rate": 1.1084935585672807e-05, "loss": 0.8203, "step": 7065 }, { "epoch": 0.48, "learning_rate": 1.1082741328734048e-05, "loss": 0.8477, "step": 7066 }, { "epoch": 0.48, "learning_rate": 1.1080547019044186e-05, "loss": 0.8447, "step": 7067 }, { "epoch": 0.48, "learning_rate": 1.1078352656710125e-05, "loss": 0.835, "step": 7068 }, { "epoch": 0.48, "learning_rate": 1.1076158241838776e-05, "loss": 0.9111, "step": 7069 }, { "epoch": 0.48, "learning_rate": 1.1073963774537049e-05, "loss": 0.7783, "step": 7070 }, { "epoch": 0.48, "learning_rate": 1.1071769254911862e-05, "loss": 0.8281, "step": 7071 }, { "epoch": 0.48, "learning_rate": 1.1069574683070125e-05, "loss": 0.8242, "step": 7072 }, { "epoch": 0.48, "learning_rate": 1.1067380059118765e-05, "loss": 0.6338, "step": 7073 }, { "epoch": 0.48, "learning_rate": 1.1065185383164701e-05, "loss": 0.7979, "step": 7074 }, { "epoch": 0.48, "learning_rate": 1.1062990655314851e-05, "loss": 0.9355, "step": 7075 }, { "epoch": 0.48, "learning_rate": 1.1060795875676153e-05, "loss": 0.8486, "step": 7076 }, { "epoch": 0.48, "learning_rate": 1.1058601044355533e-05, "loss": 0.7832, "step": 7077 }, { "epoch": 0.48, "learning_rate": 1.1056406161459919e-05, "loss": 0.8447, "step": 7078 }, { "epoch": 0.48, "learning_rate": 1.105421122709625e-05, "loss": 0.8203, "step": 7079 }, { "epoch": 0.48, "learning_rate": 1.1052016241371456e-05, "loss": 0.8496, "step": 7080 }, { "epoch": 0.48, "learning_rate": 1.104982120439249e-05, "loss": 0.8174, "step": 7081 }, { "epoch": 0.48, "learning_rate": 1.1047626116266284e-05, "loss": 0.7939, "step": 7082 }, { "epoch": 0.48, "learning_rate": 1.104543097709978e-05, "loss": 0.7998, "step": 7083 }, { "epoch": 0.48, "learning_rate": 1.1043235786999935e-05, "loss": 0.8486, "step": 7084 }, { "epoch": 0.48, "learning_rate": 1.1041040546073692e-05, "loss": 0.8086, "step": 7085 }, { "epoch": 0.48, "learning_rate": 1.1038845254428004e-05, "loss": 0.7988, "step": 7086 }, { "epoch": 0.48, "learning_rate": 1.1036649912169826e-05, "loss": 0.8262, "step": 7087 }, { "epoch": 0.48, "learning_rate": 1.1034454519406114e-05, "loss": 0.874, "step": 7088 }, { "epoch": 0.48, "learning_rate": 1.103225907624383e-05, "loss": 0.8379, "step": 7089 }, { "epoch": 0.48, "learning_rate": 1.1030063582789933e-05, "loss": 0.7773, "step": 7090 }, { "epoch": 0.48, "learning_rate": 1.1027868039151388e-05, "loss": 0.876, "step": 7091 }, { "epoch": 0.48, "learning_rate": 1.1025672445435162e-05, "loss": 0.8623, "step": 7092 }, { "epoch": 0.48, "learning_rate": 1.1023476801748224e-05, "loss": 0.7891, "step": 7093 }, { "epoch": 0.48, "learning_rate": 1.102128110819755e-05, "loss": 0.8428, "step": 7094 }, { "epoch": 0.48, "learning_rate": 1.1019085364890108e-05, "loss": 0.8447, "step": 7095 }, { "epoch": 0.48, "learning_rate": 1.1016889571932876e-05, "loss": 0.873, "step": 7096 }, { "epoch": 0.48, "learning_rate": 1.1014693729432835e-05, "loss": 0.7832, "step": 7097 }, { "epoch": 0.48, "learning_rate": 1.1012497837496962e-05, "loss": 0.8408, "step": 7098 }, { "epoch": 0.48, "learning_rate": 1.1010301896232246e-05, "loss": 0.8789, "step": 7099 }, { "epoch": 0.48, "learning_rate": 1.1008105905745672e-05, "loss": 0.875, "step": 7100 }, { "epoch": 0.48, "learning_rate": 1.1005909866144225e-05, "loss": 0.8281, "step": 7101 }, { "epoch": 0.48, "learning_rate": 1.1003713777534898e-05, "loss": 0.7969, "step": 7102 }, { "epoch": 0.48, "learning_rate": 1.1001517640024686e-05, "loss": 0.7617, "step": 7103 }, { "epoch": 0.48, "learning_rate": 1.0999321453720583e-05, "loss": 0.79, "step": 7104 }, { "epoch": 0.48, "learning_rate": 1.099712521872959e-05, "loss": 0.8154, "step": 7105 }, { "epoch": 0.48, "learning_rate": 1.0994928935158703e-05, "loss": 0.8066, "step": 7106 }, { "epoch": 0.48, "learning_rate": 1.0992732603114926e-05, "loss": 0.7793, "step": 7107 }, { "epoch": 0.48, "learning_rate": 1.0990536222705268e-05, "loss": 0.8467, "step": 7108 }, { "epoch": 0.48, "learning_rate": 1.0988339794036731e-05, "loss": 0.8447, "step": 7109 }, { "epoch": 0.48, "learning_rate": 1.0986143317216326e-05, "loss": 0.8115, "step": 7110 }, { "epoch": 0.48, "learning_rate": 1.0983946792351068e-05, "loss": 0.8799, "step": 7111 }, { "epoch": 0.48, "learning_rate": 1.0981750219547972e-05, "loss": 0.8604, "step": 7112 }, { "epoch": 0.48, "learning_rate": 1.0979553598914053e-05, "loss": 0.7334, "step": 7113 }, { "epoch": 0.48, "learning_rate": 1.0977356930556327e-05, "loss": 0.8672, "step": 7114 }, { "epoch": 0.48, "learning_rate": 1.0975160214581823e-05, "loss": 0.8096, "step": 7115 }, { "epoch": 0.48, "learning_rate": 1.0972963451097557e-05, "loss": 0.8408, "step": 7116 }, { "epoch": 0.49, "learning_rate": 1.0970766640210562e-05, "loss": 0.8174, "step": 7117 }, { "epoch": 0.49, "learning_rate": 1.0968569782027865e-05, "loss": 0.8154, "step": 7118 }, { "epoch": 0.49, "learning_rate": 1.096637287665649e-05, "loss": 0.7539, "step": 7119 }, { "epoch": 0.49, "learning_rate": 1.0964175924203482e-05, "loss": 0.8613, "step": 7120 }, { "epoch": 0.49, "learning_rate": 1.0961978924775865e-05, "loss": 0.833, "step": 7121 }, { "epoch": 0.49, "learning_rate": 1.0959781878480685e-05, "loss": 0.791, "step": 7122 }, { "epoch": 0.49, "learning_rate": 1.0957584785424978e-05, "loss": 0.8018, "step": 7123 }, { "epoch": 0.49, "learning_rate": 1.0955387645715785e-05, "loss": 0.8271, "step": 7124 }, { "epoch": 0.49, "learning_rate": 1.0953190459460152e-05, "loss": 0.8564, "step": 7125 }, { "epoch": 0.49, "learning_rate": 1.095099322676513e-05, "loss": 0.8174, "step": 7126 }, { "epoch": 0.49, "learning_rate": 1.0948795947737762e-05, "loss": 0.8105, "step": 7127 }, { "epoch": 0.49, "learning_rate": 1.0946598622485103e-05, "loss": 0.7793, "step": 7128 }, { "epoch": 0.49, "learning_rate": 1.0944401251114202e-05, "loss": 0.8545, "step": 7129 }, { "epoch": 0.49, "learning_rate": 1.0942203833732124e-05, "loss": 0.835, "step": 7130 }, { "epoch": 0.49, "learning_rate": 1.0940006370445917e-05, "loss": 0.8682, "step": 7131 }, { "epoch": 0.49, "learning_rate": 1.0937808861362645e-05, "loss": 0.7881, "step": 7132 }, { "epoch": 0.49, "learning_rate": 1.0935611306589373e-05, "loss": 0.7334, "step": 7133 }, { "epoch": 0.49, "learning_rate": 1.0933413706233163e-05, "loss": 0.8047, "step": 7134 }, { "epoch": 0.49, "learning_rate": 1.0931216060401083e-05, "loss": 0.7793, "step": 7135 }, { "epoch": 0.49, "learning_rate": 1.0929018369200202e-05, "loss": 0.8447, "step": 7136 }, { "epoch": 0.49, "learning_rate": 1.0926820632737589e-05, "loss": 0.8398, "step": 7137 }, { "epoch": 0.49, "learning_rate": 1.0924622851120324e-05, "loss": 0.8574, "step": 7138 }, { "epoch": 0.49, "learning_rate": 1.0922425024455477e-05, "loss": 0.7188, "step": 7139 }, { "epoch": 0.49, "learning_rate": 1.0920227152850124e-05, "loss": 0.7676, "step": 7140 }, { "epoch": 0.49, "learning_rate": 1.0918029236411357e-05, "loss": 0.833, "step": 7141 }, { "epoch": 0.49, "learning_rate": 1.0915831275246242e-05, "loss": 0.8662, "step": 7142 }, { "epoch": 0.49, "learning_rate": 1.0913633269461876e-05, "loss": 0.8633, "step": 7143 }, { "epoch": 0.49, "learning_rate": 1.0911435219165343e-05, "loss": 0.7764, "step": 7144 }, { "epoch": 0.49, "learning_rate": 1.090923712446373e-05, "loss": 0.7998, "step": 7145 }, { "epoch": 0.49, "learning_rate": 1.0907038985464126e-05, "loss": 0.7383, "step": 7146 }, { "epoch": 0.49, "learning_rate": 1.0904840802273628e-05, "loss": 0.8301, "step": 7147 }, { "epoch": 0.49, "learning_rate": 1.0902642574999334e-05, "loss": 0.8389, "step": 7148 }, { "epoch": 0.49, "learning_rate": 1.0900444303748333e-05, "loss": 0.752, "step": 7149 }, { "epoch": 0.49, "learning_rate": 1.089824598862773e-05, "loss": 0.7373, "step": 7150 }, { "epoch": 0.49, "learning_rate": 1.0896047629744628e-05, "loss": 0.8447, "step": 7151 }, { "epoch": 0.49, "learning_rate": 1.0893849227206129e-05, "loss": 0.8496, "step": 7152 }, { "epoch": 0.49, "learning_rate": 1.0891650781119338e-05, "loss": 0.7666, "step": 7153 }, { "epoch": 0.49, "learning_rate": 1.0889452291591367e-05, "loss": 0.7734, "step": 7154 }, { "epoch": 0.49, "learning_rate": 1.088725375872932e-05, "loss": 0.8008, "step": 7155 }, { "epoch": 0.49, "learning_rate": 1.0885055182640316e-05, "loss": 0.8867, "step": 7156 }, { "epoch": 0.49, "learning_rate": 1.0882856563431465e-05, "loss": 0.8232, "step": 7157 }, { "epoch": 0.49, "learning_rate": 1.0880657901209886e-05, "loss": 0.8115, "step": 7158 }, { "epoch": 0.49, "learning_rate": 1.0878459196082698e-05, "loss": 0.7949, "step": 7159 }, { "epoch": 0.49, "learning_rate": 1.087626044815702e-05, "loss": 0.79, "step": 7160 }, { "epoch": 0.49, "learning_rate": 1.0874061657539974e-05, "loss": 0.7949, "step": 7161 }, { "epoch": 0.49, "learning_rate": 1.0871862824338688e-05, "loss": 0.8701, "step": 7162 }, { "epoch": 0.49, "learning_rate": 1.0869663948660288e-05, "loss": 0.7285, "step": 7163 }, { "epoch": 0.49, "learning_rate": 1.0867465030611901e-05, "loss": 0.7188, "step": 7164 }, { "epoch": 0.49, "learning_rate": 1.0865266070300661e-05, "loss": 0.8213, "step": 7165 }, { "epoch": 0.49, "learning_rate": 1.0863067067833704e-05, "loss": 0.752, "step": 7166 }, { "epoch": 0.49, "learning_rate": 1.0860868023318157e-05, "loss": 0.8887, "step": 7167 }, { "epoch": 0.49, "learning_rate": 1.0858668936861163e-05, "loss": 0.79, "step": 7168 }, { "epoch": 0.49, "learning_rate": 1.0856469808569862e-05, "loss": 0.7949, "step": 7169 }, { "epoch": 0.49, "learning_rate": 1.0854270638551391e-05, "loss": 0.8672, "step": 7170 }, { "epoch": 0.49, "learning_rate": 1.0852071426912898e-05, "loss": 0.749, "step": 7171 }, { "epoch": 0.49, "learning_rate": 1.0849872173761526e-05, "loss": 0.8291, "step": 7172 }, { "epoch": 0.49, "learning_rate": 1.0847672879204422e-05, "loss": 0.7832, "step": 7173 }, { "epoch": 0.49, "learning_rate": 1.084547354334874e-05, "loss": 0.7129, "step": 7174 }, { "epoch": 0.49, "learning_rate": 1.0843274166301626e-05, "loss": 0.9053, "step": 7175 }, { "epoch": 0.49, "learning_rate": 1.0841074748170236e-05, "loss": 0.7949, "step": 7176 }, { "epoch": 0.49, "learning_rate": 1.0838875289061725e-05, "loss": 0.793, "step": 7177 }, { "epoch": 0.49, "learning_rate": 1.0836675789083252e-05, "loss": 0.8955, "step": 7178 }, { "epoch": 0.49, "learning_rate": 1.0834476248341971e-05, "loss": 0.7393, "step": 7179 }, { "epoch": 0.49, "learning_rate": 1.0832276666945054e-05, "loss": 0.8623, "step": 7180 }, { "epoch": 0.49, "learning_rate": 1.0830077044999654e-05, "loss": 0.8389, "step": 7181 }, { "epoch": 0.49, "learning_rate": 1.0827877382612941e-05, "loss": 0.7383, "step": 7182 }, { "epoch": 0.49, "learning_rate": 1.0825677679892084e-05, "loss": 0.8203, "step": 7183 }, { "epoch": 0.49, "learning_rate": 1.0823477936944254e-05, "loss": 0.7842, "step": 7184 }, { "epoch": 0.49, "learning_rate": 1.0821278153876614e-05, "loss": 0.7998, "step": 7185 }, { "epoch": 0.49, "learning_rate": 1.0819078330796342e-05, "loss": 0.7764, "step": 7186 }, { "epoch": 0.49, "learning_rate": 1.0816878467810616e-05, "loss": 0.7861, "step": 7187 }, { "epoch": 0.49, "learning_rate": 1.081467856502661e-05, "loss": 0.71, "step": 7188 }, { "epoch": 0.49, "learning_rate": 1.0812478622551505e-05, "loss": 0.8125, "step": 7189 }, { "epoch": 0.49, "learning_rate": 1.0810278640492483e-05, "loss": 0.7441, "step": 7190 }, { "epoch": 0.49, "learning_rate": 1.080807861895672e-05, "loss": 0.7031, "step": 7191 }, { "epoch": 0.49, "learning_rate": 1.080587855805141e-05, "loss": 0.8486, "step": 7192 }, { "epoch": 0.49, "learning_rate": 1.0803678457883735e-05, "loss": 0.7803, "step": 7193 }, { "epoch": 0.49, "learning_rate": 1.0801478318560883e-05, "loss": 0.7949, "step": 7194 }, { "epoch": 0.49, "learning_rate": 1.0799278140190048e-05, "loss": 0.7979, "step": 7195 }, { "epoch": 0.49, "learning_rate": 1.0797077922878421e-05, "loss": 0.8213, "step": 7196 }, { "epoch": 0.49, "learning_rate": 1.0794877666733197e-05, "loss": 0.7773, "step": 7197 }, { "epoch": 0.49, "learning_rate": 1.0792677371861573e-05, "loss": 0.6943, "step": 7198 }, { "epoch": 0.49, "learning_rate": 1.0790477038370741e-05, "loss": 0.8125, "step": 7199 }, { "epoch": 0.49, "learning_rate": 1.078827666636791e-05, "loss": 0.8486, "step": 7200 }, { "epoch": 0.49, "learning_rate": 1.0786076255960278e-05, "loss": 0.7988, "step": 7201 }, { "epoch": 0.49, "learning_rate": 1.0783875807255049e-05, "loss": 0.793, "step": 7202 }, { "epoch": 0.49, "learning_rate": 1.078167532035943e-05, "loss": 0.7363, "step": 7203 }, { "epoch": 0.49, "learning_rate": 1.0779474795380625e-05, "loss": 0.8164, "step": 7204 }, { "epoch": 0.49, "learning_rate": 1.0777274232425847e-05, "loss": 0.8711, "step": 7205 }, { "epoch": 0.49, "learning_rate": 1.0775073631602308e-05, "loss": 0.7979, "step": 7206 }, { "epoch": 0.49, "learning_rate": 1.0772872993017219e-05, "loss": 0.7607, "step": 7207 }, { "epoch": 0.49, "learning_rate": 1.0770672316777793e-05, "loss": 0.8174, "step": 7208 }, { "epoch": 0.49, "learning_rate": 1.076847160299125e-05, "loss": 0.6836, "step": 7209 }, { "epoch": 0.49, "learning_rate": 1.076627085176481e-05, "loss": 0.7549, "step": 7210 }, { "epoch": 0.49, "learning_rate": 1.0764070063205689e-05, "loss": 0.8193, "step": 7211 }, { "epoch": 0.49, "learning_rate": 1.0761869237421114e-05, "loss": 0.8477, "step": 7212 }, { "epoch": 0.49, "learning_rate": 1.0759668374518307e-05, "loss": 0.8037, "step": 7213 }, { "epoch": 0.49, "learning_rate": 1.0757467474604493e-05, "loss": 0.8271, "step": 7214 }, { "epoch": 0.49, "learning_rate": 1.0755266537786899e-05, "loss": 0.8545, "step": 7215 }, { "epoch": 0.49, "learning_rate": 1.075306556417276e-05, "loss": 0.7422, "step": 7216 }, { "epoch": 0.49, "learning_rate": 1.0750864553869298e-05, "loss": 0.8398, "step": 7217 }, { "epoch": 0.49, "learning_rate": 1.0748663506983754e-05, "loss": 0.7783, "step": 7218 }, { "epoch": 0.49, "learning_rate": 1.0746462423623365e-05, "loss": 0.8193, "step": 7219 }, { "epoch": 0.49, "learning_rate": 1.0744261303895355e-05, "loss": 0.7432, "step": 7220 }, { "epoch": 0.49, "learning_rate": 1.0742060147906976e-05, "loss": 0.7471, "step": 7221 }, { "epoch": 0.49, "learning_rate": 1.0739858955765461e-05, "loss": 0.8203, "step": 7222 }, { "epoch": 0.49, "learning_rate": 1.0737657727578055e-05, "loss": 0.8213, "step": 7223 }, { "epoch": 0.49, "learning_rate": 1.0735456463452e-05, "loss": 0.8369, "step": 7224 }, { "epoch": 0.49, "learning_rate": 1.073325516349454e-05, "loss": 0.8545, "step": 7225 }, { "epoch": 0.49, "learning_rate": 1.0731053827812927e-05, "loss": 0.8633, "step": 7226 }, { "epoch": 0.49, "learning_rate": 1.0728852456514404e-05, "loss": 0.835, "step": 7227 }, { "epoch": 0.49, "learning_rate": 1.0726651049706229e-05, "loss": 0.7686, "step": 7228 }, { "epoch": 0.49, "learning_rate": 1.0724449607495648e-05, "loss": 0.7988, "step": 7229 }, { "epoch": 0.49, "learning_rate": 1.0722248129989916e-05, "loss": 0.8096, "step": 7230 }, { "epoch": 0.49, "learning_rate": 1.0720046617296294e-05, "loss": 0.7607, "step": 7231 }, { "epoch": 0.49, "learning_rate": 1.0717845069522032e-05, "loss": 0.7812, "step": 7232 }, { "epoch": 0.49, "learning_rate": 1.0715643486774396e-05, "loss": 0.8223, "step": 7233 }, { "epoch": 0.49, "learning_rate": 1.0713441869160645e-05, "loss": 0.7979, "step": 7234 }, { "epoch": 0.49, "learning_rate": 1.0711240216788036e-05, "loss": 0.8213, "step": 7235 }, { "epoch": 0.49, "learning_rate": 1.0709038529763844e-05, "loss": 0.7637, "step": 7236 }, { "epoch": 0.49, "learning_rate": 1.0706836808195329e-05, "loss": 0.8027, "step": 7237 }, { "epoch": 0.49, "learning_rate": 1.0704635052189754e-05, "loss": 0.8535, "step": 7238 }, { "epoch": 0.49, "learning_rate": 1.0702433261854398e-05, "loss": 0.792, "step": 7239 }, { "epoch": 0.49, "learning_rate": 1.0700231437296527e-05, "loss": 0.7568, "step": 7240 }, { "epoch": 0.49, "learning_rate": 1.0698029578623413e-05, "loss": 0.7676, "step": 7241 }, { "epoch": 0.49, "learning_rate": 1.0695827685942333e-05, "loss": 0.9004, "step": 7242 }, { "epoch": 0.49, "learning_rate": 1.0693625759360562e-05, "loss": 0.7256, "step": 7243 }, { "epoch": 0.49, "learning_rate": 1.0691423798985376e-05, "loss": 0.7871, "step": 7244 }, { "epoch": 0.49, "learning_rate": 1.0689221804924061e-05, "loss": 0.8105, "step": 7245 }, { "epoch": 0.49, "learning_rate": 1.0687019777283889e-05, "loss": 0.8076, "step": 7246 }, { "epoch": 0.49, "learning_rate": 1.0684817716172148e-05, "loss": 0.8213, "step": 7247 }, { "epoch": 0.49, "learning_rate": 1.0682615621696121e-05, "loss": 0.8545, "step": 7248 }, { "epoch": 0.49, "learning_rate": 1.0680413493963098e-05, "loss": 0.8623, "step": 7249 }, { "epoch": 0.49, "learning_rate": 1.0678211333080357e-05, "loss": 0.8027, "step": 7250 }, { "epoch": 0.49, "learning_rate": 1.0676009139155196e-05, "loss": 0.7861, "step": 7251 }, { "epoch": 0.49, "learning_rate": 1.0673806912294904e-05, "loss": 0.7432, "step": 7252 }, { "epoch": 0.49, "learning_rate": 1.0671604652606767e-05, "loss": 0.7412, "step": 7253 }, { "epoch": 0.49, "learning_rate": 1.066940236019809e-05, "loss": 0.7432, "step": 7254 }, { "epoch": 0.49, "learning_rate": 1.0667200035176162e-05, "loss": 0.7793, "step": 7255 }, { "epoch": 0.49, "learning_rate": 1.0664997677648274e-05, "loss": 0.832, "step": 7256 }, { "epoch": 0.49, "learning_rate": 1.0662795287721739e-05, "loss": 0.7803, "step": 7257 }, { "epoch": 0.49, "learning_rate": 1.0660592865503846e-05, "loss": 0.8066, "step": 7258 }, { "epoch": 0.49, "learning_rate": 1.0658390411101902e-05, "loss": 0.7812, "step": 7259 }, { "epoch": 0.49, "learning_rate": 1.065618792462321e-05, "loss": 0.8652, "step": 7260 }, { "epoch": 0.49, "learning_rate": 1.0653985406175074e-05, "loss": 0.8535, "step": 7261 }, { "epoch": 0.49, "learning_rate": 1.06517828558648e-05, "loss": 0.7676, "step": 7262 }, { "epoch": 0.49, "learning_rate": 1.06495802737997e-05, "loss": 0.7744, "step": 7263 }, { "epoch": 0.5, "learning_rate": 1.0647377660087076e-05, "loss": 0.8457, "step": 7264 }, { "epoch": 0.5, "learning_rate": 1.0645175014834248e-05, "loss": 0.8242, "step": 7265 }, { "epoch": 0.5, "learning_rate": 1.064297233814852e-05, "loss": 0.7129, "step": 7266 }, { "epoch": 0.5, "learning_rate": 1.0640769630137218e-05, "loss": 0.7822, "step": 7267 }, { "epoch": 0.5, "learning_rate": 1.0638566890907647e-05, "loss": 0.8184, "step": 7268 }, { "epoch": 0.5, "learning_rate": 1.0636364120567126e-05, "loss": 0.9141, "step": 7269 }, { "epoch": 0.5, "learning_rate": 1.063416131922298e-05, "loss": 0.7666, "step": 7270 }, { "epoch": 0.5, "learning_rate": 1.063195848698252e-05, "loss": 0.8428, "step": 7271 }, { "epoch": 0.5, "learning_rate": 1.062975562395308e-05, "loss": 0.8008, "step": 7272 }, { "epoch": 0.5, "learning_rate": 1.0627552730241974e-05, "loss": 0.8008, "step": 7273 }, { "epoch": 0.5, "learning_rate": 1.0625349805956529e-05, "loss": 0.8301, "step": 7274 }, { "epoch": 0.5, "learning_rate": 1.0623146851204074e-05, "loss": 0.71, "step": 7275 }, { "epoch": 0.5, "learning_rate": 1.062094386609193e-05, "loss": 0.7861, "step": 7276 }, { "epoch": 0.5, "learning_rate": 1.0618740850727436e-05, "loss": 0.833, "step": 7277 }, { "epoch": 0.5, "learning_rate": 1.0616537805217918e-05, "loss": 0.7637, "step": 7278 }, { "epoch": 0.5, "learning_rate": 1.0614334729670706e-05, "loss": 0.791, "step": 7279 }, { "epoch": 0.5, "learning_rate": 1.0612131624193134e-05, "loss": 0.8281, "step": 7280 }, { "epoch": 0.5, "learning_rate": 1.0609928488892545e-05, "loss": 0.8047, "step": 7281 }, { "epoch": 0.5, "learning_rate": 1.0607725323876263e-05, "loss": 0.8389, "step": 7282 }, { "epoch": 0.5, "learning_rate": 1.0605522129251638e-05, "loss": 0.7598, "step": 7283 }, { "epoch": 0.5, "learning_rate": 1.0603318905126e-05, "loss": 0.8193, "step": 7284 }, { "epoch": 0.5, "learning_rate": 1.0601115651606699e-05, "loss": 0.7871, "step": 7285 }, { "epoch": 0.5, "learning_rate": 1.0598912368801072e-05, "loss": 0.7305, "step": 7286 }, { "epoch": 0.5, "learning_rate": 1.0596709056816459e-05, "loss": 0.8438, "step": 7287 }, { "epoch": 0.5, "learning_rate": 1.0594505715760215e-05, "loss": 0.7686, "step": 7288 }, { "epoch": 0.5, "learning_rate": 1.059230234573968e-05, "loss": 0.8242, "step": 7289 }, { "epoch": 0.5, "learning_rate": 1.0590098946862202e-05, "loss": 0.8506, "step": 7290 }, { "epoch": 0.5, "learning_rate": 1.0587895519235134e-05, "loss": 0.8076, "step": 7291 }, { "epoch": 0.5, "learning_rate": 1.0585692062965823e-05, "loss": 0.8223, "step": 7292 }, { "epoch": 0.5, "learning_rate": 1.0583488578161625e-05, "loss": 0.8135, "step": 7293 }, { "epoch": 0.5, "learning_rate": 1.0581285064929892e-05, "loss": 0.8174, "step": 7294 }, { "epoch": 0.5, "learning_rate": 1.0579081523377977e-05, "loss": 0.8154, "step": 7295 }, { "epoch": 0.5, "learning_rate": 1.057687795361324e-05, "loss": 0.7803, "step": 7296 }, { "epoch": 0.5, "learning_rate": 1.0574674355743038e-05, "loss": 0.7666, "step": 7297 }, { "epoch": 0.5, "learning_rate": 1.0572470729874728e-05, "loss": 0.7988, "step": 7298 }, { "epoch": 0.5, "learning_rate": 1.0570267076115674e-05, "loss": 0.8311, "step": 7299 }, { "epoch": 0.5, "learning_rate": 1.0568063394573234e-05, "loss": 0.8311, "step": 7300 }, { "epoch": 0.5, "learning_rate": 1.056585968535477e-05, "loss": 0.8135, "step": 7301 }, { "epoch": 0.5, "learning_rate": 1.0563655948567654e-05, "loss": 0.8145, "step": 7302 }, { "epoch": 0.5, "learning_rate": 1.0561452184319249e-05, "loss": 0.748, "step": 7303 }, { "epoch": 0.5, "learning_rate": 1.055924839271692e-05, "loss": 0.8057, "step": 7304 }, { "epoch": 0.5, "learning_rate": 1.0557044573868033e-05, "loss": 0.7979, "step": 7305 }, { "epoch": 0.5, "learning_rate": 1.0554840727879964e-05, "loss": 0.7119, "step": 7306 }, { "epoch": 0.5, "learning_rate": 1.0552636854860084e-05, "loss": 0.7588, "step": 7307 }, { "epoch": 0.5, "learning_rate": 1.0550432954915758e-05, "loss": 0.8154, "step": 7308 }, { "epoch": 0.5, "learning_rate": 1.0548229028154372e-05, "loss": 0.8086, "step": 7309 }, { "epoch": 0.5, "learning_rate": 1.0546025074683287e-05, "loss": 0.793, "step": 7310 }, { "epoch": 0.5, "learning_rate": 1.0543821094609892e-05, "loss": 0.8506, "step": 7311 }, { "epoch": 0.5, "learning_rate": 1.0541617088041557e-05, "loss": 0.6885, "step": 7312 }, { "epoch": 0.5, "learning_rate": 1.0539413055085666e-05, "loss": 0.874, "step": 7313 }, { "epoch": 0.5, "learning_rate": 1.0537208995849599e-05, "loss": 0.7656, "step": 7314 }, { "epoch": 0.5, "learning_rate": 1.0535004910440733e-05, "loss": 0.8096, "step": 7315 }, { "epoch": 0.5, "learning_rate": 1.0532800798966453e-05, "loss": 0.8037, "step": 7316 }, { "epoch": 0.5, "learning_rate": 1.0530596661534148e-05, "loss": 0.8115, "step": 7317 }, { "epoch": 0.5, "learning_rate": 1.0528392498251196e-05, "loss": 0.8535, "step": 7318 }, { "epoch": 0.5, "learning_rate": 1.0526188309224988e-05, "loss": 0.8232, "step": 7319 }, { "epoch": 0.5, "learning_rate": 1.0523984094562911e-05, "loss": 0.7676, "step": 7320 }, { "epoch": 0.5, "learning_rate": 1.0521779854372353e-05, "loss": 0.7354, "step": 7321 }, { "epoch": 0.5, "learning_rate": 1.0519575588760711e-05, "loss": 0.7959, "step": 7322 }, { "epoch": 0.5, "learning_rate": 1.0517371297835367e-05, "loss": 0.7676, "step": 7323 }, { "epoch": 0.5, "learning_rate": 1.0515166981703721e-05, "loss": 0.7637, "step": 7324 }, { "epoch": 0.5, "learning_rate": 1.0512962640473165e-05, "loss": 0.7822, "step": 7325 }, { "epoch": 0.5, "learning_rate": 1.0510758274251094e-05, "loss": 0.8496, "step": 7326 }, { "epoch": 0.5, "learning_rate": 1.0508553883144904e-05, "loss": 0.7988, "step": 7327 }, { "epoch": 0.5, "learning_rate": 1.0506349467261992e-05, "loss": 0.7295, "step": 7328 }, { "epoch": 0.5, "learning_rate": 1.050414502670976e-05, "loss": 0.7959, "step": 7329 }, { "epoch": 0.5, "learning_rate": 1.0501940561595607e-05, "loss": 0.8223, "step": 7330 }, { "epoch": 0.5, "learning_rate": 1.0499736072026934e-05, "loss": 0.7305, "step": 7331 }, { "epoch": 0.5, "learning_rate": 1.0497531558111146e-05, "loss": 0.7373, "step": 7332 }, { "epoch": 0.5, "learning_rate": 1.0495327019955644e-05, "loss": 0.8857, "step": 7333 }, { "epoch": 0.5, "learning_rate": 1.049312245766783e-05, "loss": 0.8398, "step": 7334 }, { "epoch": 0.5, "learning_rate": 1.049091787135512e-05, "loss": 0.6836, "step": 7335 }, { "epoch": 0.5, "learning_rate": 1.048871326112491e-05, "loss": 0.7861, "step": 7336 }, { "epoch": 0.5, "learning_rate": 1.0486508627084616e-05, "loss": 0.8076, "step": 7337 }, { "epoch": 0.5, "learning_rate": 1.0484303969341646e-05, "loss": 0.749, "step": 7338 }, { "epoch": 0.5, "learning_rate": 1.0482099288003406e-05, "loss": 0.7773, "step": 7339 }, { "epoch": 0.5, "learning_rate": 1.0479894583177318e-05, "loss": 0.8076, "step": 7340 }, { "epoch": 0.5, "learning_rate": 1.0477689854970787e-05, "loss": 0.8125, "step": 7341 }, { "epoch": 0.5, "learning_rate": 1.047548510349123e-05, "loss": 0.8555, "step": 7342 }, { "epoch": 0.5, "learning_rate": 1.0473280328846063e-05, "loss": 0.7725, "step": 7343 }, { "epoch": 0.5, "learning_rate": 1.0471075531142698e-05, "loss": 0.8496, "step": 7344 }, { "epoch": 0.5, "learning_rate": 1.0468870710488556e-05, "loss": 0.79, "step": 7345 }, { "epoch": 0.5, "learning_rate": 1.046666586699106e-05, "loss": 0.7959, "step": 7346 }, { "epoch": 0.5, "learning_rate": 1.0464461000757625e-05, "loss": 0.7861, "step": 7347 }, { "epoch": 0.5, "learning_rate": 1.046225611189567e-05, "loss": 0.7871, "step": 7348 }, { "epoch": 0.5, "learning_rate": 1.046005120051262e-05, "loss": 0.7705, "step": 7349 }, { "epoch": 0.5, "learning_rate": 1.04578462667159e-05, "loss": 0.8271, "step": 7350 }, { "epoch": 0.5, "learning_rate": 1.0455641310612932e-05, "loss": 0.7061, "step": 7351 }, { "epoch": 0.5, "learning_rate": 1.045343633231114e-05, "loss": 0.7412, "step": 7352 }, { "epoch": 0.5, "learning_rate": 1.0451231331917955e-05, "loss": 0.8643, "step": 7353 }, { "epoch": 0.5, "learning_rate": 1.0449026309540795e-05, "loss": 0.7852, "step": 7354 }, { "epoch": 0.5, "learning_rate": 1.0446821265287101e-05, "loss": 0.7959, "step": 7355 }, { "epoch": 0.5, "learning_rate": 1.0444616199264295e-05, "loss": 0.8193, "step": 7356 }, { "epoch": 0.5, "learning_rate": 1.0442411111579808e-05, "loss": 0.8018, "step": 7357 }, { "epoch": 0.5, "learning_rate": 1.0440206002341077e-05, "loss": 0.8311, "step": 7358 }, { "epoch": 0.5, "learning_rate": 1.043800087165553e-05, "loss": 0.8486, "step": 7359 }, { "epoch": 0.5, "learning_rate": 1.0435795719630599e-05, "loss": 0.8008, "step": 7360 }, { "epoch": 0.5, "learning_rate": 1.0433590546373724e-05, "loss": 0.749, "step": 7361 }, { "epoch": 0.5, "learning_rate": 1.0431385351992338e-05, "loss": 0.8398, "step": 7362 }, { "epoch": 0.5, "learning_rate": 1.042918013659388e-05, "loss": 0.7793, "step": 7363 }, { "epoch": 0.5, "learning_rate": 1.0426974900285784e-05, "loss": 0.7793, "step": 7364 }, { "epoch": 0.5, "learning_rate": 1.0424769643175494e-05, "loss": 0.7793, "step": 7365 }, { "epoch": 0.5, "learning_rate": 1.0422564365370447e-05, "loss": 0.8457, "step": 7366 }, { "epoch": 0.5, "learning_rate": 1.0420359066978082e-05, "loss": 0.8154, "step": 7367 }, { "epoch": 0.5, "learning_rate": 1.0418153748105851e-05, "loss": 0.7129, "step": 7368 }, { "epoch": 0.5, "learning_rate": 1.0415948408861183e-05, "loss": 0.6543, "step": 7369 }, { "epoch": 0.5, "learning_rate": 1.041374304935153e-05, "loss": 0.8164, "step": 7370 }, { "epoch": 0.5, "learning_rate": 1.041153766968434e-05, "loss": 0.8379, "step": 7371 }, { "epoch": 0.5, "learning_rate": 1.0409332269967047e-05, "loss": 0.7939, "step": 7372 }, { "epoch": 0.5, "learning_rate": 1.0407126850307114e-05, "loss": 0.7988, "step": 7373 }, { "epoch": 0.5, "learning_rate": 1.0404921410811977e-05, "loss": 0.7617, "step": 7374 }, { "epoch": 0.5, "learning_rate": 1.0402715951589085e-05, "loss": 0.7871, "step": 7375 }, { "epoch": 0.5, "learning_rate": 1.04005104727459e-05, "loss": 0.8623, "step": 7376 }, { "epoch": 0.5, "learning_rate": 1.039830497438986e-05, "loss": 0.8311, "step": 7377 }, { "epoch": 0.5, "learning_rate": 1.0396099456628417e-05, "loss": 0.7168, "step": 7378 }, { "epoch": 0.5, "learning_rate": 1.0393893919569034e-05, "loss": 0.8506, "step": 7379 }, { "epoch": 0.5, "learning_rate": 1.0391688363319155e-05, "loss": 0.7295, "step": 7380 }, { "epoch": 0.5, "learning_rate": 1.0389482787986238e-05, "loss": 0.8145, "step": 7381 }, { "epoch": 0.5, "learning_rate": 1.0387277193677738e-05, "loss": 0.8057, "step": 7382 }, { "epoch": 0.5, "learning_rate": 1.0385071580501115e-05, "loss": 0.8213, "step": 7383 }, { "epoch": 0.5, "learning_rate": 1.0382865948563823e-05, "loss": 0.8252, "step": 7384 }, { "epoch": 0.5, "learning_rate": 1.0380660297973317e-05, "loss": 0.8887, "step": 7385 }, { "epoch": 0.5, "learning_rate": 1.0378454628837065e-05, "loss": 0.7598, "step": 7386 }, { "epoch": 0.5, "learning_rate": 1.0376248941262519e-05, "loss": 0.8955, "step": 7387 }, { "epoch": 0.5, "learning_rate": 1.0374043235357142e-05, "loss": 0.7119, "step": 7388 }, { "epoch": 0.5, "learning_rate": 1.03718375112284e-05, "loss": 0.8418, "step": 7389 }, { "epoch": 0.5, "learning_rate": 1.0369631768983748e-05, "loss": 0.8154, "step": 7390 }, { "epoch": 0.5, "learning_rate": 1.036742600873066e-05, "loss": 0.7549, "step": 7391 }, { "epoch": 0.5, "learning_rate": 1.0365220230576592e-05, "loss": 0.7988, "step": 7392 }, { "epoch": 0.5, "learning_rate": 1.0363014434629008e-05, "loss": 0.8164, "step": 7393 }, { "epoch": 0.5, "learning_rate": 1.0360808620995384e-05, "loss": 0.8438, "step": 7394 }, { "epoch": 0.5, "learning_rate": 1.035860278978318e-05, "loss": 0.8066, "step": 7395 }, { "epoch": 0.5, "learning_rate": 1.0356396941099865e-05, "loss": 0.6943, "step": 7396 }, { "epoch": 0.5, "learning_rate": 1.0354191075052911e-05, "loss": 0.875, "step": 7397 }, { "epoch": 0.5, "learning_rate": 1.0351985191749781e-05, "loss": 0.8545, "step": 7398 }, { "epoch": 0.5, "learning_rate": 1.034977929129795e-05, "loss": 0.8076, "step": 7399 }, { "epoch": 0.5, "learning_rate": 1.0347573373804891e-05, "loss": 0.876, "step": 7400 }, { "epoch": 0.5, "learning_rate": 1.0345367439378076e-05, "loss": 0.7412, "step": 7401 }, { "epoch": 0.5, "learning_rate": 1.0343161488124973e-05, "loss": 0.7705, "step": 7402 }, { "epoch": 0.5, "learning_rate": 1.0340955520153058e-05, "loss": 0.7725, "step": 7403 }, { "epoch": 0.5, "learning_rate": 1.033874953556981e-05, "loss": 0.8887, "step": 7404 }, { "epoch": 0.5, "learning_rate": 1.0336543534482698e-05, "loss": 0.7568, "step": 7405 }, { "epoch": 0.5, "learning_rate": 1.0334337516999204e-05, "loss": 0.8018, "step": 7406 }, { "epoch": 0.5, "learning_rate": 1.0332131483226805e-05, "loss": 0.7383, "step": 7407 }, { "epoch": 0.5, "learning_rate": 1.032992543327297e-05, "loss": 0.9082, "step": 7408 }, { "epoch": 0.5, "learning_rate": 1.0327719367245188e-05, "loss": 0.8564, "step": 7409 }, { "epoch": 0.5, "learning_rate": 1.0325513285250934e-05, "loss": 0.834, "step": 7410 }, { "epoch": 0.51, "learning_rate": 1.0323307187397687e-05, "loss": 0.7344, "step": 7411 }, { "epoch": 0.51, "learning_rate": 1.0321101073792932e-05, "loss": 0.8164, "step": 7412 }, { "epoch": 0.51, "learning_rate": 1.0318894944544145e-05, "loss": 0.7471, "step": 7413 }, { "epoch": 0.51, "learning_rate": 1.0316688799758813e-05, "loss": 0.8311, "step": 7414 }, { "epoch": 0.51, "learning_rate": 1.031448263954442e-05, "loss": 0.7734, "step": 7415 }, { "epoch": 0.51, "learning_rate": 1.0312276464008445e-05, "loss": 0.8242, "step": 7416 }, { "epoch": 0.51, "learning_rate": 1.031007027325838e-05, "loss": 0.8877, "step": 7417 }, { "epoch": 0.51, "learning_rate": 1.0307864067401703e-05, "loss": 0.8027, "step": 7418 }, { "epoch": 0.51, "learning_rate": 1.0305657846545906e-05, "loss": 0.8662, "step": 7419 }, { "epoch": 0.51, "learning_rate": 1.0303451610798472e-05, "loss": 0.7969, "step": 7420 }, { "epoch": 0.51, "learning_rate": 1.0301245360266892e-05, "loss": 0.7793, "step": 7421 }, { "epoch": 0.51, "learning_rate": 1.0299039095058651e-05, "loss": 0.8203, "step": 7422 }, { "epoch": 0.51, "learning_rate": 1.0296832815281242e-05, "loss": 0.748, "step": 7423 }, { "epoch": 0.51, "learning_rate": 1.029462652104215e-05, "loss": 0.8135, "step": 7424 }, { "epoch": 0.51, "learning_rate": 1.029242021244887e-05, "loss": 0.8213, "step": 7425 }, { "epoch": 0.51, "learning_rate": 1.0290213889608888e-05, "loss": 0.8271, "step": 7426 }, { "epoch": 0.51, "learning_rate": 1.0288007552629707e-05, "loss": 0.7549, "step": 7427 }, { "epoch": 0.51, "learning_rate": 1.0285801201618809e-05, "loss": 0.7012, "step": 7428 }, { "epoch": 0.51, "learning_rate": 1.0283594836683683e-05, "loss": 0.8496, "step": 7429 }, { "epoch": 0.51, "learning_rate": 1.028138845793184e-05, "loss": 0.8154, "step": 7430 }, { "epoch": 0.51, "learning_rate": 1.027918206547076e-05, "loss": 0.8574, "step": 7431 }, { "epoch": 0.51, "learning_rate": 1.0276975659407945e-05, "loss": 0.8652, "step": 7432 }, { "epoch": 0.51, "learning_rate": 1.027476923985089e-05, "loss": 0.7764, "step": 7433 }, { "epoch": 0.51, "learning_rate": 1.0272562806907089e-05, "loss": 0.8359, "step": 7434 }, { "epoch": 0.51, "learning_rate": 1.0270356360684041e-05, "loss": 0.7666, "step": 7435 }, { "epoch": 0.51, "learning_rate": 1.0268149901289248e-05, "loss": 0.8828, "step": 7436 }, { "epoch": 0.51, "learning_rate": 1.0265943428830203e-05, "loss": 0.8135, "step": 7437 }, { "epoch": 0.51, "learning_rate": 1.0263736943414407e-05, "loss": 0.8008, "step": 7438 }, { "epoch": 0.51, "learning_rate": 1.0261530445149358e-05, "loss": 0.8379, "step": 7439 }, { "epoch": 0.51, "learning_rate": 1.025932393414256e-05, "loss": 0.7295, "step": 7440 }, { "epoch": 0.51, "learning_rate": 1.0257117410501513e-05, "loss": 0.8057, "step": 7441 }, { "epoch": 0.51, "learning_rate": 1.0254910874333718e-05, "loss": 0.8125, "step": 7442 }, { "epoch": 0.51, "learning_rate": 1.0252704325746678e-05, "loss": 0.8613, "step": 7443 }, { "epoch": 0.51, "learning_rate": 1.0250497764847895e-05, "loss": 0.8545, "step": 7444 }, { "epoch": 0.51, "learning_rate": 1.0248291191744875e-05, "loss": 0.833, "step": 7445 }, { "epoch": 0.51, "learning_rate": 1.024608460654512e-05, "loss": 0.7637, "step": 7446 }, { "epoch": 0.51, "learning_rate": 1.0243878009356131e-05, "loss": 0.8838, "step": 7447 }, { "epoch": 0.51, "learning_rate": 1.0241671400285422e-05, "loss": 0.8633, "step": 7448 }, { "epoch": 0.51, "learning_rate": 1.0239464779440491e-05, "loss": 0.7871, "step": 7449 }, { "epoch": 0.51, "learning_rate": 1.0237258146928849e-05, "loss": 0.8418, "step": 7450 }, { "epoch": 0.51, "learning_rate": 1.0235051502858003e-05, "loss": 0.9316, "step": 7451 }, { "epoch": 0.51, "learning_rate": 1.0232844847335455e-05, "loss": 0.8291, "step": 7452 }, { "epoch": 0.51, "learning_rate": 1.0230638180468722e-05, "loss": 0.8311, "step": 7453 }, { "epoch": 0.51, "learning_rate": 1.0228431502365305e-05, "loss": 0.8027, "step": 7454 }, { "epoch": 0.51, "learning_rate": 1.0226224813132716e-05, "loss": 0.8486, "step": 7455 }, { "epoch": 0.51, "learning_rate": 1.0224018112878468e-05, "loss": 0.8076, "step": 7456 }, { "epoch": 0.51, "learning_rate": 1.0221811401710067e-05, "loss": 0.8076, "step": 7457 }, { "epoch": 0.51, "learning_rate": 1.0219604679735025e-05, "loss": 0.8457, "step": 7458 }, { "epoch": 0.51, "learning_rate": 1.0217397947060857e-05, "loss": 0.7686, "step": 7459 }, { "epoch": 0.51, "learning_rate": 1.0215191203795067e-05, "loss": 0.8291, "step": 7460 }, { "epoch": 0.51, "learning_rate": 1.0212984450045174e-05, "loss": 0.7744, "step": 7461 }, { "epoch": 0.51, "learning_rate": 1.0210777685918688e-05, "loss": 0.8711, "step": 7462 }, { "epoch": 0.51, "learning_rate": 1.0208570911523126e-05, "loss": 0.7979, "step": 7463 }, { "epoch": 0.51, "learning_rate": 1.0206364126965994e-05, "loss": 0.8047, "step": 7464 }, { "epoch": 0.51, "learning_rate": 1.0204157332354816e-05, "loss": 0.8135, "step": 7465 }, { "epoch": 0.51, "learning_rate": 1.0201950527797103e-05, "loss": 0.7812, "step": 7466 }, { "epoch": 0.51, "learning_rate": 1.019974371340037e-05, "loss": 0.7969, "step": 7467 }, { "epoch": 0.51, "learning_rate": 1.0197536889272131e-05, "loss": 0.8154, "step": 7468 }, { "epoch": 0.51, "learning_rate": 1.0195330055519907e-05, "loss": 0.8018, "step": 7469 }, { "epoch": 0.51, "learning_rate": 1.0193123212251209e-05, "loss": 0.8867, "step": 7470 }, { "epoch": 0.51, "learning_rate": 1.019091635957356e-05, "loss": 0.8057, "step": 7471 }, { "epoch": 0.51, "learning_rate": 1.0188709497594478e-05, "loss": 0.7881, "step": 7472 }, { "epoch": 0.51, "learning_rate": 1.018650262642147e-05, "loss": 0.8125, "step": 7473 }, { "epoch": 0.51, "learning_rate": 1.0184295746162072e-05, "loss": 0.8613, "step": 7474 }, { "epoch": 0.51, "learning_rate": 1.0182088856923789e-05, "loss": 0.7988, "step": 7475 }, { "epoch": 0.51, "learning_rate": 1.0179881958814146e-05, "loss": 0.7842, "step": 7476 }, { "epoch": 0.51, "learning_rate": 1.0177675051940666e-05, "loss": 0.7754, "step": 7477 }, { "epoch": 0.51, "learning_rate": 1.0175468136410865e-05, "loss": 0.7109, "step": 7478 }, { "epoch": 0.51, "learning_rate": 1.0173261212332262e-05, "loss": 0.7119, "step": 7479 }, { "epoch": 0.51, "learning_rate": 1.0171054279812385e-05, "loss": 0.8252, "step": 7480 }, { "epoch": 0.51, "learning_rate": 1.016884733895875e-05, "loss": 0.7939, "step": 7481 }, { "epoch": 0.51, "learning_rate": 1.0166640389878879e-05, "loss": 0.7734, "step": 7482 }, { "epoch": 0.51, "learning_rate": 1.0164433432680299e-05, "loss": 0.8809, "step": 7483 }, { "epoch": 0.51, "learning_rate": 1.0162226467470531e-05, "loss": 0.8232, "step": 7484 }, { "epoch": 0.51, "learning_rate": 1.0160019494357095e-05, "loss": 0.8145, "step": 7485 }, { "epoch": 0.51, "learning_rate": 1.0157812513447516e-05, "loss": 0.8428, "step": 7486 }, { "epoch": 0.51, "learning_rate": 1.0155605524849324e-05, "loss": 0.7959, "step": 7487 }, { "epoch": 0.51, "learning_rate": 1.0153398528670032e-05, "loss": 0.7363, "step": 7488 }, { "epoch": 0.51, "learning_rate": 1.0151191525017176e-05, "loss": 0.7588, "step": 7489 }, { "epoch": 0.51, "learning_rate": 1.0148984513998276e-05, "loss": 0.7969, "step": 7490 }, { "epoch": 0.51, "learning_rate": 1.0146777495720855e-05, "loss": 0.7695, "step": 7491 }, { "epoch": 0.51, "learning_rate": 1.0144570470292442e-05, "loss": 0.792, "step": 7492 }, { "epoch": 0.51, "learning_rate": 1.0142363437820566e-05, "loss": 0.8906, "step": 7493 }, { "epoch": 0.51, "learning_rate": 1.0140156398412746e-05, "loss": 0.8369, "step": 7494 }, { "epoch": 0.51, "learning_rate": 1.0137949352176517e-05, "loss": 0.8379, "step": 7495 }, { "epoch": 0.51, "learning_rate": 1.01357422992194e-05, "loss": 0.7549, "step": 7496 }, { "epoch": 0.51, "learning_rate": 1.0133535239648926e-05, "loss": 0.707, "step": 7497 }, { "epoch": 0.51, "learning_rate": 1.0131328173572622e-05, "loss": 0.7715, "step": 7498 }, { "epoch": 0.51, "learning_rate": 1.0129121101098014e-05, "loss": 0.8564, "step": 7499 }, { "epoch": 0.51, "learning_rate": 1.0126914022332633e-05, "loss": 0.8682, "step": 7500 }, { "epoch": 0.51, "learning_rate": 1.0124706937384007e-05, "loss": 0.8496, "step": 7501 }, { "epoch": 0.51, "learning_rate": 1.0122499846359665e-05, "loss": 0.8447, "step": 7502 }, { "epoch": 0.51, "learning_rate": 1.0120292749367135e-05, "loss": 0.8203, "step": 7503 }, { "epoch": 0.51, "learning_rate": 1.0118085646513951e-05, "loss": 0.751, "step": 7504 }, { "epoch": 0.51, "learning_rate": 1.011587853790764e-05, "loss": 0.8096, "step": 7505 }, { "epoch": 0.51, "learning_rate": 1.0113671423655731e-05, "loss": 0.8086, "step": 7506 }, { "epoch": 0.51, "learning_rate": 1.0111464303865754e-05, "loss": 0.8076, "step": 7507 }, { "epoch": 0.51, "learning_rate": 1.0109257178645245e-05, "loss": 0.8076, "step": 7508 }, { "epoch": 0.51, "learning_rate": 1.0107050048101727e-05, "loss": 0.8125, "step": 7509 }, { "epoch": 0.51, "learning_rate": 1.010484291234274e-05, "loss": 0.7559, "step": 7510 }, { "epoch": 0.51, "learning_rate": 1.010263577147581e-05, "loss": 0.8281, "step": 7511 }, { "epoch": 0.51, "learning_rate": 1.010042862560847e-05, "loss": 0.8164, "step": 7512 }, { "epoch": 0.51, "learning_rate": 1.0098221474848256e-05, "loss": 0.7373, "step": 7513 }, { "epoch": 0.51, "learning_rate": 1.0096014319302691e-05, "loss": 0.79, "step": 7514 }, { "epoch": 0.51, "learning_rate": 1.0093807159079314e-05, "loss": 0.8027, "step": 7515 }, { "epoch": 0.51, "learning_rate": 1.0091599994285662e-05, "loss": 0.7627, "step": 7516 }, { "epoch": 0.51, "learning_rate": 1.0089392825029256e-05, "loss": 0.7822, "step": 7517 }, { "epoch": 0.51, "learning_rate": 1.0087185651417638e-05, "loss": 0.8135, "step": 7518 }, { "epoch": 0.51, "learning_rate": 1.008497847355834e-05, "loss": 0.9209, "step": 7519 }, { "epoch": 0.51, "learning_rate": 1.0082771291558896e-05, "loss": 0.7783, "step": 7520 }, { "epoch": 0.51, "learning_rate": 1.0080564105526837e-05, "loss": 0.8223, "step": 7521 }, { "epoch": 0.51, "learning_rate": 1.00783569155697e-05, "loss": 0.7568, "step": 7522 }, { "epoch": 0.51, "learning_rate": 1.0076149721795019e-05, "loss": 0.7744, "step": 7523 }, { "epoch": 0.51, "learning_rate": 1.0073942524310325e-05, "loss": 0.7979, "step": 7524 }, { "epoch": 0.51, "learning_rate": 1.0071735323223156e-05, "loss": 0.8066, "step": 7525 }, { "epoch": 0.51, "learning_rate": 1.0069528118641046e-05, "loss": 0.8037, "step": 7526 }, { "epoch": 0.51, "learning_rate": 1.0067320910671526e-05, "loss": 0.7461, "step": 7527 }, { "epoch": 0.51, "learning_rate": 1.0065113699422137e-05, "loss": 0.7295, "step": 7528 }, { "epoch": 0.51, "learning_rate": 1.0062906485000413e-05, "loss": 0.7959, "step": 7529 }, { "epoch": 0.51, "learning_rate": 1.0060699267513885e-05, "loss": 0.7705, "step": 7530 }, { "epoch": 0.51, "learning_rate": 1.0058492047070094e-05, "loss": 0.6855, "step": 7531 }, { "epoch": 0.51, "learning_rate": 1.0056284823776572e-05, "loss": 0.8359, "step": 7532 }, { "epoch": 0.51, "learning_rate": 1.0054077597740857e-05, "loss": 0.79, "step": 7533 }, { "epoch": 0.51, "learning_rate": 1.0051870369070484e-05, "loss": 0.792, "step": 7534 }, { "epoch": 0.51, "learning_rate": 1.004966313787299e-05, "loss": 0.8047, "step": 7535 }, { "epoch": 0.51, "learning_rate": 1.004745590425591e-05, "loss": 0.8115, "step": 7536 }, { "epoch": 0.51, "learning_rate": 1.0045248668326778e-05, "loss": 0.8594, "step": 7537 }, { "epoch": 0.51, "learning_rate": 1.0043041430193137e-05, "loss": 0.7539, "step": 7538 }, { "epoch": 0.51, "learning_rate": 1.0040834189962516e-05, "loss": 0.7646, "step": 7539 }, { "epoch": 0.51, "learning_rate": 1.0038626947742458e-05, "loss": 0.7832, "step": 7540 }, { "epoch": 0.51, "learning_rate": 1.0036419703640496e-05, "loss": 0.7432, "step": 7541 }, { "epoch": 0.51, "learning_rate": 1.0034212457764168e-05, "loss": 0.8369, "step": 7542 }, { "epoch": 0.51, "learning_rate": 1.003200521022101e-05, "loss": 0.7354, "step": 7543 }, { "epoch": 0.51, "learning_rate": 1.0029797961118562e-05, "loss": 0.8086, "step": 7544 }, { "epoch": 0.51, "learning_rate": 1.0027590710564355e-05, "loss": 0.8252, "step": 7545 }, { "epoch": 0.51, "learning_rate": 1.0025383458665934e-05, "loss": 0.877, "step": 7546 }, { "epoch": 0.51, "learning_rate": 1.0023176205530829e-05, "loss": 0.7793, "step": 7547 }, { "epoch": 0.51, "learning_rate": 1.002096895126658e-05, "loss": 0.7256, "step": 7548 }, { "epoch": 0.51, "learning_rate": 1.0018761695980728e-05, "loss": 0.7744, "step": 7549 }, { "epoch": 0.51, "learning_rate": 1.0016554439780806e-05, "loss": 0.7129, "step": 7550 }, { "epoch": 0.51, "learning_rate": 1.0014347182774352e-05, "loss": 0.7607, "step": 7551 }, { "epoch": 0.51, "learning_rate": 1.0012139925068904e-05, "loss": 0.7266, "step": 7552 }, { "epoch": 0.51, "learning_rate": 1.0009932666771998e-05, "loss": 0.7939, "step": 7553 }, { "epoch": 0.51, "learning_rate": 1.0007725407991174e-05, "loss": 0.7803, "step": 7554 }, { "epoch": 0.51, "learning_rate": 1.0005518148833969e-05, "loss": 0.8027, "step": 7555 }, { "epoch": 0.51, "learning_rate": 1.000331088940792e-05, "loss": 0.9229, "step": 7556 }, { "epoch": 0.51, "learning_rate": 1.0001103629820563e-05, "loss": 0.751, "step": 7557 }, { "epoch": 0.52, "learning_rate": 9.998896370179438e-06, "loss": 0.8018, "step": 7558 }, { "epoch": 0.52, "learning_rate": 9.996689110592085e-06, "loss": 0.7363, "step": 7559 }, { "epoch": 0.52, "learning_rate": 9.994481851166035e-06, "loss": 0.8818, "step": 7560 }, { "epoch": 0.52, "learning_rate": 9.992274592008826e-06, "loss": 0.7695, "step": 7561 }, { "epoch": 0.52, "learning_rate": 9.990067333228005e-06, "loss": 0.7285, "step": 7562 }, { "epoch": 0.52, "learning_rate": 9.9878600749311e-06, "loss": 0.7881, "step": 7563 }, { "epoch": 0.52, "learning_rate": 9.985652817225653e-06, "loss": 0.7988, "step": 7564 }, { "epoch": 0.52, "learning_rate": 9.983445560219199e-06, "loss": 0.6992, "step": 7565 }, { "epoch": 0.52, "learning_rate": 9.981238304019277e-06, "loss": 0.79, "step": 7566 }, { "epoch": 0.52, "learning_rate": 9.979031048733421e-06, "loss": 0.8232, "step": 7567 }, { "epoch": 0.52, "learning_rate": 9.976823794469175e-06, "loss": 0.7314, "step": 7568 }, { "epoch": 0.52, "learning_rate": 9.97461654133407e-06, "loss": 0.7051, "step": 7569 }, { "epoch": 0.52, "learning_rate": 9.972409289435648e-06, "loss": 0.7031, "step": 7570 }, { "epoch": 0.52, "learning_rate": 9.970202038881443e-06, "loss": 0.7373, "step": 7571 }, { "epoch": 0.52, "learning_rate": 9.967994789778996e-06, "loss": 0.7471, "step": 7572 }, { "epoch": 0.52, "learning_rate": 9.965787542235835e-06, "loss": 0.8887, "step": 7573 }, { "epoch": 0.52, "learning_rate": 9.963580296359506e-06, "loss": 0.8838, "step": 7574 }, { "epoch": 0.52, "learning_rate": 9.961373052257546e-06, "loss": 0.6924, "step": 7575 }, { "epoch": 0.52, "learning_rate": 9.959165810037486e-06, "loss": 0.7656, "step": 7576 }, { "epoch": 0.52, "learning_rate": 9.956958569806868e-06, "loss": 0.8633, "step": 7577 }, { "epoch": 0.52, "learning_rate": 9.954751331673224e-06, "loss": 0.8242, "step": 7578 }, { "epoch": 0.52, "learning_rate": 9.952544095744092e-06, "loss": 0.8711, "step": 7579 }, { "epoch": 0.52, "learning_rate": 9.950336862127014e-06, "loss": 0.7979, "step": 7580 }, { "epoch": 0.52, "learning_rate": 9.948129630929518e-06, "loss": 0.874, "step": 7581 }, { "epoch": 0.52, "learning_rate": 9.945922402259146e-06, "loss": 0.8545, "step": 7582 }, { "epoch": 0.52, "learning_rate": 9.943715176223433e-06, "loss": 0.752, "step": 7583 }, { "epoch": 0.52, "learning_rate": 9.941507952929911e-06, "loss": 0.8369, "step": 7584 }, { "epoch": 0.52, "learning_rate": 9.939300732486117e-06, "loss": 0.8027, "step": 7585 }, { "epoch": 0.52, "learning_rate": 9.937093514999592e-06, "loss": 0.9102, "step": 7586 }, { "epoch": 0.52, "learning_rate": 9.934886300577866e-06, "loss": 0.7969, "step": 7587 }, { "epoch": 0.52, "learning_rate": 9.932679089328479e-06, "loss": 0.8164, "step": 7588 }, { "epoch": 0.52, "learning_rate": 9.930471881358959e-06, "loss": 0.7607, "step": 7589 }, { "epoch": 0.52, "learning_rate": 9.92826467677685e-06, "loss": 0.7646, "step": 7590 }, { "epoch": 0.52, "learning_rate": 9.926057475689679e-06, "loss": 0.8115, "step": 7591 }, { "epoch": 0.52, "learning_rate": 9.923850278204985e-06, "loss": 0.8428, "step": 7592 }, { "epoch": 0.52, "learning_rate": 9.921643084430304e-06, "loss": 0.709, "step": 7593 }, { "epoch": 0.52, "learning_rate": 9.919435894473165e-06, "loss": 0.7422, "step": 7594 }, { "epoch": 0.52, "learning_rate": 9.917228708441109e-06, "loss": 0.8096, "step": 7595 }, { "epoch": 0.52, "learning_rate": 9.915021526441663e-06, "loss": 0.7793, "step": 7596 }, { "epoch": 0.52, "learning_rate": 9.912814348582362e-06, "loss": 0.7988, "step": 7597 }, { "epoch": 0.52, "learning_rate": 9.910607174970746e-06, "loss": 0.832, "step": 7598 }, { "epoch": 0.52, "learning_rate": 9.908400005714343e-06, "loss": 0.8008, "step": 7599 }, { "epoch": 0.52, "learning_rate": 9.906192840920688e-06, "loss": 0.8086, "step": 7600 }, { "epoch": 0.52, "learning_rate": 9.903985680697314e-06, "loss": 0.7676, "step": 7601 }, { "epoch": 0.52, "learning_rate": 9.90177852515175e-06, "loss": 0.8223, "step": 7602 }, { "epoch": 0.52, "learning_rate": 9.89957137439153e-06, "loss": 0.7295, "step": 7603 }, { "epoch": 0.52, "learning_rate": 9.897364228524193e-06, "loss": 0.7471, "step": 7604 }, { "epoch": 0.52, "learning_rate": 9.895157087657262e-06, "loss": 0.7754, "step": 7605 }, { "epoch": 0.52, "learning_rate": 9.892949951898274e-06, "loss": 0.8525, "step": 7606 }, { "epoch": 0.52, "learning_rate": 9.890742821354759e-06, "loss": 0.8154, "step": 7607 }, { "epoch": 0.52, "learning_rate": 9.88853569613425e-06, "loss": 0.8125, "step": 7608 }, { "epoch": 0.52, "learning_rate": 9.886328576344272e-06, "loss": 0.791, "step": 7609 }, { "epoch": 0.52, "learning_rate": 9.884121462092363e-06, "loss": 0.7988, "step": 7610 }, { "epoch": 0.52, "learning_rate": 9.881914353486052e-06, "loss": 0.8115, "step": 7611 }, { "epoch": 0.52, "learning_rate": 9.879707250632867e-06, "loss": 0.8389, "step": 7612 }, { "epoch": 0.52, "learning_rate": 9.87750015364034e-06, "loss": 0.8398, "step": 7613 }, { "epoch": 0.52, "learning_rate": 9.875293062615997e-06, "loss": 0.8184, "step": 7614 }, { "epoch": 0.52, "learning_rate": 9.873085977667369e-06, "loss": 0.7656, "step": 7615 }, { "epoch": 0.52, "learning_rate": 9.87087889890199e-06, "loss": 0.7539, "step": 7616 }, { "epoch": 0.52, "learning_rate": 9.86867182642738e-06, "loss": 0.8555, "step": 7617 }, { "epoch": 0.52, "learning_rate": 9.866464760351078e-06, "loss": 0.8359, "step": 7618 }, { "epoch": 0.52, "learning_rate": 9.864257700780605e-06, "loss": 0.7832, "step": 7619 }, { "epoch": 0.52, "learning_rate": 9.862050647823486e-06, "loss": 0.7783, "step": 7620 }, { "epoch": 0.52, "learning_rate": 9.859843601587254e-06, "loss": 0.8018, "step": 7621 }, { "epoch": 0.52, "learning_rate": 9.857636562179439e-06, "loss": 0.709, "step": 7622 }, { "epoch": 0.52, "learning_rate": 9.85542952970756e-06, "loss": 0.8682, "step": 7623 }, { "epoch": 0.52, "learning_rate": 9.853222504279148e-06, "loss": 0.8223, "step": 7624 }, { "epoch": 0.52, "learning_rate": 9.851015486001729e-06, "loss": 0.8076, "step": 7625 }, { "epoch": 0.52, "learning_rate": 9.848808474982826e-06, "loss": 0.8281, "step": 7626 }, { "epoch": 0.52, "learning_rate": 9.846601471329968e-06, "loss": 0.7285, "step": 7627 }, { "epoch": 0.52, "learning_rate": 9.84439447515068e-06, "loss": 0.8389, "step": 7628 }, { "epoch": 0.52, "learning_rate": 9.842187486552486e-06, "loss": 0.8691, "step": 7629 }, { "epoch": 0.52, "learning_rate": 9.839980505642909e-06, "loss": 0.7998, "step": 7630 }, { "epoch": 0.52, "learning_rate": 9.837773532529474e-06, "loss": 0.8232, "step": 7631 }, { "epoch": 0.52, "learning_rate": 9.835566567319701e-06, "loss": 0.8027, "step": 7632 }, { "epoch": 0.52, "learning_rate": 9.833359610121121e-06, "loss": 0.7959, "step": 7633 }, { "epoch": 0.52, "learning_rate": 9.831152661041253e-06, "loss": 0.8633, "step": 7634 }, { "epoch": 0.52, "learning_rate": 9.828945720187619e-06, "loss": 0.7412, "step": 7635 }, { "epoch": 0.52, "learning_rate": 9.826738787667741e-06, "loss": 0.8516, "step": 7636 }, { "epoch": 0.52, "learning_rate": 9.824531863589142e-06, "loss": 0.7861, "step": 7637 }, { "epoch": 0.52, "learning_rate": 9.822324948059337e-06, "loss": 0.8086, "step": 7638 }, { "epoch": 0.52, "learning_rate": 9.820118041185854e-06, "loss": 0.7598, "step": 7639 }, { "epoch": 0.52, "learning_rate": 9.817911143076214e-06, "loss": 0.8691, "step": 7640 }, { "epoch": 0.52, "learning_rate": 9.815704253837932e-06, "loss": 0.7637, "step": 7641 }, { "epoch": 0.52, "learning_rate": 9.813497373578532e-06, "loss": 0.8115, "step": 7642 }, { "epoch": 0.52, "learning_rate": 9.811290502405529e-06, "loss": 0.8213, "step": 7643 }, { "epoch": 0.52, "learning_rate": 9.80908364042644e-06, "loss": 0.7949, "step": 7644 }, { "epoch": 0.52, "learning_rate": 9.806876787748793e-06, "loss": 0.8193, "step": 7645 }, { "epoch": 0.52, "learning_rate": 9.804669944480095e-06, "loss": 0.832, "step": 7646 }, { "epoch": 0.52, "learning_rate": 9.80246311072787e-06, "loss": 0.7783, "step": 7647 }, { "epoch": 0.52, "learning_rate": 9.800256286599633e-06, "loss": 0.8223, "step": 7648 }, { "epoch": 0.52, "learning_rate": 9.7980494722029e-06, "loss": 0.7754, "step": 7649 }, { "epoch": 0.52, "learning_rate": 9.795842667645184e-06, "loss": 0.8301, "step": 7650 }, { "epoch": 0.52, "learning_rate": 9.793635873034006e-06, "loss": 0.8145, "step": 7651 }, { "epoch": 0.52, "learning_rate": 9.791429088476877e-06, "loss": 0.7676, "step": 7652 }, { "epoch": 0.52, "learning_rate": 9.789222314081316e-06, "loss": 0.8916, "step": 7653 }, { "epoch": 0.52, "learning_rate": 9.78701554995483e-06, "loss": 0.8008, "step": 7654 }, { "epoch": 0.52, "learning_rate": 9.784808796204938e-06, "loss": 0.7793, "step": 7655 }, { "epoch": 0.52, "learning_rate": 9.782602052939148e-06, "loss": 0.7041, "step": 7656 }, { "epoch": 0.52, "learning_rate": 9.780395320264975e-06, "loss": 0.7842, "step": 7657 }, { "epoch": 0.52, "learning_rate": 9.778188598289936e-06, "loss": 0.8135, "step": 7658 }, { "epoch": 0.52, "learning_rate": 9.775981887121533e-06, "loss": 0.7686, "step": 7659 }, { "epoch": 0.52, "learning_rate": 9.773775186867287e-06, "loss": 0.7617, "step": 7660 }, { "epoch": 0.52, "learning_rate": 9.771568497634698e-06, "loss": 0.7793, "step": 7661 }, { "epoch": 0.52, "learning_rate": 9.76936181953128e-06, "loss": 0.7861, "step": 7662 }, { "epoch": 0.52, "learning_rate": 9.767155152664545e-06, "loss": 0.8057, "step": 7663 }, { "epoch": 0.52, "learning_rate": 9.764948497142e-06, "loss": 0.8848, "step": 7664 }, { "epoch": 0.52, "learning_rate": 9.762741853071153e-06, "loss": 0.8379, "step": 7665 }, { "epoch": 0.52, "learning_rate": 9.760535220559512e-06, "loss": 0.7676, "step": 7666 }, { "epoch": 0.52, "learning_rate": 9.758328599714583e-06, "loss": 0.7637, "step": 7667 }, { "epoch": 0.52, "learning_rate": 9.75612199064387e-06, "loss": 0.8398, "step": 7668 }, { "epoch": 0.52, "learning_rate": 9.753915393454882e-06, "loss": 0.7402, "step": 7669 }, { "epoch": 0.52, "learning_rate": 9.751708808255129e-06, "loss": 0.7734, "step": 7670 }, { "epoch": 0.52, "learning_rate": 9.749502235152107e-06, "loss": 0.8027, "step": 7671 }, { "epoch": 0.52, "learning_rate": 9.747295674253324e-06, "loss": 0.8281, "step": 7672 }, { "epoch": 0.52, "learning_rate": 9.745089125666287e-06, "loss": 0.8066, "step": 7673 }, { "epoch": 0.52, "learning_rate": 9.742882589498489e-06, "loss": 0.9131, "step": 7674 }, { "epoch": 0.52, "learning_rate": 9.740676065857441e-06, "loss": 0.8037, "step": 7675 }, { "epoch": 0.52, "learning_rate": 9.738469554850645e-06, "loss": 0.7686, "step": 7676 }, { "epoch": 0.52, "learning_rate": 9.736263056585596e-06, "loss": 0.7656, "step": 7677 }, { "epoch": 0.52, "learning_rate": 9.734056571169802e-06, "loss": 0.7686, "step": 7678 }, { "epoch": 0.52, "learning_rate": 9.731850098710755e-06, "loss": 0.7646, "step": 7679 }, { "epoch": 0.52, "learning_rate": 9.729643639315957e-06, "loss": 0.8164, "step": 7680 }, { "epoch": 0.52, "learning_rate": 9.727437193092913e-06, "loss": 0.7842, "step": 7681 }, { "epoch": 0.52, "learning_rate": 9.725230760149112e-06, "loss": 0.7285, "step": 7682 }, { "epoch": 0.52, "learning_rate": 9.723024340592059e-06, "loss": 0.8389, "step": 7683 }, { "epoch": 0.52, "learning_rate": 9.720817934529243e-06, "loss": 0.8096, "step": 7684 }, { "epoch": 0.52, "learning_rate": 9.718611542068166e-06, "loss": 0.7764, "step": 7685 }, { "epoch": 0.52, "learning_rate": 9.716405163316315e-06, "loss": 0.7617, "step": 7686 }, { "epoch": 0.52, "learning_rate": 9.714198798381196e-06, "loss": 0.7939, "step": 7687 }, { "epoch": 0.52, "learning_rate": 9.711992447370298e-06, "loss": 0.7676, "step": 7688 }, { "epoch": 0.52, "learning_rate": 9.709786110391114e-06, "loss": 0.8125, "step": 7689 }, { "epoch": 0.52, "learning_rate": 9.707579787551133e-06, "loss": 0.8623, "step": 7690 }, { "epoch": 0.52, "learning_rate": 9.705373478957855e-06, "loss": 0.8213, "step": 7691 }, { "epoch": 0.52, "learning_rate": 9.703167184718762e-06, "loss": 0.8047, "step": 7692 }, { "epoch": 0.52, "learning_rate": 9.70096090494135e-06, "loss": 0.7803, "step": 7693 }, { "epoch": 0.52, "learning_rate": 9.698754639733113e-06, "loss": 0.7295, "step": 7694 }, { "epoch": 0.52, "learning_rate": 9.69654838920153e-06, "loss": 0.8301, "step": 7695 }, { "epoch": 0.52, "learning_rate": 9.694342153454099e-06, "loss": 0.7607, "step": 7696 }, { "epoch": 0.52, "learning_rate": 9.6921359325983e-06, "loss": 0.7363, "step": 7697 }, { "epoch": 0.52, "learning_rate": 9.689929726741622e-06, "loss": 0.7539, "step": 7698 }, { "epoch": 0.52, "learning_rate": 9.687723535991556e-06, "loss": 0.7832, "step": 7699 }, { "epoch": 0.52, "learning_rate": 9.685517360455581e-06, "loss": 0.7637, "step": 7700 }, { "epoch": 0.52, "learning_rate": 9.68331120024119e-06, "loss": 0.749, "step": 7701 }, { "epoch": 0.52, "learning_rate": 9.681105055455857e-06, "loss": 0.8145, "step": 7702 }, { "epoch": 0.52, "learning_rate": 9.678898926207074e-06, "loss": 0.8135, "step": 7703 }, { "epoch": 0.53, "learning_rate": 9.676692812602315e-06, "loss": 0.7998, "step": 7704 }, { "epoch": 0.53, "learning_rate": 9.674486714749068e-06, "loss": 0.8027, "step": 7705 }, { "epoch": 0.53, "learning_rate": 9.672280632754815e-06, "loss": 0.8135, "step": 7706 }, { "epoch": 0.53, "learning_rate": 9.670074566727034e-06, "loss": 0.7891, "step": 7707 }, { "epoch": 0.53, "learning_rate": 9.6678685167732e-06, "loss": 0.8301, "step": 7708 }, { "epoch": 0.53, "learning_rate": 9.665662483000801e-06, "loss": 0.7695, "step": 7709 }, { "epoch": 0.53, "learning_rate": 9.663456465517303e-06, "loss": 0.7588, "step": 7710 }, { "epoch": 0.53, "learning_rate": 9.661250464430191e-06, "loss": 0.8027, "step": 7711 }, { "epoch": 0.53, "learning_rate": 9.659044479846943e-06, "loss": 0.793, "step": 7712 }, { "epoch": 0.53, "learning_rate": 9.65683851187503e-06, "loss": 0.7158, "step": 7713 }, { "epoch": 0.53, "learning_rate": 9.65463256062193e-06, "loss": 0.8535, "step": 7714 }, { "epoch": 0.53, "learning_rate": 9.652426626195112e-06, "loss": 0.7822, "step": 7715 }, { "epoch": 0.53, "learning_rate": 9.65022070870205e-06, "loss": 0.792, "step": 7716 }, { "epoch": 0.53, "learning_rate": 9.648014808250222e-06, "loss": 0.877, "step": 7717 }, { "epoch": 0.53, "learning_rate": 9.645808924947094e-06, "loss": 0.6768, "step": 7718 }, { "epoch": 0.53, "learning_rate": 9.643603058900139e-06, "loss": 0.79, "step": 7719 }, { "epoch": 0.53, "learning_rate": 9.641397210216822e-06, "loss": 0.8701, "step": 7720 }, { "epoch": 0.53, "learning_rate": 9.63919137900462e-06, "loss": 0.7676, "step": 7721 }, { "epoch": 0.53, "learning_rate": 9.636985565370992e-06, "loss": 0.8242, "step": 7722 }, { "epoch": 0.53, "learning_rate": 9.634779769423412e-06, "loss": 0.7236, "step": 7723 }, { "epoch": 0.53, "learning_rate": 9.632573991269346e-06, "loss": 0.7324, "step": 7724 }, { "epoch": 0.53, "learning_rate": 9.630368231016255e-06, "loss": 0.7197, "step": 7725 }, { "epoch": 0.53, "learning_rate": 9.628162488771605e-06, "loss": 0.7969, "step": 7726 }, { "epoch": 0.53, "learning_rate": 9.625956764642863e-06, "loss": 0.8008, "step": 7727 }, { "epoch": 0.53, "learning_rate": 9.623751058737483e-06, "loss": 0.79, "step": 7728 }, { "epoch": 0.53, "learning_rate": 9.621545371162938e-06, "loss": 0.8174, "step": 7729 }, { "epoch": 0.53, "learning_rate": 9.619339702026685e-06, "loss": 0.7314, "step": 7730 }, { "epoch": 0.53, "learning_rate": 9.61713405143618e-06, "loss": 0.7891, "step": 7731 }, { "epoch": 0.53, "learning_rate": 9.61492841949889e-06, "loss": 0.7842, "step": 7732 }, { "epoch": 0.53, "learning_rate": 9.612722806322264e-06, "loss": 0.6729, "step": 7733 }, { "epoch": 0.53, "learning_rate": 9.610517212013762e-06, "loss": 0.7324, "step": 7734 }, { "epoch": 0.53, "learning_rate": 9.608311636680849e-06, "loss": 0.7871, "step": 7735 }, { "epoch": 0.53, "learning_rate": 9.60610608043097e-06, "loss": 0.7754, "step": 7736 }, { "epoch": 0.53, "learning_rate": 9.603900543371584e-06, "loss": 0.6406, "step": 7737 }, { "epoch": 0.53, "learning_rate": 9.601695025610144e-06, "loss": 0.8086, "step": 7738 }, { "epoch": 0.53, "learning_rate": 9.599489527254101e-06, "loss": 0.7617, "step": 7739 }, { "epoch": 0.53, "learning_rate": 9.597284048410913e-06, "loss": 0.9062, "step": 7740 }, { "epoch": 0.53, "learning_rate": 9.595078589188028e-06, "loss": 0.8525, "step": 7741 }, { "epoch": 0.53, "learning_rate": 9.592873149692889e-06, "loss": 0.7998, "step": 7742 }, { "epoch": 0.53, "learning_rate": 9.590667730032955e-06, "loss": 0.8789, "step": 7743 }, { "epoch": 0.53, "learning_rate": 9.588462330315666e-06, "loss": 0.8027, "step": 7744 }, { "epoch": 0.53, "learning_rate": 9.58625695064847e-06, "loss": 0.7871, "step": 7745 }, { "epoch": 0.53, "learning_rate": 9.584051591138818e-06, "loss": 0.8149, "step": 7746 }, { "epoch": 0.53, "learning_rate": 9.581846251894152e-06, "loss": 0.8613, "step": 7747 }, { "epoch": 0.53, "learning_rate": 9.57964093302192e-06, "loss": 0.8525, "step": 7748 }, { "epoch": 0.53, "learning_rate": 9.577435634629556e-06, "loss": 0.7861, "step": 7749 }, { "epoch": 0.53, "learning_rate": 9.575230356824511e-06, "loss": 0.7627, "step": 7750 }, { "epoch": 0.53, "learning_rate": 9.573025099714218e-06, "loss": 0.8838, "step": 7751 }, { "epoch": 0.53, "learning_rate": 9.570819863406121e-06, "loss": 0.8379, "step": 7752 }, { "epoch": 0.53, "learning_rate": 9.568614648007664e-06, "loss": 0.7734, "step": 7753 }, { "epoch": 0.53, "learning_rate": 9.566409453626279e-06, "loss": 0.8398, "step": 7754 }, { "epoch": 0.53, "learning_rate": 9.564204280369405e-06, "loss": 0.6904, "step": 7755 }, { "epoch": 0.53, "learning_rate": 9.561999128344475e-06, "loss": 0.833, "step": 7756 }, { "epoch": 0.53, "learning_rate": 9.559793997658924e-06, "loss": 0.8105, "step": 7757 }, { "epoch": 0.53, "learning_rate": 9.557588888420192e-06, "loss": 0.7979, "step": 7758 }, { "epoch": 0.53, "learning_rate": 9.555383800735709e-06, "loss": 0.8125, "step": 7759 }, { "epoch": 0.53, "learning_rate": 9.5531787347129e-06, "loss": 0.7881, "step": 7760 }, { "epoch": 0.53, "learning_rate": 9.550973690459207e-06, "loss": 0.8301, "step": 7761 }, { "epoch": 0.53, "learning_rate": 9.548768668082051e-06, "loss": 0.751, "step": 7762 }, { "epoch": 0.53, "learning_rate": 9.54656366768886e-06, "loss": 0.8027, "step": 7763 }, { "epoch": 0.53, "learning_rate": 9.544358689387071e-06, "loss": 0.8574, "step": 7764 }, { "epoch": 0.53, "learning_rate": 9.542153733284101e-06, "loss": 0.7979, "step": 7765 }, { "epoch": 0.53, "learning_rate": 9.539948799487383e-06, "loss": 0.8105, "step": 7766 }, { "epoch": 0.53, "learning_rate": 9.537743888104333e-06, "loss": 0.7881, "step": 7767 }, { "epoch": 0.53, "learning_rate": 9.53553899924238e-06, "loss": 0.7324, "step": 7768 }, { "epoch": 0.53, "learning_rate": 9.533334133008942e-06, "loss": 0.7695, "step": 7769 }, { "epoch": 0.53, "learning_rate": 9.531129289511444e-06, "loss": 0.8174, "step": 7770 }, { "epoch": 0.53, "learning_rate": 9.528924468857304e-06, "loss": 0.7256, "step": 7771 }, { "epoch": 0.53, "learning_rate": 9.526719671153942e-06, "loss": 0.8271, "step": 7772 }, { "epoch": 0.53, "learning_rate": 9.524514896508774e-06, "loss": 0.8174, "step": 7773 }, { "epoch": 0.53, "learning_rate": 9.522310145029218e-06, "loss": 0.708, "step": 7774 }, { "epoch": 0.53, "learning_rate": 9.520105416822681e-06, "loss": 0.7549, "step": 7775 }, { "epoch": 0.53, "learning_rate": 9.517900711996592e-06, "loss": 0.793, "step": 7776 }, { "epoch": 0.53, "learning_rate": 9.515696030658358e-06, "loss": 0.8564, "step": 7777 }, { "epoch": 0.53, "learning_rate": 9.513491372915386e-06, "loss": 0.8359, "step": 7778 }, { "epoch": 0.53, "learning_rate": 9.511286738875093e-06, "loss": 0.8232, "step": 7779 }, { "epoch": 0.53, "learning_rate": 9.509082128644885e-06, "loss": 0.8818, "step": 7780 }, { "epoch": 0.53, "learning_rate": 9.50687754233217e-06, "loss": 0.8389, "step": 7781 }, { "epoch": 0.53, "learning_rate": 9.504672980044361e-06, "loss": 0.8701, "step": 7782 }, { "epoch": 0.53, "learning_rate": 9.502468441888857e-06, "loss": 0.7773, "step": 7783 }, { "epoch": 0.53, "learning_rate": 9.500263927973068e-06, "loss": 0.7793, "step": 7784 }, { "epoch": 0.53, "learning_rate": 9.498059438404395e-06, "loss": 0.793, "step": 7785 }, { "epoch": 0.53, "learning_rate": 9.495854973290244e-06, "loss": 0.7783, "step": 7786 }, { "epoch": 0.53, "learning_rate": 9.49365053273801e-06, "loss": 0.8369, "step": 7787 }, { "epoch": 0.53, "learning_rate": 9.491446116855098e-06, "loss": 0.8047, "step": 7788 }, { "epoch": 0.53, "learning_rate": 9.48924172574891e-06, "loss": 0.7871, "step": 7789 }, { "epoch": 0.53, "learning_rate": 9.487037359526838e-06, "loss": 0.7393, "step": 7790 }, { "epoch": 0.53, "learning_rate": 9.484833018296282e-06, "loss": 0.7949, "step": 7791 }, { "epoch": 0.53, "learning_rate": 9.482628702164638e-06, "loss": 0.793, "step": 7792 }, { "epoch": 0.53, "learning_rate": 9.480424411239289e-06, "loss": 0.8047, "step": 7793 }, { "epoch": 0.53, "learning_rate": 9.478220145627645e-06, "loss": 0.7393, "step": 7794 }, { "epoch": 0.53, "learning_rate": 9.476015905437092e-06, "loss": 0.8584, "step": 7795 }, { "epoch": 0.53, "learning_rate": 9.473811690775014e-06, "loss": 0.8467, "step": 7796 }, { "epoch": 0.53, "learning_rate": 9.471607501748808e-06, "loss": 0.8096, "step": 7797 }, { "epoch": 0.53, "learning_rate": 9.469403338465857e-06, "loss": 0.7578, "step": 7798 }, { "epoch": 0.53, "learning_rate": 9.467199201033546e-06, "loss": 0.8291, "step": 7799 }, { "epoch": 0.53, "learning_rate": 9.46499508955927e-06, "loss": 0.8047, "step": 7800 }, { "epoch": 0.53, "learning_rate": 9.462791004150404e-06, "loss": 0.8193, "step": 7801 }, { "epoch": 0.53, "learning_rate": 9.460586944914335e-06, "loss": 0.7822, "step": 7802 }, { "epoch": 0.53, "learning_rate": 9.458382911958444e-06, "loss": 0.7871, "step": 7803 }, { "epoch": 0.53, "learning_rate": 9.456178905390111e-06, "loss": 0.8096, "step": 7804 }, { "epoch": 0.53, "learning_rate": 9.453974925316713e-06, "loss": 0.7881, "step": 7805 }, { "epoch": 0.53, "learning_rate": 9.451770971845632e-06, "loss": 0.7236, "step": 7806 }, { "epoch": 0.53, "learning_rate": 9.449567045084243e-06, "loss": 0.793, "step": 7807 }, { "epoch": 0.53, "learning_rate": 9.447363145139921e-06, "loss": 0.7959, "step": 7808 }, { "epoch": 0.53, "learning_rate": 9.44515927212004e-06, "loss": 0.8721, "step": 7809 }, { "epoch": 0.53, "learning_rate": 9.442955426131972e-06, "loss": 0.8477, "step": 7810 }, { "epoch": 0.53, "learning_rate": 9.440751607283084e-06, "loss": 0.9102, "step": 7811 }, { "epoch": 0.53, "learning_rate": 9.438547815680754e-06, "loss": 0.7969, "step": 7812 }, { "epoch": 0.53, "learning_rate": 9.436344051432347e-06, "loss": 0.7998, "step": 7813 }, { "epoch": 0.53, "learning_rate": 9.434140314645231e-06, "loss": 0.7812, "step": 7814 }, { "epoch": 0.53, "learning_rate": 9.43193660542677e-06, "loss": 0.7637, "step": 7815 }, { "epoch": 0.53, "learning_rate": 9.429732923884331e-06, "loss": 0.7354, "step": 7816 }, { "epoch": 0.53, "learning_rate": 9.427529270125273e-06, "loss": 0.7949, "step": 7817 }, { "epoch": 0.53, "learning_rate": 9.425325644256966e-06, "loss": 0.834, "step": 7818 }, { "epoch": 0.53, "learning_rate": 9.423122046386761e-06, "loss": 0.8359, "step": 7819 }, { "epoch": 0.53, "learning_rate": 9.420918476622027e-06, "loss": 0.8232, "step": 7820 }, { "epoch": 0.53, "learning_rate": 9.418714935070111e-06, "loss": 0.7715, "step": 7821 }, { "epoch": 0.53, "learning_rate": 9.41651142183838e-06, "loss": 0.8184, "step": 7822 }, { "epoch": 0.53, "learning_rate": 9.414307937034179e-06, "loss": 0.7705, "step": 7823 }, { "epoch": 0.53, "learning_rate": 9.412104480764868e-06, "loss": 0.792, "step": 7824 }, { "epoch": 0.53, "learning_rate": 9.409901053137801e-06, "loss": 0.834, "step": 7825 }, { "epoch": 0.53, "learning_rate": 9.407697654260324e-06, "loss": 0.8057, "step": 7826 }, { "epoch": 0.53, "learning_rate": 9.40549428423979e-06, "loss": 0.7715, "step": 7827 }, { "epoch": 0.53, "learning_rate": 9.403290943183545e-06, "loss": 0.7197, "step": 7828 }, { "epoch": 0.53, "learning_rate": 9.401087631198934e-06, "loss": 0.752, "step": 7829 }, { "epoch": 0.53, "learning_rate": 9.398884348393303e-06, "loss": 0.7178, "step": 7830 }, { "epoch": 0.53, "learning_rate": 9.396681094874001e-06, "loss": 0.7578, "step": 7831 }, { "epoch": 0.53, "learning_rate": 9.394477870748367e-06, "loss": 0.7305, "step": 7832 }, { "epoch": 0.53, "learning_rate": 9.39227467612374e-06, "loss": 0.8906, "step": 7833 }, { "epoch": 0.53, "learning_rate": 9.390071511107462e-06, "loss": 0.7842, "step": 7834 }, { "epoch": 0.53, "learning_rate": 9.387868375806866e-06, "loss": 0.7725, "step": 7835 }, { "epoch": 0.53, "learning_rate": 9.385665270329298e-06, "loss": 0.8115, "step": 7836 }, { "epoch": 0.53, "learning_rate": 9.383462194782086e-06, "loss": 0.7031, "step": 7837 }, { "epoch": 0.53, "learning_rate": 9.381259149272568e-06, "loss": 0.7832, "step": 7838 }, { "epoch": 0.53, "learning_rate": 9.379056133908072e-06, "loss": 0.7764, "step": 7839 }, { "epoch": 0.53, "learning_rate": 9.376853148795933e-06, "loss": 0.8848, "step": 7840 }, { "epoch": 0.53, "learning_rate": 9.374650194043473e-06, "loss": 0.749, "step": 7841 }, { "epoch": 0.53, "learning_rate": 9.372447269758027e-06, "loss": 0.7686, "step": 7842 }, { "epoch": 0.53, "learning_rate": 9.370244376046924e-06, "loss": 0.8076, "step": 7843 }, { "epoch": 0.53, "learning_rate": 9.368041513017481e-06, "loss": 0.7676, "step": 7844 }, { "epoch": 0.53, "learning_rate": 9.365838680777024e-06, "loss": 0.8916, "step": 7845 }, { "epoch": 0.53, "learning_rate": 9.363635879432878e-06, "loss": 0.7607, "step": 7846 }, { "epoch": 0.53, "learning_rate": 9.361433109092357e-06, "loss": 0.7451, "step": 7847 }, { "epoch": 0.53, "learning_rate": 9.359230369862785e-06, "loss": 0.7891, "step": 7848 }, { "epoch": 0.53, "learning_rate": 9.357027661851481e-06, "loss": 0.8398, "step": 7849 }, { "epoch": 0.53, "learning_rate": 9.354824985165755e-06, "loss": 0.7764, "step": 7850 }, { "epoch": 0.54, "learning_rate": 9.352622339912929e-06, "loss": 0.8701, "step": 7851 }, { "epoch": 0.54, "learning_rate": 9.350419726200306e-06, "loss": 0.792, "step": 7852 }, { "epoch": 0.54, "learning_rate": 9.348217144135202e-06, "loss": 0.7734, "step": 7853 }, { "epoch": 0.54, "learning_rate": 9.346014593824928e-06, "loss": 0.8574, "step": 7854 }, { "epoch": 0.54, "learning_rate": 9.34381207537679e-06, "loss": 0.8467, "step": 7855 }, { "epoch": 0.54, "learning_rate": 9.3416095888981e-06, "loss": 0.8662, "step": 7856 }, { "epoch": 0.54, "learning_rate": 9.339407134496157e-06, "loss": 0.7617, "step": 7857 }, { "epoch": 0.54, "learning_rate": 9.337204712278262e-06, "loss": 0.8545, "step": 7858 }, { "epoch": 0.54, "learning_rate": 9.335002322351725e-06, "loss": 0.8369, "step": 7859 }, { "epoch": 0.54, "learning_rate": 9.332799964823841e-06, "loss": 0.7451, "step": 7860 }, { "epoch": 0.54, "learning_rate": 9.330597639801914e-06, "loss": 0.7832, "step": 7861 }, { "epoch": 0.54, "learning_rate": 9.328395347393235e-06, "loss": 0.7773, "step": 7862 }, { "epoch": 0.54, "learning_rate": 9.326193087705101e-06, "loss": 0.7959, "step": 7863 }, { "epoch": 0.54, "learning_rate": 9.323990860844806e-06, "loss": 0.7949, "step": 7864 }, { "epoch": 0.54, "learning_rate": 9.321788666919644e-06, "loss": 0.834, "step": 7865 }, { "epoch": 0.54, "learning_rate": 9.319586506036907e-06, "loss": 0.7285, "step": 7866 }, { "epoch": 0.54, "learning_rate": 9.31738437830388e-06, "loss": 0.8145, "step": 7867 }, { "epoch": 0.54, "learning_rate": 9.315182283827853e-06, "loss": 0.79, "step": 7868 }, { "epoch": 0.54, "learning_rate": 9.312980222716115e-06, "loss": 0.8516, "step": 7869 }, { "epoch": 0.54, "learning_rate": 9.310778195075942e-06, "loss": 0.7266, "step": 7870 }, { "epoch": 0.54, "learning_rate": 9.308576201014624e-06, "loss": 0.749, "step": 7871 }, { "epoch": 0.54, "learning_rate": 9.306374240639441e-06, "loss": 0.7471, "step": 7872 }, { "epoch": 0.54, "learning_rate": 9.304172314057668e-06, "loss": 0.7939, "step": 7873 }, { "epoch": 0.54, "learning_rate": 9.30197042137659e-06, "loss": 0.79, "step": 7874 }, { "epoch": 0.54, "learning_rate": 9.299768562703477e-06, "loss": 0.7334, "step": 7875 }, { "epoch": 0.54, "learning_rate": 9.297566738145602e-06, "loss": 0.7549, "step": 7876 }, { "epoch": 0.54, "learning_rate": 9.295364947810246e-06, "loss": 0.7764, "step": 7877 }, { "epoch": 0.54, "learning_rate": 9.293163191804675e-06, "loss": 0.7979, "step": 7878 }, { "epoch": 0.54, "learning_rate": 9.29096147023616e-06, "loss": 0.751, "step": 7879 }, { "epoch": 0.54, "learning_rate": 9.288759783211967e-06, "loss": 0.7998, "step": 7880 }, { "epoch": 0.54, "learning_rate": 9.28655813083936e-06, "loss": 0.877, "step": 7881 }, { "epoch": 0.54, "learning_rate": 9.284356513225604e-06, "loss": 0.8066, "step": 7882 }, { "epoch": 0.54, "learning_rate": 9.28215493047797e-06, "loss": 0.8096, "step": 7883 }, { "epoch": 0.54, "learning_rate": 9.279953382703708e-06, "loss": 0.7861, "step": 7884 }, { "epoch": 0.54, "learning_rate": 9.277751870010085e-06, "loss": 0.7715, "step": 7885 }, { "epoch": 0.54, "learning_rate": 9.275550392504356e-06, "loss": 0.835, "step": 7886 }, { "epoch": 0.54, "learning_rate": 9.273348950293776e-06, "loss": 0.7734, "step": 7887 }, { "epoch": 0.54, "learning_rate": 9.271147543485596e-06, "loss": 0.751, "step": 7888 }, { "epoch": 0.54, "learning_rate": 9.268946172187075e-06, "loss": 0.7852, "step": 7889 }, { "epoch": 0.54, "learning_rate": 9.266744836505462e-06, "loss": 0.7432, "step": 7890 }, { "epoch": 0.54, "learning_rate": 9.264543536548003e-06, "loss": 0.7705, "step": 7891 }, { "epoch": 0.54, "learning_rate": 9.26234227242195e-06, "loss": 0.7588, "step": 7892 }, { "epoch": 0.54, "learning_rate": 9.260141044234542e-06, "loss": 0.7314, "step": 7893 }, { "epoch": 0.54, "learning_rate": 9.257939852093024e-06, "loss": 0.7246, "step": 7894 }, { "epoch": 0.54, "learning_rate": 9.255738696104647e-06, "loss": 0.8496, "step": 7895 }, { "epoch": 0.54, "learning_rate": 9.253537576376639e-06, "loss": 0.7607, "step": 7896 }, { "epoch": 0.54, "learning_rate": 9.251336493016248e-06, "loss": 0.7939, "step": 7897 }, { "epoch": 0.54, "learning_rate": 9.249135446130707e-06, "loss": 0.8145, "step": 7898 }, { "epoch": 0.54, "learning_rate": 9.246934435827246e-06, "loss": 0.8086, "step": 7899 }, { "epoch": 0.54, "learning_rate": 9.244733462213101e-06, "loss": 0.7852, "step": 7900 }, { "epoch": 0.54, "learning_rate": 9.24253252539551e-06, "loss": 0.8711, "step": 7901 }, { "epoch": 0.54, "learning_rate": 9.240331625481695e-06, "loss": 0.7852, "step": 7902 }, { "epoch": 0.54, "learning_rate": 9.23813076257889e-06, "loss": 0.8184, "step": 7903 }, { "epoch": 0.54, "learning_rate": 9.235929936794313e-06, "loss": 0.8115, "step": 7904 }, { "epoch": 0.54, "learning_rate": 9.233729148235196e-06, "loss": 0.8584, "step": 7905 }, { "epoch": 0.54, "learning_rate": 9.231528397008752e-06, "loss": 0.7598, "step": 7906 }, { "epoch": 0.54, "learning_rate": 9.229327683222209e-06, "loss": 0.8594, "step": 7907 }, { "epoch": 0.54, "learning_rate": 9.227127006982786e-06, "loss": 0.7949, "step": 7908 }, { "epoch": 0.54, "learning_rate": 9.224926368397695e-06, "loss": 0.835, "step": 7909 }, { "epoch": 0.54, "learning_rate": 9.222725767574156e-06, "loss": 0.7656, "step": 7910 }, { "epoch": 0.54, "learning_rate": 9.220525204619378e-06, "loss": 0.7451, "step": 7911 }, { "epoch": 0.54, "learning_rate": 9.218324679640572e-06, "loss": 0.7578, "step": 7912 }, { "epoch": 0.54, "learning_rate": 9.216124192744953e-06, "loss": 0.7412, "step": 7913 }, { "epoch": 0.54, "learning_rate": 9.213923744039726e-06, "loss": 0.8477, "step": 7914 }, { "epoch": 0.54, "learning_rate": 9.211723333632092e-06, "loss": 0.835, "step": 7915 }, { "epoch": 0.54, "learning_rate": 9.209522961629262e-06, "loss": 0.7764, "step": 7916 }, { "epoch": 0.54, "learning_rate": 9.207322628138433e-06, "loss": 0.833, "step": 7917 }, { "epoch": 0.54, "learning_rate": 9.205122333266805e-06, "loss": 0.8555, "step": 7918 }, { "epoch": 0.54, "learning_rate": 9.20292207712158e-06, "loss": 0.8135, "step": 7919 }, { "epoch": 0.54, "learning_rate": 9.200721859809954e-06, "loss": 0.8379, "step": 7920 }, { "epoch": 0.54, "learning_rate": 9.198521681439122e-06, "loss": 0.748, "step": 7921 }, { "epoch": 0.54, "learning_rate": 9.19632154211627e-06, "loss": 0.8145, "step": 7922 }, { "epoch": 0.54, "learning_rate": 9.194121441948596e-06, "loss": 0.8066, "step": 7923 }, { "epoch": 0.54, "learning_rate": 9.191921381043282e-06, "loss": 0.7969, "step": 7924 }, { "epoch": 0.54, "learning_rate": 9.18972135950752e-06, "loss": 0.666, "step": 7925 }, { "epoch": 0.54, "learning_rate": 9.187521377448499e-06, "loss": 0.8301, "step": 7926 }, { "epoch": 0.54, "learning_rate": 9.185321434973393e-06, "loss": 0.7939, "step": 7927 }, { "epoch": 0.54, "learning_rate": 9.183121532189387e-06, "loss": 0.8125, "step": 7928 }, { "epoch": 0.54, "learning_rate": 9.18092166920366e-06, "loss": 0.8486, "step": 7929 }, { "epoch": 0.54, "learning_rate": 9.178721846123388e-06, "loss": 0.7871, "step": 7930 }, { "epoch": 0.54, "learning_rate": 9.176522063055751e-06, "loss": 0.7705, "step": 7931 }, { "epoch": 0.54, "learning_rate": 9.17432232010792e-06, "loss": 0.7832, "step": 7932 }, { "epoch": 0.54, "learning_rate": 9.17212261738706e-06, "loss": 0.8076, "step": 7933 }, { "epoch": 0.54, "learning_rate": 9.169922955000351e-06, "loss": 0.7656, "step": 7934 }, { "epoch": 0.54, "learning_rate": 9.167723333054952e-06, "loss": 0.8242, "step": 7935 }, { "epoch": 0.54, "learning_rate": 9.165523751658029e-06, "loss": 0.8174, "step": 7936 }, { "epoch": 0.54, "learning_rate": 9.163324210916753e-06, "loss": 0.7861, "step": 7937 }, { "epoch": 0.54, "learning_rate": 9.161124710938278e-06, "loss": 0.8154, "step": 7938 }, { "epoch": 0.54, "learning_rate": 9.15892525182977e-06, "loss": 0.7725, "step": 7939 }, { "epoch": 0.54, "learning_rate": 9.156725833698377e-06, "loss": 0.6953, "step": 7940 }, { "epoch": 0.54, "learning_rate": 9.154526456651265e-06, "loss": 0.8516, "step": 7941 }, { "epoch": 0.54, "learning_rate": 9.15232712079558e-06, "loss": 0.8184, "step": 7942 }, { "epoch": 0.54, "learning_rate": 9.150127826238476e-06, "loss": 0.8838, "step": 7943 }, { "epoch": 0.54, "learning_rate": 9.147928573087104e-06, "loss": 0.8193, "step": 7944 }, { "epoch": 0.54, "learning_rate": 9.14572936144861e-06, "loss": 0.834, "step": 7945 }, { "epoch": 0.54, "learning_rate": 9.143530191430143e-06, "loss": 0.8379, "step": 7946 }, { "epoch": 0.54, "learning_rate": 9.14133106313884e-06, "loss": 0.7783, "step": 7947 }, { "epoch": 0.54, "learning_rate": 9.139131976681843e-06, "loss": 0.7881, "step": 7948 }, { "epoch": 0.54, "learning_rate": 9.136932932166299e-06, "loss": 0.8516, "step": 7949 }, { "epoch": 0.54, "learning_rate": 9.13473392969934e-06, "loss": 0.7432, "step": 7950 }, { "epoch": 0.54, "learning_rate": 9.1325349693881e-06, "loss": 0.834, "step": 7951 }, { "epoch": 0.54, "learning_rate": 9.130336051339717e-06, "loss": 0.8486, "step": 7952 }, { "epoch": 0.54, "learning_rate": 9.128137175661316e-06, "loss": 0.8203, "step": 7953 }, { "epoch": 0.54, "learning_rate": 9.125938342460028e-06, "loss": 0.833, "step": 7954 }, { "epoch": 0.54, "learning_rate": 9.123739551842985e-06, "loss": 0.8506, "step": 7955 }, { "epoch": 0.54, "learning_rate": 9.121540803917305e-06, "loss": 0.8193, "step": 7956 }, { "epoch": 0.54, "learning_rate": 9.119342098790118e-06, "loss": 0.7393, "step": 7957 }, { "epoch": 0.54, "learning_rate": 9.117143436568539e-06, "loss": 0.7959, "step": 7958 }, { "epoch": 0.54, "learning_rate": 9.11494481735969e-06, "loss": 0.8232, "step": 7959 }, { "epoch": 0.54, "learning_rate": 9.112746241270682e-06, "loss": 0.7783, "step": 7960 }, { "epoch": 0.54, "learning_rate": 9.110547708408635e-06, "loss": 0.8232, "step": 7961 }, { "epoch": 0.54, "learning_rate": 9.108349218880665e-06, "loss": 0.7949, "step": 7962 }, { "epoch": 0.54, "learning_rate": 9.106150772793873e-06, "loss": 0.8506, "step": 7963 }, { "epoch": 0.54, "learning_rate": 9.103952370255376e-06, "loss": 0.7393, "step": 7964 }, { "epoch": 0.54, "learning_rate": 9.101754011372275e-06, "loss": 0.8291, "step": 7965 }, { "epoch": 0.54, "learning_rate": 9.099555696251667e-06, "loss": 0.792, "step": 7966 }, { "epoch": 0.54, "learning_rate": 9.09735742500067e-06, "loss": 0.8066, "step": 7967 }, { "epoch": 0.54, "learning_rate": 9.095159197726374e-06, "loss": 0.8633, "step": 7968 }, { "epoch": 0.54, "learning_rate": 9.092961014535876e-06, "loss": 0.8252, "step": 7969 }, { "epoch": 0.54, "learning_rate": 9.090762875536276e-06, "loss": 0.7939, "step": 7970 }, { "epoch": 0.54, "learning_rate": 9.08856478083466e-06, "loss": 0.7812, "step": 7971 }, { "epoch": 0.54, "learning_rate": 9.086366730538124e-06, "loss": 0.8252, "step": 7972 }, { "epoch": 0.54, "learning_rate": 9.08416872475376e-06, "loss": 0.8076, "step": 7973 }, { "epoch": 0.54, "learning_rate": 9.081970763588648e-06, "loss": 0.877, "step": 7974 }, { "epoch": 0.54, "learning_rate": 9.079772847149878e-06, "loss": 0.8164, "step": 7975 }, { "epoch": 0.54, "learning_rate": 9.077574975544527e-06, "loss": 0.7686, "step": 7976 }, { "epoch": 0.54, "learning_rate": 9.075377148879678e-06, "loss": 0.7812, "step": 7977 }, { "epoch": 0.54, "learning_rate": 9.073179367262413e-06, "loss": 0.749, "step": 7978 }, { "epoch": 0.54, "learning_rate": 9.0709816307998e-06, "loss": 0.7812, "step": 7979 }, { "epoch": 0.54, "learning_rate": 9.06878393959892e-06, "loss": 0.7588, "step": 7980 }, { "epoch": 0.54, "learning_rate": 9.06658629376684e-06, "loss": 0.8701, "step": 7981 }, { "epoch": 0.54, "learning_rate": 9.064388693410632e-06, "loss": 0.7256, "step": 7982 }, { "epoch": 0.54, "learning_rate": 9.062191138637357e-06, "loss": 0.7822, "step": 7983 }, { "epoch": 0.54, "learning_rate": 9.059993629554084e-06, "loss": 0.8125, "step": 7984 }, { "epoch": 0.54, "learning_rate": 9.057796166267879e-06, "loss": 0.7832, "step": 7985 }, { "epoch": 0.54, "learning_rate": 9.0555987488858e-06, "loss": 0.7451, "step": 7986 }, { "epoch": 0.54, "learning_rate": 9.053401377514902e-06, "loss": 0.7861, "step": 7987 }, { "epoch": 0.54, "learning_rate": 9.051204052262243e-06, "loss": 0.8594, "step": 7988 }, { "epoch": 0.54, "learning_rate": 9.049006773234872e-06, "loss": 0.7959, "step": 7989 }, { "epoch": 0.54, "learning_rate": 9.046809540539848e-06, "loss": 0.8975, "step": 7990 }, { "epoch": 0.54, "learning_rate": 9.044612354284218e-06, "loss": 0.9102, "step": 7991 }, { "epoch": 0.54, "learning_rate": 9.042415214575026e-06, "loss": 0.7803, "step": 7992 }, { "epoch": 0.54, "learning_rate": 9.04021812151932e-06, "loss": 0.7891, "step": 7993 }, { "epoch": 0.54, "learning_rate": 9.038021075224137e-06, "loss": 0.8428, "step": 7994 }, { "epoch": 0.54, "learning_rate": 9.03582407579652e-06, "loss": 0.8223, "step": 7995 }, { "epoch": 0.54, "learning_rate": 9.03362712334351e-06, "loss": 0.8154, "step": 7996 }, { "epoch": 0.54, "learning_rate": 9.031430217972138e-06, "loss": 0.7734, "step": 7997 }, { "epoch": 0.55, "learning_rate": 9.02923335978944e-06, "loss": 0.7979, "step": 7998 }, { "epoch": 0.55, "learning_rate": 9.027036548902444e-06, "loss": 0.791, "step": 7999 }, { "epoch": 0.55, "learning_rate": 9.024839785418182e-06, "loss": 0.7979, "step": 8000 }, { "epoch": 0.55, "learning_rate": 9.022643069443673e-06, "loss": 0.7539, "step": 8001 }, { "epoch": 0.55, "learning_rate": 9.020446401085952e-06, "loss": 0.8262, "step": 8002 }, { "epoch": 0.55, "learning_rate": 9.018249780452031e-06, "loss": 0.7158, "step": 8003 }, { "epoch": 0.55, "learning_rate": 9.016053207648934e-06, "loss": 0.7314, "step": 8004 }, { "epoch": 0.55, "learning_rate": 9.013856682783677e-06, "loss": 0.8457, "step": 8005 }, { "epoch": 0.55, "learning_rate": 9.011660205963276e-06, "loss": 0.751, "step": 8006 }, { "epoch": 0.55, "learning_rate": 9.009463777294735e-06, "loss": 0.8369, "step": 8007 }, { "epoch": 0.55, "learning_rate": 9.007267396885074e-06, "loss": 0.8008, "step": 8008 }, { "epoch": 0.55, "learning_rate": 9.005071064841299e-06, "loss": 0.79, "step": 8009 }, { "epoch": 0.55, "learning_rate": 9.002874781270412e-06, "loss": 0.7959, "step": 8010 }, { "epoch": 0.55, "learning_rate": 9.000678546279418e-06, "loss": 0.7969, "step": 8011 }, { "epoch": 0.55, "learning_rate": 8.998482359975316e-06, "loss": 0.7324, "step": 8012 }, { "epoch": 0.55, "learning_rate": 8.996286222465102e-06, "loss": 0.8047, "step": 8013 }, { "epoch": 0.55, "learning_rate": 8.994090133855777e-06, "loss": 0.8232, "step": 8014 }, { "epoch": 0.55, "learning_rate": 8.991894094254331e-06, "loss": 0.8135, "step": 8015 }, { "epoch": 0.55, "learning_rate": 8.989698103767756e-06, "loss": 0.8008, "step": 8016 }, { "epoch": 0.55, "learning_rate": 8.98750216250304e-06, "loss": 0.7266, "step": 8017 }, { "epoch": 0.55, "learning_rate": 8.98530627056717e-06, "loss": 0.7803, "step": 8018 }, { "epoch": 0.55, "learning_rate": 8.983110428067125e-06, "loss": 0.8311, "step": 8019 }, { "epoch": 0.55, "learning_rate": 8.980914635109895e-06, "loss": 0.8047, "step": 8020 }, { "epoch": 0.55, "learning_rate": 8.978718891802452e-06, "loss": 0.792, "step": 8021 }, { "epoch": 0.55, "learning_rate": 8.976523198251777e-06, "loss": 0.7529, "step": 8022 }, { "epoch": 0.55, "learning_rate": 8.97432755456484e-06, "loss": 0.7334, "step": 8023 }, { "epoch": 0.55, "learning_rate": 8.972131960848617e-06, "loss": 0.7451, "step": 8024 }, { "epoch": 0.55, "learning_rate": 8.969936417210068e-06, "loss": 0.9297, "step": 8025 }, { "epoch": 0.55, "learning_rate": 8.967740923756172e-06, "loss": 0.8086, "step": 8026 }, { "epoch": 0.55, "learning_rate": 8.965545480593888e-06, "loss": 0.7686, "step": 8027 }, { "epoch": 0.55, "learning_rate": 8.963350087830176e-06, "loss": 0.7842, "step": 8028 }, { "epoch": 0.55, "learning_rate": 8.961154745571999e-06, "loss": 0.7754, "step": 8029 }, { "epoch": 0.55, "learning_rate": 8.958959453926311e-06, "loss": 0.7139, "step": 8030 }, { "epoch": 0.55, "learning_rate": 8.956764213000064e-06, "loss": 0.7383, "step": 8031 }, { "epoch": 0.55, "learning_rate": 8.95456902290022e-06, "loss": 0.6787, "step": 8032 }, { "epoch": 0.55, "learning_rate": 8.952373883733718e-06, "loss": 0.7148, "step": 8033 }, { "epoch": 0.55, "learning_rate": 8.950178795607513e-06, "loss": 0.7461, "step": 8034 }, { "epoch": 0.55, "learning_rate": 8.947983758628545e-06, "loss": 0.7969, "step": 8035 }, { "epoch": 0.55, "learning_rate": 8.945788772903755e-06, "loss": 0.792, "step": 8036 }, { "epoch": 0.55, "learning_rate": 8.943593838540083e-06, "loss": 0.8125, "step": 8037 }, { "epoch": 0.55, "learning_rate": 8.941398955644472e-06, "loss": 0.749, "step": 8038 }, { "epoch": 0.55, "learning_rate": 8.939204124323849e-06, "loss": 0.834, "step": 8039 }, { "epoch": 0.55, "learning_rate": 8.93700934468515e-06, "loss": 0.7432, "step": 8040 }, { "epoch": 0.55, "learning_rate": 8.934814616835306e-06, "loss": 0.8447, "step": 8041 }, { "epoch": 0.55, "learning_rate": 8.93261994088124e-06, "loss": 0.7637, "step": 8042 }, { "epoch": 0.55, "learning_rate": 8.930425316929878e-06, "loss": 0.8096, "step": 8043 }, { "epoch": 0.55, "learning_rate": 8.928230745088142e-06, "loss": 0.7861, "step": 8044 }, { "epoch": 0.55, "learning_rate": 8.926036225462955e-06, "loss": 0.8467, "step": 8045 }, { "epoch": 0.55, "learning_rate": 8.923841758161227e-06, "loss": 0.8213, "step": 8046 }, { "epoch": 0.55, "learning_rate": 8.921647343289878e-06, "loss": 0.9111, "step": 8047 }, { "epoch": 0.55, "learning_rate": 8.919452980955819e-06, "loss": 0.79, "step": 8048 }, { "epoch": 0.55, "learning_rate": 8.917258671265952e-06, "loss": 0.7744, "step": 8049 }, { "epoch": 0.55, "learning_rate": 8.915064414327196e-06, "loss": 0.7646, "step": 8050 }, { "epoch": 0.55, "learning_rate": 8.912870210246448e-06, "loss": 0.8096, "step": 8051 }, { "epoch": 0.55, "learning_rate": 8.910676059130611e-06, "loss": 0.8311, "step": 8052 }, { "epoch": 0.55, "learning_rate": 8.908481961086583e-06, "loss": 0.7559, "step": 8053 }, { "epoch": 0.55, "learning_rate": 8.906287916221259e-06, "loss": 0.8086, "step": 8054 }, { "epoch": 0.55, "learning_rate": 8.904093924641532e-06, "loss": 0.8047, "step": 8055 }, { "epoch": 0.55, "learning_rate": 8.9018999864543e-06, "loss": 0.7754, "step": 8056 }, { "epoch": 0.55, "learning_rate": 8.899706101766445e-06, "loss": 0.7812, "step": 8057 }, { "epoch": 0.55, "learning_rate": 8.897512270684857e-06, "loss": 0.7559, "step": 8058 }, { "epoch": 0.55, "learning_rate": 8.895318493316415e-06, "loss": 0.8369, "step": 8059 }, { "epoch": 0.55, "learning_rate": 8.893124769768005e-06, "loss": 0.9004, "step": 8060 }, { "epoch": 0.55, "learning_rate": 8.890931100146497e-06, "loss": 0.8232, "step": 8061 }, { "epoch": 0.55, "learning_rate": 8.888737484558775e-06, "loss": 0.7744, "step": 8062 }, { "epoch": 0.55, "learning_rate": 8.88654392311171e-06, "loss": 0.7305, "step": 8063 }, { "epoch": 0.55, "learning_rate": 8.884350415912168e-06, "loss": 0.8047, "step": 8064 }, { "epoch": 0.55, "learning_rate": 8.882156963067024e-06, "loss": 0.8203, "step": 8065 }, { "epoch": 0.55, "learning_rate": 8.879963564683134e-06, "loss": 0.7783, "step": 8066 }, { "epoch": 0.55, "learning_rate": 8.877770220867362e-06, "loss": 0.8262, "step": 8067 }, { "epoch": 0.55, "learning_rate": 8.875576931726575e-06, "loss": 0.8135, "step": 8068 }, { "epoch": 0.55, "learning_rate": 8.873383697367623e-06, "loss": 0.8428, "step": 8069 }, { "epoch": 0.55, "learning_rate": 8.871190517897364e-06, "loss": 0.7344, "step": 8070 }, { "epoch": 0.55, "learning_rate": 8.86899739342265e-06, "loss": 0.8154, "step": 8071 }, { "epoch": 0.55, "learning_rate": 8.866804324050323e-06, "loss": 0.8486, "step": 8072 }, { "epoch": 0.55, "learning_rate": 8.864611309887234e-06, "loss": 0.7422, "step": 8073 }, { "epoch": 0.55, "learning_rate": 8.86241835104023e-06, "loss": 0.8496, "step": 8074 }, { "epoch": 0.55, "learning_rate": 8.860225447616145e-06, "loss": 0.7393, "step": 8075 }, { "epoch": 0.55, "learning_rate": 8.858032599721824e-06, "loss": 0.8145, "step": 8076 }, { "epoch": 0.55, "learning_rate": 8.855839807464097e-06, "loss": 0.8398, "step": 8077 }, { "epoch": 0.55, "learning_rate": 8.853647070949802e-06, "loss": 0.7285, "step": 8078 }, { "epoch": 0.55, "learning_rate": 8.851454390285759e-06, "loss": 0.835, "step": 8079 }, { "epoch": 0.55, "learning_rate": 8.849261765578807e-06, "loss": 0.8125, "step": 8080 }, { "epoch": 0.55, "learning_rate": 8.847069196935766e-06, "loss": 0.7588, "step": 8081 }, { "epoch": 0.55, "learning_rate": 8.844876684463455e-06, "loss": 0.8057, "step": 8082 }, { "epoch": 0.55, "learning_rate": 8.842684228268698e-06, "loss": 0.7344, "step": 8083 }, { "epoch": 0.55, "learning_rate": 8.840491828458307e-06, "loss": 0.7949, "step": 8084 }, { "epoch": 0.55, "learning_rate": 8.838299485139097e-06, "loss": 0.8516, "step": 8085 }, { "epoch": 0.55, "learning_rate": 8.836107198417882e-06, "loss": 0.7959, "step": 8086 }, { "epoch": 0.55, "learning_rate": 8.833914968401466e-06, "loss": 0.7627, "step": 8087 }, { "epoch": 0.55, "learning_rate": 8.831722795196658e-06, "loss": 0.7373, "step": 8088 }, { "epoch": 0.55, "learning_rate": 8.82953067891026e-06, "loss": 0.7842, "step": 8089 }, { "epoch": 0.55, "learning_rate": 8.827338619649063e-06, "loss": 0.79, "step": 8090 }, { "epoch": 0.55, "learning_rate": 8.825146617519874e-06, "loss": 0.7793, "step": 8091 }, { "epoch": 0.55, "learning_rate": 8.822954672629486e-06, "loss": 0.7783, "step": 8092 }, { "epoch": 0.55, "learning_rate": 8.82076278508469e-06, "loss": 0.875, "step": 8093 }, { "epoch": 0.55, "learning_rate": 8.818570954992274e-06, "loss": 0.8027, "step": 8094 }, { "epoch": 0.55, "learning_rate": 8.81637918245902e-06, "loss": 0.8486, "step": 8095 }, { "epoch": 0.55, "learning_rate": 8.814187467591713e-06, "loss": 0.8164, "step": 8096 }, { "epoch": 0.55, "learning_rate": 8.811995810497141e-06, "loss": 0.7959, "step": 8097 }, { "epoch": 0.55, "learning_rate": 8.809804211282071e-06, "loss": 0.8135, "step": 8098 }, { "epoch": 0.55, "learning_rate": 8.807612670053285e-06, "loss": 0.8477, "step": 8099 }, { "epoch": 0.55, "learning_rate": 8.805421186917548e-06, "loss": 0.7803, "step": 8100 }, { "epoch": 0.55, "learning_rate": 8.803229761981637e-06, "loss": 0.7754, "step": 8101 }, { "epoch": 0.55, "learning_rate": 8.801038395352308e-06, "loss": 0.7646, "step": 8102 }, { "epoch": 0.55, "learning_rate": 8.79884708713633e-06, "loss": 0.793, "step": 8103 }, { "epoch": 0.55, "learning_rate": 8.796655837440469e-06, "loss": 0.708, "step": 8104 }, { "epoch": 0.55, "learning_rate": 8.794464646371476e-06, "loss": 0.6689, "step": 8105 }, { "epoch": 0.55, "learning_rate": 8.792273514036103e-06, "loss": 0.8428, "step": 8106 }, { "epoch": 0.55, "learning_rate": 8.790082440541109e-06, "loss": 0.7969, "step": 8107 }, { "epoch": 0.55, "learning_rate": 8.787891425993235e-06, "loss": 0.8135, "step": 8108 }, { "epoch": 0.55, "learning_rate": 8.785700470499233e-06, "loss": 0.7578, "step": 8109 }, { "epoch": 0.55, "learning_rate": 8.783509574165847e-06, "loss": 0.791, "step": 8110 }, { "epoch": 0.55, "learning_rate": 8.781318737099815e-06, "loss": 0.7656, "step": 8111 }, { "epoch": 0.55, "learning_rate": 8.779127959407874e-06, "loss": 0.7744, "step": 8112 }, { "epoch": 0.55, "learning_rate": 8.776937241196759e-06, "loss": 0.8174, "step": 8113 }, { "epoch": 0.55, "learning_rate": 8.7747465825732e-06, "loss": 0.873, "step": 8114 }, { "epoch": 0.55, "learning_rate": 8.77255598364393e-06, "loss": 0.7373, "step": 8115 }, { "epoch": 0.55, "learning_rate": 8.770365444515673e-06, "loss": 0.7695, "step": 8116 }, { "epoch": 0.55, "learning_rate": 8.768174965295153e-06, "loss": 0.7695, "step": 8117 }, { "epoch": 0.55, "learning_rate": 8.765984546089085e-06, "loss": 0.7471, "step": 8118 }, { "epoch": 0.55, "learning_rate": 8.763794187004195e-06, "loss": 0.7363, "step": 8119 }, { "epoch": 0.55, "learning_rate": 8.761603888147184e-06, "loss": 0.7852, "step": 8120 }, { "epoch": 0.55, "learning_rate": 8.759413649624775e-06, "loss": 0.7197, "step": 8121 }, { "epoch": 0.55, "learning_rate": 8.757223471543675e-06, "loss": 0.7529, "step": 8122 }, { "epoch": 0.55, "learning_rate": 8.755033354010587e-06, "loss": 0.8154, "step": 8123 }, { "epoch": 0.55, "learning_rate": 8.75284329713221e-06, "loss": 0.7891, "step": 8124 }, { "epoch": 0.55, "learning_rate": 8.750653301015249e-06, "loss": 0.8477, "step": 8125 }, { "epoch": 0.55, "learning_rate": 8.748463365766396e-06, "loss": 0.7529, "step": 8126 }, { "epoch": 0.55, "learning_rate": 8.746273491492346e-06, "loss": 0.6992, "step": 8127 }, { "epoch": 0.55, "learning_rate": 8.744083678299795e-06, "loss": 0.8262, "step": 8128 }, { "epoch": 0.55, "learning_rate": 8.741893926295422e-06, "loss": 0.7881, "step": 8129 }, { "epoch": 0.55, "learning_rate": 8.739704235585919e-06, "loss": 0.8135, "step": 8130 }, { "epoch": 0.55, "learning_rate": 8.737514606277961e-06, "loss": 0.7041, "step": 8131 }, { "epoch": 0.55, "learning_rate": 8.735325038478228e-06, "loss": 0.7441, "step": 8132 }, { "epoch": 0.55, "learning_rate": 8.733135532293402e-06, "loss": 0.7314, "step": 8133 }, { "epoch": 0.55, "learning_rate": 8.730946087830148e-06, "loss": 0.7012, "step": 8134 }, { "epoch": 0.55, "learning_rate": 8.728756705195142e-06, "loss": 0.7705, "step": 8135 }, { "epoch": 0.55, "learning_rate": 8.726567384495045e-06, "loss": 0.8301, "step": 8136 }, { "epoch": 0.55, "learning_rate": 8.724378125836525e-06, "loss": 0.8467, "step": 8137 }, { "epoch": 0.55, "learning_rate": 8.722188929326237e-06, "loss": 0.707, "step": 8138 }, { "epoch": 0.55, "learning_rate": 8.719999795070842e-06, "loss": 0.7305, "step": 8139 }, { "epoch": 0.55, "learning_rate": 8.717810723176998e-06, "loss": 0.8096, "step": 8140 }, { "epoch": 0.55, "learning_rate": 8.715621713751353e-06, "loss": 0.7695, "step": 8141 }, { "epoch": 0.55, "learning_rate": 8.713432766900554e-06, "loss": 0.8721, "step": 8142 }, { "epoch": 0.55, "learning_rate": 8.711243882731249e-06, "loss": 0.6748, "step": 8143 }, { "epoch": 0.55, "learning_rate": 8.709055061350074e-06, "loss": 0.8398, "step": 8144 }, { "epoch": 0.56, "learning_rate": 8.706866302863678e-06, "loss": 0.8213, "step": 8145 }, { "epoch": 0.56, "learning_rate": 8.704677607378694e-06, "loss": 0.7441, "step": 8146 }, { "epoch": 0.56, "learning_rate": 8.70248897500175e-06, "loss": 0.7695, "step": 8147 }, { "epoch": 0.56, "learning_rate": 8.700300405839484e-06, "loss": 0.7744, "step": 8148 }, { "epoch": 0.56, "learning_rate": 8.698111899998516e-06, "loss": 0.832, "step": 8149 }, { "epoch": 0.56, "learning_rate": 8.69592345758547e-06, "loss": 0.8701, "step": 8150 }, { "epoch": 0.56, "learning_rate": 8.693735078706976e-06, "loss": 0.7012, "step": 8151 }, { "epoch": 0.56, "learning_rate": 8.69154676346964e-06, "loss": 0.8018, "step": 8152 }, { "epoch": 0.56, "learning_rate": 8.689358511980087e-06, "loss": 0.7539, "step": 8153 }, { "epoch": 0.56, "learning_rate": 8.68717032434492e-06, "loss": 0.8145, "step": 8154 }, { "epoch": 0.56, "learning_rate": 8.684982200670751e-06, "loss": 0.7852, "step": 8155 }, { "epoch": 0.56, "learning_rate": 8.682794141064184e-06, "loss": 0.7451, "step": 8156 }, { "epoch": 0.56, "learning_rate": 8.680606145631822e-06, "loss": 0.7842, "step": 8157 }, { "epoch": 0.56, "learning_rate": 8.678418214480268e-06, "loss": 0.7969, "step": 8158 }, { "epoch": 0.56, "learning_rate": 8.676230347716112e-06, "loss": 0.8037, "step": 8159 }, { "epoch": 0.56, "learning_rate": 8.674042545445948e-06, "loss": 0.7988, "step": 8160 }, { "epoch": 0.56, "learning_rate": 8.67185480777637e-06, "loss": 0.8262, "step": 8161 }, { "epoch": 0.56, "learning_rate": 8.669667134813954e-06, "loss": 0.8057, "step": 8162 }, { "epoch": 0.56, "learning_rate": 8.667479526665295e-06, "loss": 0.668, "step": 8163 }, { "epoch": 0.56, "learning_rate": 8.66529198343697e-06, "loss": 0.8203, "step": 8164 }, { "epoch": 0.56, "learning_rate": 8.663104505235552e-06, "loss": 0.7969, "step": 8165 }, { "epoch": 0.56, "learning_rate": 8.66091709216762e-06, "loss": 0.7373, "step": 8166 }, { "epoch": 0.56, "learning_rate": 8.658729744339738e-06, "loss": 0.75, "step": 8167 }, { "epoch": 0.56, "learning_rate": 8.656542461858478e-06, "loss": 0.7812, "step": 8168 }, { "epoch": 0.56, "learning_rate": 8.654355244830406e-06, "loss": 0.7119, "step": 8169 }, { "epoch": 0.56, "learning_rate": 8.65216809336208e-06, "loss": 0.748, "step": 8170 }, { "epoch": 0.56, "learning_rate": 8.649981007560059e-06, "loss": 0.8105, "step": 8171 }, { "epoch": 0.56, "learning_rate": 8.647793987530896e-06, "loss": 0.7988, "step": 8172 }, { "epoch": 0.56, "learning_rate": 8.645607033381146e-06, "loss": 0.7725, "step": 8173 }, { "epoch": 0.56, "learning_rate": 8.643420145217354e-06, "loss": 0.8076, "step": 8174 }, { "epoch": 0.56, "learning_rate": 8.641233323146068e-06, "loss": 0.7783, "step": 8175 }, { "epoch": 0.56, "learning_rate": 8.639046567273825e-06, "loss": 0.833, "step": 8176 }, { "epoch": 0.56, "learning_rate": 8.636859877707171e-06, "loss": 0.8818, "step": 8177 }, { "epoch": 0.56, "learning_rate": 8.634673254552635e-06, "loss": 0.7598, "step": 8178 }, { "epoch": 0.56, "learning_rate": 8.632486697916753e-06, "loss": 0.7275, "step": 8179 }, { "epoch": 0.56, "learning_rate": 8.630300207906049e-06, "loss": 0.8076, "step": 8180 }, { "epoch": 0.56, "learning_rate": 8.628113784627053e-06, "loss": 0.7285, "step": 8181 }, { "epoch": 0.56, "learning_rate": 8.625927428186289e-06, "loss": 0.8232, "step": 8182 }, { "epoch": 0.56, "learning_rate": 8.623741138690272e-06, "loss": 0.8467, "step": 8183 }, { "epoch": 0.56, "learning_rate": 8.62155491624552e-06, "loss": 0.7012, "step": 8184 }, { "epoch": 0.56, "learning_rate": 8.619368760958545e-06, "loss": 0.8252, "step": 8185 }, { "epoch": 0.56, "learning_rate": 8.617182672935854e-06, "loss": 0.7549, "step": 8186 }, { "epoch": 0.56, "learning_rate": 8.61499665228396e-06, "loss": 0.8213, "step": 8187 }, { "epoch": 0.56, "learning_rate": 8.61281069910936e-06, "loss": 0.8154, "step": 8188 }, { "epoch": 0.56, "learning_rate": 8.610624813518555e-06, "loss": 0.8203, "step": 8189 }, { "epoch": 0.56, "learning_rate": 8.608438995618043e-06, "loss": 0.8184, "step": 8190 }, { "epoch": 0.56, "learning_rate": 8.606253245514315e-06, "loss": 0.7559, "step": 8191 }, { "epoch": 0.56, "learning_rate": 8.604067563313857e-06, "loss": 0.7988, "step": 8192 }, { "epoch": 0.56, "learning_rate": 8.601881949123163e-06, "loss": 0.8672, "step": 8193 }, { "epoch": 0.56, "learning_rate": 8.59969640304871e-06, "loss": 0.793, "step": 8194 }, { "epoch": 0.56, "learning_rate": 8.597510925196983e-06, "loss": 0.8164, "step": 8195 }, { "epoch": 0.56, "learning_rate": 8.595325515674453e-06, "loss": 0.7305, "step": 8196 }, { "epoch": 0.56, "learning_rate": 8.593140174587597e-06, "loss": 0.8037, "step": 8197 }, { "epoch": 0.56, "learning_rate": 8.590954902042879e-06, "loss": 0.7295, "step": 8198 }, { "epoch": 0.56, "learning_rate": 8.588769698146771e-06, "loss": 0.7539, "step": 8199 }, { "epoch": 0.56, "learning_rate": 8.586584563005737e-06, "loss": 0.7715, "step": 8200 }, { "epoch": 0.56, "learning_rate": 8.584399496726234e-06, "loss": 0.8213, "step": 8201 }, { "epoch": 0.56, "learning_rate": 8.582214499414719e-06, "loss": 0.7686, "step": 8202 }, { "epoch": 0.56, "learning_rate": 8.580029571177642e-06, "loss": 0.835, "step": 8203 }, { "epoch": 0.56, "learning_rate": 8.577844712121453e-06, "loss": 0.7588, "step": 8204 }, { "epoch": 0.56, "learning_rate": 8.575659922352605e-06, "loss": 0.8477, "step": 8205 }, { "epoch": 0.56, "learning_rate": 8.573475201977534e-06, "loss": 0.7598, "step": 8206 }, { "epoch": 0.56, "learning_rate": 8.571290551102683e-06, "loss": 0.8252, "step": 8207 }, { "epoch": 0.56, "learning_rate": 8.569105969834486e-06, "loss": 0.7422, "step": 8208 }, { "epoch": 0.56, "learning_rate": 8.566921458279377e-06, "loss": 0.8252, "step": 8209 }, { "epoch": 0.56, "learning_rate": 8.56473701654378e-06, "loss": 0.7695, "step": 8210 }, { "epoch": 0.56, "learning_rate": 8.562552644734132e-06, "loss": 0.7646, "step": 8211 }, { "epoch": 0.56, "learning_rate": 8.560368342956845e-06, "loss": 0.7676, "step": 8212 }, { "epoch": 0.56, "learning_rate": 8.558184111318346e-06, "loss": 0.7891, "step": 8213 }, { "epoch": 0.56, "learning_rate": 8.555999949925043e-06, "loss": 0.7051, "step": 8214 }, { "epoch": 0.56, "learning_rate": 8.553815858883354e-06, "loss": 0.7656, "step": 8215 }, { "epoch": 0.56, "learning_rate": 8.551631838299683e-06, "loss": 0.7871, "step": 8216 }, { "epoch": 0.56, "learning_rate": 8.54944788828044e-06, "loss": 0.8193, "step": 8217 }, { "epoch": 0.56, "learning_rate": 8.547264008932027e-06, "loss": 0.8105, "step": 8218 }, { "epoch": 0.56, "learning_rate": 8.545080200360838e-06, "loss": 0.8125, "step": 8219 }, { "epoch": 0.56, "learning_rate": 8.542896462673274e-06, "loss": 0.7363, "step": 8220 }, { "epoch": 0.56, "learning_rate": 8.540712795975718e-06, "loss": 0.8232, "step": 8221 }, { "epoch": 0.56, "learning_rate": 8.538529200374565e-06, "loss": 0.8008, "step": 8222 }, { "epoch": 0.56, "learning_rate": 8.5363456759762e-06, "loss": 0.7607, "step": 8223 }, { "epoch": 0.56, "learning_rate": 8.534162222887003e-06, "loss": 0.8242, "step": 8224 }, { "epoch": 0.56, "learning_rate": 8.53197884121335e-06, "loss": 0.7998, "step": 8225 }, { "epoch": 0.56, "learning_rate": 8.529795531061618e-06, "loss": 0.8447, "step": 8226 }, { "epoch": 0.56, "learning_rate": 8.52761229253817e-06, "loss": 0.8086, "step": 8227 }, { "epoch": 0.56, "learning_rate": 8.525429125749386e-06, "loss": 0.6191, "step": 8228 }, { "epoch": 0.56, "learning_rate": 8.52324603080162e-06, "loss": 0.6426, "step": 8229 }, { "epoch": 0.56, "learning_rate": 8.521063007801235e-06, "loss": 0.7842, "step": 8230 }, { "epoch": 0.56, "learning_rate": 8.518880056854592e-06, "loss": 0.7686, "step": 8231 }, { "epoch": 0.56, "learning_rate": 8.516697178068036e-06, "loss": 0.6992, "step": 8232 }, { "epoch": 0.56, "learning_rate": 8.51451437154792e-06, "loss": 0.8252, "step": 8233 }, { "epoch": 0.56, "learning_rate": 8.512331637400597e-06, "loss": 0.7422, "step": 8234 }, { "epoch": 0.56, "learning_rate": 8.5101489757324e-06, "loss": 0.791, "step": 8235 }, { "epoch": 0.56, "learning_rate": 8.507966386649674e-06, "loss": 0.8174, "step": 8236 }, { "epoch": 0.56, "learning_rate": 8.505783870258751e-06, "loss": 0.7637, "step": 8237 }, { "epoch": 0.56, "learning_rate": 8.503601426665968e-06, "loss": 0.7148, "step": 8238 }, { "epoch": 0.56, "learning_rate": 8.501419055977646e-06, "loss": 0.8408, "step": 8239 }, { "epoch": 0.56, "learning_rate": 8.499236758300117e-06, "loss": 0.8105, "step": 8240 }, { "epoch": 0.56, "learning_rate": 8.497054533739702e-06, "loss": 0.7656, "step": 8241 }, { "epoch": 0.56, "learning_rate": 8.494872382402713e-06, "loss": 0.7988, "step": 8242 }, { "epoch": 0.56, "learning_rate": 8.492690304395472e-06, "loss": 0.8164, "step": 8243 }, { "epoch": 0.56, "learning_rate": 8.490508299824284e-06, "loss": 0.8711, "step": 8244 }, { "epoch": 0.56, "learning_rate": 8.488326368795454e-06, "loss": 0.7979, "step": 8245 }, { "epoch": 0.56, "learning_rate": 8.486144511415295e-06, "loss": 0.832, "step": 8246 }, { "epoch": 0.56, "learning_rate": 8.483962727790103e-06, "loss": 0.8369, "step": 8247 }, { "epoch": 0.56, "learning_rate": 8.481781018026168e-06, "loss": 0.7627, "step": 8248 }, { "epoch": 0.56, "learning_rate": 8.479599382229792e-06, "loss": 0.6895, "step": 8249 }, { "epoch": 0.56, "learning_rate": 8.477417820507256e-06, "loss": 0.8096, "step": 8250 }, { "epoch": 0.56, "learning_rate": 8.475236332964848e-06, "loss": 0.9043, "step": 8251 }, { "epoch": 0.56, "learning_rate": 8.473054919708858e-06, "loss": 0.8145, "step": 8252 }, { "epoch": 0.56, "learning_rate": 8.470873580845554e-06, "loss": 0.7637, "step": 8253 }, { "epoch": 0.56, "learning_rate": 8.468692316481217e-06, "loss": 0.7891, "step": 8254 }, { "epoch": 0.56, "learning_rate": 8.466511126722113e-06, "loss": 0.8193, "step": 8255 }, { "epoch": 0.56, "learning_rate": 8.464330011674514e-06, "loss": 0.7617, "step": 8256 }, { "epoch": 0.56, "learning_rate": 8.462148971444678e-06, "loss": 0.7744, "step": 8257 }, { "epoch": 0.56, "learning_rate": 8.459968006138872e-06, "loss": 0.7627, "step": 8258 }, { "epoch": 0.56, "learning_rate": 8.457787115863352e-06, "loss": 0.7842, "step": 8259 }, { "epoch": 0.56, "learning_rate": 8.455606300724364e-06, "loss": 0.7842, "step": 8260 }, { "epoch": 0.56, "learning_rate": 8.453425560828168e-06, "loss": 0.8057, "step": 8261 }, { "epoch": 0.56, "learning_rate": 8.451244896281e-06, "loss": 0.7783, "step": 8262 }, { "epoch": 0.56, "learning_rate": 8.4490643071891e-06, "loss": 0.8535, "step": 8263 }, { "epoch": 0.56, "learning_rate": 8.446883793658715e-06, "loss": 0.7363, "step": 8264 }, { "epoch": 0.56, "learning_rate": 8.444703355796078e-06, "loss": 0.75, "step": 8265 }, { "epoch": 0.56, "learning_rate": 8.442522993707416e-06, "loss": 0.8672, "step": 8266 }, { "epoch": 0.56, "learning_rate": 8.440342707498961e-06, "loss": 0.835, "step": 8267 }, { "epoch": 0.56, "learning_rate": 8.438162497276929e-06, "loss": 0.8408, "step": 8268 }, { "epoch": 0.56, "learning_rate": 8.435982363147542e-06, "loss": 0.8428, "step": 8269 }, { "epoch": 0.56, "learning_rate": 8.433802305217022e-06, "loss": 0.7656, "step": 8270 }, { "epoch": 0.56, "learning_rate": 8.431622323591576e-06, "loss": 0.8145, "step": 8271 }, { "epoch": 0.56, "learning_rate": 8.429442418377415e-06, "loss": 0.7705, "step": 8272 }, { "epoch": 0.56, "learning_rate": 8.427262589680742e-06, "loss": 0.7783, "step": 8273 }, { "epoch": 0.56, "learning_rate": 8.425082837607762e-06, "loss": 0.6582, "step": 8274 }, { "epoch": 0.56, "learning_rate": 8.422903162264664e-06, "loss": 0.8076, "step": 8275 }, { "epoch": 0.56, "learning_rate": 8.420723563757649e-06, "loss": 0.7432, "step": 8276 }, { "epoch": 0.56, "learning_rate": 8.418544042192906e-06, "loss": 0.7393, "step": 8277 }, { "epoch": 0.56, "learning_rate": 8.416364597676618e-06, "loss": 0.7539, "step": 8278 }, { "epoch": 0.56, "learning_rate": 8.414185230314972e-06, "loss": 0.8906, "step": 8279 }, { "epoch": 0.56, "learning_rate": 8.412005940214146e-06, "loss": 0.8447, "step": 8280 }, { "epoch": 0.56, "learning_rate": 8.409826727480308e-06, "loss": 0.7881, "step": 8281 }, { "epoch": 0.56, "learning_rate": 8.407647592219637e-06, "loss": 0.7197, "step": 8282 }, { "epoch": 0.56, "learning_rate": 8.405468534538299e-06, "loss": 0.7832, "step": 8283 }, { "epoch": 0.56, "learning_rate": 8.403289554542453e-06, "loss": 0.6377, "step": 8284 }, { "epoch": 0.56, "learning_rate": 8.401110652338266e-06, "loss": 0.7842, "step": 8285 }, { "epoch": 0.56, "learning_rate": 8.398931828031886e-06, "loss": 0.8467, "step": 8286 }, { "epoch": 0.56, "learning_rate": 8.39675308172947e-06, "loss": 0.7783, "step": 8287 }, { "epoch": 0.56, "learning_rate": 8.394574413537168e-06, "loss": 0.7559, "step": 8288 }, { "epoch": 0.56, "learning_rate": 8.39239582356112e-06, "loss": 0.7598, "step": 8289 }, { "epoch": 0.56, "learning_rate": 8.390217311907472e-06, "loss": 0.7949, "step": 8290 }, { "epoch": 0.57, "learning_rate": 8.388038878682356e-06, "loss": 0.7822, "step": 8291 }, { "epoch": 0.57, "learning_rate": 8.385860523991907e-06, "loss": 0.8203, "step": 8292 }, { "epoch": 0.57, "learning_rate": 8.383682247942253e-06, "loss": 0.7529, "step": 8293 }, { "epoch": 0.57, "learning_rate": 8.381504050639521e-06, "loss": 0.8311, "step": 8294 }, { "epoch": 0.57, "learning_rate": 8.379325932189836e-06, "loss": 0.8037, "step": 8295 }, { "epoch": 0.57, "learning_rate": 8.377147892699314e-06, "loss": 0.8154, "step": 8296 }, { "epoch": 0.57, "learning_rate": 8.374969932274064e-06, "loss": 0.749, "step": 8297 }, { "epoch": 0.57, "learning_rate": 8.372792051020201e-06, "loss": 0.8184, "step": 8298 }, { "epoch": 0.57, "learning_rate": 8.370614249043828e-06, "loss": 0.8838, "step": 8299 }, { "epoch": 0.57, "learning_rate": 8.36843652645105e-06, "loss": 0.791, "step": 8300 }, { "epoch": 0.57, "learning_rate": 8.366258883347967e-06, "loss": 0.8105, "step": 8301 }, { "epoch": 0.57, "learning_rate": 8.364081319840669e-06, "loss": 0.8203, "step": 8302 }, { "epoch": 0.57, "learning_rate": 8.361903836035253e-06, "loss": 0.7812, "step": 8303 }, { "epoch": 0.57, "learning_rate": 8.359726432037798e-06, "loss": 0.707, "step": 8304 }, { "epoch": 0.57, "learning_rate": 8.35754910795439e-06, "loss": 0.8506, "step": 8305 }, { "epoch": 0.57, "learning_rate": 8.355371863891114e-06, "loss": 0.7549, "step": 8306 }, { "epoch": 0.57, "learning_rate": 8.353194699954038e-06, "loss": 0.8193, "step": 8307 }, { "epoch": 0.57, "learning_rate": 8.351017616249239e-06, "loss": 0.752, "step": 8308 }, { "epoch": 0.57, "learning_rate": 8.348840612882778e-06, "loss": 0.834, "step": 8309 }, { "epoch": 0.57, "learning_rate": 8.346663689960724e-06, "loss": 0.8271, "step": 8310 }, { "epoch": 0.57, "learning_rate": 8.34448684758913e-06, "loss": 0.8047, "step": 8311 }, { "epoch": 0.57, "learning_rate": 8.342310085874059e-06, "loss": 0.7617, "step": 8312 }, { "epoch": 0.57, "learning_rate": 8.340133404921561e-06, "loss": 0.7432, "step": 8313 }, { "epoch": 0.57, "learning_rate": 8.337956804837684e-06, "loss": 0.7656, "step": 8314 }, { "epoch": 0.57, "learning_rate": 8.335780285728468e-06, "loss": 0.8154, "step": 8315 }, { "epoch": 0.57, "learning_rate": 8.333603847699956e-06, "loss": 0.7393, "step": 8316 }, { "epoch": 0.57, "learning_rate": 8.33142749085818e-06, "loss": 0.8037, "step": 8317 }, { "epoch": 0.57, "learning_rate": 8.329251215309178e-06, "loss": 0.79, "step": 8318 }, { "epoch": 0.57, "learning_rate": 8.327075021158976e-06, "loss": 0.8242, "step": 8319 }, { "epoch": 0.57, "learning_rate": 8.324898908513597e-06, "loss": 0.8223, "step": 8320 }, { "epoch": 0.57, "learning_rate": 8.322722877479063e-06, "loss": 0.8203, "step": 8321 }, { "epoch": 0.57, "learning_rate": 8.320546928161385e-06, "loss": 0.8105, "step": 8322 }, { "epoch": 0.57, "learning_rate": 8.318371060666577e-06, "loss": 0.7773, "step": 8323 }, { "epoch": 0.57, "learning_rate": 8.316195275100655e-06, "loss": 0.833, "step": 8324 }, { "epoch": 0.57, "learning_rate": 8.314019571569614e-06, "loss": 0.9141, "step": 8325 }, { "epoch": 0.57, "learning_rate": 8.31184395017946e-06, "loss": 0.8037, "step": 8326 }, { "epoch": 0.57, "learning_rate": 8.309668411036182e-06, "loss": 0.8145, "step": 8327 }, { "epoch": 0.57, "learning_rate": 8.307492954245781e-06, "loss": 0.7227, "step": 8328 }, { "epoch": 0.57, "learning_rate": 8.305317579914236e-06, "loss": 0.7451, "step": 8329 }, { "epoch": 0.57, "learning_rate": 8.303142288147537e-06, "loss": 0.8135, "step": 8330 }, { "epoch": 0.57, "learning_rate": 8.300967079051666e-06, "loss": 0.7871, "step": 8331 }, { "epoch": 0.57, "learning_rate": 8.298791952732596e-06, "loss": 0.7812, "step": 8332 }, { "epoch": 0.57, "learning_rate": 8.296616909296296e-06, "loss": 0.8662, "step": 8333 }, { "epoch": 0.57, "learning_rate": 8.294441948848742e-06, "loss": 0.7676, "step": 8334 }, { "epoch": 0.57, "learning_rate": 8.292267071495886e-06, "loss": 0.8281, "step": 8335 }, { "epoch": 0.57, "learning_rate": 8.290092277343698e-06, "loss": 0.833, "step": 8336 }, { "epoch": 0.57, "learning_rate": 8.287917566498133e-06, "loss": 0.8223, "step": 8337 }, { "epoch": 0.57, "learning_rate": 8.285742939065138e-06, "loss": 0.7334, "step": 8338 }, { "epoch": 0.57, "learning_rate": 8.283568395150666e-06, "loss": 0.7646, "step": 8339 }, { "epoch": 0.57, "learning_rate": 8.281393934860654e-06, "loss": 0.8389, "step": 8340 }, { "epoch": 0.57, "learning_rate": 8.279219558301048e-06, "loss": 0.7041, "step": 8341 }, { "epoch": 0.57, "learning_rate": 8.277045265577784e-06, "loss": 0.791, "step": 8342 }, { "epoch": 0.57, "learning_rate": 8.274871056796786e-06, "loss": 0.7939, "step": 8343 }, { "epoch": 0.57, "learning_rate": 8.27269693206399e-06, "loss": 0.7607, "step": 8344 }, { "epoch": 0.57, "learning_rate": 8.270522891485313e-06, "loss": 0.8525, "step": 8345 }, { "epoch": 0.57, "learning_rate": 8.268348935166674e-06, "loss": 0.7383, "step": 8346 }, { "epoch": 0.57, "learning_rate": 8.266175063213995e-06, "loss": 0.7656, "step": 8347 }, { "epoch": 0.57, "learning_rate": 8.26400127573318e-06, "loss": 0.8174, "step": 8348 }, { "epoch": 0.57, "learning_rate": 8.26182757283014e-06, "loss": 0.7432, "step": 8349 }, { "epoch": 0.57, "learning_rate": 8.259653954610776e-06, "loss": 0.7979, "step": 8350 }, { "epoch": 0.57, "learning_rate": 8.257480421180986e-06, "loss": 0.8154, "step": 8351 }, { "epoch": 0.57, "learning_rate": 8.255306972646661e-06, "loss": 0.7402, "step": 8352 }, { "epoch": 0.57, "learning_rate": 8.253133609113699e-06, "loss": 0.8369, "step": 8353 }, { "epoch": 0.57, "learning_rate": 8.25096033068798e-06, "loss": 0.835, "step": 8354 }, { "epoch": 0.57, "learning_rate": 8.248787137475393e-06, "loss": 0.7441, "step": 8355 }, { "epoch": 0.57, "learning_rate": 8.246614029581807e-06, "loss": 0.7773, "step": 8356 }, { "epoch": 0.57, "learning_rate": 8.244441007113104e-06, "loss": 0.7676, "step": 8357 }, { "epoch": 0.57, "learning_rate": 8.242268070175143e-06, "loss": 0.7773, "step": 8358 }, { "epoch": 0.57, "learning_rate": 8.240095218873799e-06, "loss": 0.7598, "step": 8359 }, { "epoch": 0.57, "learning_rate": 8.237922453314933e-06, "loss": 0.791, "step": 8360 }, { "epoch": 0.57, "learning_rate": 8.235749773604395e-06, "loss": 0.7637, "step": 8361 }, { "epoch": 0.57, "learning_rate": 8.233577179848047e-06, "loss": 0.707, "step": 8362 }, { "epoch": 0.57, "learning_rate": 8.231404672151728e-06, "loss": 0.8281, "step": 8363 }, { "epoch": 0.57, "learning_rate": 8.229232250621286e-06, "loss": 0.8184, "step": 8364 }, { "epoch": 0.57, "learning_rate": 8.227059915362566e-06, "loss": 0.8125, "step": 8365 }, { "epoch": 0.57, "learning_rate": 8.2248876664814e-06, "loss": 0.748, "step": 8366 }, { "epoch": 0.57, "learning_rate": 8.222715504083621e-06, "loss": 0.832, "step": 8367 }, { "epoch": 0.57, "learning_rate": 8.220543428275057e-06, "loss": 0.7832, "step": 8368 }, { "epoch": 0.57, "learning_rate": 8.218371439161528e-06, "loss": 0.7803, "step": 8369 }, { "epoch": 0.57, "learning_rate": 8.216199536848852e-06, "loss": 0.6963, "step": 8370 }, { "epoch": 0.57, "learning_rate": 8.214027721442854e-06, "loss": 0.75, "step": 8371 }, { "epoch": 0.57, "learning_rate": 8.211855993049334e-06, "loss": 0.7822, "step": 8372 }, { "epoch": 0.57, "learning_rate": 8.209684351774106e-06, "loss": 0.8027, "step": 8373 }, { "epoch": 0.57, "learning_rate": 8.207512797722967e-06, "loss": 0.7441, "step": 8374 }, { "epoch": 0.57, "learning_rate": 8.205341331001719e-06, "loss": 0.8691, "step": 8375 }, { "epoch": 0.57, "learning_rate": 8.20316995171615e-06, "loss": 0.7217, "step": 8376 }, { "epoch": 0.57, "learning_rate": 8.200998659972054e-06, "loss": 0.7783, "step": 8377 }, { "epoch": 0.57, "learning_rate": 8.19882745587522e-06, "loss": 0.8242, "step": 8378 }, { "epoch": 0.57, "learning_rate": 8.19665633953142e-06, "loss": 0.833, "step": 8379 }, { "epoch": 0.57, "learning_rate": 8.194485311046441e-06, "loss": 0.7402, "step": 8380 }, { "epoch": 0.57, "learning_rate": 8.192314370526044e-06, "loss": 0.7998, "step": 8381 }, { "epoch": 0.57, "learning_rate": 8.190143518076002e-06, "loss": 0.8008, "step": 8382 }, { "epoch": 0.57, "learning_rate": 8.187972753802084e-06, "loss": 0.8086, "step": 8383 }, { "epoch": 0.57, "learning_rate": 8.185802077810045e-06, "loss": 0.8125, "step": 8384 }, { "epoch": 0.57, "learning_rate": 8.183631490205636e-06, "loss": 0.7744, "step": 8385 }, { "epoch": 0.57, "learning_rate": 8.181460991094617e-06, "loss": 0.7607, "step": 8386 }, { "epoch": 0.57, "learning_rate": 8.179290580582727e-06, "loss": 0.7822, "step": 8387 }, { "epoch": 0.57, "learning_rate": 8.177120258775707e-06, "loss": 0.7861, "step": 8388 }, { "epoch": 0.57, "learning_rate": 8.174950025779308e-06, "loss": 0.8037, "step": 8389 }, { "epoch": 0.57, "learning_rate": 8.17277988169925e-06, "loss": 0.8184, "step": 8390 }, { "epoch": 0.57, "learning_rate": 8.170609826641267e-06, "loss": 0.7617, "step": 8391 }, { "epoch": 0.57, "learning_rate": 8.168439860711084e-06, "loss": 0.8623, "step": 8392 }, { "epoch": 0.57, "learning_rate": 8.166269984014425e-06, "loss": 0.8428, "step": 8393 }, { "epoch": 0.57, "learning_rate": 8.164100196656997e-06, "loss": 0.7998, "step": 8394 }, { "epoch": 0.57, "learning_rate": 8.16193049874452e-06, "loss": 0.8105, "step": 8395 }, { "epoch": 0.57, "learning_rate": 8.159760890382703e-06, "loss": 0.8125, "step": 8396 }, { "epoch": 0.57, "learning_rate": 8.15759137167724e-06, "loss": 0.7578, "step": 8397 }, { "epoch": 0.57, "learning_rate": 8.15542194273384e-06, "loss": 0.7275, "step": 8398 }, { "epoch": 0.57, "learning_rate": 8.153252603658193e-06, "loss": 0.8105, "step": 8399 }, { "epoch": 0.57, "learning_rate": 8.151083354555985e-06, "loss": 0.8623, "step": 8400 }, { "epoch": 0.57, "learning_rate": 8.148914195532908e-06, "loss": 0.7559, "step": 8401 }, { "epoch": 0.57, "learning_rate": 8.146745126694644e-06, "loss": 0.7646, "step": 8402 }, { "epoch": 0.57, "learning_rate": 8.144576148146865e-06, "loss": 0.7578, "step": 8403 }, { "epoch": 0.57, "learning_rate": 8.142407259995246e-06, "loss": 0.7969, "step": 8404 }, { "epoch": 0.57, "learning_rate": 8.140238462345453e-06, "loss": 0.8555, "step": 8405 }, { "epoch": 0.57, "learning_rate": 8.138069755303151e-06, "loss": 0.748, "step": 8406 }, { "epoch": 0.57, "learning_rate": 8.135901138974002e-06, "loss": 0.873, "step": 8407 }, { "epoch": 0.57, "learning_rate": 8.133732613463657e-06, "loss": 0.8008, "step": 8408 }, { "epoch": 0.57, "learning_rate": 8.13156417887777e-06, "loss": 0.8545, "step": 8409 }, { "epoch": 0.57, "learning_rate": 8.129395835321983e-06, "loss": 0.7305, "step": 8410 }, { "epoch": 0.57, "learning_rate": 8.127227582901941e-06, "loss": 0.8145, "step": 8411 }, { "epoch": 0.57, "learning_rate": 8.125059421723278e-06, "loss": 0.8115, "step": 8412 }, { "epoch": 0.57, "learning_rate": 8.12289135189163e-06, "loss": 0.8301, "step": 8413 }, { "epoch": 0.57, "learning_rate": 8.120723373512625e-06, "loss": 0.833, "step": 8414 }, { "epoch": 0.57, "learning_rate": 8.118555486691883e-06, "loss": 0.8008, "step": 8415 }, { "epoch": 0.57, "learning_rate": 8.116387691535029e-06, "loss": 0.8008, "step": 8416 }, { "epoch": 0.57, "learning_rate": 8.114219988147675e-06, "loss": 0.8008, "step": 8417 }, { "epoch": 0.57, "learning_rate": 8.112052376635424e-06, "loss": 0.708, "step": 8418 }, { "epoch": 0.57, "learning_rate": 8.109884857103896e-06, "loss": 0.7881, "step": 8419 }, { "epoch": 0.57, "learning_rate": 8.107717429658686e-06, "loss": 0.8701, "step": 8420 }, { "epoch": 0.57, "learning_rate": 8.105550094405387e-06, "loss": 0.7461, "step": 8421 }, { "epoch": 0.57, "learning_rate": 8.103382851449597e-06, "loss": 0.752, "step": 8422 }, { "epoch": 0.57, "learning_rate": 8.101215700896903e-06, "loss": 0.8525, "step": 8423 }, { "epoch": 0.57, "learning_rate": 8.099048642852883e-06, "loss": 0.7607, "step": 8424 }, { "epoch": 0.57, "learning_rate": 8.096881677423126e-06, "loss": 0.708, "step": 8425 }, { "epoch": 0.57, "learning_rate": 8.094714804713196e-06, "loss": 0.7793, "step": 8426 }, { "epoch": 0.57, "learning_rate": 8.092548024828672e-06, "loss": 0.8154, "step": 8427 }, { "epoch": 0.57, "learning_rate": 8.090381337875113e-06, "loss": 0.8516, "step": 8428 }, { "epoch": 0.57, "learning_rate": 8.088214743958084e-06, "loss": 0.7129, "step": 8429 }, { "epoch": 0.57, "learning_rate": 8.086048243183135e-06, "loss": 0.8721, "step": 8430 }, { "epoch": 0.57, "learning_rate": 8.083881835655823e-06, "loss": 0.8115, "step": 8431 }, { "epoch": 0.57, "learning_rate": 8.081715521481699e-06, "loss": 0.8311, "step": 8432 }, { "epoch": 0.57, "learning_rate": 8.079549300766299e-06, "loss": 0.7773, "step": 8433 }, { "epoch": 0.57, "learning_rate": 8.077383173615164e-06, "loss": 0.8545, "step": 8434 }, { "epoch": 0.57, "learning_rate": 8.075217140133829e-06, "loss": 0.8037, "step": 8435 }, { "epoch": 0.57, "learning_rate": 8.073051200427814e-06, "loss": 0.8496, "step": 8436 }, { "epoch": 0.57, "learning_rate": 8.070885354602654e-06, "loss": 0.7852, "step": 8437 }, { "epoch": 0.58, "learning_rate": 8.068719602763868e-06, "loss": 0.7754, "step": 8438 }, { "epoch": 0.58, "learning_rate": 8.066553945016968e-06, "loss": 0.7861, "step": 8439 }, { "epoch": 0.58, "learning_rate": 8.064388381467465e-06, "loss": 0.793, "step": 8440 }, { "epoch": 0.58, "learning_rate": 8.062222912220864e-06, "loss": 0.7539, "step": 8441 }, { "epoch": 0.58, "learning_rate": 8.060057537382669e-06, "loss": 0.8203, "step": 8442 }, { "epoch": 0.58, "learning_rate": 8.057892257058378e-06, "loss": 0.8164, "step": 8443 }, { "epoch": 0.58, "learning_rate": 8.055727071353478e-06, "loss": 0.8467, "step": 8444 }, { "epoch": 0.58, "learning_rate": 8.053561980373464e-06, "loss": 0.7646, "step": 8445 }, { "epoch": 0.58, "learning_rate": 8.051396984223814e-06, "loss": 0.7705, "step": 8446 }, { "epoch": 0.58, "learning_rate": 8.04923208301001e-06, "loss": 0.6973, "step": 8447 }, { "epoch": 0.58, "learning_rate": 8.047067276837517e-06, "loss": 0.7764, "step": 8448 }, { "epoch": 0.58, "learning_rate": 8.044902565811816e-06, "loss": 0.7305, "step": 8449 }, { "epoch": 0.58, "learning_rate": 8.042737950038367e-06, "loss": 0.8398, "step": 8450 }, { "epoch": 0.58, "learning_rate": 8.040573429622629e-06, "loss": 0.7646, "step": 8451 }, { "epoch": 0.58, "learning_rate": 8.038409004670059e-06, "loss": 0.7139, "step": 8452 }, { "epoch": 0.58, "learning_rate": 8.036244675286107e-06, "loss": 0.7627, "step": 8453 }, { "epoch": 0.58, "learning_rate": 8.034080441576214e-06, "loss": 0.7588, "step": 8454 }, { "epoch": 0.58, "learning_rate": 8.031916303645828e-06, "loss": 0.75, "step": 8455 }, { "epoch": 0.58, "learning_rate": 8.029752261600387e-06, "loss": 0.6709, "step": 8456 }, { "epoch": 0.58, "learning_rate": 8.027588315545317e-06, "loss": 0.7256, "step": 8457 }, { "epoch": 0.58, "learning_rate": 8.02542446558605e-06, "loss": 0.8613, "step": 8458 }, { "epoch": 0.58, "learning_rate": 8.023260711828002e-06, "loss": 0.8418, "step": 8459 }, { "epoch": 0.58, "learning_rate": 8.0210970543766e-06, "loss": 0.7754, "step": 8460 }, { "epoch": 0.58, "learning_rate": 8.018933493337253e-06, "loss": 0.7666, "step": 8461 }, { "epoch": 0.58, "learning_rate": 8.016770028815368e-06, "loss": 0.7178, "step": 8462 }, { "epoch": 0.58, "learning_rate": 8.014606660916354e-06, "loss": 0.7402, "step": 8463 }, { "epoch": 0.58, "learning_rate": 8.012443389745603e-06, "loss": 0.7461, "step": 8464 }, { "epoch": 0.58, "learning_rate": 8.01028021540851e-06, "loss": 0.7822, "step": 8465 }, { "epoch": 0.58, "learning_rate": 8.008117138010473e-06, "loss": 0.7529, "step": 8466 }, { "epoch": 0.58, "learning_rate": 8.00595415765687e-06, "loss": 0.7725, "step": 8467 }, { "epoch": 0.58, "learning_rate": 8.003791274453086e-06, "loss": 0.8164, "step": 8468 }, { "epoch": 0.58, "learning_rate": 8.001628488504492e-06, "loss": 0.752, "step": 8469 }, { "epoch": 0.58, "learning_rate": 7.999465799916461e-06, "loss": 0.832, "step": 8470 }, { "epoch": 0.58, "learning_rate": 7.997303208794355e-06, "loss": 0.8555, "step": 8471 }, { "epoch": 0.58, "learning_rate": 7.995140715243543e-06, "loss": 0.791, "step": 8472 }, { "epoch": 0.58, "learning_rate": 7.992978319369376e-06, "loss": 0.7646, "step": 8473 }, { "epoch": 0.58, "learning_rate": 7.99081602127721e-06, "loss": 0.8525, "step": 8474 }, { "epoch": 0.58, "learning_rate": 7.988653821072387e-06, "loss": 0.7783, "step": 8475 }, { "epoch": 0.58, "learning_rate": 7.986491718860255e-06, "loss": 0.7832, "step": 8476 }, { "epoch": 0.58, "learning_rate": 7.984329714746142e-06, "loss": 0.8037, "step": 8477 }, { "epoch": 0.58, "learning_rate": 7.98216780883539e-06, "loss": 0.8096, "step": 8478 }, { "epoch": 0.58, "learning_rate": 7.980006001233325e-06, "loss": 0.7725, "step": 8479 }, { "epoch": 0.58, "learning_rate": 7.977844292045268e-06, "loss": 0.8262, "step": 8480 }, { "epoch": 0.58, "learning_rate": 7.975682681376542e-06, "loss": 0.7871, "step": 8481 }, { "epoch": 0.58, "learning_rate": 7.973521169332452e-06, "loss": 0.7441, "step": 8482 }, { "epoch": 0.58, "learning_rate": 7.971359756018311e-06, "loss": 0.8086, "step": 8483 }, { "epoch": 0.58, "learning_rate": 7.969198441539428e-06, "loss": 0.79, "step": 8484 }, { "epoch": 0.58, "learning_rate": 7.967037226001095e-06, "loss": 0.7344, "step": 8485 }, { "epoch": 0.58, "learning_rate": 7.964876109508614e-06, "loss": 0.8086, "step": 8486 }, { "epoch": 0.58, "learning_rate": 7.962715092167266e-06, "loss": 0.7959, "step": 8487 }, { "epoch": 0.58, "learning_rate": 7.96055417408234e-06, "loss": 0.7617, "step": 8488 }, { "epoch": 0.58, "learning_rate": 7.958393355359113e-06, "loss": 0.708, "step": 8489 }, { "epoch": 0.58, "learning_rate": 7.956232636102866e-06, "loss": 0.7529, "step": 8490 }, { "epoch": 0.58, "learning_rate": 7.954072016418862e-06, "loss": 0.833, "step": 8491 }, { "epoch": 0.58, "learning_rate": 7.951911496412372e-06, "loss": 0.7764, "step": 8492 }, { "epoch": 0.58, "learning_rate": 7.949751076188653e-06, "loss": 0.7451, "step": 8493 }, { "epoch": 0.58, "learning_rate": 7.947590755852963e-06, "loss": 0.8379, "step": 8494 }, { "epoch": 0.58, "learning_rate": 7.945430535510547e-06, "loss": 0.8359, "step": 8495 }, { "epoch": 0.58, "learning_rate": 7.943270415266658e-06, "loss": 0.6533, "step": 8496 }, { "epoch": 0.58, "learning_rate": 7.941110395226534e-06, "loss": 0.7305, "step": 8497 }, { "epoch": 0.58, "learning_rate": 7.93895047549541e-06, "loss": 0.7686, "step": 8498 }, { "epoch": 0.58, "learning_rate": 7.936790656178522e-06, "loss": 0.8057, "step": 8499 }, { "epoch": 0.58, "learning_rate": 7.934630937381089e-06, "loss": 0.752, "step": 8500 }, { "epoch": 0.58, "learning_rate": 7.932471319208335e-06, "loss": 0.8096, "step": 8501 }, { "epoch": 0.58, "learning_rate": 7.930311801765482e-06, "loss": 0.7578, "step": 8502 }, { "epoch": 0.58, "learning_rate": 7.928152385157733e-06, "loss": 0.7266, "step": 8503 }, { "epoch": 0.58, "learning_rate": 7.925993069490303e-06, "loss": 0.8818, "step": 8504 }, { "epoch": 0.58, "learning_rate": 7.923833854868389e-06, "loss": 0.8115, "step": 8505 }, { "epoch": 0.58, "learning_rate": 7.921674741397184e-06, "loss": 0.8389, "step": 8506 }, { "epoch": 0.58, "learning_rate": 7.919515729181884e-06, "loss": 0.79, "step": 8507 }, { "epoch": 0.58, "learning_rate": 7.917356818327681e-06, "loss": 0.7695, "step": 8508 }, { "epoch": 0.58, "learning_rate": 7.915198008939748e-06, "loss": 0.749, "step": 8509 }, { "epoch": 0.58, "learning_rate": 7.913039301123271e-06, "loss": 0.8369, "step": 8510 }, { "epoch": 0.58, "learning_rate": 7.910880694983414e-06, "loss": 0.8389, "step": 8511 }, { "epoch": 0.58, "learning_rate": 7.90872219062535e-06, "loss": 0.7734, "step": 8512 }, { "epoch": 0.58, "learning_rate": 7.906563788154234e-06, "loss": 0.8105, "step": 8513 }, { "epoch": 0.58, "learning_rate": 7.904405487675232e-06, "loss": 0.8555, "step": 8514 }, { "epoch": 0.58, "learning_rate": 7.902247289293494e-06, "loss": 0.7119, "step": 8515 }, { "epoch": 0.58, "learning_rate": 7.900089193114161e-06, "loss": 0.7236, "step": 8516 }, { "epoch": 0.58, "learning_rate": 7.897931199242386e-06, "loss": 0.7725, "step": 8517 }, { "epoch": 0.58, "learning_rate": 7.895773307783297e-06, "loss": 0.7871, "step": 8518 }, { "epoch": 0.58, "learning_rate": 7.893615518842027e-06, "loss": 0.7354, "step": 8519 }, { "epoch": 0.58, "learning_rate": 7.89145783252371e-06, "loss": 0.8623, "step": 8520 }, { "epoch": 0.58, "learning_rate": 7.889300248933465e-06, "loss": 0.8291, "step": 8521 }, { "epoch": 0.58, "learning_rate": 7.887142768176409e-06, "loss": 0.7783, "step": 8522 }, { "epoch": 0.58, "learning_rate": 7.884985390357655e-06, "loss": 0.7568, "step": 8523 }, { "epoch": 0.58, "learning_rate": 7.882828115582306e-06, "loss": 0.7217, "step": 8524 }, { "epoch": 0.58, "learning_rate": 7.880670943955467e-06, "loss": 0.8047, "step": 8525 }, { "epoch": 0.58, "learning_rate": 7.878513875582242e-06, "loss": 0.8115, "step": 8526 }, { "epoch": 0.58, "learning_rate": 7.876356910567712e-06, "loss": 0.7891, "step": 8527 }, { "epoch": 0.58, "learning_rate": 7.874200049016975e-06, "loss": 0.7109, "step": 8528 }, { "epoch": 0.58, "learning_rate": 7.872043291035104e-06, "loss": 0.7559, "step": 8529 }, { "epoch": 0.58, "learning_rate": 7.869886636727183e-06, "loss": 0.8203, "step": 8530 }, { "epoch": 0.58, "learning_rate": 7.867730086198277e-06, "loss": 0.7588, "step": 8531 }, { "epoch": 0.58, "learning_rate": 7.86557363955346e-06, "loss": 0.8066, "step": 8532 }, { "epoch": 0.58, "learning_rate": 7.863417296897792e-06, "loss": 0.6982, "step": 8533 }, { "epoch": 0.58, "learning_rate": 7.861261058336327e-06, "loss": 0.6621, "step": 8534 }, { "epoch": 0.58, "learning_rate": 7.859104923974122e-06, "loss": 0.8477, "step": 8535 }, { "epoch": 0.58, "learning_rate": 7.856948893916218e-06, "loss": 0.7979, "step": 8536 }, { "epoch": 0.58, "learning_rate": 7.854792968267658e-06, "loss": 0.7871, "step": 8537 }, { "epoch": 0.58, "learning_rate": 7.852637147133482e-06, "loss": 0.7695, "step": 8538 }, { "epoch": 0.58, "learning_rate": 7.85048143061872e-06, "loss": 0.749, "step": 8539 }, { "epoch": 0.58, "learning_rate": 7.8483258188284e-06, "loss": 0.7646, "step": 8540 }, { "epoch": 0.58, "learning_rate": 7.846170311867539e-06, "loss": 0.6953, "step": 8541 }, { "epoch": 0.58, "learning_rate": 7.844014909841153e-06, "loss": 0.8018, "step": 8542 }, { "epoch": 0.58, "learning_rate": 7.841859612854255e-06, "loss": 0.8018, "step": 8543 }, { "epoch": 0.58, "learning_rate": 7.839704421011856e-06, "loss": 0.8193, "step": 8544 }, { "epoch": 0.58, "learning_rate": 7.83754933441895e-06, "loss": 0.8379, "step": 8545 }, { "epoch": 0.58, "learning_rate": 7.835394353180535e-06, "loss": 0.7607, "step": 8546 }, { "epoch": 0.58, "learning_rate": 7.833239477401601e-06, "loss": 0.7852, "step": 8547 }, { "epoch": 0.58, "learning_rate": 7.831084707187137e-06, "loss": 0.7559, "step": 8548 }, { "epoch": 0.58, "learning_rate": 7.828930042642115e-06, "loss": 0.7744, "step": 8549 }, { "epoch": 0.58, "learning_rate": 7.826775483871518e-06, "loss": 0.8701, "step": 8550 }, { "epoch": 0.58, "learning_rate": 7.824621030980313e-06, "loss": 0.7588, "step": 8551 }, { "epoch": 0.58, "learning_rate": 7.822466684073466e-06, "loss": 0.8086, "step": 8552 }, { "epoch": 0.58, "learning_rate": 7.82031244325594e-06, "loss": 0.7803, "step": 8553 }, { "epoch": 0.58, "learning_rate": 7.81815830863268e-06, "loss": 0.8018, "step": 8554 }, { "epoch": 0.58, "learning_rate": 7.816004280308637e-06, "loss": 0.7197, "step": 8555 }, { "epoch": 0.58, "learning_rate": 7.813850358388767e-06, "loss": 0.8076, "step": 8556 }, { "epoch": 0.58, "learning_rate": 7.811696542978e-06, "loss": 0.7783, "step": 8557 }, { "epoch": 0.58, "learning_rate": 7.809542834181269e-06, "loss": 0.791, "step": 8558 }, { "epoch": 0.58, "learning_rate": 7.807389232103505e-06, "loss": 0.751, "step": 8559 }, { "epoch": 0.58, "learning_rate": 7.80523573684963e-06, "loss": 0.7266, "step": 8560 }, { "epoch": 0.58, "learning_rate": 7.803082348524558e-06, "loss": 0.8174, "step": 8561 }, { "epoch": 0.58, "learning_rate": 7.800929067233214e-06, "loss": 0.7666, "step": 8562 }, { "epoch": 0.58, "learning_rate": 7.798775893080496e-06, "loss": 0.79, "step": 8563 }, { "epoch": 0.58, "learning_rate": 7.796622826171311e-06, "loss": 0.7432, "step": 8564 }, { "epoch": 0.58, "learning_rate": 7.794469866610552e-06, "loss": 0.8369, "step": 8565 }, { "epoch": 0.58, "learning_rate": 7.792317014503116e-06, "loss": 0.7354, "step": 8566 }, { "epoch": 0.58, "learning_rate": 7.790164269953883e-06, "loss": 0.8164, "step": 8567 }, { "epoch": 0.58, "learning_rate": 7.78801163306774e-06, "loss": 0.667, "step": 8568 }, { "epoch": 0.58, "learning_rate": 7.785859103949566e-06, "loss": 0.8662, "step": 8569 }, { "epoch": 0.58, "learning_rate": 7.783706682704227e-06, "loss": 0.8594, "step": 8570 }, { "epoch": 0.58, "learning_rate": 7.78155436943659e-06, "loss": 0.8018, "step": 8571 }, { "epoch": 0.58, "learning_rate": 7.779402164251516e-06, "loss": 0.6953, "step": 8572 }, { "epoch": 0.58, "learning_rate": 7.777250067253856e-06, "loss": 0.832, "step": 8573 }, { "epoch": 0.58, "learning_rate": 7.775098078548471e-06, "loss": 0.834, "step": 8574 }, { "epoch": 0.58, "learning_rate": 7.772946198240198e-06, "loss": 0.7578, "step": 8575 }, { "epoch": 0.58, "learning_rate": 7.770794426433876e-06, "loss": 0.8174, "step": 8576 }, { "epoch": 0.58, "learning_rate": 7.768642763234342e-06, "loss": 0.709, "step": 8577 }, { "epoch": 0.58, "learning_rate": 7.76649120874642e-06, "loss": 0.7949, "step": 8578 }, { "epoch": 0.58, "learning_rate": 7.76433976307494e-06, "loss": 0.7764, "step": 8579 }, { "epoch": 0.58, "learning_rate": 7.762188426324719e-06, "loss": 0.8223, "step": 8580 }, { "epoch": 0.58, "learning_rate": 7.760037198600566e-06, "loss": 0.793, "step": 8581 }, { "epoch": 0.58, "learning_rate": 7.757886080007296e-06, "loss": 0.8164, "step": 8582 }, { "epoch": 0.58, "learning_rate": 7.755735070649702e-06, "loss": 0.8379, "step": 8583 }, { "epoch": 0.58, "learning_rate": 7.753584170632586e-06, "loss": 0.7676, "step": 8584 }, { "epoch": 0.59, "learning_rate": 7.751433380060743e-06, "loss": 0.7871, "step": 8585 }, { "epoch": 0.59, "learning_rate": 7.749282699038954e-06, "loss": 0.834, "step": 8586 }, { "epoch": 0.59, "learning_rate": 7.747132127672004e-06, "loss": 0.8672, "step": 8587 }, { "epoch": 0.59, "learning_rate": 7.744981666064664e-06, "loss": 0.7637, "step": 8588 }, { "epoch": 0.59, "learning_rate": 7.74283131432171e-06, "loss": 0.751, "step": 8589 }, { "epoch": 0.59, "learning_rate": 7.740681072547901e-06, "loss": 0.7715, "step": 8590 }, { "epoch": 0.59, "learning_rate": 7.738530940848002e-06, "loss": 0.8672, "step": 8591 }, { "epoch": 0.59, "learning_rate": 7.736380919326765e-06, "loss": 0.7441, "step": 8592 }, { "epoch": 0.59, "learning_rate": 7.734231008088942e-06, "loss": 0.7646, "step": 8593 }, { "epoch": 0.59, "learning_rate": 7.73208120723927e-06, "loss": 0.7354, "step": 8594 }, { "epoch": 0.59, "learning_rate": 7.729931516882495e-06, "loss": 0.7734, "step": 8595 }, { "epoch": 0.59, "learning_rate": 7.72778193712334e-06, "loss": 0.8174, "step": 8596 }, { "epoch": 0.59, "learning_rate": 7.725632468066541e-06, "loss": 0.7314, "step": 8597 }, { "epoch": 0.59, "learning_rate": 7.723483109816819e-06, "loss": 0.7725, "step": 8598 }, { "epoch": 0.59, "learning_rate": 7.721333862478886e-06, "loss": 0.8018, "step": 8599 }, { "epoch": 0.59, "learning_rate": 7.71918472615746e-06, "loss": 0.8037, "step": 8600 }, { "epoch": 0.59, "learning_rate": 7.71703570095724e-06, "loss": 0.7998, "step": 8601 }, { "epoch": 0.59, "learning_rate": 7.714886786982927e-06, "loss": 0.7998, "step": 8602 }, { "epoch": 0.59, "learning_rate": 7.712737984339222e-06, "loss": 0.8203, "step": 8603 }, { "epoch": 0.59, "learning_rate": 7.710589293130809e-06, "loss": 0.8027, "step": 8604 }, { "epoch": 0.59, "learning_rate": 7.708440713462377e-06, "loss": 0.7803, "step": 8605 }, { "epoch": 0.59, "learning_rate": 7.706292245438599e-06, "loss": 0.7715, "step": 8606 }, { "epoch": 0.59, "learning_rate": 7.704143889164153e-06, "loss": 0.8945, "step": 8607 }, { "epoch": 0.59, "learning_rate": 7.7019956447437e-06, "loss": 0.8135, "step": 8608 }, { "epoch": 0.59, "learning_rate": 7.69984751228191e-06, "loss": 0.7969, "step": 8609 }, { "epoch": 0.59, "learning_rate": 7.697699491883438e-06, "loss": 0.7695, "step": 8610 }, { "epoch": 0.59, "learning_rate": 7.695551583652935e-06, "loss": 0.8262, "step": 8611 }, { "epoch": 0.59, "learning_rate": 7.693403787695047e-06, "loss": 0.7373, "step": 8612 }, { "epoch": 0.59, "learning_rate": 7.691256104114413e-06, "loss": 0.7451, "step": 8613 }, { "epoch": 0.59, "learning_rate": 7.689108533015666e-06, "loss": 0.792, "step": 8614 }, { "epoch": 0.59, "learning_rate": 7.68696107450344e-06, "loss": 0.7734, "step": 8615 }, { "epoch": 0.59, "learning_rate": 7.68481372868236e-06, "loss": 0.8213, "step": 8616 }, { "epoch": 0.59, "learning_rate": 7.68266649565704e-06, "loss": 0.7891, "step": 8617 }, { "epoch": 0.59, "learning_rate": 7.680519375532099e-06, "loss": 0.8154, "step": 8618 }, { "epoch": 0.59, "learning_rate": 7.678372368412136e-06, "loss": 0.7686, "step": 8619 }, { "epoch": 0.59, "learning_rate": 7.676225474401759e-06, "loss": 0.8125, "step": 8620 }, { "epoch": 0.59, "learning_rate": 7.674078693605566e-06, "loss": 0.7568, "step": 8621 }, { "epoch": 0.59, "learning_rate": 7.671932026128143e-06, "loss": 0.8623, "step": 8622 }, { "epoch": 0.59, "learning_rate": 7.66978547207408e-06, "loss": 0.8525, "step": 8623 }, { "epoch": 0.59, "learning_rate": 7.667639031547955e-06, "loss": 0.8027, "step": 8624 }, { "epoch": 0.59, "learning_rate": 7.665492704654343e-06, "loss": 0.8057, "step": 8625 }, { "epoch": 0.59, "learning_rate": 7.663346491497809e-06, "loss": 0.6963, "step": 8626 }, { "epoch": 0.59, "learning_rate": 7.661200392182925e-06, "loss": 0.791, "step": 8627 }, { "epoch": 0.59, "learning_rate": 7.659054406814241e-06, "loss": 0.7861, "step": 8628 }, { "epoch": 0.59, "learning_rate": 7.656908535496314e-06, "loss": 0.8477, "step": 8629 }, { "epoch": 0.59, "learning_rate": 7.654762778333687e-06, "loss": 0.666, "step": 8630 }, { "epoch": 0.59, "learning_rate": 7.652617135430905e-06, "loss": 0.8037, "step": 8631 }, { "epoch": 0.59, "learning_rate": 7.650471606892498e-06, "loss": 0.7861, "step": 8632 }, { "epoch": 0.59, "learning_rate": 7.648326192823002e-06, "loss": 0.8164, "step": 8633 }, { "epoch": 0.59, "learning_rate": 7.64618089332694e-06, "loss": 0.7158, "step": 8634 }, { "epoch": 0.59, "learning_rate": 7.644035708508829e-06, "loss": 0.8301, "step": 8635 }, { "epoch": 0.59, "learning_rate": 7.641890638473186e-06, "loss": 0.7261, "step": 8636 }, { "epoch": 0.59, "learning_rate": 7.639745683324513e-06, "loss": 0.7842, "step": 8637 }, { "epoch": 0.59, "learning_rate": 7.637600843167314e-06, "loss": 0.7871, "step": 8638 }, { "epoch": 0.59, "learning_rate": 7.635456118106091e-06, "loss": 0.8057, "step": 8639 }, { "epoch": 0.59, "learning_rate": 7.633311508245327e-06, "loss": 0.6904, "step": 8640 }, { "epoch": 0.59, "learning_rate": 7.631167013689513e-06, "loss": 0.8105, "step": 8641 }, { "epoch": 0.59, "learning_rate": 7.629022634543126e-06, "loss": 0.7822, "step": 8642 }, { "epoch": 0.59, "learning_rate": 7.626878370910642e-06, "loss": 0.749, "step": 8643 }, { "epoch": 0.59, "learning_rate": 7.624734222896524e-06, "loss": 0.8408, "step": 8644 }, { "epoch": 0.59, "learning_rate": 7.622590190605242e-06, "loss": 0.8291, "step": 8645 }, { "epoch": 0.59, "learning_rate": 7.62044627414125e-06, "loss": 0.7842, "step": 8646 }, { "epoch": 0.59, "learning_rate": 7.618302473609001e-06, "loss": 0.7871, "step": 8647 }, { "epoch": 0.59, "learning_rate": 7.616158789112935e-06, "loss": 0.8027, "step": 8648 }, { "epoch": 0.59, "learning_rate": 7.6140152207575e-06, "loss": 0.7842, "step": 8649 }, { "epoch": 0.59, "learning_rate": 7.611871768647123e-06, "loss": 0.7988, "step": 8650 }, { "epoch": 0.59, "learning_rate": 7.609728432886241e-06, "loss": 0.8174, "step": 8651 }, { "epoch": 0.59, "learning_rate": 7.6075852135792725e-06, "loss": 0.75, "step": 8652 }, { "epoch": 0.59, "learning_rate": 7.605442110830634e-06, "loss": 0.8037, "step": 8653 }, { "epoch": 0.59, "learning_rate": 7.603299124744743e-06, "loss": 0.7393, "step": 8654 }, { "epoch": 0.59, "learning_rate": 7.601156255425999e-06, "loss": 0.7725, "step": 8655 }, { "epoch": 0.59, "learning_rate": 7.599013502978801e-06, "loss": 0.7324, "step": 8656 }, { "epoch": 0.59, "learning_rate": 7.596870867507554e-06, "loss": 0.8018, "step": 8657 }, { "epoch": 0.59, "learning_rate": 7.59472834911664e-06, "loss": 0.8906, "step": 8658 }, { "epoch": 0.59, "learning_rate": 7.592585947910444e-06, "loss": 0.8262, "step": 8659 }, { "epoch": 0.59, "learning_rate": 7.590443663993342e-06, "loss": 0.7402, "step": 8660 }, { "epoch": 0.59, "learning_rate": 7.588301497469709e-06, "loss": 0.7715, "step": 8661 }, { "epoch": 0.59, "learning_rate": 7.586159448443905e-06, "loss": 0.7676, "step": 8662 }, { "epoch": 0.59, "learning_rate": 7.584017517020299e-06, "loss": 0.7783, "step": 8663 }, { "epoch": 0.59, "learning_rate": 7.581875703303241e-06, "loss": 0.7529, "step": 8664 }, { "epoch": 0.59, "learning_rate": 7.579734007397081e-06, "loss": 0.8105, "step": 8665 }, { "epoch": 0.59, "learning_rate": 7.577592429406161e-06, "loss": 0.79, "step": 8666 }, { "epoch": 0.59, "learning_rate": 7.575450969434822e-06, "loss": 0.8164, "step": 8667 }, { "epoch": 0.59, "learning_rate": 7.573309627587389e-06, "loss": 0.8184, "step": 8668 }, { "epoch": 0.59, "learning_rate": 7.5711684039681945e-06, "loss": 0.792, "step": 8669 }, { "epoch": 0.59, "learning_rate": 7.5690272986815596e-06, "loss": 0.7852, "step": 8670 }, { "epoch": 0.59, "learning_rate": 7.5668863118317935e-06, "loss": 0.6973, "step": 8671 }, { "epoch": 0.59, "learning_rate": 7.56474544352321e-06, "loss": 0.7773, "step": 8672 }, { "epoch": 0.59, "learning_rate": 7.562604693860107e-06, "loss": 0.7139, "step": 8673 }, { "epoch": 0.59, "learning_rate": 7.560464062946784e-06, "loss": 0.7002, "step": 8674 }, { "epoch": 0.59, "learning_rate": 7.558323550887537e-06, "loss": 0.8154, "step": 8675 }, { "epoch": 0.59, "learning_rate": 7.556183157786643e-06, "loss": 0.7725, "step": 8676 }, { "epoch": 0.59, "learning_rate": 7.554042883748391e-06, "loss": 0.75, "step": 8677 }, { "epoch": 0.59, "learning_rate": 7.551902728877049e-06, "loss": 0.7744, "step": 8678 }, { "epoch": 0.59, "learning_rate": 7.549762693276884e-06, "loss": 0.8008, "step": 8679 }, { "epoch": 0.59, "learning_rate": 7.547622777052161e-06, "loss": 0.8115, "step": 8680 }, { "epoch": 0.59, "learning_rate": 7.54548298030714e-06, "loss": 0.6963, "step": 8681 }, { "epoch": 0.59, "learning_rate": 7.543343303146066e-06, "loss": 0.7812, "step": 8682 }, { "epoch": 0.59, "learning_rate": 7.541203745673189e-06, "loss": 0.7803, "step": 8683 }, { "epoch": 0.59, "learning_rate": 7.539064307992743e-06, "loss": 0.834, "step": 8684 }, { "epoch": 0.59, "learning_rate": 7.536924990208966e-06, "loss": 0.7686, "step": 8685 }, { "epoch": 0.59, "learning_rate": 7.534785792426079e-06, "loss": 0.7578, "step": 8686 }, { "epoch": 0.59, "learning_rate": 7.532646714748311e-06, "loss": 0.7812, "step": 8687 }, { "epoch": 0.59, "learning_rate": 7.530507757279877e-06, "loss": 0.8135, "step": 8688 }, { "epoch": 0.59, "learning_rate": 7.528368920124981e-06, "loss": 0.7676, "step": 8689 }, { "epoch": 0.59, "learning_rate": 7.526230203387834e-06, "loss": 0.7891, "step": 8690 }, { "epoch": 0.59, "learning_rate": 7.524091607172629e-06, "loss": 0.79, "step": 8691 }, { "epoch": 0.59, "learning_rate": 7.521953131583557e-06, "loss": 0.8486, "step": 8692 }, { "epoch": 0.59, "learning_rate": 7.519814776724812e-06, "loss": 0.8828, "step": 8693 }, { "epoch": 0.59, "learning_rate": 7.517676542700568e-06, "loss": 0.8301, "step": 8694 }, { "epoch": 0.59, "learning_rate": 7.515538429615005e-06, "loss": 0.8223, "step": 8695 }, { "epoch": 0.59, "learning_rate": 7.513400437572288e-06, "loss": 0.7588, "step": 8696 }, { "epoch": 0.59, "learning_rate": 7.511262566676574e-06, "loss": 0.8301, "step": 8697 }, { "epoch": 0.59, "learning_rate": 7.509124817032032e-06, "loss": 0.709, "step": 8698 }, { "epoch": 0.59, "learning_rate": 7.506987188742808e-06, "loss": 0.7676, "step": 8699 }, { "epoch": 0.59, "learning_rate": 7.504849681913045e-06, "loss": 0.752, "step": 8700 }, { "epoch": 0.59, "learning_rate": 7.502712296646885e-06, "loss": 0.7578, "step": 8701 }, { "epoch": 0.59, "learning_rate": 7.500575033048458e-06, "loss": 0.8809, "step": 8702 }, { "epoch": 0.59, "learning_rate": 7.4984378912218925e-06, "loss": 0.751, "step": 8703 }, { "epoch": 0.59, "learning_rate": 7.496300871271314e-06, "loss": 0.7021, "step": 8704 }, { "epoch": 0.59, "learning_rate": 7.494163973300835e-06, "loss": 0.749, "step": 8705 }, { "epoch": 0.59, "learning_rate": 7.492027197414564e-06, "loss": 0.7754, "step": 8706 }, { "epoch": 0.59, "learning_rate": 7.4898905437166044e-06, "loss": 0.7461, "step": 8707 }, { "epoch": 0.59, "learning_rate": 7.487754012311058e-06, "loss": 0.8018, "step": 8708 }, { "epoch": 0.59, "learning_rate": 7.485617603302009e-06, "loss": 0.7773, "step": 8709 }, { "epoch": 0.59, "learning_rate": 7.4834813167935504e-06, "loss": 0.7607, "step": 8710 }, { "epoch": 0.59, "learning_rate": 7.481345152889761e-06, "loss": 0.7666, "step": 8711 }, { "epoch": 0.59, "learning_rate": 7.479209111694712e-06, "loss": 0.8271, "step": 8712 }, { "epoch": 0.59, "learning_rate": 7.477073193312472e-06, "loss": 0.8662, "step": 8713 }, { "epoch": 0.59, "learning_rate": 7.474937397847104e-06, "loss": 0.7705, "step": 8714 }, { "epoch": 0.59, "learning_rate": 7.472801725402658e-06, "loss": 0.6758, "step": 8715 }, { "epoch": 0.59, "learning_rate": 7.470666176083193e-06, "loss": 0.8467, "step": 8716 }, { "epoch": 0.59, "learning_rate": 7.468530749992748e-06, "loss": 0.8447, "step": 8717 }, { "epoch": 0.59, "learning_rate": 7.466395447235362e-06, "loss": 0.8418, "step": 8718 }, { "epoch": 0.59, "learning_rate": 7.4642602679150664e-06, "loss": 0.8193, "step": 8719 }, { "epoch": 0.59, "learning_rate": 7.462125212135884e-06, "loss": 0.7715, "step": 8720 }, { "epoch": 0.59, "learning_rate": 7.459990280001837e-06, "loss": 0.7881, "step": 8721 }, { "epoch": 0.59, "learning_rate": 7.457855471616943e-06, "loss": 0.8604, "step": 8722 }, { "epoch": 0.59, "learning_rate": 7.455720787085205e-06, "loss": 0.8096, "step": 8723 }, { "epoch": 0.59, "learning_rate": 7.4535862265106295e-06, "loss": 0.7705, "step": 8724 }, { "epoch": 0.59, "learning_rate": 7.451451789997206e-06, "loss": 0.8359, "step": 8725 }, { "epoch": 0.59, "learning_rate": 7.449317477648928e-06, "loss": 0.8467, "step": 8726 }, { "epoch": 0.59, "learning_rate": 7.447183289569775e-06, "loss": 0.7715, "step": 8727 }, { "epoch": 0.59, "learning_rate": 7.445049225863729e-06, "loss": 0.7598, "step": 8728 }, { "epoch": 0.59, "learning_rate": 7.442915286634762e-06, "loss": 0.8359, "step": 8729 }, { "epoch": 0.59, "learning_rate": 7.440781471986835e-06, "loss": 0.8467, "step": 8730 }, { "epoch": 0.59, "learning_rate": 7.4386477820239136e-06, "loss": 0.835, "step": 8731 }, { "epoch": 0.6, "learning_rate": 7.436514216849947e-06, "loss": 0.8037, "step": 8732 }, { "epoch": 0.6, "learning_rate": 7.434380776568878e-06, "loss": 0.8271, "step": 8733 }, { "epoch": 0.6, "learning_rate": 7.432247461284654e-06, "loss": 0.8252, "step": 8734 }, { "epoch": 0.6, "learning_rate": 7.430114271101212e-06, "loss": 0.7871, "step": 8735 }, { "epoch": 0.6, "learning_rate": 7.427981206122475e-06, "loss": 0.7656, "step": 8736 }, { "epoch": 0.6, "learning_rate": 7.425848266452369e-06, "loss": 0.7803, "step": 8737 }, { "epoch": 0.6, "learning_rate": 7.423715452194809e-06, "loss": 0.7354, "step": 8738 }, { "epoch": 0.6, "learning_rate": 7.421582763453704e-06, "loss": 0.7344, "step": 8739 }, { "epoch": 0.6, "learning_rate": 7.419450200332965e-06, "loss": 0.7363, "step": 8740 }, { "epoch": 0.6, "learning_rate": 7.417317762936485e-06, "loss": 0.7646, "step": 8741 }, { "epoch": 0.6, "learning_rate": 7.415185451368159e-06, "loss": 0.7812, "step": 8742 }, { "epoch": 0.6, "learning_rate": 7.413053265731871e-06, "loss": 0.8037, "step": 8743 }, { "epoch": 0.6, "learning_rate": 7.410921206131502e-06, "loss": 0.7988, "step": 8744 }, { "epoch": 0.6, "learning_rate": 7.408789272670922e-06, "loss": 0.7822, "step": 8745 }, { "epoch": 0.6, "learning_rate": 7.406657465454005e-06, "loss": 0.7607, "step": 8746 }, { "epoch": 0.6, "learning_rate": 7.404525784584611e-06, "loss": 0.8105, "step": 8747 }, { "epoch": 0.6, "learning_rate": 7.402394230166595e-06, "loss": 0.8232, "step": 8748 }, { "epoch": 0.6, "learning_rate": 7.400262802303803e-06, "loss": 0.7559, "step": 8749 }, { "epoch": 0.6, "learning_rate": 7.398131501100083e-06, "loss": 0.8789, "step": 8750 }, { "epoch": 0.6, "learning_rate": 7.396000326659265e-06, "loss": 0.8066, "step": 8751 }, { "epoch": 0.6, "learning_rate": 7.393869279085187e-06, "loss": 0.7441, "step": 8752 }, { "epoch": 0.6, "learning_rate": 7.391738358481671e-06, "loss": 0.8271, "step": 8753 }, { "epoch": 0.6, "learning_rate": 7.389607564952534e-06, "loss": 0.7607, "step": 8754 }, { "epoch": 0.6, "learning_rate": 7.38747689860159e-06, "loss": 0.752, "step": 8755 }, { "epoch": 0.6, "learning_rate": 7.3853463595326435e-06, "loss": 0.7393, "step": 8756 }, { "epoch": 0.6, "learning_rate": 7.383215947849491e-06, "loss": 0.7734, "step": 8757 }, { "epoch": 0.6, "learning_rate": 7.381085663655936e-06, "loss": 0.8203, "step": 8758 }, { "epoch": 0.6, "learning_rate": 7.3789555070557564e-06, "loss": 0.8223, "step": 8759 }, { "epoch": 0.6, "learning_rate": 7.376825478152739e-06, "loss": 0.7285, "step": 8760 }, { "epoch": 0.6, "learning_rate": 7.3746955770506545e-06, "loss": 0.749, "step": 8761 }, { "epoch": 0.6, "learning_rate": 7.372565803853276e-06, "loss": 0.7715, "step": 8762 }, { "epoch": 0.6, "learning_rate": 7.370436158664358e-06, "loss": 0.7109, "step": 8763 }, { "epoch": 0.6, "learning_rate": 7.368306641587666e-06, "loss": 0.7705, "step": 8764 }, { "epoch": 0.6, "learning_rate": 7.366177252726947e-06, "loss": 0.7871, "step": 8765 }, { "epoch": 0.6, "learning_rate": 7.364047992185945e-06, "loss": 0.7793, "step": 8766 }, { "epoch": 0.6, "learning_rate": 7.361918860068392e-06, "loss": 0.8477, "step": 8767 }, { "epoch": 0.6, "learning_rate": 7.359789856478027e-06, "loss": 0.7334, "step": 8768 }, { "epoch": 0.6, "learning_rate": 7.357660981518566e-06, "loss": 0.7344, "step": 8769 }, { "epoch": 0.6, "learning_rate": 7.355532235293736e-06, "loss": 0.7793, "step": 8770 }, { "epoch": 0.6, "learning_rate": 7.35340361790725e-06, "loss": 0.6973, "step": 8771 }, { "epoch": 0.6, "learning_rate": 7.351275129462807e-06, "loss": 0.8193, "step": 8772 }, { "epoch": 0.6, "learning_rate": 7.3491467700641125e-06, "loss": 0.7627, "step": 8773 }, { "epoch": 0.6, "learning_rate": 7.347018539814857e-06, "loss": 0.7227, "step": 8774 }, { "epoch": 0.6, "learning_rate": 7.344890438818727e-06, "loss": 0.8154, "step": 8775 }, { "epoch": 0.6, "learning_rate": 7.342762467179408e-06, "loss": 0.792, "step": 8776 }, { "epoch": 0.6, "learning_rate": 7.340634625000571e-06, "loss": 0.7373, "step": 8777 }, { "epoch": 0.6, "learning_rate": 7.338506912385888e-06, "loss": 0.8721, "step": 8778 }, { "epoch": 0.6, "learning_rate": 7.336379329439015e-06, "loss": 0.7959, "step": 8779 }, { "epoch": 0.6, "learning_rate": 7.334251876263614e-06, "loss": 0.7881, "step": 8780 }, { "epoch": 0.6, "learning_rate": 7.332124552963327e-06, "loss": 0.7979, "step": 8781 }, { "epoch": 0.6, "learning_rate": 7.329997359641805e-06, "loss": 0.8281, "step": 8782 }, { "epoch": 0.6, "learning_rate": 7.327870296402682e-06, "loss": 0.7432, "step": 8783 }, { "epoch": 0.6, "learning_rate": 7.325743363349589e-06, "loss": 0.7773, "step": 8784 }, { "epoch": 0.6, "learning_rate": 7.3236165605861455e-06, "loss": 0.8184, "step": 8785 }, { "epoch": 0.6, "learning_rate": 7.3214898882159755e-06, "loss": 0.7627, "step": 8786 }, { "epoch": 0.6, "learning_rate": 7.319363346342683e-06, "loss": 0.8027, "step": 8787 }, { "epoch": 0.6, "learning_rate": 7.31723693506988e-06, "loss": 0.6689, "step": 8788 }, { "epoch": 0.6, "learning_rate": 7.315110654501165e-06, "loss": 0.7842, "step": 8789 }, { "epoch": 0.6, "learning_rate": 7.312984504740126e-06, "loss": 0.7451, "step": 8790 }, { "epoch": 0.6, "learning_rate": 7.310858485890352e-06, "loss": 0.8047, "step": 8791 }, { "epoch": 0.6, "learning_rate": 7.30873259805542e-06, "loss": 0.8115, "step": 8792 }, { "epoch": 0.6, "learning_rate": 7.306606841338902e-06, "loss": 0.8018, "step": 8793 }, { "epoch": 0.6, "learning_rate": 7.304481215844373e-06, "loss": 0.7939, "step": 8794 }, { "epoch": 0.6, "learning_rate": 7.302355721675384e-06, "loss": 0.7891, "step": 8795 }, { "epoch": 0.6, "learning_rate": 7.300230358935495e-06, "loss": 0.7959, "step": 8796 }, { "epoch": 0.6, "learning_rate": 7.29810512772825e-06, "loss": 0.7969, "step": 8797 }, { "epoch": 0.6, "learning_rate": 7.2959800281571925e-06, "loss": 0.7852, "step": 8798 }, { "epoch": 0.6, "learning_rate": 7.2938550603258525e-06, "loss": 0.8271, "step": 8799 }, { "epoch": 0.6, "learning_rate": 7.291730224337764e-06, "loss": 0.8174, "step": 8800 }, { "epoch": 0.6, "learning_rate": 7.28960552029645e-06, "loss": 0.7432, "step": 8801 }, { "epoch": 0.6, "learning_rate": 7.287480948305421e-06, "loss": 0.7822, "step": 8802 }, { "epoch": 0.6, "learning_rate": 7.285356508468186e-06, "loss": 0.7686, "step": 8803 }, { "epoch": 0.6, "learning_rate": 7.283232200888253e-06, "loss": 0.8115, "step": 8804 }, { "epoch": 0.6, "learning_rate": 7.2811080256691105e-06, "loss": 0.8086, "step": 8805 }, { "epoch": 0.6, "learning_rate": 7.278983982914254e-06, "loss": 0.7754, "step": 8806 }, { "epoch": 0.6, "learning_rate": 7.2768600727271665e-06, "loss": 0.7822, "step": 8807 }, { "epoch": 0.6, "learning_rate": 7.274736295211322e-06, "loss": 0.7246, "step": 8808 }, { "epoch": 0.6, "learning_rate": 7.272612650470194e-06, "loss": 0.75, "step": 8809 }, { "epoch": 0.6, "learning_rate": 7.270489138607244e-06, "loss": 0.751, "step": 8810 }, { "epoch": 0.6, "learning_rate": 7.2683657597259264e-06, "loss": 0.7861, "step": 8811 }, { "epoch": 0.6, "learning_rate": 7.2662425139297e-06, "loss": 0.8291, "step": 8812 }, { "epoch": 0.6, "learning_rate": 7.264119401322004e-06, "loss": 0.8828, "step": 8813 }, { "epoch": 0.6, "learning_rate": 7.261996422006279e-06, "loss": 0.7676, "step": 8814 }, { "epoch": 0.6, "learning_rate": 7.259873576085951e-06, "loss": 0.7627, "step": 8815 }, { "epoch": 0.6, "learning_rate": 7.25775086366445e-06, "loss": 0.7842, "step": 8816 }, { "epoch": 0.6, "learning_rate": 7.255628284845195e-06, "loss": 0.7754, "step": 8817 }, { "epoch": 0.6, "learning_rate": 7.253505839731596e-06, "loss": 0.7109, "step": 8818 }, { "epoch": 0.6, "learning_rate": 7.251383528427058e-06, "loss": 0.7803, "step": 8819 }, { "epoch": 0.6, "learning_rate": 7.249261351034982e-06, "loss": 0.7432, "step": 8820 }, { "epoch": 0.6, "learning_rate": 7.247139307658756e-06, "loss": 0.8115, "step": 8821 }, { "epoch": 0.6, "learning_rate": 7.245017398401767e-06, "loss": 0.7129, "step": 8822 }, { "epoch": 0.6, "learning_rate": 7.242895623367401e-06, "loss": 0.8203, "step": 8823 }, { "epoch": 0.6, "learning_rate": 7.240773982659022e-06, "loss": 0.7988, "step": 8824 }, { "epoch": 0.6, "learning_rate": 7.238652476380003e-06, "loss": 0.7871, "step": 8825 }, { "epoch": 0.6, "learning_rate": 7.236531104633699e-06, "loss": 0.8281, "step": 8826 }, { "epoch": 0.6, "learning_rate": 7.234409867523466e-06, "loss": 0.7568, "step": 8827 }, { "epoch": 0.6, "learning_rate": 7.232288765152646e-06, "loss": 0.7461, "step": 8828 }, { "epoch": 0.6, "learning_rate": 7.230167797624583e-06, "loss": 0.7402, "step": 8829 }, { "epoch": 0.6, "learning_rate": 7.228046965042614e-06, "loss": 0.8613, "step": 8830 }, { "epoch": 0.6, "learning_rate": 7.22592626751006e-06, "loss": 0.7969, "step": 8831 }, { "epoch": 0.6, "learning_rate": 7.223805705130242e-06, "loss": 0.7725, "step": 8832 }, { "epoch": 0.6, "learning_rate": 7.221685278006474e-06, "loss": 0.8389, "step": 8833 }, { "epoch": 0.6, "learning_rate": 7.219564986242063e-06, "loss": 0.748, "step": 8834 }, { "epoch": 0.6, "learning_rate": 7.217444829940313e-06, "loss": 0.8184, "step": 8835 }, { "epoch": 0.6, "learning_rate": 7.215324809204516e-06, "loss": 0.7588, "step": 8836 }, { "epoch": 0.6, "learning_rate": 7.213204924137956e-06, "loss": 0.7461, "step": 8837 }, { "epoch": 0.6, "learning_rate": 7.2110851748439185e-06, "loss": 0.6943, "step": 8838 }, { "epoch": 0.6, "learning_rate": 7.208965561425673e-06, "loss": 0.7529, "step": 8839 }, { "epoch": 0.6, "learning_rate": 7.206846083986487e-06, "loss": 0.7451, "step": 8840 }, { "epoch": 0.6, "learning_rate": 7.204726742629627e-06, "loss": 0.8711, "step": 8841 }, { "epoch": 0.6, "learning_rate": 7.202607537458344e-06, "loss": 0.7695, "step": 8842 }, { "epoch": 0.6, "learning_rate": 7.200488468575886e-06, "loss": 0.876, "step": 8843 }, { "epoch": 0.6, "learning_rate": 7.19836953608549e-06, "loss": 0.8281, "step": 8844 }, { "epoch": 0.6, "learning_rate": 7.196250740090398e-06, "loss": 0.7793, "step": 8845 }, { "epoch": 0.6, "learning_rate": 7.194132080693827e-06, "loss": 0.8096, "step": 8846 }, { "epoch": 0.6, "learning_rate": 7.192013557999007e-06, "loss": 0.8369, "step": 8847 }, { "epoch": 0.6, "learning_rate": 7.189895172109152e-06, "loss": 0.7832, "step": 8848 }, { "epoch": 0.6, "learning_rate": 7.187776923127465e-06, "loss": 0.8184, "step": 8849 }, { "epoch": 0.6, "learning_rate": 7.185658811157151e-06, "loss": 0.8594, "step": 8850 }, { "epoch": 0.6, "learning_rate": 7.183540836301402e-06, "loss": 0.7402, "step": 8851 }, { "epoch": 0.6, "learning_rate": 7.181422998663401e-06, "loss": 0.7559, "step": 8852 }, { "epoch": 0.6, "learning_rate": 7.17930529834634e-06, "loss": 0.8076, "step": 8853 }, { "epoch": 0.6, "learning_rate": 7.177187735453388e-06, "loss": 0.7607, "step": 8854 }, { "epoch": 0.6, "learning_rate": 7.175070310087709e-06, "loss": 0.749, "step": 8855 }, { "epoch": 0.6, "learning_rate": 7.172953022352468e-06, "loss": 0.7568, "step": 8856 }, { "epoch": 0.6, "learning_rate": 7.170835872350816e-06, "loss": 0.7812, "step": 8857 }, { "epoch": 0.6, "learning_rate": 7.168718860185902e-06, "loss": 0.8955, "step": 8858 }, { "epoch": 0.6, "learning_rate": 7.166601985960869e-06, "loss": 0.8154, "step": 8859 }, { "epoch": 0.6, "learning_rate": 7.164485249778848e-06, "loss": 0.835, "step": 8860 }, { "epoch": 0.6, "learning_rate": 7.16236865174297e-06, "loss": 0.7676, "step": 8861 }, { "epoch": 0.6, "learning_rate": 7.160252191956349e-06, "loss": 0.7822, "step": 8862 }, { "epoch": 0.6, "learning_rate": 7.158135870522107e-06, "loss": 0.7549, "step": 8863 }, { "epoch": 0.6, "learning_rate": 7.156019687543342e-06, "loss": 0.7969, "step": 8864 }, { "epoch": 0.6, "learning_rate": 7.153903643123161e-06, "loss": 0.7852, "step": 8865 }, { "epoch": 0.6, "learning_rate": 7.151787737364657e-06, "loss": 0.8105, "step": 8866 }, { "epoch": 0.6, "learning_rate": 7.149671970370915e-06, "loss": 0.8545, "step": 8867 }, { "epoch": 0.6, "learning_rate": 7.147556342245016e-06, "loss": 0.7939, "step": 8868 }, { "epoch": 0.6, "learning_rate": 7.145440853090033e-06, "loss": 0.8037, "step": 8869 }, { "epoch": 0.6, "learning_rate": 7.143325503009027e-06, "loss": 0.835, "step": 8870 }, { "epoch": 0.6, "learning_rate": 7.141210292105069e-06, "loss": 0.71, "step": 8871 }, { "epoch": 0.6, "learning_rate": 7.139095220481207e-06, "loss": 0.8301, "step": 8872 }, { "epoch": 0.6, "learning_rate": 7.136980288240485e-06, "loss": 0.7812, "step": 8873 }, { "epoch": 0.6, "learning_rate": 7.1348654954859444e-06, "loss": 0.6895, "step": 8874 }, { "epoch": 0.6, "learning_rate": 7.1327508423206146e-06, "loss": 0.7773, "step": 8875 }, { "epoch": 0.6, "learning_rate": 7.130636328847522e-06, "loss": 0.8506, "step": 8876 }, { "epoch": 0.6, "learning_rate": 7.128521955169693e-06, "loss": 0.7295, "step": 8877 }, { "epoch": 0.61, "learning_rate": 7.126407721390132e-06, "loss": 0.7998, "step": 8878 }, { "epoch": 0.61, "learning_rate": 7.124293627611847e-06, "loss": 0.7148, "step": 8879 }, { "epoch": 0.61, "learning_rate": 7.122179673937835e-06, "loss": 0.71, "step": 8880 }, { "epoch": 0.61, "learning_rate": 7.120065860471093e-06, "loss": 0.7227, "step": 8881 }, { "epoch": 0.61, "learning_rate": 7.117952187314595e-06, "loss": 0.8037, "step": 8882 }, { "epoch": 0.61, "learning_rate": 7.11583865457133e-06, "loss": 0.7246, "step": 8883 }, { "epoch": 0.61, "learning_rate": 7.113725262344265e-06, "loss": 0.8281, "step": 8884 }, { "epoch": 0.61, "learning_rate": 7.111612010736364e-06, "loss": 0.7871, "step": 8885 }, { "epoch": 0.61, "learning_rate": 7.109498899850587e-06, "loss": 0.8477, "step": 8886 }, { "epoch": 0.61, "learning_rate": 7.107385929789882e-06, "loss": 0.7637, "step": 8887 }, { "epoch": 0.61, "learning_rate": 7.105273100657188e-06, "loss": 0.7998, "step": 8888 }, { "epoch": 0.61, "learning_rate": 7.103160412555452e-06, "loss": 0.7334, "step": 8889 }, { "epoch": 0.61, "learning_rate": 7.1010478655876e-06, "loss": 0.8037, "step": 8890 }, { "epoch": 0.61, "learning_rate": 7.098935459856553e-06, "loss": 0.8525, "step": 8891 }, { "epoch": 0.61, "learning_rate": 7.096823195465232e-06, "loss": 0.8145, "step": 8892 }, { "epoch": 0.61, "learning_rate": 7.0947110725165405e-06, "loss": 0.7549, "step": 8893 }, { "epoch": 0.61, "learning_rate": 7.092599091113381e-06, "loss": 0.7559, "step": 8894 }, { "epoch": 0.61, "learning_rate": 7.090487251358656e-06, "loss": 0.7588, "step": 8895 }, { "epoch": 0.61, "learning_rate": 7.088375553355249e-06, "loss": 0.7168, "step": 8896 }, { "epoch": 0.61, "learning_rate": 7.086263997206046e-06, "loss": 0.8096, "step": 8897 }, { "epoch": 0.61, "learning_rate": 7.0841525830139146e-06, "loss": 0.8477, "step": 8898 }, { "epoch": 0.61, "learning_rate": 7.082041310881731e-06, "loss": 0.7402, "step": 8899 }, { "epoch": 0.61, "learning_rate": 7.079930180912348e-06, "loss": 0.7852, "step": 8900 }, { "epoch": 0.61, "learning_rate": 7.077819193208626e-06, "loss": 0.7979, "step": 8901 }, { "epoch": 0.61, "learning_rate": 7.075708347873413e-06, "loss": 0.7852, "step": 8902 }, { "epoch": 0.61, "learning_rate": 7.073597645009544e-06, "loss": 0.7295, "step": 8903 }, { "epoch": 0.61, "learning_rate": 7.071487084719857e-06, "loss": 0.8027, "step": 8904 }, { "epoch": 0.61, "learning_rate": 7.069376667107177e-06, "loss": 0.7256, "step": 8905 }, { "epoch": 0.61, "learning_rate": 7.067266392274318e-06, "loss": 0.8066, "step": 8906 }, { "epoch": 0.61, "learning_rate": 7.0651562603241e-06, "loss": 0.7812, "step": 8907 }, { "epoch": 0.61, "learning_rate": 7.063046271359327e-06, "loss": 0.8193, "step": 8908 }, { "epoch": 0.61, "learning_rate": 7.060936425482796e-06, "loss": 0.8105, "step": 8909 }, { "epoch": 0.61, "learning_rate": 7.0588267227973e-06, "loss": 0.79, "step": 8910 }, { "epoch": 0.61, "learning_rate": 7.05671716340562e-06, "loss": 0.7236, "step": 8911 }, { "epoch": 0.61, "learning_rate": 7.054607747410535e-06, "loss": 0.7344, "step": 8912 }, { "epoch": 0.61, "learning_rate": 7.052498474914822e-06, "loss": 0.8213, "step": 8913 }, { "epoch": 0.61, "learning_rate": 7.0503893460212355e-06, "loss": 0.7041, "step": 8914 }, { "epoch": 0.61, "learning_rate": 7.04828036083254e-06, "loss": 0.8711, "step": 8915 }, { "epoch": 0.61, "learning_rate": 7.046171519451479e-06, "loss": 0.8193, "step": 8916 }, { "epoch": 0.61, "learning_rate": 7.044062821980799e-06, "loss": 0.8018, "step": 8917 }, { "epoch": 0.61, "learning_rate": 7.04195426852323e-06, "loss": 0.8135, "step": 8918 }, { "epoch": 0.61, "learning_rate": 7.039845859181507e-06, "loss": 0.75, "step": 8919 }, { "epoch": 0.61, "learning_rate": 7.0377375940583514e-06, "loss": 0.791, "step": 8920 }, { "epoch": 0.61, "learning_rate": 7.035629473256474e-06, "loss": 0.7256, "step": 8921 }, { "epoch": 0.61, "learning_rate": 7.0335214968785855e-06, "loss": 0.833, "step": 8922 }, { "epoch": 0.61, "learning_rate": 7.0314136650273855e-06, "loss": 0.7646, "step": 8923 }, { "epoch": 0.61, "learning_rate": 7.029305977805563e-06, "loss": 0.8037, "step": 8924 }, { "epoch": 0.61, "learning_rate": 7.027198435315809e-06, "loss": 0.7939, "step": 8925 }, { "epoch": 0.61, "learning_rate": 7.025091037660807e-06, "loss": 0.8008, "step": 8926 }, { "epoch": 0.61, "learning_rate": 7.02298378494322e-06, "loss": 0.8018, "step": 8927 }, { "epoch": 0.61, "learning_rate": 7.020876677265722e-06, "loss": 0.7744, "step": 8928 }, { "epoch": 0.61, "learning_rate": 7.0187697147309645e-06, "loss": 0.7861, "step": 8929 }, { "epoch": 0.61, "learning_rate": 7.016662897441598e-06, "loss": 0.835, "step": 8930 }, { "epoch": 0.61, "learning_rate": 7.014556225500273e-06, "loss": 0.8125, "step": 8931 }, { "epoch": 0.61, "learning_rate": 7.012449699009622e-06, "loss": 0.7637, "step": 8932 }, { "epoch": 0.61, "learning_rate": 7.010343318072279e-06, "loss": 0.7949, "step": 8933 }, { "epoch": 0.61, "learning_rate": 7.008237082790861e-06, "loss": 0.7637, "step": 8934 }, { "epoch": 0.61, "learning_rate": 7.006130993267986e-06, "loss": 0.8057, "step": 8935 }, { "epoch": 0.61, "learning_rate": 7.004025049606265e-06, "loss": 0.6846, "step": 8936 }, { "epoch": 0.61, "learning_rate": 7.001919251908296e-06, "loss": 0.7627, "step": 8937 }, { "epoch": 0.61, "learning_rate": 6.999813600276676e-06, "loss": 0.8057, "step": 8938 }, { "epoch": 0.61, "learning_rate": 6.997708094813992e-06, "loss": 0.7979, "step": 8939 }, { "epoch": 0.61, "learning_rate": 6.9956027356228215e-06, "loss": 0.7139, "step": 8940 }, { "epoch": 0.61, "learning_rate": 6.993497522805737e-06, "loss": 0.7627, "step": 8941 }, { "epoch": 0.61, "learning_rate": 6.991392456465309e-06, "loss": 0.7705, "step": 8942 }, { "epoch": 0.61, "learning_rate": 6.9892875367040934e-06, "loss": 0.8311, "step": 8943 }, { "epoch": 0.61, "learning_rate": 6.9871827636246445e-06, "loss": 0.8027, "step": 8944 }, { "epoch": 0.61, "learning_rate": 6.985078137329502e-06, "loss": 0.8789, "step": 8945 }, { "epoch": 0.61, "learning_rate": 6.982973657921207e-06, "loss": 0.8389, "step": 8946 }, { "epoch": 0.61, "learning_rate": 6.9808693255022846e-06, "loss": 0.6846, "step": 8947 }, { "epoch": 0.61, "learning_rate": 6.978765140175263e-06, "loss": 0.9053, "step": 8948 }, { "epoch": 0.61, "learning_rate": 6.97666110204266e-06, "loss": 0.749, "step": 8949 }, { "epoch": 0.61, "learning_rate": 6.9745572112069784e-06, "loss": 0.8379, "step": 8950 }, { "epoch": 0.61, "learning_rate": 6.9724534677707225e-06, "loss": 0.8564, "step": 8951 }, { "epoch": 0.61, "learning_rate": 6.970349871836383e-06, "loss": 0.7344, "step": 8952 }, { "epoch": 0.61, "learning_rate": 6.96824642350645e-06, "loss": 0.7783, "step": 8953 }, { "epoch": 0.61, "learning_rate": 6.966143122883408e-06, "loss": 0.833, "step": 8954 }, { "epoch": 0.61, "learning_rate": 6.964039970069722e-06, "loss": 0.792, "step": 8955 }, { "epoch": 0.61, "learning_rate": 6.961936965167864e-06, "loss": 0.7705, "step": 8956 }, { "epoch": 0.61, "learning_rate": 6.959834108280288e-06, "loss": 0.7832, "step": 8957 }, { "epoch": 0.61, "learning_rate": 6.957731399509443e-06, "loss": 0.7705, "step": 8958 }, { "epoch": 0.61, "learning_rate": 6.955628838957774e-06, "loss": 0.8672, "step": 8959 }, { "epoch": 0.61, "learning_rate": 6.953526426727724e-06, "loss": 0.8389, "step": 8960 }, { "epoch": 0.61, "learning_rate": 6.951424162921716e-06, "loss": 0.8496, "step": 8961 }, { "epoch": 0.61, "learning_rate": 6.949322047642176e-06, "loss": 0.7246, "step": 8962 }, { "epoch": 0.61, "learning_rate": 6.947220080991516e-06, "loss": 0.8584, "step": 8963 }, { "epoch": 0.61, "learning_rate": 6.945118263072146e-06, "loss": 0.748, "step": 8964 }, { "epoch": 0.61, "learning_rate": 6.94301659398646e-06, "loss": 0.7734, "step": 8965 }, { "epoch": 0.61, "learning_rate": 6.94091507383686e-06, "loss": 0.8428, "step": 8966 }, { "epoch": 0.61, "learning_rate": 6.9388137027257305e-06, "loss": 0.7686, "step": 8967 }, { "epoch": 0.61, "learning_rate": 6.936712480755445e-06, "loss": 0.7822, "step": 8968 }, { "epoch": 0.61, "learning_rate": 6.934611408028382e-06, "loss": 0.8291, "step": 8969 }, { "epoch": 0.61, "learning_rate": 6.932510484646898e-06, "loss": 0.7598, "step": 8970 }, { "epoch": 0.61, "learning_rate": 6.930409710713351e-06, "loss": 0.8584, "step": 8971 }, { "epoch": 0.61, "learning_rate": 6.928309086330099e-06, "loss": 0.7344, "step": 8972 }, { "epoch": 0.61, "learning_rate": 6.926208611599476e-06, "loss": 0.7227, "step": 8973 }, { "epoch": 0.61, "learning_rate": 6.92410828662382e-06, "loss": 0.7402, "step": 8974 }, { "epoch": 0.61, "learning_rate": 6.92200811150546e-06, "loss": 0.6895, "step": 8975 }, { "epoch": 0.61, "learning_rate": 6.919908086346714e-06, "loss": 0.7773, "step": 8976 }, { "epoch": 0.61, "learning_rate": 6.917808211249891e-06, "loss": 0.7881, "step": 8977 }, { "epoch": 0.61, "learning_rate": 6.915708486317307e-06, "loss": 0.9102, "step": 8978 }, { "epoch": 0.61, "learning_rate": 6.913608911651253e-06, "loss": 0.7627, "step": 8979 }, { "epoch": 0.61, "learning_rate": 6.911509487354024e-06, "loss": 0.8037, "step": 8980 }, { "epoch": 0.61, "learning_rate": 6.9094102135279005e-06, "loss": 0.832, "step": 8981 }, { "epoch": 0.61, "learning_rate": 6.907311090275163e-06, "loss": 0.7217, "step": 8982 }, { "epoch": 0.61, "learning_rate": 6.905212117698074e-06, "loss": 0.7949, "step": 8983 }, { "epoch": 0.61, "learning_rate": 6.9031132958989015e-06, "loss": 0.7676, "step": 8984 }, { "epoch": 0.61, "learning_rate": 6.9010146249799e-06, "loss": 0.7354, "step": 8985 }, { "epoch": 0.61, "learning_rate": 6.898916105043314e-06, "loss": 0.833, "step": 8986 }, { "epoch": 0.61, "learning_rate": 6.896817736191384e-06, "loss": 0.7207, "step": 8987 }, { "epoch": 0.61, "learning_rate": 6.894719518526343e-06, "loss": 0.8193, "step": 8988 }, { "epoch": 0.61, "learning_rate": 6.892621452150412e-06, "loss": 0.7715, "step": 8989 }, { "epoch": 0.61, "learning_rate": 6.8905235371658165e-06, "loss": 0.8076, "step": 8990 }, { "epoch": 0.61, "learning_rate": 6.888425773674761e-06, "loss": 0.749, "step": 8991 }, { "epoch": 0.61, "learning_rate": 6.886328161779452e-06, "loss": 0.7471, "step": 8992 }, { "epoch": 0.61, "learning_rate": 6.884230701582083e-06, "loss": 0.7539, "step": 8993 }, { "epoch": 0.61, "learning_rate": 6.8821333931848396e-06, "loss": 0.7598, "step": 8994 }, { "epoch": 0.61, "learning_rate": 6.880036236689904e-06, "loss": 0.6963, "step": 8995 }, { "epoch": 0.61, "learning_rate": 6.877939232199456e-06, "loss": 0.7979, "step": 8996 }, { "epoch": 0.61, "learning_rate": 6.875842379815654e-06, "loss": 0.7686, "step": 8997 }, { "epoch": 0.61, "learning_rate": 6.8737456796406594e-06, "loss": 0.791, "step": 8998 }, { "epoch": 0.61, "learning_rate": 6.871649131776621e-06, "loss": 0.751, "step": 8999 }, { "epoch": 0.61, "learning_rate": 6.869552736325687e-06, "loss": 0.7305, "step": 9000 }, { "epoch": 0.61, "learning_rate": 6.867456493389987e-06, "loss": 0.8164, "step": 9001 }, { "epoch": 0.61, "learning_rate": 6.865360403071655e-06, "loss": 0.7998, "step": 9002 }, { "epoch": 0.61, "learning_rate": 6.863264465472814e-06, "loss": 0.7061, "step": 9003 }, { "epoch": 0.61, "learning_rate": 6.861168680695574e-06, "loss": 0.7852, "step": 9004 }, { "epoch": 0.61, "learning_rate": 6.8590730488420445e-06, "loss": 0.6709, "step": 9005 }, { "epoch": 0.61, "learning_rate": 6.85697757001432e-06, "loss": 0.6562, "step": 9006 }, { "epoch": 0.61, "learning_rate": 6.854882244314494e-06, "loss": 0.6914, "step": 9007 }, { "epoch": 0.61, "learning_rate": 6.852787071844655e-06, "loss": 0.8535, "step": 9008 }, { "epoch": 0.61, "learning_rate": 6.850692052706877e-06, "loss": 0.7783, "step": 9009 }, { "epoch": 0.61, "learning_rate": 6.8485971870032255e-06, "loss": 0.8115, "step": 9010 }, { "epoch": 0.61, "learning_rate": 6.846502474835768e-06, "loss": 0.7959, "step": 9011 }, { "epoch": 0.61, "learning_rate": 6.844407916306554e-06, "loss": 0.7705, "step": 9012 }, { "epoch": 0.61, "learning_rate": 6.842313511517631e-06, "loss": 0.8115, "step": 9013 }, { "epoch": 0.61, "learning_rate": 6.8402192605710435e-06, "loss": 0.8369, "step": 9014 }, { "epoch": 0.61, "learning_rate": 6.838125163568817e-06, "loss": 0.7871, "step": 9015 }, { "epoch": 0.61, "learning_rate": 6.836031220612981e-06, "loss": 0.7949, "step": 9016 }, { "epoch": 0.61, "learning_rate": 6.833937431805548e-06, "loss": 0.7812, "step": 9017 }, { "epoch": 0.61, "learning_rate": 6.8318437972485295e-06, "loss": 0.7344, "step": 9018 }, { "epoch": 0.61, "learning_rate": 6.829750317043924e-06, "loss": 0.7422, "step": 9019 }, { "epoch": 0.61, "learning_rate": 6.827656991293729e-06, "loss": 0.8135, "step": 9020 }, { "epoch": 0.61, "learning_rate": 6.825563820099934e-06, "loss": 0.8555, "step": 9021 }, { "epoch": 0.61, "learning_rate": 6.823470803564513e-06, "loss": 0.8369, "step": 9022 }, { "epoch": 0.61, "learning_rate": 6.8213779417894414e-06, "loss": 0.6841, "step": 9023 }, { "epoch": 0.61, "learning_rate": 6.819285234876678e-06, "loss": 0.7549, "step": 9024 }, { "epoch": 0.62, "learning_rate": 6.817192682928182e-06, "loss": 0.8135, "step": 9025 }, { "epoch": 0.62, "learning_rate": 6.815100286045908e-06, "loss": 0.7168, "step": 9026 }, { "epoch": 0.62, "learning_rate": 6.813008044331791e-06, "loss": 0.7891, "step": 9027 }, { "epoch": 0.62, "learning_rate": 6.8109159578877655e-06, "loss": 0.8896, "step": 9028 }, { "epoch": 0.62, "learning_rate": 6.808824026815761e-06, "loss": 0.6904, "step": 9029 }, { "epoch": 0.62, "learning_rate": 6.806732251217694e-06, "loss": 0.7725, "step": 9030 }, { "epoch": 0.62, "learning_rate": 6.804640631195471e-06, "loss": 0.7139, "step": 9031 }, { "epoch": 0.62, "learning_rate": 6.802549166851007e-06, "loss": 0.7842, "step": 9032 }, { "epoch": 0.62, "learning_rate": 6.800457858286189e-06, "loss": 0.7568, "step": 9033 }, { "epoch": 0.62, "learning_rate": 6.798366705602909e-06, "loss": 0.7324, "step": 9034 }, { "epoch": 0.62, "learning_rate": 6.796275708903046e-06, "loss": 0.7402, "step": 9035 }, { "epoch": 0.62, "learning_rate": 6.7941848682884756e-06, "loss": 0.8535, "step": 9036 }, { "epoch": 0.62, "learning_rate": 6.7920941838610585e-06, "loss": 0.7861, "step": 9037 }, { "epoch": 0.62, "learning_rate": 6.790003655722659e-06, "loss": 0.8076, "step": 9038 }, { "epoch": 0.62, "learning_rate": 6.787913283975126e-06, "loss": 0.7832, "step": 9039 }, { "epoch": 0.62, "learning_rate": 6.785823068720299e-06, "loss": 0.8389, "step": 9040 }, { "epoch": 0.62, "learning_rate": 6.783733010060018e-06, "loss": 0.8662, "step": 9041 }, { "epoch": 0.62, "learning_rate": 6.781643108096106e-06, "loss": 0.75, "step": 9042 }, { "epoch": 0.62, "learning_rate": 6.779553362930382e-06, "loss": 0.7051, "step": 9043 }, { "epoch": 0.62, "learning_rate": 6.777463774664665e-06, "loss": 0.7979, "step": 9044 }, { "epoch": 0.62, "learning_rate": 6.775374343400757e-06, "loss": 0.7656, "step": 9045 }, { "epoch": 0.62, "learning_rate": 6.773285069240451e-06, "loss": 0.7891, "step": 9046 }, { "epoch": 0.62, "learning_rate": 6.771195952285541e-06, "loss": 0.8047, "step": 9047 }, { "epoch": 0.62, "learning_rate": 6.769106992637804e-06, "loss": 0.75, "step": 9048 }, { "epoch": 0.62, "learning_rate": 6.767018190399016e-06, "loss": 0.8457, "step": 9049 }, { "epoch": 0.62, "learning_rate": 6.7649295456709485e-06, "loss": 0.8418, "step": 9050 }, { "epoch": 0.62, "learning_rate": 6.762841058555352e-06, "loss": 0.7109, "step": 9051 }, { "epoch": 0.62, "learning_rate": 6.760752729153985e-06, "loss": 0.7949, "step": 9052 }, { "epoch": 0.62, "learning_rate": 6.758664557568584e-06, "loss": 0.7666, "step": 9053 }, { "epoch": 0.62, "learning_rate": 6.7565765439008856e-06, "loss": 0.8271, "step": 9054 }, { "epoch": 0.62, "learning_rate": 6.754488688252625e-06, "loss": 0.8545, "step": 9055 }, { "epoch": 0.62, "learning_rate": 6.752400990725514e-06, "loss": 0.8164, "step": 9056 }, { "epoch": 0.62, "learning_rate": 6.750313451421271e-06, "loss": 0.7422, "step": 9057 }, { "epoch": 0.62, "learning_rate": 6.7482260704415955e-06, "loss": 0.793, "step": 9058 }, { "epoch": 0.62, "learning_rate": 6.746138847888191e-06, "loss": 0.8018, "step": 9059 }, { "epoch": 0.62, "learning_rate": 6.744051783862737e-06, "loss": 0.7959, "step": 9060 }, { "epoch": 0.62, "learning_rate": 6.741964878466924e-06, "loss": 0.8066, "step": 9061 }, { "epoch": 0.62, "learning_rate": 6.739878131802426e-06, "loss": 0.7568, "step": 9062 }, { "epoch": 0.62, "learning_rate": 6.737791543970905e-06, "loss": 0.7188, "step": 9063 }, { "epoch": 0.62, "learning_rate": 6.73570511507402e-06, "loss": 0.7656, "step": 9064 }, { "epoch": 0.62, "learning_rate": 6.733618845213424e-06, "loss": 0.7764, "step": 9065 }, { "epoch": 0.62, "learning_rate": 6.731532734490756e-06, "loss": 0.7568, "step": 9066 }, { "epoch": 0.62, "learning_rate": 6.729446783007654e-06, "loss": 0.7891, "step": 9067 }, { "epoch": 0.62, "learning_rate": 6.727360990865748e-06, "loss": 0.7949, "step": 9068 }, { "epoch": 0.62, "learning_rate": 6.725275358166652e-06, "loss": 0.79, "step": 9069 }, { "epoch": 0.62, "learning_rate": 6.7231898850119846e-06, "loss": 0.8252, "step": 9070 }, { "epoch": 0.62, "learning_rate": 6.721104571503343e-06, "loss": 0.7197, "step": 9071 }, { "epoch": 0.62, "learning_rate": 6.719019417742325e-06, "loss": 0.7461, "step": 9072 }, { "epoch": 0.62, "learning_rate": 6.716934423830526e-06, "loss": 0.8252, "step": 9073 }, { "epoch": 0.62, "learning_rate": 6.714849589869519e-06, "loss": 0.8506, "step": 9074 }, { "epoch": 0.62, "learning_rate": 6.712764915960881e-06, "loss": 0.8193, "step": 9075 }, { "epoch": 0.62, "learning_rate": 6.7106804022061736e-06, "loss": 0.8037, "step": 9076 }, { "epoch": 0.62, "learning_rate": 6.7085960487069605e-06, "loss": 0.7422, "step": 9077 }, { "epoch": 0.62, "learning_rate": 6.7065118555647825e-06, "loss": 0.7939, "step": 9078 }, { "epoch": 0.62, "learning_rate": 6.70442782288119e-06, "loss": 0.8008, "step": 9079 }, { "epoch": 0.62, "learning_rate": 6.702343950757711e-06, "loss": 0.7129, "step": 9080 }, { "epoch": 0.62, "learning_rate": 6.700260239295877e-06, "loss": 0.7939, "step": 9081 }, { "epoch": 0.62, "learning_rate": 6.6981766885971995e-06, "loss": 0.7861, "step": 9082 }, { "epoch": 0.62, "learning_rate": 6.696093298763198e-06, "loss": 0.7539, "step": 9083 }, { "epoch": 0.62, "learning_rate": 6.694010069895363e-06, "loss": 0.79, "step": 9084 }, { "epoch": 0.62, "learning_rate": 6.691927002095198e-06, "loss": 0.875, "step": 9085 }, { "epoch": 0.62, "learning_rate": 6.6898440954641904e-06, "loss": 0.7871, "step": 9086 }, { "epoch": 0.62, "learning_rate": 6.687761350103816e-06, "loss": 0.8525, "step": 9087 }, { "epoch": 0.62, "learning_rate": 6.68567876611555e-06, "loss": 0.7334, "step": 9088 }, { "epoch": 0.62, "learning_rate": 6.6835963436008486e-06, "loss": 0.8154, "step": 9089 }, { "epoch": 0.62, "learning_rate": 6.681514082661171e-06, "loss": 0.7197, "step": 9090 }, { "epoch": 0.62, "learning_rate": 6.6794319833979696e-06, "loss": 0.8369, "step": 9091 }, { "epoch": 0.62, "learning_rate": 6.677350045912677e-06, "loss": 0.8145, "step": 9092 }, { "epoch": 0.62, "learning_rate": 6.6752682703067315e-06, "loss": 0.8535, "step": 9093 }, { "epoch": 0.62, "learning_rate": 6.6731866566815504e-06, "loss": 0.8193, "step": 9094 }, { "epoch": 0.62, "learning_rate": 6.6711052051385565e-06, "loss": 0.7812, "step": 9095 }, { "epoch": 0.62, "learning_rate": 6.669023915779149e-06, "loss": 0.6719, "step": 9096 }, { "epoch": 0.62, "learning_rate": 6.6669427887047385e-06, "loss": 0.748, "step": 9097 }, { "epoch": 0.62, "learning_rate": 6.664861824016711e-06, "loss": 0.6777, "step": 9098 }, { "epoch": 0.62, "learning_rate": 6.6627810218164555e-06, "loss": 0.7979, "step": 9099 }, { "epoch": 0.62, "learning_rate": 6.660700382205343e-06, "loss": 0.7998, "step": 9100 }, { "epoch": 0.62, "learning_rate": 6.658619905284747e-06, "loss": 0.8525, "step": 9101 }, { "epoch": 0.62, "learning_rate": 6.6565395911560225e-06, "loss": 0.8145, "step": 9102 }, { "epoch": 0.62, "learning_rate": 6.654459439920529e-06, "loss": 0.7734, "step": 9103 }, { "epoch": 0.62, "learning_rate": 6.652379451679609e-06, "loss": 0.7842, "step": 9104 }, { "epoch": 0.62, "learning_rate": 6.650299626534598e-06, "loss": 0.7783, "step": 9105 }, { "epoch": 0.62, "learning_rate": 6.648219964586826e-06, "loss": 0.7285, "step": 9106 }, { "epoch": 0.62, "learning_rate": 6.646140465937614e-06, "loss": 0.7871, "step": 9107 }, { "epoch": 0.62, "learning_rate": 6.644061130688271e-06, "loss": 0.7275, "step": 9108 }, { "epoch": 0.62, "learning_rate": 6.641981958940111e-06, "loss": 0.71, "step": 9109 }, { "epoch": 0.62, "learning_rate": 6.639902950794424e-06, "loss": 0.7402, "step": 9110 }, { "epoch": 0.62, "learning_rate": 6.637824106352504e-06, "loss": 0.8545, "step": 9111 }, { "epoch": 0.62, "learning_rate": 6.635745425715627e-06, "loss": 0.8242, "step": 9112 }, { "epoch": 0.62, "learning_rate": 6.633666908985072e-06, "loss": 0.8545, "step": 9113 }, { "epoch": 0.62, "learning_rate": 6.6315885562620954e-06, "loss": 0.7676, "step": 9114 }, { "epoch": 0.62, "learning_rate": 6.629510367647965e-06, "loss": 0.7861, "step": 9115 }, { "epoch": 0.62, "learning_rate": 6.627432343243922e-06, "loss": 0.7305, "step": 9116 }, { "epoch": 0.62, "learning_rate": 6.625354483151214e-06, "loss": 0.8105, "step": 9117 }, { "epoch": 0.62, "learning_rate": 6.623276787471069e-06, "loss": 0.8066, "step": 9118 }, { "epoch": 0.62, "learning_rate": 6.621199256304716e-06, "loss": 0.7939, "step": 9119 }, { "epoch": 0.62, "learning_rate": 6.619121889753366e-06, "loss": 0.7861, "step": 9120 }, { "epoch": 0.62, "learning_rate": 6.617044687918235e-06, "loss": 0.8047, "step": 9121 }, { "epoch": 0.62, "learning_rate": 6.6149676509005234e-06, "loss": 0.7725, "step": 9122 }, { "epoch": 0.62, "learning_rate": 6.612890778801422e-06, "loss": 0.793, "step": 9123 }, { "epoch": 0.62, "learning_rate": 6.610814071722118e-06, "loss": 0.709, "step": 9124 }, { "epoch": 0.62, "learning_rate": 6.608737529763785e-06, "loss": 0.8057, "step": 9125 }, { "epoch": 0.62, "learning_rate": 6.606661153027592e-06, "loss": 0.7793, "step": 9126 }, { "epoch": 0.62, "learning_rate": 6.604584941614706e-06, "loss": 0.8057, "step": 9127 }, { "epoch": 0.62, "learning_rate": 6.602508895626274e-06, "loss": 0.792, "step": 9128 }, { "epoch": 0.62, "learning_rate": 6.6004330151634456e-06, "loss": 0.8477, "step": 9129 }, { "epoch": 0.62, "learning_rate": 6.598357300327355e-06, "loss": 0.7705, "step": 9130 }, { "epoch": 0.62, "learning_rate": 6.596281751219128e-06, "loss": 0.7744, "step": 9131 }, { "epoch": 0.62, "learning_rate": 6.594206367939886e-06, "loss": 0.7764, "step": 9132 }, { "epoch": 0.62, "learning_rate": 6.592131150590748e-06, "loss": 0.8359, "step": 9133 }, { "epoch": 0.62, "learning_rate": 6.590056099272812e-06, "loss": 0.8555, "step": 9134 }, { "epoch": 0.62, "learning_rate": 6.58798121408718e-06, "loss": 0.8076, "step": 9135 }, { "epoch": 0.62, "learning_rate": 6.5859064951349335e-06, "loss": 0.8516, "step": 9136 }, { "epoch": 0.62, "learning_rate": 6.583831942517158e-06, "loss": 0.9014, "step": 9137 }, { "epoch": 0.62, "learning_rate": 6.58175755633492e-06, "loss": 0.7969, "step": 9138 }, { "epoch": 0.62, "learning_rate": 6.5796833366892896e-06, "loss": 0.7666, "step": 9139 }, { "epoch": 0.62, "learning_rate": 6.577609283681322e-06, "loss": 0.7559, "step": 9140 }, { "epoch": 0.62, "learning_rate": 6.575535397412061e-06, "loss": 0.7998, "step": 9141 }, { "epoch": 0.62, "learning_rate": 6.573461677982551e-06, "loss": 0.7949, "step": 9142 }, { "epoch": 0.62, "learning_rate": 6.571388125493818e-06, "loss": 0.7646, "step": 9143 }, { "epoch": 0.62, "learning_rate": 6.569314740046886e-06, "loss": 0.7334, "step": 9144 }, { "epoch": 0.62, "learning_rate": 6.567241521742777e-06, "loss": 0.7793, "step": 9145 }, { "epoch": 0.62, "learning_rate": 6.565168470682492e-06, "loss": 0.7686, "step": 9146 }, { "epoch": 0.62, "learning_rate": 6.563095586967034e-06, "loss": 0.8633, "step": 9147 }, { "epoch": 0.62, "learning_rate": 6.561022870697391e-06, "loss": 0.7402, "step": 9148 }, { "epoch": 0.62, "learning_rate": 6.558950321974544e-06, "loss": 0.7783, "step": 9149 }, { "epoch": 0.62, "learning_rate": 6.5568779408994675e-06, "loss": 0.793, "step": 9150 }, { "epoch": 0.62, "learning_rate": 6.5548057275731334e-06, "loss": 0.6748, "step": 9151 }, { "epoch": 0.62, "learning_rate": 6.552733682096495e-06, "loss": 0.8135, "step": 9152 }, { "epoch": 0.62, "learning_rate": 6.550661804570505e-06, "loss": 0.7744, "step": 9153 }, { "epoch": 0.62, "learning_rate": 6.5485900950961014e-06, "loss": 0.8076, "step": 9154 }, { "epoch": 0.62, "learning_rate": 6.5465185537742235e-06, "loss": 0.6348, "step": 9155 }, { "epoch": 0.62, "learning_rate": 6.544447180705788e-06, "loss": 0.7471, "step": 9156 }, { "epoch": 0.62, "learning_rate": 6.54237597599172e-06, "loss": 0.7861, "step": 9157 }, { "epoch": 0.62, "learning_rate": 6.540304939732927e-06, "loss": 0.7393, "step": 9158 }, { "epoch": 0.62, "learning_rate": 6.538234072030307e-06, "loss": 0.7178, "step": 9159 }, { "epoch": 0.62, "learning_rate": 6.536163372984756e-06, "loss": 0.7275, "step": 9160 }, { "epoch": 0.62, "learning_rate": 6.5340928426971555e-06, "loss": 0.7559, "step": 9161 }, { "epoch": 0.62, "learning_rate": 6.532022481268378e-06, "loss": 0.8564, "step": 9162 }, { "epoch": 0.62, "learning_rate": 6.5299522887993025e-06, "loss": 0.749, "step": 9163 }, { "epoch": 0.62, "learning_rate": 6.527882265390779e-06, "loss": 0.8154, "step": 9164 }, { "epoch": 0.62, "learning_rate": 6.525812411143666e-06, "loss": 0.7793, "step": 9165 }, { "epoch": 0.62, "learning_rate": 6.523742726158802e-06, "loss": 0.7705, "step": 9166 }, { "epoch": 0.62, "learning_rate": 6.52167321053702e-06, "loss": 0.7471, "step": 9167 }, { "epoch": 0.62, "learning_rate": 6.51960386437915e-06, "loss": 0.7783, "step": 9168 }, { "epoch": 0.62, "learning_rate": 6.517534687786011e-06, "loss": 0.7744, "step": 9169 }, { "epoch": 0.62, "learning_rate": 6.515465680858412e-06, "loss": 0.7617, "step": 9170 }, { "epoch": 0.62, "learning_rate": 6.513396843697156e-06, "loss": 0.6865, "step": 9171 }, { "epoch": 0.63, "learning_rate": 6.511328176403035e-06, "loss": 0.7764, "step": 9172 }, { "epoch": 0.63, "learning_rate": 6.5092596790768314e-06, "loss": 0.8223, "step": 9173 }, { "epoch": 0.63, "learning_rate": 6.5071913518193305e-06, "loss": 0.8047, "step": 9174 }, { "epoch": 0.63, "learning_rate": 6.505123194731295e-06, "loss": 0.6426, "step": 9175 }, { "epoch": 0.63, "learning_rate": 6.50305520791349e-06, "loss": 0.7666, "step": 9176 }, { "epoch": 0.63, "learning_rate": 6.500987391466662e-06, "loss": 0.7832, "step": 9177 }, { "epoch": 0.63, "learning_rate": 6.49891974549156e-06, "loss": 0.668, "step": 9178 }, { "epoch": 0.63, "learning_rate": 6.4968522700889125e-06, "loss": 0.7842, "step": 9179 }, { "epoch": 0.63, "learning_rate": 6.494784965359453e-06, "loss": 0.7617, "step": 9180 }, { "epoch": 0.63, "learning_rate": 6.492717831403903e-06, "loss": 0.8135, "step": 9181 }, { "epoch": 0.63, "learning_rate": 6.490650868322965e-06, "loss": 0.7295, "step": 9182 }, { "epoch": 0.63, "learning_rate": 6.488584076217351e-06, "loss": 0.7842, "step": 9183 }, { "epoch": 0.63, "learning_rate": 6.4865174551877465e-06, "loss": 0.8037, "step": 9184 }, { "epoch": 0.63, "learning_rate": 6.484451005334837e-06, "loss": 0.8027, "step": 9185 }, { "epoch": 0.63, "learning_rate": 6.482384726759304e-06, "loss": 0.7695, "step": 9186 }, { "epoch": 0.63, "learning_rate": 6.480318619561819e-06, "loss": 0.8066, "step": 9187 }, { "epoch": 0.63, "learning_rate": 6.478252683843037e-06, "loss": 0.792, "step": 9188 }, { "epoch": 0.63, "learning_rate": 6.476186919703615e-06, "loss": 0.7646, "step": 9189 }, { "epoch": 0.63, "learning_rate": 6.4741213272441915e-06, "loss": 0.79, "step": 9190 }, { "epoch": 0.63, "learning_rate": 6.472055906565402e-06, "loss": 0.7695, "step": 9191 }, { "epoch": 0.63, "learning_rate": 6.469990657767883e-06, "loss": 0.8506, "step": 9192 }, { "epoch": 0.63, "learning_rate": 6.467925580952243e-06, "loss": 0.7715, "step": 9193 }, { "epoch": 0.63, "learning_rate": 6.4658606762191e-06, "loss": 0.8369, "step": 9194 }, { "epoch": 0.63, "learning_rate": 6.46379594366905e-06, "loss": 0.7363, "step": 9195 }, { "epoch": 0.63, "learning_rate": 6.461731383402692e-06, "loss": 0.8252, "step": 9196 }, { "epoch": 0.63, "learning_rate": 6.4596669955206025e-06, "loss": 0.7578, "step": 9197 }, { "epoch": 0.63, "learning_rate": 6.457602780123368e-06, "loss": 0.6992, "step": 9198 }, { "epoch": 0.63, "learning_rate": 6.455538737311555e-06, "loss": 0.7939, "step": 9199 }, { "epoch": 0.63, "learning_rate": 6.453474867185721e-06, "loss": 0.8057, "step": 9200 }, { "epoch": 0.63, "learning_rate": 6.451411169846418e-06, "loss": 0.7666, "step": 9201 }, { "epoch": 0.63, "learning_rate": 6.449347645394191e-06, "loss": 0.7373, "step": 9202 }, { "epoch": 0.63, "learning_rate": 6.447284293929568e-06, "loss": 0.79, "step": 9203 }, { "epoch": 0.63, "learning_rate": 6.445221115553084e-06, "loss": 0.6885, "step": 9204 }, { "epoch": 0.63, "learning_rate": 6.443158110365257e-06, "loss": 0.8076, "step": 9205 }, { "epoch": 0.63, "learning_rate": 6.441095278466591e-06, "loss": 0.7705, "step": 9206 }, { "epoch": 0.63, "learning_rate": 6.439032619957591e-06, "loss": 0.8252, "step": 9207 }, { "epoch": 0.63, "learning_rate": 6.436970134938746e-06, "loss": 0.835, "step": 9208 }, { "epoch": 0.63, "learning_rate": 6.43490782351054e-06, "loss": 0.7578, "step": 9209 }, { "epoch": 0.63, "learning_rate": 6.4328456857734555e-06, "loss": 0.8047, "step": 9210 }, { "epoch": 0.63, "learning_rate": 6.4307837218279536e-06, "loss": 0.7705, "step": 9211 }, { "epoch": 0.63, "learning_rate": 6.428721931774496e-06, "loss": 0.7627, "step": 9212 }, { "epoch": 0.63, "learning_rate": 6.4266603157135295e-06, "loss": 0.7568, "step": 9213 }, { "epoch": 0.63, "learning_rate": 6.4245988737455016e-06, "loss": 0.7334, "step": 9214 }, { "epoch": 0.63, "learning_rate": 6.422537605970838e-06, "loss": 0.7822, "step": 9215 }, { "epoch": 0.63, "learning_rate": 6.420476512489968e-06, "loss": 0.8193, "step": 9216 }, { "epoch": 0.63, "learning_rate": 6.418415593403311e-06, "loss": 0.7734, "step": 9217 }, { "epoch": 0.63, "learning_rate": 6.416354848811272e-06, "loss": 0.8018, "step": 9218 }, { "epoch": 0.63, "learning_rate": 6.414294278814247e-06, "loss": 0.8164, "step": 9219 }, { "epoch": 0.63, "learning_rate": 6.412233883512633e-06, "loss": 0.8047, "step": 9220 }, { "epoch": 0.63, "learning_rate": 6.410173663006803e-06, "loss": 0.7764, "step": 9221 }, { "epoch": 0.63, "learning_rate": 6.408113617397142e-06, "loss": 0.7793, "step": 9222 }, { "epoch": 0.63, "learning_rate": 6.406053746784011e-06, "loss": 0.835, "step": 9223 }, { "epoch": 0.63, "learning_rate": 6.403994051267764e-06, "loss": 0.8105, "step": 9224 }, { "epoch": 0.63, "learning_rate": 6.401934530948753e-06, "loss": 0.8047, "step": 9225 }, { "epoch": 0.63, "learning_rate": 6.399875185927316e-06, "loss": 0.8125, "step": 9226 }, { "epoch": 0.63, "learning_rate": 6.39781601630378e-06, "loss": 0.7412, "step": 9227 }, { "epoch": 0.63, "learning_rate": 6.3957570221784774e-06, "loss": 0.8369, "step": 9228 }, { "epoch": 0.63, "learning_rate": 6.393698203651715e-06, "loss": 0.7158, "step": 9229 }, { "epoch": 0.63, "learning_rate": 6.391639560823802e-06, "loss": 0.8076, "step": 9230 }, { "epoch": 0.63, "learning_rate": 6.389581093795032e-06, "loss": 0.7305, "step": 9231 }, { "epoch": 0.63, "learning_rate": 6.3875228026656965e-06, "loss": 0.8193, "step": 9232 }, { "epoch": 0.63, "learning_rate": 6.385464687536069e-06, "loss": 0.8066, "step": 9233 }, { "epoch": 0.63, "learning_rate": 6.383406748506429e-06, "loss": 0.708, "step": 9234 }, { "epoch": 0.63, "learning_rate": 6.381348985677038e-06, "loss": 0.8252, "step": 9235 }, { "epoch": 0.63, "learning_rate": 6.3792913991481485e-06, "loss": 0.7461, "step": 9236 }, { "epoch": 0.63, "learning_rate": 6.377233989020002e-06, "loss": 0.8018, "step": 9237 }, { "epoch": 0.63, "learning_rate": 6.375176755392841e-06, "loss": 0.8535, "step": 9238 }, { "epoch": 0.63, "learning_rate": 6.373119698366887e-06, "loss": 0.8066, "step": 9239 }, { "epoch": 0.63, "learning_rate": 6.371062818042368e-06, "loss": 0.7402, "step": 9240 }, { "epoch": 0.63, "learning_rate": 6.369006114519494e-06, "loss": 0.7812, "step": 9241 }, { "epoch": 0.63, "learning_rate": 6.366949587898461e-06, "loss": 0.8105, "step": 9242 }, { "epoch": 0.63, "learning_rate": 6.36489323827947e-06, "loss": 0.7285, "step": 9243 }, { "epoch": 0.63, "learning_rate": 6.362837065762701e-06, "loss": 0.7793, "step": 9244 }, { "epoch": 0.63, "learning_rate": 6.360781070448332e-06, "loss": 0.7725, "step": 9245 }, { "epoch": 0.63, "learning_rate": 6.358725252436535e-06, "loss": 0.8184, "step": 9246 }, { "epoch": 0.63, "learning_rate": 6.356669611827464e-06, "loss": 0.835, "step": 9247 }, { "epoch": 0.63, "learning_rate": 6.354614148721273e-06, "loss": 0.6914, "step": 9248 }, { "epoch": 0.63, "learning_rate": 6.352558863218101e-06, "loss": 0.7432, "step": 9249 }, { "epoch": 0.63, "learning_rate": 6.350503755418087e-06, "loss": 0.7539, "step": 9250 }, { "epoch": 0.63, "learning_rate": 6.348448825421347e-06, "loss": 0.8398, "step": 9251 }, { "epoch": 0.63, "learning_rate": 6.346394073328004e-06, "loss": 0.7871, "step": 9252 }, { "epoch": 0.63, "learning_rate": 6.344339499238166e-06, "loss": 0.7344, "step": 9253 }, { "epoch": 0.63, "learning_rate": 6.342285103251928e-06, "loss": 0.8418, "step": 9254 }, { "epoch": 0.63, "learning_rate": 6.340230885469381e-06, "loss": 0.7598, "step": 9255 }, { "epoch": 0.63, "learning_rate": 6.338176845990608e-06, "loss": 0.791, "step": 9256 }, { "epoch": 0.63, "learning_rate": 6.336122984915675e-06, "loss": 0.7285, "step": 9257 }, { "epoch": 0.63, "learning_rate": 6.334069302344657e-06, "loss": 0.8418, "step": 9258 }, { "epoch": 0.63, "learning_rate": 6.332015798377604e-06, "loss": 0.7969, "step": 9259 }, { "epoch": 0.63, "learning_rate": 6.32996247311456e-06, "loss": 0.7666, "step": 9260 }, { "epoch": 0.63, "learning_rate": 6.327909326655568e-06, "loss": 0.8691, "step": 9261 }, { "epoch": 0.63, "learning_rate": 6.3258563591006526e-06, "loss": 0.8027, "step": 9262 }, { "epoch": 0.63, "learning_rate": 6.323803570549833e-06, "loss": 0.8408, "step": 9263 }, { "epoch": 0.63, "learning_rate": 6.321750961103129e-06, "loss": 0.7363, "step": 9264 }, { "epoch": 0.63, "learning_rate": 6.3196985308605366e-06, "loss": 0.877, "step": 9265 }, { "epoch": 0.63, "learning_rate": 6.317646279922055e-06, "loss": 0.8223, "step": 9266 }, { "epoch": 0.63, "learning_rate": 6.315594208387665e-06, "loss": 0.7822, "step": 9267 }, { "epoch": 0.63, "learning_rate": 6.313542316357346e-06, "loss": 0.8213, "step": 9268 }, { "epoch": 0.63, "learning_rate": 6.311490603931063e-06, "loss": 0.7861, "step": 9269 }, { "epoch": 0.63, "learning_rate": 6.309439071208783e-06, "loss": 0.835, "step": 9270 }, { "epoch": 0.63, "learning_rate": 6.307387718290447e-06, "loss": 0.75, "step": 9271 }, { "epoch": 0.63, "learning_rate": 6.305336545276004e-06, "loss": 0.7773, "step": 9272 }, { "epoch": 0.63, "learning_rate": 6.3032855522653834e-06, "loss": 0.8037, "step": 9273 }, { "epoch": 0.63, "learning_rate": 6.301234739358512e-06, "loss": 0.7314, "step": 9274 }, { "epoch": 0.63, "learning_rate": 6.299184106655298e-06, "loss": 0.8867, "step": 9275 }, { "epoch": 0.63, "learning_rate": 6.297133654255658e-06, "loss": 0.7412, "step": 9276 }, { "epoch": 0.63, "learning_rate": 6.295083382259487e-06, "loss": 0.7373, "step": 9277 }, { "epoch": 0.63, "learning_rate": 6.29303329076667e-06, "loss": 0.8447, "step": 9278 }, { "epoch": 0.63, "learning_rate": 6.290983379877094e-06, "loss": 0.7354, "step": 9279 }, { "epoch": 0.63, "learning_rate": 6.288933649690625e-06, "loss": 0.7764, "step": 9280 }, { "epoch": 0.63, "learning_rate": 6.286884100307124e-06, "loss": 0.7842, "step": 9281 }, { "epoch": 0.63, "learning_rate": 6.284834731826454e-06, "loss": 0.7275, "step": 9282 }, { "epoch": 0.63, "learning_rate": 6.282785544348451e-06, "loss": 0.8135, "step": 9283 }, { "epoch": 0.63, "learning_rate": 6.280736537972958e-06, "loss": 0.8154, "step": 9284 }, { "epoch": 0.63, "learning_rate": 6.278687712799798e-06, "loss": 0.7744, "step": 9285 }, { "epoch": 0.63, "learning_rate": 6.276639068928793e-06, "loss": 0.7373, "step": 9286 }, { "epoch": 0.63, "learning_rate": 6.274590606459746e-06, "loss": 0.8086, "step": 9287 }, { "epoch": 0.63, "learning_rate": 6.272542325492468e-06, "loss": 0.8184, "step": 9288 }, { "epoch": 0.63, "learning_rate": 6.2704942261267445e-06, "loss": 0.876, "step": 9289 }, { "epoch": 0.63, "learning_rate": 6.268446308462361e-06, "loss": 0.8262, "step": 9290 }, { "epoch": 0.63, "learning_rate": 6.2663985725990905e-06, "loss": 0.8105, "step": 9291 }, { "epoch": 0.63, "learning_rate": 6.2643510186366965e-06, "loss": 0.7344, "step": 9292 }, { "epoch": 0.63, "learning_rate": 6.262303646674943e-06, "loss": 0.708, "step": 9293 }, { "epoch": 0.63, "learning_rate": 6.260256456813571e-06, "loss": 0.8115, "step": 9294 }, { "epoch": 0.63, "learning_rate": 6.258209449152326e-06, "loss": 0.7949, "step": 9295 }, { "epoch": 0.63, "learning_rate": 6.256162623790931e-06, "loss": 0.7676, "step": 9296 }, { "epoch": 0.63, "learning_rate": 6.254115980829112e-06, "loss": 0.8242, "step": 9297 }, { "epoch": 0.63, "learning_rate": 6.252069520366576e-06, "loss": 0.8037, "step": 9298 }, { "epoch": 0.63, "learning_rate": 6.250023242503031e-06, "loss": 0.7695, "step": 9299 }, { "epoch": 0.63, "learning_rate": 6.247977147338176e-06, "loss": 0.7715, "step": 9300 }, { "epoch": 0.63, "learning_rate": 6.245931234971687e-06, "loss": 0.7695, "step": 9301 }, { "epoch": 0.63, "learning_rate": 6.2438855055032476e-06, "loss": 0.8252, "step": 9302 }, { "epoch": 0.63, "learning_rate": 6.241839959032521e-06, "loss": 0.7793, "step": 9303 }, { "epoch": 0.63, "learning_rate": 6.239794595659167e-06, "loss": 0.8037, "step": 9304 }, { "epoch": 0.63, "learning_rate": 6.23774941548284e-06, "loss": 0.8125, "step": 9305 }, { "epoch": 0.63, "learning_rate": 6.235704418603179e-06, "loss": 0.7334, "step": 9306 }, { "epoch": 0.63, "learning_rate": 6.233659605119813e-06, "loss": 0.8037, "step": 9307 }, { "epoch": 0.63, "learning_rate": 6.231614975132369e-06, "loss": 0.7188, "step": 9308 }, { "epoch": 0.63, "learning_rate": 6.229570528740456e-06, "loss": 0.7578, "step": 9309 }, { "epoch": 0.63, "learning_rate": 6.227526266043684e-06, "loss": 0.7578, "step": 9310 }, { "epoch": 0.63, "learning_rate": 6.225482187141651e-06, "loss": 0.7979, "step": 9311 }, { "epoch": 0.63, "learning_rate": 6.223438292133939e-06, "loss": 0.8262, "step": 9312 }, { "epoch": 0.63, "learning_rate": 6.221394581120133e-06, "loss": 0.8008, "step": 9313 }, { "epoch": 0.63, "learning_rate": 6.2193510541997946e-06, "loss": 0.7832, "step": 9314 }, { "epoch": 0.63, "learning_rate": 6.217307711472491e-06, "loss": 0.7266, "step": 9315 }, { "epoch": 0.63, "learning_rate": 6.2152645530377684e-06, "loss": 0.7471, "step": 9316 }, { "epoch": 0.63, "learning_rate": 6.213221578995174e-06, "loss": 0.6846, "step": 9317 }, { "epoch": 0.64, "learning_rate": 6.211178789444241e-06, "loss": 0.8291, "step": 9318 }, { "epoch": 0.64, "learning_rate": 6.209136184484491e-06, "loss": 0.7529, "step": 9319 }, { "epoch": 0.64, "learning_rate": 6.207093764215443e-06, "loss": 0.7705, "step": 9320 }, { "epoch": 0.64, "learning_rate": 6.205051528736602e-06, "loss": 0.8574, "step": 9321 }, { "epoch": 0.64, "learning_rate": 6.2030094781474596e-06, "loss": 0.7695, "step": 9322 }, { "epoch": 0.64, "learning_rate": 6.200967612547515e-06, "loss": 0.7358, "step": 9323 }, { "epoch": 0.64, "learning_rate": 6.198925932036244e-06, "loss": 0.7588, "step": 9324 }, { "epoch": 0.64, "learning_rate": 6.196884436713115e-06, "loss": 0.8086, "step": 9325 }, { "epoch": 0.64, "learning_rate": 6.194843126677592e-06, "loss": 0.8379, "step": 9326 }, { "epoch": 0.64, "learning_rate": 6.192802002029123e-06, "loss": 0.7539, "step": 9327 }, { "epoch": 0.64, "learning_rate": 6.1907610628671556e-06, "loss": 0.7129, "step": 9328 }, { "epoch": 0.64, "learning_rate": 6.188720309291125e-06, "loss": 0.7129, "step": 9329 }, { "epoch": 0.64, "learning_rate": 6.186679741400454e-06, "loss": 0.793, "step": 9330 }, { "epoch": 0.64, "learning_rate": 6.184639359294563e-06, "loss": 0.7969, "step": 9331 }, { "epoch": 0.64, "learning_rate": 6.182599163072854e-06, "loss": 0.7764, "step": 9332 }, { "epoch": 0.64, "learning_rate": 6.180559152834729e-06, "loss": 0.7578, "step": 9333 }, { "epoch": 0.64, "learning_rate": 6.178519328679571e-06, "loss": 0.8037, "step": 9334 }, { "epoch": 0.64, "learning_rate": 6.176479690706768e-06, "loss": 0.7539, "step": 9335 }, { "epoch": 0.64, "learning_rate": 6.17444023901569e-06, "loss": 0.7852, "step": 9336 }, { "epoch": 0.64, "learning_rate": 6.172400973705694e-06, "loss": 0.71, "step": 9337 }, { "epoch": 0.64, "learning_rate": 6.17036189487614e-06, "loss": 0.8105, "step": 9338 }, { "epoch": 0.64, "learning_rate": 6.1683230026263666e-06, "loss": 0.8359, "step": 9339 }, { "epoch": 0.64, "learning_rate": 6.166284297055705e-06, "loss": 0.7695, "step": 9340 }, { "epoch": 0.64, "learning_rate": 6.164245778263488e-06, "loss": 0.7158, "step": 9341 }, { "epoch": 0.64, "learning_rate": 6.162207446349031e-06, "loss": 0.7783, "step": 9342 }, { "epoch": 0.64, "learning_rate": 6.16016930141164e-06, "loss": 0.8027, "step": 9343 }, { "epoch": 0.64, "learning_rate": 6.158131343550613e-06, "loss": 0.7471, "step": 9344 }, { "epoch": 0.64, "learning_rate": 6.156093572865239e-06, "loss": 0.7471, "step": 9345 }, { "epoch": 0.64, "learning_rate": 6.154055989454797e-06, "loss": 0.8125, "step": 9346 }, { "epoch": 0.64, "learning_rate": 6.152018593418563e-06, "loss": 0.7441, "step": 9347 }, { "epoch": 0.64, "learning_rate": 6.149981384855792e-06, "loss": 0.8604, "step": 9348 }, { "epoch": 0.64, "learning_rate": 6.147944363865744e-06, "loss": 0.7939, "step": 9349 }, { "epoch": 0.64, "learning_rate": 6.145907530547657e-06, "loss": 0.7637, "step": 9350 }, { "epoch": 0.64, "learning_rate": 6.143870885000769e-06, "loss": 0.7178, "step": 9351 }, { "epoch": 0.64, "learning_rate": 6.141834427324298e-06, "loss": 0.8193, "step": 9352 }, { "epoch": 0.64, "learning_rate": 6.139798157617469e-06, "loss": 0.8408, "step": 9353 }, { "epoch": 0.64, "learning_rate": 6.137762075979487e-06, "loss": 0.792, "step": 9354 }, { "epoch": 0.64, "learning_rate": 6.135726182509546e-06, "loss": 0.8223, "step": 9355 }, { "epoch": 0.64, "learning_rate": 6.13369047730684e-06, "loss": 0.7666, "step": 9356 }, { "epoch": 0.64, "learning_rate": 6.131654960470545e-06, "loss": 0.8281, "step": 9357 }, { "epoch": 0.64, "learning_rate": 6.129619632099826e-06, "loss": 0.7715, "step": 9358 }, { "epoch": 0.64, "learning_rate": 6.127584492293854e-06, "loss": 0.7305, "step": 9359 }, { "epoch": 0.64, "learning_rate": 6.125549541151777e-06, "loss": 0.8896, "step": 9360 }, { "epoch": 0.64, "learning_rate": 6.123514778772737e-06, "loss": 0.8154, "step": 9361 }, { "epoch": 0.64, "learning_rate": 6.12148020525587e-06, "loss": 0.7354, "step": 9362 }, { "epoch": 0.64, "learning_rate": 6.119445820700294e-06, "loss": 0.8438, "step": 9363 }, { "epoch": 0.64, "learning_rate": 6.117411625205127e-06, "loss": 0.8027, "step": 9364 }, { "epoch": 0.64, "learning_rate": 6.1153776188694825e-06, "loss": 0.7646, "step": 9365 }, { "epoch": 0.64, "learning_rate": 6.113343801792447e-06, "loss": 0.8115, "step": 9366 }, { "epoch": 0.64, "learning_rate": 6.111310174073115e-06, "loss": 0.7695, "step": 9367 }, { "epoch": 0.64, "learning_rate": 6.109276735810559e-06, "loss": 0.7979, "step": 9368 }, { "epoch": 0.64, "learning_rate": 6.1072434871038535e-06, "loss": 0.7773, "step": 9369 }, { "epoch": 0.64, "learning_rate": 6.105210428052051e-06, "loss": 0.7988, "step": 9370 }, { "epoch": 0.64, "learning_rate": 6.103177558754208e-06, "loss": 0.7529, "step": 9371 }, { "epoch": 0.64, "learning_rate": 6.101144879309367e-06, "loss": 0.7256, "step": 9372 }, { "epoch": 0.64, "learning_rate": 6.099112389816554e-06, "loss": 0.7852, "step": 9373 }, { "epoch": 0.64, "learning_rate": 6.0970800903747985e-06, "loss": 0.7715, "step": 9374 }, { "epoch": 0.64, "learning_rate": 6.0950479810831096e-06, "loss": 0.7744, "step": 9375 }, { "epoch": 0.64, "learning_rate": 6.09301606204049e-06, "loss": 0.6943, "step": 9376 }, { "epoch": 0.64, "learning_rate": 6.090984333345938e-06, "loss": 0.7686, "step": 9377 }, { "epoch": 0.64, "learning_rate": 6.088952795098442e-06, "loss": 0.7783, "step": 9378 }, { "epoch": 0.64, "learning_rate": 6.086921447396972e-06, "loss": 0.8359, "step": 9379 }, { "epoch": 0.64, "learning_rate": 6.0848902903405006e-06, "loss": 0.7578, "step": 9380 }, { "epoch": 0.64, "learning_rate": 6.082859324027981e-06, "loss": 0.749, "step": 9381 }, { "epoch": 0.64, "learning_rate": 6.0808285485583625e-06, "loss": 0.8281, "step": 9382 }, { "epoch": 0.64, "learning_rate": 6.0787979640305906e-06, "loss": 0.8506, "step": 9383 }, { "epoch": 0.64, "learning_rate": 6.076767570543588e-06, "loss": 0.7402, "step": 9384 }, { "epoch": 0.64, "learning_rate": 6.074737368196279e-06, "loss": 0.8721, "step": 9385 }, { "epoch": 0.64, "learning_rate": 6.072707357087574e-06, "loss": 0.8623, "step": 9386 }, { "epoch": 0.64, "learning_rate": 6.0706775373163764e-06, "loss": 0.7939, "step": 9387 }, { "epoch": 0.64, "learning_rate": 6.0686479089815735e-06, "loss": 0.7969, "step": 9388 }, { "epoch": 0.64, "learning_rate": 6.066618472182054e-06, "loss": 0.7363, "step": 9389 }, { "epoch": 0.64, "learning_rate": 6.064589227016693e-06, "loss": 0.875, "step": 9390 }, { "epoch": 0.64, "learning_rate": 6.062560173584353e-06, "loss": 0.7734, "step": 9391 }, { "epoch": 0.64, "learning_rate": 6.0605313119838885e-06, "loss": 0.8281, "step": 9392 }, { "epoch": 0.64, "learning_rate": 6.0585026423141465e-06, "loss": 0.7754, "step": 9393 }, { "epoch": 0.64, "learning_rate": 6.0564741646739615e-06, "loss": 0.7832, "step": 9394 }, { "epoch": 0.64, "learning_rate": 6.054445879162163e-06, "loss": 0.7939, "step": 9395 }, { "epoch": 0.64, "learning_rate": 6.052417785877571e-06, "loss": 0.8535, "step": 9396 }, { "epoch": 0.64, "learning_rate": 6.050389884918992e-06, "loss": 0.7617, "step": 9397 }, { "epoch": 0.64, "learning_rate": 6.048362176385225e-06, "loss": 0.749, "step": 9398 }, { "epoch": 0.64, "learning_rate": 6.046334660375059e-06, "loss": 0.875, "step": 9399 }, { "epoch": 0.64, "learning_rate": 6.044307336987274e-06, "loss": 0.7695, "step": 9400 }, { "epoch": 0.64, "learning_rate": 6.042280206320645e-06, "loss": 0.8125, "step": 9401 }, { "epoch": 0.64, "learning_rate": 6.040253268473931e-06, "loss": 0.6934, "step": 9402 }, { "epoch": 0.64, "learning_rate": 6.038226523545887e-06, "loss": 0.7949, "step": 9403 }, { "epoch": 0.64, "learning_rate": 6.03619997163525e-06, "loss": 0.8438, "step": 9404 }, { "epoch": 0.64, "learning_rate": 6.034173612840759e-06, "loss": 0.7715, "step": 9405 }, { "epoch": 0.64, "learning_rate": 6.032147447261134e-06, "loss": 0.8193, "step": 9406 }, { "epoch": 0.64, "learning_rate": 6.0301214749950925e-06, "loss": 0.6885, "step": 9407 }, { "epoch": 0.64, "learning_rate": 6.0280956961413406e-06, "loss": 0.7676, "step": 9408 }, { "epoch": 0.64, "learning_rate": 6.026070110798574e-06, "loss": 0.7832, "step": 9409 }, { "epoch": 0.64, "learning_rate": 6.024044719065476e-06, "loss": 0.7139, "step": 9410 }, { "epoch": 0.64, "learning_rate": 6.022019521040726e-06, "loss": 0.8086, "step": 9411 }, { "epoch": 0.64, "learning_rate": 6.019994516822988e-06, "loss": 0.8467, "step": 9412 }, { "epoch": 0.64, "learning_rate": 6.017969706510924e-06, "loss": 0.8076, "step": 9413 }, { "epoch": 0.64, "learning_rate": 6.015945090203186e-06, "loss": 0.7646, "step": 9414 }, { "epoch": 0.64, "learning_rate": 6.013920667998404e-06, "loss": 0.8252, "step": 9415 }, { "epoch": 0.64, "learning_rate": 6.011896439995217e-06, "loss": 0.6992, "step": 9416 }, { "epoch": 0.64, "learning_rate": 6.009872406292236e-06, "loss": 0.7734, "step": 9417 }, { "epoch": 0.64, "learning_rate": 6.007848566988078e-06, "loss": 0.7676, "step": 9418 }, { "epoch": 0.64, "learning_rate": 6.005824922181346e-06, "loss": 0.7344, "step": 9419 }, { "epoch": 0.64, "learning_rate": 6.003801471970627e-06, "loss": 0.7422, "step": 9420 }, { "epoch": 0.64, "learning_rate": 6.0017782164545065e-06, "loss": 0.7656, "step": 9421 }, { "epoch": 0.64, "learning_rate": 5.999755155731556e-06, "loss": 0.7188, "step": 9422 }, { "epoch": 0.64, "learning_rate": 5.997732289900336e-06, "loss": 0.7793, "step": 9423 }, { "epoch": 0.64, "learning_rate": 5.995709619059408e-06, "loss": 0.7646, "step": 9424 }, { "epoch": 0.64, "learning_rate": 5.99368714330731e-06, "loss": 0.8115, "step": 9425 }, { "epoch": 0.64, "learning_rate": 5.9916648627425815e-06, "loss": 0.7422, "step": 9426 }, { "epoch": 0.64, "learning_rate": 5.9896427774637445e-06, "loss": 0.79, "step": 9427 }, { "epoch": 0.64, "learning_rate": 5.987620887569314e-06, "loss": 0.8154, "step": 9428 }, { "epoch": 0.64, "learning_rate": 5.985599193157796e-06, "loss": 0.8389, "step": 9429 }, { "epoch": 0.64, "learning_rate": 5.9835776943276946e-06, "loss": 0.7852, "step": 9430 }, { "epoch": 0.64, "learning_rate": 5.98155639117749e-06, "loss": 0.793, "step": 9431 }, { "epoch": 0.64, "learning_rate": 5.979535283805663e-06, "loss": 0.8145, "step": 9432 }, { "epoch": 0.64, "learning_rate": 5.97751437231068e-06, "loss": 0.7402, "step": 9433 }, { "epoch": 0.64, "learning_rate": 5.975493656791001e-06, "loss": 0.7812, "step": 9434 }, { "epoch": 0.64, "learning_rate": 5.973473137345073e-06, "loss": 0.791, "step": 9435 }, { "epoch": 0.64, "learning_rate": 5.971452814071338e-06, "loss": 0.7129, "step": 9436 }, { "epoch": 0.64, "learning_rate": 5.969432687068227e-06, "loss": 0.7783, "step": 9437 }, { "epoch": 0.64, "learning_rate": 5.9674127564341585e-06, "loss": 0.8525, "step": 9438 }, { "epoch": 0.64, "learning_rate": 5.965393022267545e-06, "loss": 0.7539, "step": 9439 }, { "epoch": 0.64, "learning_rate": 5.963373484666785e-06, "loss": 0.7383, "step": 9440 }, { "epoch": 0.64, "learning_rate": 5.961354143730269e-06, "loss": 0.8291, "step": 9441 }, { "epoch": 0.64, "learning_rate": 5.959334999556387e-06, "loss": 0.7119, "step": 9442 }, { "epoch": 0.64, "learning_rate": 5.957316052243505e-06, "loss": 0.7812, "step": 9443 }, { "epoch": 0.64, "learning_rate": 5.955297301889988e-06, "loss": 0.7793, "step": 9444 }, { "epoch": 0.64, "learning_rate": 5.953278748594191e-06, "loss": 0.8457, "step": 9445 }, { "epoch": 0.64, "learning_rate": 5.951260392454454e-06, "loss": 0.7666, "step": 9446 }, { "epoch": 0.64, "learning_rate": 5.94924223356911e-06, "loss": 0.7061, "step": 9447 }, { "epoch": 0.64, "learning_rate": 5.947224272036492e-06, "loss": 0.8057, "step": 9448 }, { "epoch": 0.64, "learning_rate": 5.945206507954908e-06, "loss": 0.7139, "step": 9449 }, { "epoch": 0.64, "learning_rate": 5.943188941422667e-06, "loss": 0.8125, "step": 9450 }, { "epoch": 0.64, "learning_rate": 5.9411715725380605e-06, "loss": 0.7822, "step": 9451 }, { "epoch": 0.64, "learning_rate": 5.9391544013993785e-06, "loss": 0.7705, "step": 9452 }, { "epoch": 0.64, "learning_rate": 5.937137428104893e-06, "loss": 0.7705, "step": 9453 }, { "epoch": 0.64, "learning_rate": 5.935120652752875e-06, "loss": 0.8252, "step": 9454 }, { "epoch": 0.64, "learning_rate": 5.933104075441583e-06, "loss": 0.7705, "step": 9455 }, { "epoch": 0.64, "learning_rate": 5.931087696269261e-06, "loss": 0.75, "step": 9456 }, { "epoch": 0.64, "learning_rate": 5.929071515334149e-06, "loss": 0.7559, "step": 9457 }, { "epoch": 0.64, "learning_rate": 5.927055532734473e-06, "loss": 0.8281, "step": 9458 }, { "epoch": 0.64, "learning_rate": 5.92503974856845e-06, "loss": 0.7773, "step": 9459 }, { "epoch": 0.64, "learning_rate": 5.923024162934297e-06, "loss": 0.8086, "step": 9460 }, { "epoch": 0.64, "learning_rate": 5.9210087759302055e-06, "loss": 0.7754, "step": 9461 }, { "epoch": 0.64, "learning_rate": 5.918993587654367e-06, "loss": 0.7764, "step": 9462 }, { "epoch": 0.64, "learning_rate": 5.916978598204964e-06, "loss": 0.7754, "step": 9463 }, { "epoch": 0.64, "learning_rate": 5.914963807680163e-06, "loss": 0.7393, "step": 9464 }, { "epoch": 0.65, "learning_rate": 5.912949216178123e-06, "loss": 0.7793, "step": 9465 }, { "epoch": 0.65, "learning_rate": 5.910934823797003e-06, "loss": 0.748, "step": 9466 }, { "epoch": 0.65, "learning_rate": 5.908920630634937e-06, "loss": 0.7832, "step": 9467 }, { "epoch": 0.65, "learning_rate": 5.90690663679006e-06, "loss": 0.7754, "step": 9468 }, { "epoch": 0.65, "learning_rate": 5.90489284236049e-06, "loss": 0.8193, "step": 9469 }, { "epoch": 0.65, "learning_rate": 5.902879247444342e-06, "loss": 0.7373, "step": 9470 }, { "epoch": 0.65, "learning_rate": 5.900865852139715e-06, "loss": 0.7383, "step": 9471 }, { "epoch": 0.65, "learning_rate": 5.898852656544705e-06, "loss": 0.6523, "step": 9472 }, { "epoch": 0.65, "learning_rate": 5.896839660757394e-06, "loss": 0.752, "step": 9473 }, { "epoch": 0.65, "learning_rate": 5.894826864875856e-06, "loss": 0.7383, "step": 9474 }, { "epoch": 0.65, "learning_rate": 5.892814268998152e-06, "loss": 0.8037, "step": 9475 }, { "epoch": 0.65, "learning_rate": 5.890801873222336e-06, "loss": 0.7324, "step": 9476 }, { "epoch": 0.65, "learning_rate": 5.88878967764645e-06, "loss": 0.8174, "step": 9477 }, { "epoch": 0.65, "learning_rate": 5.886777682368534e-06, "loss": 0.748, "step": 9478 }, { "epoch": 0.65, "learning_rate": 5.884765887486609e-06, "loss": 0.7441, "step": 9479 }, { "epoch": 0.65, "learning_rate": 5.882754293098687e-06, "loss": 0.7871, "step": 9480 }, { "epoch": 0.65, "learning_rate": 5.880742899302778e-06, "loss": 0.7793, "step": 9481 }, { "epoch": 0.65, "learning_rate": 5.878731706196872e-06, "loss": 0.7393, "step": 9482 }, { "epoch": 0.65, "learning_rate": 5.876720713878953e-06, "loss": 0.751, "step": 9483 }, { "epoch": 0.65, "learning_rate": 5.874709922447004e-06, "loss": 0.7812, "step": 9484 }, { "epoch": 0.65, "learning_rate": 5.8726993319989855e-06, "loss": 0.7988, "step": 9485 }, { "epoch": 0.65, "learning_rate": 5.870688942632856e-06, "loss": 0.7451, "step": 9486 }, { "epoch": 0.65, "learning_rate": 5.8686787544465575e-06, "loss": 0.7764, "step": 9487 }, { "epoch": 0.65, "learning_rate": 5.866668767538031e-06, "loss": 0.8037, "step": 9488 }, { "epoch": 0.65, "learning_rate": 5.864658982005196e-06, "loss": 0.6982, "step": 9489 }, { "epoch": 0.65, "learning_rate": 5.862649397945976e-06, "loss": 0.8086, "step": 9490 }, { "epoch": 0.65, "learning_rate": 5.8606400154582764e-06, "loss": 0.7617, "step": 9491 }, { "epoch": 0.65, "learning_rate": 5.8586308346399935e-06, "loss": 0.7236, "step": 9492 }, { "epoch": 0.65, "learning_rate": 5.856621855589015e-06, "loss": 0.7266, "step": 9493 }, { "epoch": 0.65, "learning_rate": 5.854613078403215e-06, "loss": 0.7979, "step": 9494 }, { "epoch": 0.65, "learning_rate": 5.852604503180463e-06, "loss": 0.791, "step": 9495 }, { "epoch": 0.65, "learning_rate": 5.850596130018622e-06, "loss": 0.7402, "step": 9496 }, { "epoch": 0.65, "learning_rate": 5.848587959015534e-06, "loss": 0.7773, "step": 9497 }, { "epoch": 0.65, "learning_rate": 5.846579990269037e-06, "loss": 0.6865, "step": 9498 }, { "epoch": 0.65, "learning_rate": 5.844572223876961e-06, "loss": 0.7881, "step": 9499 }, { "epoch": 0.65, "learning_rate": 5.842564659937122e-06, "loss": 0.8086, "step": 9500 }, { "epoch": 0.65, "learning_rate": 5.840557298547329e-06, "loss": 0.7197, "step": 9501 }, { "epoch": 0.65, "learning_rate": 5.838550139805384e-06, "loss": 0.7715, "step": 9502 }, { "epoch": 0.65, "learning_rate": 5.8365431838090744e-06, "loss": 0.749, "step": 9503 }, { "epoch": 0.65, "learning_rate": 5.834536430656176e-06, "loss": 0.748, "step": 9504 }, { "epoch": 0.65, "learning_rate": 5.83252988044446e-06, "loss": 0.751, "step": 9505 }, { "epoch": 0.65, "learning_rate": 5.830523533271683e-06, "loss": 0.751, "step": 9506 }, { "epoch": 0.65, "learning_rate": 5.828517389235598e-06, "loss": 0.7441, "step": 9507 }, { "epoch": 0.65, "learning_rate": 5.826511448433941e-06, "loss": 0.7402, "step": 9508 }, { "epoch": 0.65, "learning_rate": 5.824505710964443e-06, "loss": 0.8457, "step": 9509 }, { "epoch": 0.65, "learning_rate": 5.822500176924828e-06, "loss": 0.8311, "step": 9510 }, { "epoch": 0.65, "learning_rate": 5.820494846412796e-06, "loss": 0.7881, "step": 9511 }, { "epoch": 0.65, "learning_rate": 5.8184897195260514e-06, "loss": 0.7627, "step": 9512 }, { "epoch": 0.65, "learning_rate": 5.816484796362284e-06, "loss": 0.793, "step": 9513 }, { "epoch": 0.65, "learning_rate": 5.814480077019173e-06, "loss": 0.7109, "step": 9514 }, { "epoch": 0.65, "learning_rate": 5.812475561594388e-06, "loss": 0.6836, "step": 9515 }, { "epoch": 0.65, "learning_rate": 5.8104712501855944e-06, "loss": 0.8115, "step": 9516 }, { "epoch": 0.65, "learning_rate": 5.808467142890432e-06, "loss": 0.8096, "step": 9517 }, { "epoch": 0.65, "learning_rate": 5.806463239806548e-06, "loss": 0.7129, "step": 9518 }, { "epoch": 0.65, "learning_rate": 5.804459541031569e-06, "loss": 0.874, "step": 9519 }, { "epoch": 0.65, "learning_rate": 5.802456046663117e-06, "loss": 0.7656, "step": 9520 }, { "epoch": 0.65, "learning_rate": 5.800452756798802e-06, "loss": 0.8008, "step": 9521 }, { "epoch": 0.65, "learning_rate": 5.798449671536224e-06, "loss": 0.7764, "step": 9522 }, { "epoch": 0.65, "learning_rate": 5.796446790972976e-06, "loss": 0.7676, "step": 9523 }, { "epoch": 0.65, "learning_rate": 5.794444115206632e-06, "loss": 0.752, "step": 9524 }, { "epoch": 0.65, "learning_rate": 5.792441644334761e-06, "loss": 0.8359, "step": 9525 }, { "epoch": 0.65, "learning_rate": 5.790439378454936e-06, "loss": 0.8486, "step": 9526 }, { "epoch": 0.65, "learning_rate": 5.7884373176646965e-06, "loss": 0.7666, "step": 9527 }, { "epoch": 0.65, "learning_rate": 5.786435462061584e-06, "loss": 0.8145, "step": 9528 }, { "epoch": 0.65, "learning_rate": 5.784433811743131e-06, "loss": 0.79, "step": 9529 }, { "epoch": 0.65, "learning_rate": 5.7824323668068605e-06, "loss": 0.8623, "step": 9530 }, { "epoch": 0.65, "learning_rate": 5.780431127350272e-06, "loss": 0.7734, "step": 9531 }, { "epoch": 0.65, "learning_rate": 5.778430093470881e-06, "loss": 0.748, "step": 9532 }, { "epoch": 0.65, "learning_rate": 5.776429265266167e-06, "loss": 0.7627, "step": 9533 }, { "epoch": 0.65, "learning_rate": 5.774428642833611e-06, "loss": 0.7861, "step": 9534 }, { "epoch": 0.65, "learning_rate": 5.772428226270688e-06, "loss": 0.8223, "step": 9535 }, { "epoch": 0.65, "learning_rate": 5.7704280156748535e-06, "loss": 0.7988, "step": 9536 }, { "epoch": 0.65, "learning_rate": 5.768428011143561e-06, "loss": 0.7998, "step": 9537 }, { "epoch": 0.65, "learning_rate": 5.76642821277425e-06, "loss": 0.8252, "step": 9538 }, { "epoch": 0.65, "learning_rate": 5.764428620664353e-06, "loss": 0.8291, "step": 9539 }, { "epoch": 0.65, "learning_rate": 5.762429234911283e-06, "loss": 0.6738, "step": 9540 }, { "epoch": 0.65, "learning_rate": 5.760430055612453e-06, "loss": 0.8477, "step": 9541 }, { "epoch": 0.65, "learning_rate": 5.758431082865267e-06, "loss": 0.7891, "step": 9542 }, { "epoch": 0.65, "learning_rate": 5.75643231676711e-06, "loss": 0.7666, "step": 9543 }, { "epoch": 0.65, "learning_rate": 5.754433757415363e-06, "loss": 0.8301, "step": 9544 }, { "epoch": 0.65, "learning_rate": 5.752435404907397e-06, "loss": 0.791, "step": 9545 }, { "epoch": 0.65, "learning_rate": 5.750437259340576e-06, "loss": 0.7451, "step": 9546 }, { "epoch": 0.65, "learning_rate": 5.748439320812238e-06, "loss": 0.791, "step": 9547 }, { "epoch": 0.65, "learning_rate": 5.7464415894197266e-06, "loss": 0.7773, "step": 9548 }, { "epoch": 0.65, "learning_rate": 5.744444065260382e-06, "loss": 0.7832, "step": 9549 }, { "epoch": 0.65, "learning_rate": 5.742446748431509e-06, "loss": 0.7656, "step": 9550 }, { "epoch": 0.65, "learning_rate": 5.740449639030424e-06, "loss": 0.7324, "step": 9551 }, { "epoch": 0.65, "learning_rate": 5.7384527371544295e-06, "loss": 0.7695, "step": 9552 }, { "epoch": 0.65, "learning_rate": 5.736456042900804e-06, "loss": 0.8389, "step": 9553 }, { "epoch": 0.65, "learning_rate": 5.734459556366831e-06, "loss": 0.7334, "step": 9554 }, { "epoch": 0.65, "learning_rate": 5.732463277649787e-06, "loss": 0.7031, "step": 9555 }, { "epoch": 0.65, "learning_rate": 5.730467206846919e-06, "loss": 0.6846, "step": 9556 }, { "epoch": 0.65, "learning_rate": 5.728471344055482e-06, "loss": 0.8154, "step": 9557 }, { "epoch": 0.65, "learning_rate": 5.726475689372711e-06, "loss": 0.8037, "step": 9558 }, { "epoch": 0.65, "learning_rate": 5.724480242895842e-06, "loss": 0.8457, "step": 9559 }, { "epoch": 0.65, "learning_rate": 5.722485004722078e-06, "loss": 0.6318, "step": 9560 }, { "epoch": 0.65, "learning_rate": 5.72048997494864e-06, "loss": 0.7988, "step": 9561 }, { "epoch": 0.65, "learning_rate": 5.7184951536727255e-06, "loss": 0.7373, "step": 9562 }, { "epoch": 0.65, "learning_rate": 5.716500540991514e-06, "loss": 0.834, "step": 9563 }, { "epoch": 0.65, "learning_rate": 5.7145061370021885e-06, "loss": 0.8389, "step": 9564 }, { "epoch": 0.65, "learning_rate": 5.712511941801918e-06, "loss": 0.71, "step": 9565 }, { "epoch": 0.65, "learning_rate": 5.7105179554878484e-06, "loss": 0.793, "step": 9566 }, { "epoch": 0.65, "learning_rate": 5.70852417815714e-06, "loss": 0.7471, "step": 9567 }, { "epoch": 0.65, "learning_rate": 5.706530609906928e-06, "loss": 0.709, "step": 9568 }, { "epoch": 0.65, "learning_rate": 5.704537250834331e-06, "loss": 0.8066, "step": 9569 }, { "epoch": 0.65, "learning_rate": 5.702544101036469e-06, "loss": 0.7266, "step": 9570 }, { "epoch": 0.65, "learning_rate": 5.70055116061045e-06, "loss": 0.7422, "step": 9571 }, { "epoch": 0.65, "learning_rate": 5.698558429653369e-06, "loss": 0.7412, "step": 9572 }, { "epoch": 0.65, "learning_rate": 5.69656590826231e-06, "loss": 0.8369, "step": 9573 }, { "epoch": 0.65, "learning_rate": 5.694573596534352e-06, "loss": 0.8916, "step": 9574 }, { "epoch": 0.65, "learning_rate": 5.69258149456656e-06, "loss": 0.6924, "step": 9575 }, { "epoch": 0.65, "learning_rate": 5.690589602455986e-06, "loss": 0.7783, "step": 9576 }, { "epoch": 0.65, "learning_rate": 5.688597920299675e-06, "loss": 0.7939, "step": 9577 }, { "epoch": 0.65, "learning_rate": 5.686606448194664e-06, "loss": 0.7646, "step": 9578 }, { "epoch": 0.65, "learning_rate": 5.684615186237976e-06, "loss": 0.8496, "step": 9579 }, { "epoch": 0.65, "learning_rate": 5.682624134526625e-06, "loss": 0.7979, "step": 9580 }, { "epoch": 0.65, "learning_rate": 5.680633293157616e-06, "loss": 0.8125, "step": 9581 }, { "epoch": 0.65, "learning_rate": 5.678642662227947e-06, "loss": 0.7773, "step": 9582 }, { "epoch": 0.65, "learning_rate": 5.676652241834593e-06, "loss": 0.793, "step": 9583 }, { "epoch": 0.65, "learning_rate": 5.674662032074529e-06, "loss": 0.7158, "step": 9584 }, { "epoch": 0.65, "learning_rate": 5.672672033044721e-06, "loss": 0.709, "step": 9585 }, { "epoch": 0.65, "learning_rate": 5.67068224484212e-06, "loss": 0.6973, "step": 9586 }, { "epoch": 0.65, "learning_rate": 5.668692667563671e-06, "loss": 0.7432, "step": 9587 }, { "epoch": 0.65, "learning_rate": 5.666703301306307e-06, "loss": 0.7676, "step": 9588 }, { "epoch": 0.65, "learning_rate": 5.664714146166942e-06, "loss": 0.7363, "step": 9589 }, { "epoch": 0.65, "learning_rate": 5.662725202242488e-06, "loss": 0.7598, "step": 9590 }, { "epoch": 0.65, "learning_rate": 5.6607364696298595e-06, "loss": 0.7656, "step": 9591 }, { "epoch": 0.65, "learning_rate": 5.658747948425935e-06, "loss": 0.7627, "step": 9592 }, { "epoch": 0.65, "learning_rate": 5.656759638727598e-06, "loss": 0.7559, "step": 9593 }, { "epoch": 0.65, "learning_rate": 5.654771540631721e-06, "loss": 0.8154, "step": 9594 }, { "epoch": 0.65, "learning_rate": 5.652783654235164e-06, "loss": 0.7773, "step": 9595 }, { "epoch": 0.65, "learning_rate": 5.650795979634769e-06, "loss": 0.8066, "step": 9596 }, { "epoch": 0.65, "learning_rate": 5.648808516927387e-06, "loss": 0.7822, "step": 9597 }, { "epoch": 0.65, "learning_rate": 5.646821266209843e-06, "loss": 0.7969, "step": 9598 }, { "epoch": 0.65, "learning_rate": 5.644834227578952e-06, "loss": 0.7285, "step": 9599 }, { "epoch": 0.65, "learning_rate": 5.642847401131526e-06, "loss": 0.8408, "step": 9600 }, { "epoch": 0.65, "learning_rate": 5.640860786964364e-06, "loss": 0.792, "step": 9601 }, { "epoch": 0.65, "learning_rate": 5.638874385174246e-06, "loss": 0.7266, "step": 9602 }, { "epoch": 0.65, "learning_rate": 5.636888195857958e-06, "loss": 0.8213, "step": 9603 }, { "epoch": 0.65, "learning_rate": 5.634902219112268e-06, "loss": 0.7881, "step": 9604 }, { "epoch": 0.65, "learning_rate": 5.632916455033926e-06, "loss": 0.7559, "step": 9605 }, { "epoch": 0.65, "learning_rate": 5.630930903719682e-06, "loss": 0.7725, "step": 9606 }, { "epoch": 0.65, "learning_rate": 5.62894556526627e-06, "loss": 0.8584, "step": 9607 }, { "epoch": 0.65, "learning_rate": 5.626960439770417e-06, "loss": 0.7725, "step": 9608 }, { "epoch": 0.65, "learning_rate": 5.624975527328839e-06, "loss": 0.7119, "step": 9609 }, { "epoch": 0.65, "learning_rate": 5.62299082803824e-06, "loss": 0.8301, "step": 9610 }, { "epoch": 0.65, "learning_rate": 5.621006341995316e-06, "loss": 0.752, "step": 9611 }, { "epoch": 0.66, "learning_rate": 5.619022069296749e-06, "loss": 0.873, "step": 9612 }, { "epoch": 0.66, "learning_rate": 5.617038010039211e-06, "loss": 0.7881, "step": 9613 }, { "epoch": 0.66, "learning_rate": 5.615054164319367e-06, "loss": 0.7881, "step": 9614 }, { "epoch": 0.66, "learning_rate": 5.613070532233871e-06, "loss": 0.7686, "step": 9615 }, { "epoch": 0.66, "learning_rate": 5.6110871138793656e-06, "loss": 0.7607, "step": 9616 }, { "epoch": 0.66, "learning_rate": 5.609103909352485e-06, "loss": 0.7007, "step": 9617 }, { "epoch": 0.66, "learning_rate": 5.607120918749844e-06, "loss": 0.6826, "step": 9618 }, { "epoch": 0.66, "learning_rate": 5.605138142168058e-06, "loss": 0.6738, "step": 9619 }, { "epoch": 0.66, "learning_rate": 5.603155579703726e-06, "loss": 0.7461, "step": 9620 }, { "epoch": 0.66, "learning_rate": 5.60117323145344e-06, "loss": 0.7402, "step": 9621 }, { "epoch": 0.66, "learning_rate": 5.599191097513781e-06, "loss": 0.7373, "step": 9622 }, { "epoch": 0.66, "learning_rate": 5.5972091779813174e-06, "loss": 0.7783, "step": 9623 }, { "epoch": 0.66, "learning_rate": 5.595227472952611e-06, "loss": 0.7959, "step": 9624 }, { "epoch": 0.66, "learning_rate": 5.593245982524203e-06, "loss": 0.8721, "step": 9625 }, { "epoch": 0.66, "learning_rate": 5.591264706792632e-06, "loss": 0.7207, "step": 9626 }, { "epoch": 0.66, "learning_rate": 5.5892836458544376e-06, "loss": 0.8174, "step": 9627 }, { "epoch": 0.66, "learning_rate": 5.587302799806125e-06, "loss": 0.7598, "step": 9628 }, { "epoch": 0.66, "learning_rate": 5.585322168744205e-06, "loss": 0.8721, "step": 9629 }, { "epoch": 0.66, "learning_rate": 5.583341752765173e-06, "loss": 0.7617, "step": 9630 }, { "epoch": 0.66, "learning_rate": 5.581361551965521e-06, "loss": 0.8164, "step": 9631 }, { "epoch": 0.66, "learning_rate": 5.579381566441709e-06, "loss": 0.7285, "step": 9632 }, { "epoch": 0.66, "learning_rate": 5.577401796290216e-06, "loss": 0.6523, "step": 9633 }, { "epoch": 0.66, "learning_rate": 5.575422241607495e-06, "loss": 0.7852, "step": 9634 }, { "epoch": 0.66, "learning_rate": 5.573442902489984e-06, "loss": 0.8096, "step": 9635 }, { "epoch": 0.66, "learning_rate": 5.5714637790341184e-06, "loss": 0.7549, "step": 9636 }, { "epoch": 0.66, "learning_rate": 5.569484871336326e-06, "loss": 0.748, "step": 9637 }, { "epoch": 0.66, "learning_rate": 5.5675061794930055e-06, "loss": 0.7695, "step": 9638 }, { "epoch": 0.66, "learning_rate": 5.565527703600573e-06, "loss": 0.7744, "step": 9639 }, { "epoch": 0.66, "learning_rate": 5.563549443755417e-06, "loss": 0.7256, "step": 9640 }, { "epoch": 0.66, "learning_rate": 5.5615714000539135e-06, "loss": 0.8242, "step": 9641 }, { "epoch": 0.66, "learning_rate": 5.559593572592434e-06, "loss": 0.7607, "step": 9642 }, { "epoch": 0.66, "learning_rate": 5.557615961467338e-06, "loss": 0.751, "step": 9643 }, { "epoch": 0.66, "learning_rate": 5.555638566774978e-06, "loss": 0.8066, "step": 9644 }, { "epoch": 0.66, "learning_rate": 5.553661388611688e-06, "loss": 0.7998, "step": 9645 }, { "epoch": 0.66, "learning_rate": 5.5516844270738e-06, "loss": 0.7783, "step": 9646 }, { "epoch": 0.66, "learning_rate": 5.549707682257634e-06, "loss": 0.793, "step": 9647 }, { "epoch": 0.66, "learning_rate": 5.547731154259488e-06, "loss": 0.874, "step": 9648 }, { "epoch": 0.66, "learning_rate": 5.545754843175663e-06, "loss": 0.7559, "step": 9649 }, { "epoch": 0.66, "learning_rate": 5.5437787491024445e-06, "loss": 0.7725, "step": 9650 }, { "epoch": 0.66, "learning_rate": 5.541802872136108e-06, "loss": 0.7686, "step": 9651 }, { "epoch": 0.66, "learning_rate": 5.539827212372919e-06, "loss": 0.7422, "step": 9652 }, { "epoch": 0.66, "learning_rate": 5.537851769909135e-06, "loss": 0.7285, "step": 9653 }, { "epoch": 0.66, "learning_rate": 5.5358765448409905e-06, "loss": 0.6914, "step": 9654 }, { "epoch": 0.66, "learning_rate": 5.533901537264719e-06, "loss": 0.8408, "step": 9655 }, { "epoch": 0.66, "learning_rate": 5.531926747276554e-06, "loss": 0.7861, "step": 9656 }, { "epoch": 0.66, "learning_rate": 5.529952174972697e-06, "loss": 0.8701, "step": 9657 }, { "epoch": 0.66, "learning_rate": 5.527977820449351e-06, "loss": 0.7881, "step": 9658 }, { "epoch": 0.66, "learning_rate": 5.526003683802709e-06, "loss": 0.8623, "step": 9659 }, { "epoch": 0.66, "learning_rate": 5.524029765128952e-06, "loss": 0.7939, "step": 9660 }, { "epoch": 0.66, "learning_rate": 5.52205606452424e-06, "loss": 0.8115, "step": 9661 }, { "epoch": 0.66, "learning_rate": 5.52008258208474e-06, "loss": 0.79, "step": 9662 }, { "epoch": 0.66, "learning_rate": 5.5181093179066035e-06, "loss": 0.7227, "step": 9663 }, { "epoch": 0.66, "learning_rate": 5.516136272085959e-06, "loss": 0.7529, "step": 9664 }, { "epoch": 0.66, "learning_rate": 5.514163444718937e-06, "loss": 0.751, "step": 9665 }, { "epoch": 0.66, "learning_rate": 5.5121908359016516e-06, "loss": 0.751, "step": 9666 }, { "epoch": 0.66, "learning_rate": 5.510218445730211e-06, "loss": 0.8311, "step": 9667 }, { "epoch": 0.66, "learning_rate": 5.5082462743007085e-06, "loss": 0.7656, "step": 9668 }, { "epoch": 0.66, "learning_rate": 5.506274321709229e-06, "loss": 0.7314, "step": 9669 }, { "epoch": 0.66, "learning_rate": 5.504302588051847e-06, "loss": 0.7246, "step": 9670 }, { "epoch": 0.66, "learning_rate": 5.502331073424621e-06, "loss": 0.7139, "step": 9671 }, { "epoch": 0.66, "learning_rate": 5.500359777923607e-06, "loss": 0.8174, "step": 9672 }, { "epoch": 0.66, "learning_rate": 5.498388701644845e-06, "loss": 0.7422, "step": 9673 }, { "epoch": 0.66, "learning_rate": 5.496417844684365e-06, "loss": 0.709, "step": 9674 }, { "epoch": 0.66, "learning_rate": 5.494447207138187e-06, "loss": 0.792, "step": 9675 }, { "epoch": 0.66, "learning_rate": 5.492476789102328e-06, "loss": 0.6934, "step": 9676 }, { "epoch": 0.66, "learning_rate": 5.490506590672774e-06, "loss": 0.7393, "step": 9677 }, { "epoch": 0.66, "learning_rate": 5.48853661194552e-06, "loss": 0.7734, "step": 9678 }, { "epoch": 0.66, "learning_rate": 5.486566853016542e-06, "loss": 0.707, "step": 9679 }, { "epoch": 0.66, "learning_rate": 5.484597313981805e-06, "loss": 0.7949, "step": 9680 }, { "epoch": 0.66, "learning_rate": 5.4826279949372686e-06, "loss": 0.7852, "step": 9681 }, { "epoch": 0.66, "learning_rate": 5.4806588959788766e-06, "loss": 0.668, "step": 9682 }, { "epoch": 0.66, "learning_rate": 5.478690017202566e-06, "loss": 0.7803, "step": 9683 }, { "epoch": 0.66, "learning_rate": 5.476721358704253e-06, "loss": 0.7314, "step": 9684 }, { "epoch": 0.66, "learning_rate": 5.474752920579851e-06, "loss": 0.7266, "step": 9685 }, { "epoch": 0.66, "learning_rate": 5.4727847029252735e-06, "loss": 0.8008, "step": 9686 }, { "epoch": 0.66, "learning_rate": 5.470816705836401e-06, "loss": 0.7412, "step": 9687 }, { "epoch": 0.66, "learning_rate": 5.468848929409119e-06, "loss": 0.7686, "step": 9688 }, { "epoch": 0.66, "learning_rate": 5.466881373739298e-06, "loss": 0.7715, "step": 9689 }, { "epoch": 0.66, "learning_rate": 5.464914038922793e-06, "loss": 0.748, "step": 9690 }, { "epoch": 0.66, "learning_rate": 5.46294692505545e-06, "loss": 0.7207, "step": 9691 }, { "epoch": 0.66, "learning_rate": 5.460980032233118e-06, "loss": 0.8545, "step": 9692 }, { "epoch": 0.66, "learning_rate": 5.4590133605516174e-06, "loss": 0.7686, "step": 9693 }, { "epoch": 0.66, "learning_rate": 5.4570469101067614e-06, "loss": 0.7627, "step": 9694 }, { "epoch": 0.66, "learning_rate": 5.455080680994359e-06, "loss": 0.7295, "step": 9695 }, { "epoch": 0.66, "learning_rate": 5.453114673310209e-06, "loss": 0.8037, "step": 9696 }, { "epoch": 0.66, "learning_rate": 5.451148887150082e-06, "loss": 0.8232, "step": 9697 }, { "epoch": 0.66, "learning_rate": 5.449183322609763e-06, "loss": 0.7881, "step": 9698 }, { "epoch": 0.66, "learning_rate": 5.447217979785014e-06, "loss": 0.7158, "step": 9699 }, { "epoch": 0.66, "learning_rate": 5.44525285877158e-06, "loss": 0.8311, "step": 9700 }, { "epoch": 0.66, "learning_rate": 5.443287959665205e-06, "loss": 0.7725, "step": 9701 }, { "epoch": 0.66, "learning_rate": 5.441323282561617e-06, "loss": 0.7588, "step": 9702 }, { "epoch": 0.66, "learning_rate": 5.439358827556538e-06, "loss": 0.7979, "step": 9703 }, { "epoch": 0.66, "learning_rate": 5.437394594745673e-06, "loss": 0.7754, "step": 9704 }, { "epoch": 0.66, "learning_rate": 5.435430584224726e-06, "loss": 0.7822, "step": 9705 }, { "epoch": 0.66, "learning_rate": 5.433466796089373e-06, "loss": 0.7441, "step": 9706 }, { "epoch": 0.66, "learning_rate": 5.431503230435296e-06, "loss": 0.7021, "step": 9707 }, { "epoch": 0.66, "learning_rate": 5.429539887358159e-06, "loss": 0.7754, "step": 9708 }, { "epoch": 0.66, "learning_rate": 5.427576766953615e-06, "loss": 0.8057, "step": 9709 }, { "epoch": 0.66, "learning_rate": 5.425613869317309e-06, "loss": 0.8066, "step": 9710 }, { "epoch": 0.66, "learning_rate": 5.423651194544871e-06, "loss": 0.8232, "step": 9711 }, { "epoch": 0.66, "learning_rate": 5.421688742731929e-06, "loss": 0.8066, "step": 9712 }, { "epoch": 0.66, "learning_rate": 5.419726513974083e-06, "loss": 0.8086, "step": 9713 }, { "epoch": 0.66, "learning_rate": 5.4177645083669385e-06, "loss": 0.8486, "step": 9714 }, { "epoch": 0.66, "learning_rate": 5.415802726006083e-06, "loss": 0.7852, "step": 9715 }, { "epoch": 0.66, "learning_rate": 5.413841166987096e-06, "loss": 0.7373, "step": 9716 }, { "epoch": 0.66, "learning_rate": 5.411879831405543e-06, "loss": 0.7656, "step": 9717 }, { "epoch": 0.66, "learning_rate": 5.4099187193569815e-06, "loss": 0.8027, "step": 9718 }, { "epoch": 0.66, "learning_rate": 5.407957830936959e-06, "loss": 0.8164, "step": 9719 }, { "epoch": 0.66, "learning_rate": 5.405997166241003e-06, "loss": 0.7266, "step": 9720 }, { "epoch": 0.66, "learning_rate": 5.40403672536464e-06, "loss": 0.7559, "step": 9721 }, { "epoch": 0.66, "learning_rate": 5.402076508403389e-06, "loss": 0.7422, "step": 9722 }, { "epoch": 0.66, "learning_rate": 5.4001165154527426e-06, "loss": 0.7627, "step": 9723 }, { "epoch": 0.66, "learning_rate": 5.398156746608197e-06, "loss": 0.709, "step": 9724 }, { "epoch": 0.66, "learning_rate": 5.396197201965232e-06, "loss": 0.8008, "step": 9725 }, { "epoch": 0.66, "learning_rate": 5.394237881619311e-06, "loss": 0.7393, "step": 9726 }, { "epoch": 0.66, "learning_rate": 5.392278785665892e-06, "loss": 0.8633, "step": 9727 }, { "epoch": 0.66, "learning_rate": 5.390319914200435e-06, "loss": 0.6787, "step": 9728 }, { "epoch": 0.66, "learning_rate": 5.388361267318362e-06, "loss": 0.7734, "step": 9729 }, { "epoch": 0.66, "learning_rate": 5.386402845115103e-06, "loss": 0.8125, "step": 9730 }, { "epoch": 0.66, "learning_rate": 5.3844446476860725e-06, "loss": 0.7764, "step": 9731 }, { "epoch": 0.66, "learning_rate": 5.382486675126678e-06, "loss": 0.7314, "step": 9732 }, { "epoch": 0.66, "learning_rate": 5.380528927532299e-06, "loss": 0.8271, "step": 9733 }, { "epoch": 0.66, "learning_rate": 5.37857140499833e-06, "loss": 0.75, "step": 9734 }, { "epoch": 0.66, "learning_rate": 5.376614107620141e-06, "loss": 0.7617, "step": 9735 }, { "epoch": 0.66, "learning_rate": 5.374657035493083e-06, "loss": 0.8125, "step": 9736 }, { "epoch": 0.66, "learning_rate": 5.372700188712508e-06, "loss": 0.7822, "step": 9737 }, { "epoch": 0.66, "learning_rate": 5.370743567373759e-06, "loss": 0.7383, "step": 9738 }, { "epoch": 0.66, "learning_rate": 5.36878717157215e-06, "loss": 0.751, "step": 9739 }, { "epoch": 0.66, "learning_rate": 5.366831001403006e-06, "loss": 0.7861, "step": 9740 }, { "epoch": 0.66, "learning_rate": 5.364875056961636e-06, "loss": 0.8037, "step": 9741 }, { "epoch": 0.66, "learning_rate": 5.362919338343322e-06, "loss": 0.7539, "step": 9742 }, { "epoch": 0.66, "learning_rate": 5.360963845643352e-06, "loss": 0.7793, "step": 9743 }, { "epoch": 0.66, "learning_rate": 5.359008578956997e-06, "loss": 0.8398, "step": 9744 }, { "epoch": 0.66, "learning_rate": 5.357053538379517e-06, "loss": 0.6572, "step": 9745 }, { "epoch": 0.66, "learning_rate": 5.355098724006164e-06, "loss": 0.7285, "step": 9746 }, { "epoch": 0.66, "learning_rate": 5.3531441359321735e-06, "loss": 0.8242, "step": 9747 }, { "epoch": 0.66, "learning_rate": 5.3511897742527784e-06, "loss": 0.8096, "step": 9748 }, { "epoch": 0.66, "learning_rate": 5.349235639063186e-06, "loss": 0.7461, "step": 9749 }, { "epoch": 0.66, "learning_rate": 5.3472817304586065e-06, "loss": 0.7588, "step": 9750 }, { "epoch": 0.66, "learning_rate": 5.345328048534235e-06, "loss": 0.749, "step": 9751 }, { "epoch": 0.66, "learning_rate": 5.343374593385254e-06, "loss": 0.7715, "step": 9752 }, { "epoch": 0.66, "learning_rate": 5.341421365106836e-06, "loss": 0.7373, "step": 9753 }, { "epoch": 0.66, "learning_rate": 5.339468363794142e-06, "loss": 0.7236, "step": 9754 }, { "epoch": 0.66, "learning_rate": 5.3375155895423245e-06, "loss": 0.8096, "step": 9755 }, { "epoch": 0.66, "learning_rate": 5.335563042446517e-06, "loss": 0.7568, "step": 9756 }, { "epoch": 0.66, "learning_rate": 5.333610722601852e-06, "loss": 0.6719, "step": 9757 }, { "epoch": 0.66, "learning_rate": 5.331658630103442e-06, "loss": 0.7529, "step": 9758 }, { "epoch": 0.67, "learning_rate": 5.329706765046399e-06, "loss": 0.7178, "step": 9759 }, { "epoch": 0.67, "learning_rate": 5.327755127525813e-06, "loss": 0.8301, "step": 9760 }, { "epoch": 0.67, "learning_rate": 5.325803717636773e-06, "loss": 0.7686, "step": 9761 }, { "epoch": 0.67, "learning_rate": 5.3238525354743455e-06, "loss": 0.8525, "step": 9762 }, { "epoch": 0.67, "learning_rate": 5.3219015811335885e-06, "loss": 0.7686, "step": 9763 }, { "epoch": 0.67, "learning_rate": 5.319950854709568e-06, "loss": 0.7295, "step": 9764 }, { "epoch": 0.67, "learning_rate": 5.318000356297308e-06, "loss": 0.7959, "step": 9765 }, { "epoch": 0.67, "learning_rate": 5.316050085991844e-06, "loss": 0.7197, "step": 9766 }, { "epoch": 0.67, "learning_rate": 5.314100043888191e-06, "loss": 0.6934, "step": 9767 }, { "epoch": 0.67, "learning_rate": 5.312150230081359e-06, "loss": 0.6992, "step": 9768 }, { "epoch": 0.67, "learning_rate": 5.31020064466633e-06, "loss": 0.832, "step": 9769 }, { "epoch": 0.67, "learning_rate": 5.3082512877381025e-06, "loss": 0.834, "step": 9770 }, { "epoch": 0.67, "learning_rate": 5.306302159391647e-06, "loss": 0.7607, "step": 9771 }, { "epoch": 0.67, "learning_rate": 5.304353259721917e-06, "loss": 0.7539, "step": 9772 }, { "epoch": 0.67, "learning_rate": 5.302404588823869e-06, "loss": 0.791, "step": 9773 }, { "epoch": 0.67, "learning_rate": 5.3004561467924386e-06, "loss": 0.7676, "step": 9774 }, { "epoch": 0.67, "learning_rate": 5.2985079337225556e-06, "loss": 0.8203, "step": 9775 }, { "epoch": 0.67, "learning_rate": 5.2965599497091365e-06, "loss": 0.7764, "step": 9776 }, { "epoch": 0.67, "learning_rate": 5.2946121948470915e-06, "loss": 0.748, "step": 9777 }, { "epoch": 0.67, "learning_rate": 5.2926646692313076e-06, "loss": 0.7363, "step": 9778 }, { "epoch": 0.67, "learning_rate": 5.290717372956671e-06, "loss": 0.7148, "step": 9779 }, { "epoch": 0.67, "learning_rate": 5.288770306118055e-06, "loss": 0.8018, "step": 9780 }, { "epoch": 0.67, "learning_rate": 5.286823468810319e-06, "loss": 0.6572, "step": 9781 }, { "epoch": 0.67, "learning_rate": 5.284876861128314e-06, "loss": 0.7383, "step": 9782 }, { "epoch": 0.67, "learning_rate": 5.2829304831668795e-06, "loss": 0.8633, "step": 9783 }, { "epoch": 0.67, "learning_rate": 5.280984335020844e-06, "loss": 0.8037, "step": 9784 }, { "epoch": 0.67, "learning_rate": 5.2790384167850185e-06, "loss": 0.7998, "step": 9785 }, { "epoch": 0.67, "learning_rate": 5.2770927285542074e-06, "loss": 0.7812, "step": 9786 }, { "epoch": 0.67, "learning_rate": 5.275147270423215e-06, "loss": 0.8369, "step": 9787 }, { "epoch": 0.67, "learning_rate": 5.2732020424868146e-06, "loss": 0.749, "step": 9788 }, { "epoch": 0.67, "learning_rate": 5.271257044839779e-06, "loss": 0.7383, "step": 9789 }, { "epoch": 0.67, "learning_rate": 5.26931227757687e-06, "loss": 0.7324, "step": 9790 }, { "epoch": 0.67, "learning_rate": 5.2673677407928415e-06, "loss": 0.7666, "step": 9791 }, { "epoch": 0.67, "learning_rate": 5.265423434582416e-06, "loss": 0.7842, "step": 9792 }, { "epoch": 0.67, "learning_rate": 5.263479359040339e-06, "loss": 0.7744, "step": 9793 }, { "epoch": 0.67, "learning_rate": 5.2615355142613124e-06, "loss": 0.7861, "step": 9794 }, { "epoch": 0.67, "learning_rate": 5.259591900340044e-06, "loss": 0.7217, "step": 9795 }, { "epoch": 0.67, "learning_rate": 5.257648517371227e-06, "loss": 0.8301, "step": 9796 }, { "epoch": 0.67, "learning_rate": 5.2557053654495486e-06, "loss": 0.7812, "step": 9797 }, { "epoch": 0.67, "learning_rate": 5.2537624446696635e-06, "loss": 0.8184, "step": 9798 }, { "epoch": 0.67, "learning_rate": 5.251819755126245e-06, "loss": 0.8271, "step": 9799 }, { "epoch": 0.67, "learning_rate": 5.249877296913941e-06, "loss": 0.7412, "step": 9800 }, { "epoch": 0.67, "learning_rate": 5.247935070127379e-06, "loss": 0.7061, "step": 9801 }, { "epoch": 0.67, "learning_rate": 5.245993074861189e-06, "loss": 0.7754, "step": 9802 }, { "epoch": 0.67, "learning_rate": 5.244051311209983e-06, "loss": 0.7734, "step": 9803 }, { "epoch": 0.67, "learning_rate": 5.242109779268367e-06, "loss": 0.8057, "step": 9804 }, { "epoch": 0.67, "learning_rate": 5.240168479130932e-06, "loss": 0.7393, "step": 9805 }, { "epoch": 0.67, "learning_rate": 5.238227410892254e-06, "loss": 0.8428, "step": 9806 }, { "epoch": 0.67, "learning_rate": 5.236286574646909e-06, "loss": 0.8047, "step": 9807 }, { "epoch": 0.67, "learning_rate": 5.234345970489445e-06, "loss": 0.7275, "step": 9808 }, { "epoch": 0.67, "learning_rate": 5.232405598514414e-06, "loss": 0.7861, "step": 9809 }, { "epoch": 0.67, "learning_rate": 5.230465458816349e-06, "loss": 0.7588, "step": 9810 }, { "epoch": 0.67, "learning_rate": 5.228525551489775e-06, "loss": 0.7393, "step": 9811 }, { "epoch": 0.67, "learning_rate": 5.226585876629203e-06, "loss": 0.7832, "step": 9812 }, { "epoch": 0.67, "learning_rate": 5.224646434329139e-06, "loss": 0.708, "step": 9813 }, { "epoch": 0.67, "learning_rate": 5.222707224684063e-06, "loss": 0.793, "step": 9814 }, { "epoch": 0.67, "learning_rate": 5.220768247788458e-06, "loss": 0.7144, "step": 9815 }, { "epoch": 0.67, "learning_rate": 5.218829503736791e-06, "loss": 0.7412, "step": 9816 }, { "epoch": 0.67, "learning_rate": 5.216890992623518e-06, "loss": 0.7295, "step": 9817 }, { "epoch": 0.67, "learning_rate": 5.214952714543082e-06, "loss": 0.6709, "step": 9818 }, { "epoch": 0.67, "learning_rate": 5.2130146695899174e-06, "loss": 0.7871, "step": 9819 }, { "epoch": 0.67, "learning_rate": 5.211076857858447e-06, "loss": 0.7783, "step": 9820 }, { "epoch": 0.67, "learning_rate": 5.209139279443076e-06, "loss": 0.8428, "step": 9821 }, { "epoch": 0.67, "learning_rate": 5.207201934438201e-06, "loss": 0.7783, "step": 9822 }, { "epoch": 0.67, "learning_rate": 5.205264822938222e-06, "loss": 0.7432, "step": 9823 }, { "epoch": 0.67, "learning_rate": 5.203327945037503e-06, "loss": 0.7295, "step": 9824 }, { "epoch": 0.67, "learning_rate": 5.2013913008304125e-06, "loss": 0.7686, "step": 9825 }, { "epoch": 0.67, "learning_rate": 5.199454890411309e-06, "loss": 0.6582, "step": 9826 }, { "epoch": 0.67, "learning_rate": 5.197518713874523e-06, "loss": 0.7754, "step": 9827 }, { "epoch": 0.67, "learning_rate": 5.195582771314389e-06, "loss": 0.7422, "step": 9828 }, { "epoch": 0.67, "learning_rate": 5.193647062825236e-06, "loss": 0.7168, "step": 9829 }, { "epoch": 0.67, "learning_rate": 5.191711588501358e-06, "loss": 0.8564, "step": 9830 }, { "epoch": 0.67, "learning_rate": 5.189776348437058e-06, "loss": 0.6729, "step": 9831 }, { "epoch": 0.67, "learning_rate": 5.1878413427266195e-06, "loss": 0.8223, "step": 9832 }, { "epoch": 0.67, "learning_rate": 5.185906571464321e-06, "loss": 0.791, "step": 9833 }, { "epoch": 0.67, "learning_rate": 5.18397203474441e-06, "loss": 0.8037, "step": 9834 }, { "epoch": 0.67, "learning_rate": 5.182037732661151e-06, "loss": 0.7949, "step": 9835 }, { "epoch": 0.67, "learning_rate": 5.180103665308783e-06, "loss": 0.7344, "step": 9836 }, { "epoch": 0.67, "learning_rate": 5.178169832781526e-06, "loss": 0.8398, "step": 9837 }, { "epoch": 0.67, "learning_rate": 5.176236235173599e-06, "loss": 0.7549, "step": 9838 }, { "epoch": 0.67, "learning_rate": 5.174302872579208e-06, "loss": 0.7871, "step": 9839 }, { "epoch": 0.67, "learning_rate": 5.172369745092545e-06, "loss": 0.7812, "step": 9840 }, { "epoch": 0.67, "learning_rate": 5.170436852807793e-06, "loss": 0.7744, "step": 9841 }, { "epoch": 0.67, "learning_rate": 5.168504195819122e-06, "loss": 0.7285, "step": 9842 }, { "epoch": 0.67, "learning_rate": 5.1665717742206945e-06, "loss": 0.8809, "step": 9843 }, { "epoch": 0.67, "learning_rate": 5.1646395881066504e-06, "loss": 0.7578, "step": 9844 }, { "epoch": 0.67, "learning_rate": 5.162707637571131e-06, "loss": 0.8369, "step": 9845 }, { "epoch": 0.67, "learning_rate": 5.160775922708259e-06, "loss": 0.7197, "step": 9846 }, { "epoch": 0.67, "learning_rate": 5.1588444436121465e-06, "loss": 0.7412, "step": 9847 }, { "epoch": 0.67, "learning_rate": 5.1569132003768985e-06, "loss": 0.7734, "step": 9848 }, { "epoch": 0.67, "learning_rate": 5.154982193096606e-06, "loss": 0.7305, "step": 9849 }, { "epoch": 0.67, "learning_rate": 5.153051421865341e-06, "loss": 0.7891, "step": 9850 }, { "epoch": 0.67, "learning_rate": 5.151120886777174e-06, "loss": 0.7773, "step": 9851 }, { "epoch": 0.67, "learning_rate": 5.149190587926162e-06, "loss": 0.7197, "step": 9852 }, { "epoch": 0.67, "learning_rate": 5.147260525406348e-06, "loss": 0.8438, "step": 9853 }, { "epoch": 0.67, "learning_rate": 5.145330699311765e-06, "loss": 0.7725, "step": 9854 }, { "epoch": 0.67, "learning_rate": 5.143401109736432e-06, "loss": 0.7881, "step": 9855 }, { "epoch": 0.67, "learning_rate": 5.141471756774365e-06, "loss": 0.8135, "step": 9856 }, { "epoch": 0.67, "learning_rate": 5.139542640519552e-06, "loss": 0.8066, "step": 9857 }, { "epoch": 0.67, "learning_rate": 5.137613761065983e-06, "loss": 0.752, "step": 9858 }, { "epoch": 0.67, "learning_rate": 5.135685118507641e-06, "loss": 0.6885, "step": 9859 }, { "epoch": 0.67, "learning_rate": 5.133756712938478e-06, "loss": 0.7812, "step": 9860 }, { "epoch": 0.67, "learning_rate": 5.131828544452452e-06, "loss": 0.8027, "step": 9861 }, { "epoch": 0.67, "learning_rate": 5.1299006131435045e-06, "loss": 0.7412, "step": 9862 }, { "epoch": 0.67, "learning_rate": 5.127972919105559e-06, "loss": 0.7236, "step": 9863 }, { "epoch": 0.67, "learning_rate": 5.12604546243253e-06, "loss": 0.6719, "step": 9864 }, { "epoch": 0.67, "learning_rate": 5.124118243218338e-06, "loss": 0.7754, "step": 9865 }, { "epoch": 0.67, "learning_rate": 5.122191261556862e-06, "loss": 0.751, "step": 9866 }, { "epoch": 0.67, "learning_rate": 5.120264517541991e-06, "loss": 0.7754, "step": 9867 }, { "epoch": 0.67, "learning_rate": 5.118338011267594e-06, "loss": 0.7676, "step": 9868 }, { "epoch": 0.67, "learning_rate": 5.116411742827534e-06, "loss": 0.7197, "step": 9869 }, { "epoch": 0.67, "learning_rate": 5.114485712315649e-06, "loss": 0.7559, "step": 9870 }, { "epoch": 0.67, "learning_rate": 5.112559919825786e-06, "loss": 0.8252, "step": 9871 }, { "epoch": 0.67, "learning_rate": 5.11063436545177e-06, "loss": 0.7686, "step": 9872 }, { "epoch": 0.67, "learning_rate": 5.108709049287403e-06, "loss": 0.7334, "step": 9873 }, { "epoch": 0.67, "learning_rate": 5.106783971426494e-06, "loss": 0.8203, "step": 9874 }, { "epoch": 0.67, "learning_rate": 5.104859131962832e-06, "loss": 0.7344, "step": 9875 }, { "epoch": 0.67, "learning_rate": 5.102934530990194e-06, "loss": 0.7812, "step": 9876 }, { "epoch": 0.67, "learning_rate": 5.101010168602345e-06, "loss": 0.7227, "step": 9877 }, { "epoch": 0.67, "learning_rate": 5.099086044893048e-06, "loss": 0.8359, "step": 9878 }, { "epoch": 0.67, "learning_rate": 5.097162159956035e-06, "loss": 0.7471, "step": 9879 }, { "epoch": 0.67, "learning_rate": 5.095238513885041e-06, "loss": 0.8506, "step": 9880 }, { "epoch": 0.67, "learning_rate": 5.09331510677379e-06, "loss": 0.6943, "step": 9881 }, { "epoch": 0.67, "learning_rate": 5.091391938715986e-06, "loss": 0.7725, "step": 9882 }, { "epoch": 0.67, "learning_rate": 5.089469009805328e-06, "loss": 0.7803, "step": 9883 }, { "epoch": 0.67, "learning_rate": 5.087546320135501e-06, "loss": 0.7764, "step": 9884 }, { "epoch": 0.67, "learning_rate": 5.08562386980018e-06, "loss": 0.8506, "step": 9885 }, { "epoch": 0.67, "learning_rate": 5.083701658893022e-06, "loss": 0.7539, "step": 9886 }, { "epoch": 0.67, "learning_rate": 5.08177968750768e-06, "loss": 0.8271, "step": 9887 }, { "epoch": 0.67, "learning_rate": 5.079857955737791e-06, "loss": 0.7314, "step": 9888 }, { "epoch": 0.67, "learning_rate": 5.077936463676981e-06, "loss": 0.7861, "step": 9889 }, { "epoch": 0.67, "learning_rate": 5.0760152114188675e-06, "loss": 0.7402, "step": 9890 }, { "epoch": 0.67, "learning_rate": 5.074094199057054e-06, "loss": 0.8252, "step": 9891 }, { "epoch": 0.67, "learning_rate": 5.072173426685132e-06, "loss": 0.8271, "step": 9892 }, { "epoch": 0.67, "learning_rate": 5.070252894396675e-06, "loss": 0.8213, "step": 9893 }, { "epoch": 0.67, "learning_rate": 5.06833260228526e-06, "loss": 0.7998, "step": 9894 }, { "epoch": 0.67, "learning_rate": 5.066412550444444e-06, "loss": 0.7734, "step": 9895 }, { "epoch": 0.67, "learning_rate": 5.064492738967763e-06, "loss": 0.7363, "step": 9896 }, { "epoch": 0.67, "learning_rate": 5.062573167948756e-06, "loss": 0.8242, "step": 9897 }, { "epoch": 0.67, "learning_rate": 5.060653837480947e-06, "loss": 0.748, "step": 9898 }, { "epoch": 0.67, "learning_rate": 5.058734747657834e-06, "loss": 0.7148, "step": 9899 }, { "epoch": 0.67, "learning_rate": 5.056815898572929e-06, "loss": 0.79, "step": 9900 }, { "epoch": 0.67, "learning_rate": 5.054897290319713e-06, "loss": 0.8262, "step": 9901 }, { "epoch": 0.67, "learning_rate": 5.052978922991658e-06, "loss": 0.7734, "step": 9902 }, { "epoch": 0.67, "learning_rate": 5.051060796682229e-06, "loss": 0.6113, "step": 9903 }, { "epoch": 0.67, "learning_rate": 5.049142911484876e-06, "loss": 0.748, "step": 9904 }, { "epoch": 0.68, "learning_rate": 5.047225267493039e-06, "loss": 0.8262, "step": 9905 }, { "epoch": 0.68, "learning_rate": 5.045307864800145e-06, "loss": 0.7588, "step": 9906 }, { "epoch": 0.68, "learning_rate": 5.043390703499611e-06, "loss": 0.7744, "step": 9907 }, { "epoch": 0.68, "learning_rate": 5.041473783684844e-06, "loss": 0.7158, "step": 9908 }, { "epoch": 0.68, "learning_rate": 5.039557105449229e-06, "loss": 0.8135, "step": 9909 }, { "epoch": 0.68, "learning_rate": 5.037640668886148e-06, "loss": 0.7891, "step": 9910 }, { "epoch": 0.68, "learning_rate": 5.035724474088972e-06, "loss": 0.6836, "step": 9911 }, { "epoch": 0.68, "learning_rate": 5.033808521151059e-06, "loss": 0.8018, "step": 9912 }, { "epoch": 0.68, "learning_rate": 5.0318928101657525e-06, "loss": 0.7617, "step": 9913 }, { "epoch": 0.68, "learning_rate": 5.029977341226388e-06, "loss": 0.8154, "step": 9914 }, { "epoch": 0.68, "learning_rate": 5.028062114426284e-06, "loss": 0.752, "step": 9915 }, { "epoch": 0.68, "learning_rate": 5.026147129858749e-06, "loss": 0.8018, "step": 9916 }, { "epoch": 0.68, "learning_rate": 5.0242323876170855e-06, "loss": 0.7793, "step": 9917 }, { "epoch": 0.68, "learning_rate": 5.022317887794576e-06, "loss": 0.7422, "step": 9918 }, { "epoch": 0.68, "learning_rate": 5.020403630484496e-06, "loss": 0.7686, "step": 9919 }, { "epoch": 0.68, "learning_rate": 5.0184896157801085e-06, "loss": 0.8584, "step": 9920 }, { "epoch": 0.68, "learning_rate": 5.0165758437746685e-06, "loss": 0.7676, "step": 9921 }, { "epoch": 0.68, "learning_rate": 5.014662314561405e-06, "loss": 0.8115, "step": 9922 }, { "epoch": 0.68, "learning_rate": 5.012749028233548e-06, "loss": 0.8076, "step": 9923 }, { "epoch": 0.68, "learning_rate": 5.010835984884322e-06, "loss": 0.8037, "step": 9924 }, { "epoch": 0.68, "learning_rate": 5.00892318460692e-06, "loss": 0.7939, "step": 9925 }, { "epoch": 0.68, "learning_rate": 5.007010627494537e-06, "loss": 0.7188, "step": 9926 }, { "epoch": 0.68, "learning_rate": 5.005098313640353e-06, "loss": 0.7793, "step": 9927 }, { "epoch": 0.68, "learning_rate": 5.003186243137539e-06, "loss": 0.8076, "step": 9928 }, { "epoch": 0.68, "learning_rate": 5.00127441607924e-06, "loss": 0.7793, "step": 9929 }, { "epoch": 0.68, "learning_rate": 4.999362832558612e-06, "loss": 0.7764, "step": 9930 }, { "epoch": 0.68, "learning_rate": 4.9974514926687865e-06, "loss": 0.8018, "step": 9931 }, { "epoch": 0.68, "learning_rate": 4.995540396502877e-06, "loss": 0.6992, "step": 9932 }, { "epoch": 0.68, "learning_rate": 4.9936295441539935e-06, "loss": 0.8691, "step": 9933 }, { "epoch": 0.68, "learning_rate": 4.99171893571524e-06, "loss": 0.7598, "step": 9934 }, { "epoch": 0.68, "learning_rate": 4.9898085712796885e-06, "loss": 0.7139, "step": 9935 }, { "epoch": 0.68, "learning_rate": 4.987898450940422e-06, "loss": 0.7773, "step": 9936 }, { "epoch": 0.68, "learning_rate": 4.9859885747905024e-06, "loss": 0.8213, "step": 9937 }, { "epoch": 0.68, "learning_rate": 4.984078942922971e-06, "loss": 0.7012, "step": 9938 }, { "epoch": 0.68, "learning_rate": 4.982169555430868e-06, "loss": 0.7197, "step": 9939 }, { "epoch": 0.68, "learning_rate": 4.980260412407221e-06, "loss": 0.7461, "step": 9940 }, { "epoch": 0.68, "learning_rate": 4.978351513945041e-06, "loss": 0.7959, "step": 9941 }, { "epoch": 0.68, "learning_rate": 4.9764428601373315e-06, "loss": 0.7236, "step": 9942 }, { "epoch": 0.68, "learning_rate": 4.97453445107708e-06, "loss": 0.6836, "step": 9943 }, { "epoch": 0.68, "learning_rate": 4.972626286857268e-06, "loss": 0.7744, "step": 9944 }, { "epoch": 0.68, "learning_rate": 4.970718367570856e-06, "loss": 0.7051, "step": 9945 }, { "epoch": 0.68, "learning_rate": 4.9688106933108e-06, "loss": 0.7334, "step": 9946 }, { "epoch": 0.68, "learning_rate": 4.96690326417004e-06, "loss": 0.8496, "step": 9947 }, { "epoch": 0.68, "learning_rate": 4.964996080241509e-06, "loss": 0.7949, "step": 9948 }, { "epoch": 0.68, "learning_rate": 4.963089141618122e-06, "loss": 0.791, "step": 9949 }, { "epoch": 0.68, "learning_rate": 4.96118244839279e-06, "loss": 0.8271, "step": 9950 }, { "epoch": 0.68, "learning_rate": 4.9592760006584015e-06, "loss": 0.8232, "step": 9951 }, { "epoch": 0.68, "learning_rate": 4.9573697985078395e-06, "loss": 0.7227, "step": 9952 }, { "epoch": 0.68, "learning_rate": 4.9554638420339755e-06, "loss": 0.8203, "step": 9953 }, { "epoch": 0.68, "learning_rate": 4.953558131329665e-06, "loss": 0.7988, "step": 9954 }, { "epoch": 0.68, "learning_rate": 4.951652666487758e-06, "loss": 0.833, "step": 9955 }, { "epoch": 0.68, "learning_rate": 4.949747447601088e-06, "loss": 0.7441, "step": 9956 }, { "epoch": 0.68, "learning_rate": 4.947842474762478e-06, "loss": 0.75, "step": 9957 }, { "epoch": 0.68, "learning_rate": 4.945937748064733e-06, "loss": 0.7598, "step": 9958 }, { "epoch": 0.68, "learning_rate": 4.944033267600651e-06, "loss": 0.7627, "step": 9959 }, { "epoch": 0.68, "learning_rate": 4.942129033463029e-06, "loss": 0.7158, "step": 9960 }, { "epoch": 0.68, "learning_rate": 4.94022504574463e-06, "loss": 0.7021, "step": 9961 }, { "epoch": 0.68, "learning_rate": 4.938321304538219e-06, "loss": 0.7451, "step": 9962 }, { "epoch": 0.68, "learning_rate": 4.936417809936549e-06, "loss": 0.8076, "step": 9963 }, { "epoch": 0.68, "learning_rate": 4.934514562032358e-06, "loss": 0.8145, "step": 9964 }, { "epoch": 0.68, "learning_rate": 4.932611560918365e-06, "loss": 0.7803, "step": 9965 }, { "epoch": 0.68, "learning_rate": 4.930708806687297e-06, "loss": 0.7744, "step": 9966 }, { "epoch": 0.68, "learning_rate": 4.928806299431844e-06, "loss": 0.7891, "step": 9967 }, { "epoch": 0.68, "learning_rate": 4.926904039244701e-06, "loss": 0.7471, "step": 9968 }, { "epoch": 0.68, "learning_rate": 4.925002026218546e-06, "loss": 0.7305, "step": 9969 }, { "epoch": 0.68, "learning_rate": 4.923100260446048e-06, "loss": 0.792, "step": 9970 }, { "epoch": 0.68, "learning_rate": 4.921198742019851e-06, "loss": 0.7861, "step": 9971 }, { "epoch": 0.68, "learning_rate": 4.919297471032608e-06, "loss": 0.7812, "step": 9972 }, { "epoch": 0.68, "learning_rate": 4.917396447576947e-06, "loss": 0.7363, "step": 9973 }, { "epoch": 0.68, "learning_rate": 4.91549567174548e-06, "loss": 0.7559, "step": 9974 }, { "epoch": 0.68, "learning_rate": 4.913595143630816e-06, "loss": 0.7588, "step": 9975 }, { "epoch": 0.68, "learning_rate": 4.911694863325548e-06, "loss": 0.7842, "step": 9976 }, { "epoch": 0.68, "learning_rate": 4.909794830922259e-06, "loss": 0.8135, "step": 9977 }, { "epoch": 0.68, "learning_rate": 4.907895046513516e-06, "loss": 0.8027, "step": 9978 }, { "epoch": 0.68, "learning_rate": 4.90599551019188e-06, "loss": 0.7002, "step": 9979 }, { "epoch": 0.68, "learning_rate": 4.904096222049896e-06, "loss": 0.8125, "step": 9980 }, { "epoch": 0.68, "learning_rate": 4.902197182180093e-06, "loss": 0.7285, "step": 9981 }, { "epoch": 0.68, "learning_rate": 4.900298390674994e-06, "loss": 0.7832, "step": 9982 }, { "epoch": 0.68, "learning_rate": 4.89839984762711e-06, "loss": 0.7393, "step": 9983 }, { "epoch": 0.68, "learning_rate": 4.896501553128936e-06, "loss": 0.6904, "step": 9984 }, { "epoch": 0.68, "learning_rate": 4.894603507272957e-06, "loss": 0.6924, "step": 9985 }, { "epoch": 0.68, "learning_rate": 4.892705710151651e-06, "loss": 0.7363, "step": 9986 }, { "epoch": 0.68, "learning_rate": 4.8908081618574685e-06, "loss": 0.8232, "step": 9987 }, { "epoch": 0.68, "learning_rate": 4.888910862482864e-06, "loss": 0.8408, "step": 9988 }, { "epoch": 0.68, "learning_rate": 4.887013812120274e-06, "loss": 0.8594, "step": 9989 }, { "epoch": 0.68, "learning_rate": 4.885117010862121e-06, "loss": 0.7119, "step": 9990 }, { "epoch": 0.68, "learning_rate": 4.883220458800817e-06, "loss": 0.7393, "step": 9991 }, { "epoch": 0.68, "learning_rate": 4.881324156028763e-06, "loss": 0.7305, "step": 9992 }, { "epoch": 0.68, "learning_rate": 4.87942810263835e-06, "loss": 0.7744, "step": 9993 }, { "epoch": 0.68, "learning_rate": 4.877532298721948e-06, "loss": 0.7861, "step": 9994 }, { "epoch": 0.68, "learning_rate": 4.875636744371917e-06, "loss": 0.7764, "step": 9995 }, { "epoch": 0.68, "learning_rate": 4.873741439680621e-06, "loss": 0.7588, "step": 9996 }, { "epoch": 0.68, "learning_rate": 4.871846384740391e-06, "loss": 0.6943, "step": 9997 }, { "epoch": 0.68, "learning_rate": 4.8699515796435525e-06, "loss": 0.7861, "step": 9998 }, { "epoch": 0.68, "learning_rate": 4.868057024482428e-06, "loss": 0.7461, "step": 9999 }, { "epoch": 0.68, "learning_rate": 4.866162719349311e-06, "loss": 0.7959, "step": 10000 }, { "epoch": 0.68, "learning_rate": 4.864268664336492e-06, "loss": 0.792, "step": 10001 }, { "epoch": 0.68, "learning_rate": 4.8623748595362606e-06, "loss": 0.7197, "step": 10002 }, { "epoch": 0.68, "learning_rate": 4.860481305040872e-06, "loss": 0.7988, "step": 10003 }, { "epoch": 0.68, "learning_rate": 4.858588000942583e-06, "loss": 0.7793, "step": 10004 }, { "epoch": 0.68, "learning_rate": 4.856694947333637e-06, "loss": 0.8076, "step": 10005 }, { "epoch": 0.68, "learning_rate": 4.854802144306266e-06, "loss": 0.7793, "step": 10006 }, { "epoch": 0.68, "learning_rate": 4.852909591952674e-06, "loss": 0.7471, "step": 10007 }, { "epoch": 0.68, "learning_rate": 4.851017290365082e-06, "loss": 0.7383, "step": 10008 }, { "epoch": 0.68, "learning_rate": 4.849125239635679e-06, "loss": 0.6807, "step": 10009 }, { "epoch": 0.68, "learning_rate": 4.84723343985664e-06, "loss": 0.8389, "step": 10010 }, { "epoch": 0.68, "learning_rate": 4.845341891120135e-06, "loss": 0.7783, "step": 10011 }, { "epoch": 0.68, "learning_rate": 4.843450593518324e-06, "loss": 0.7422, "step": 10012 }, { "epoch": 0.68, "learning_rate": 4.841559547143347e-06, "loss": 0.7979, "step": 10013 }, { "epoch": 0.68, "learning_rate": 4.839668752087339e-06, "loss": 0.8037, "step": 10014 }, { "epoch": 0.68, "learning_rate": 4.837778208442415e-06, "loss": 0.749, "step": 10015 }, { "epoch": 0.68, "learning_rate": 4.835887916300691e-06, "loss": 0.7891, "step": 10016 }, { "epoch": 0.68, "learning_rate": 4.833997875754251e-06, "loss": 0.7129, "step": 10017 }, { "epoch": 0.68, "learning_rate": 4.832108086895183e-06, "loss": 0.7363, "step": 10018 }, { "epoch": 0.68, "learning_rate": 4.830218549815557e-06, "loss": 0.668, "step": 10019 }, { "epoch": 0.68, "learning_rate": 4.828329264607431e-06, "loss": 0.8164, "step": 10020 }, { "epoch": 0.68, "learning_rate": 4.826440231362851e-06, "loss": 0.6934, "step": 10021 }, { "epoch": 0.68, "learning_rate": 4.8245514501738546e-06, "loss": 0.8105, "step": 10022 }, { "epoch": 0.68, "learning_rate": 4.822662921132455e-06, "loss": 0.7656, "step": 10023 }, { "epoch": 0.68, "learning_rate": 4.820774644330663e-06, "loss": 0.8047, "step": 10024 }, { "epoch": 0.68, "learning_rate": 4.818886619860483e-06, "loss": 0.7256, "step": 10025 }, { "epoch": 0.68, "learning_rate": 4.8169988478138915e-06, "loss": 0.7266, "step": 10026 }, { "epoch": 0.68, "learning_rate": 4.815111328282864e-06, "loss": 0.8164, "step": 10027 }, { "epoch": 0.68, "learning_rate": 4.8132240613593595e-06, "loss": 0.7451, "step": 10028 }, { "epoch": 0.68, "learning_rate": 4.811337047135329e-06, "loss": 0.7686, "step": 10029 }, { "epoch": 0.68, "learning_rate": 4.809450285702697e-06, "loss": 0.7949, "step": 10030 }, { "epoch": 0.68, "learning_rate": 4.807563777153399e-06, "loss": 0.709, "step": 10031 }, { "epoch": 0.68, "learning_rate": 4.805677521579343e-06, "loss": 0.7422, "step": 10032 }, { "epoch": 0.68, "learning_rate": 4.803791519072421e-06, "loss": 0.792, "step": 10033 }, { "epoch": 0.68, "learning_rate": 4.801905769724523e-06, "loss": 0.8076, "step": 10034 }, { "epoch": 0.68, "learning_rate": 4.800020273627527e-06, "loss": 0.8115, "step": 10035 }, { "epoch": 0.68, "learning_rate": 4.798135030873281e-06, "loss": 0.7949, "step": 10036 }, { "epoch": 0.68, "learning_rate": 4.7962500415536475e-06, "loss": 0.8105, "step": 10037 }, { "epoch": 0.68, "learning_rate": 4.794365305760461e-06, "loss": 0.7578, "step": 10038 }, { "epoch": 0.68, "learning_rate": 4.792480823585539e-06, "loss": 0.751, "step": 10039 }, { "epoch": 0.68, "learning_rate": 4.790596595120699e-06, "loss": 0.7803, "step": 10040 }, { "epoch": 0.68, "learning_rate": 4.7887126204577375e-06, "loss": 0.7041, "step": 10041 }, { "epoch": 0.68, "learning_rate": 4.7868288996884425e-06, "loss": 0.749, "step": 10042 }, { "epoch": 0.68, "learning_rate": 4.784945432904591e-06, "loss": 0.7627, "step": 10043 }, { "epoch": 0.68, "learning_rate": 4.783062220197943e-06, "loss": 0.7656, "step": 10044 }, { "epoch": 0.68, "learning_rate": 4.781179261660251e-06, "loss": 0.8203, "step": 10045 }, { "epoch": 0.68, "learning_rate": 4.77929655738325e-06, "loss": 0.7568, "step": 10046 }, { "epoch": 0.68, "learning_rate": 4.777414107458665e-06, "loss": 0.7334, "step": 10047 }, { "epoch": 0.68, "learning_rate": 4.775531911978209e-06, "loss": 0.7881, "step": 10048 }, { "epoch": 0.68, "learning_rate": 4.7736499710335845e-06, "loss": 0.748, "step": 10049 }, { "epoch": 0.68, "learning_rate": 4.771768284716478e-06, "loss": 0.707, "step": 10050 }, { "epoch": 0.68, "learning_rate": 4.769886853118567e-06, "loss": 0.7529, "step": 10051 }, { "epoch": 0.69, "learning_rate": 4.768005676331517e-06, "loss": 0.7959, "step": 10052 }, { "epoch": 0.69, "learning_rate": 4.766124754446971e-06, "loss": 0.8076, "step": 10053 }, { "epoch": 0.69, "learning_rate": 4.764244087556571e-06, "loss": 0.7695, "step": 10054 }, { "epoch": 0.69, "learning_rate": 4.762363675751944e-06, "loss": 0.7764, "step": 10055 }, { "epoch": 0.69, "learning_rate": 4.760483519124703e-06, "loss": 0.7246, "step": 10056 }, { "epoch": 0.69, "learning_rate": 4.758603617766451e-06, "loss": 0.7803, "step": 10057 }, { "epoch": 0.69, "learning_rate": 4.756723971768778e-06, "loss": 0.793, "step": 10058 }, { "epoch": 0.69, "learning_rate": 4.754844581223254e-06, "loss": 0.7861, "step": 10059 }, { "epoch": 0.69, "learning_rate": 4.752965446221442e-06, "loss": 0.7559, "step": 10060 }, { "epoch": 0.69, "learning_rate": 4.751086566854904e-06, "loss": 0.7324, "step": 10061 }, { "epoch": 0.69, "learning_rate": 4.749207943215171e-06, "loss": 0.8789, "step": 10062 }, { "epoch": 0.69, "learning_rate": 4.747329575393768e-06, "loss": 0.709, "step": 10063 }, { "epoch": 0.69, "learning_rate": 4.7454514634822145e-06, "loss": 0.8291, "step": 10064 }, { "epoch": 0.69, "learning_rate": 4.743573607572013e-06, "loss": 0.7168, "step": 10065 }, { "epoch": 0.69, "learning_rate": 4.741696007754641e-06, "loss": 0.8262, "step": 10066 }, { "epoch": 0.69, "learning_rate": 4.739818664121586e-06, "loss": 0.8008, "step": 10067 }, { "epoch": 0.69, "learning_rate": 4.737941576764314e-06, "loss": 0.6787, "step": 10068 }, { "epoch": 0.69, "learning_rate": 4.736064745774268e-06, "loss": 0.7793, "step": 10069 }, { "epoch": 0.69, "learning_rate": 4.734188171242891e-06, "loss": 0.7451, "step": 10070 }, { "epoch": 0.69, "learning_rate": 4.732311853261612e-06, "loss": 0.6699, "step": 10071 }, { "epoch": 0.69, "learning_rate": 4.730435791921836e-06, "loss": 0.7324, "step": 10072 }, { "epoch": 0.69, "learning_rate": 4.728559987314975e-06, "loss": 0.7598, "step": 10073 }, { "epoch": 0.69, "learning_rate": 4.726684439532419e-06, "loss": 0.7627, "step": 10074 }, { "epoch": 0.69, "learning_rate": 4.724809148665535e-06, "loss": 0.8447, "step": 10075 }, { "epoch": 0.69, "learning_rate": 4.722934114805692e-06, "loss": 0.7363, "step": 10076 }, { "epoch": 0.69, "learning_rate": 4.7210593380442415e-06, "loss": 0.7646, "step": 10077 }, { "epoch": 0.69, "learning_rate": 4.719184818472523e-06, "loss": 0.8262, "step": 10078 }, { "epoch": 0.69, "learning_rate": 4.7173105561818625e-06, "loss": 0.7461, "step": 10079 }, { "epoch": 0.69, "learning_rate": 4.715436551263574e-06, "loss": 0.8047, "step": 10080 }, { "epoch": 0.69, "learning_rate": 4.713562803808963e-06, "loss": 0.7695, "step": 10081 }, { "epoch": 0.69, "learning_rate": 4.71168931390931e-06, "loss": 0.7646, "step": 10082 }, { "epoch": 0.69, "learning_rate": 4.709816081655897e-06, "loss": 0.8086, "step": 10083 }, { "epoch": 0.69, "learning_rate": 4.707943107139986e-06, "loss": 0.7344, "step": 10084 }, { "epoch": 0.69, "learning_rate": 4.706070390452828e-06, "loss": 0.877, "step": 10085 }, { "epoch": 0.69, "learning_rate": 4.704197931685663e-06, "loss": 0.7832, "step": 10086 }, { "epoch": 0.69, "learning_rate": 4.702325730929721e-06, "loss": 0.8096, "step": 10087 }, { "epoch": 0.69, "learning_rate": 4.700453788276205e-06, "loss": 0.7686, "step": 10088 }, { "epoch": 0.69, "learning_rate": 4.698582103816325e-06, "loss": 0.7568, "step": 10089 }, { "epoch": 0.69, "learning_rate": 4.696710677641264e-06, "loss": 0.7979, "step": 10090 }, { "epoch": 0.69, "learning_rate": 4.694839509842202e-06, "loss": 0.7178, "step": 10091 }, { "epoch": 0.69, "learning_rate": 4.6929686005102995e-06, "loss": 0.7881, "step": 10092 }, { "epoch": 0.69, "learning_rate": 4.691097949736707e-06, "loss": 0.7432, "step": 10093 }, { "epoch": 0.69, "learning_rate": 4.689227557612568e-06, "loss": 0.6992, "step": 10094 }, { "epoch": 0.69, "learning_rate": 4.6873574242289995e-06, "loss": 0.791, "step": 10095 }, { "epoch": 0.69, "learning_rate": 4.6854875496771155e-06, "loss": 0.7471, "step": 10096 }, { "epoch": 0.69, "learning_rate": 4.6836179340480255e-06, "loss": 0.7988, "step": 10097 }, { "epoch": 0.69, "learning_rate": 4.681748577432807e-06, "loss": 0.8232, "step": 10098 }, { "epoch": 0.69, "learning_rate": 4.679879479922538e-06, "loss": 0.7715, "step": 10099 }, { "epoch": 0.69, "learning_rate": 4.678010641608281e-06, "loss": 0.791, "step": 10100 }, { "epoch": 0.69, "learning_rate": 4.676142062581091e-06, "loss": 0.7266, "step": 10101 }, { "epoch": 0.69, "learning_rate": 4.674273742931992e-06, "loss": 0.7793, "step": 10102 }, { "epoch": 0.69, "learning_rate": 4.67240568275202e-06, "loss": 0.7744, "step": 10103 }, { "epoch": 0.69, "learning_rate": 4.6705378821321875e-06, "loss": 0.7002, "step": 10104 }, { "epoch": 0.69, "learning_rate": 4.668670341163486e-06, "loss": 0.8262, "step": 10105 }, { "epoch": 0.69, "learning_rate": 4.666803059936905e-06, "loss": 0.6338, "step": 10106 }, { "epoch": 0.69, "learning_rate": 4.664936038543423e-06, "loss": 0.8301, "step": 10107 }, { "epoch": 0.69, "learning_rate": 4.66306927707399e-06, "loss": 0.7607, "step": 10108 }, { "epoch": 0.69, "learning_rate": 4.661202775619563e-06, "loss": 0.6709, "step": 10109 }, { "epoch": 0.69, "learning_rate": 4.659336534271082e-06, "loss": 0.7246, "step": 10110 }, { "epoch": 0.69, "learning_rate": 4.6574705531194605e-06, "loss": 0.7646, "step": 10111 }, { "epoch": 0.69, "learning_rate": 4.655604832255614e-06, "loss": 0.6953, "step": 10112 }, { "epoch": 0.69, "learning_rate": 4.653739371770438e-06, "loss": 0.7666, "step": 10113 }, { "epoch": 0.69, "learning_rate": 4.651874171754819e-06, "loss": 0.752, "step": 10114 }, { "epoch": 0.69, "learning_rate": 4.65000923229963e-06, "loss": 0.6895, "step": 10115 }, { "epoch": 0.69, "learning_rate": 4.648144553495732e-06, "loss": 0.6992, "step": 10116 }, { "epoch": 0.69, "learning_rate": 4.646280135433972e-06, "loss": 0.7607, "step": 10117 }, { "epoch": 0.69, "learning_rate": 4.644415978205179e-06, "loss": 0.8027, "step": 10118 }, { "epoch": 0.69, "learning_rate": 4.642552081900179e-06, "loss": 0.7393, "step": 10119 }, { "epoch": 0.69, "learning_rate": 4.64068844660978e-06, "loss": 0.8477, "step": 10120 }, { "epoch": 0.69, "learning_rate": 4.638825072424779e-06, "loss": 0.8125, "step": 10121 }, { "epoch": 0.69, "learning_rate": 4.63696195943596e-06, "loss": 0.751, "step": 10122 }, { "epoch": 0.69, "learning_rate": 4.635099107734095e-06, "loss": 0.7549, "step": 10123 }, { "epoch": 0.69, "learning_rate": 4.633236517409936e-06, "loss": 0.7744, "step": 10124 }, { "epoch": 0.69, "learning_rate": 4.631374188554232e-06, "loss": 0.7715, "step": 10125 }, { "epoch": 0.69, "learning_rate": 4.629512121257716e-06, "loss": 0.8262, "step": 10126 }, { "epoch": 0.69, "learning_rate": 4.627650315611109e-06, "loss": 0.8145, "step": 10127 }, { "epoch": 0.69, "learning_rate": 4.625788771705115e-06, "loss": 0.7295, "step": 10128 }, { "epoch": 0.69, "learning_rate": 4.6239274896304305e-06, "loss": 0.8037, "step": 10129 }, { "epoch": 0.69, "learning_rate": 4.6220664694777405e-06, "loss": 0.7627, "step": 10130 }, { "epoch": 0.69, "learning_rate": 4.620205711337702e-06, "loss": 0.709, "step": 10131 }, { "epoch": 0.69, "learning_rate": 4.618345215300982e-06, "loss": 0.7227, "step": 10132 }, { "epoch": 0.69, "learning_rate": 4.6164849814582256e-06, "loss": 0.7959, "step": 10133 }, { "epoch": 0.69, "learning_rate": 4.614625009900054e-06, "loss": 0.7578, "step": 10134 }, { "epoch": 0.69, "learning_rate": 4.612765300717089e-06, "loss": 0.7969, "step": 10135 }, { "epoch": 0.69, "learning_rate": 4.610905853999938e-06, "loss": 0.7871, "step": 10136 }, { "epoch": 0.69, "learning_rate": 4.609046669839188e-06, "loss": 0.7393, "step": 10137 }, { "epoch": 0.69, "learning_rate": 4.607187748325422e-06, "loss": 0.7461, "step": 10138 }, { "epoch": 0.69, "learning_rate": 4.605329089549211e-06, "loss": 0.7373, "step": 10139 }, { "epoch": 0.69, "learning_rate": 4.6034706936011e-06, "loss": 0.8438, "step": 10140 }, { "epoch": 0.69, "learning_rate": 4.601612560571632e-06, "loss": 0.7939, "step": 10141 }, { "epoch": 0.69, "learning_rate": 4.599754690551338e-06, "loss": 0.7227, "step": 10142 }, { "epoch": 0.69, "learning_rate": 4.597897083630731e-06, "loss": 0.8438, "step": 10143 }, { "epoch": 0.69, "learning_rate": 4.596039739900316e-06, "loss": 0.71, "step": 10144 }, { "epoch": 0.69, "learning_rate": 4.594182659450582e-06, "loss": 0.6768, "step": 10145 }, { "epoch": 0.69, "learning_rate": 4.592325842372006e-06, "loss": 0.752, "step": 10146 }, { "epoch": 0.69, "learning_rate": 4.590469288755049e-06, "loss": 0.7705, "step": 10147 }, { "epoch": 0.69, "learning_rate": 4.588612998690165e-06, "loss": 0.752, "step": 10148 }, { "epoch": 0.69, "learning_rate": 4.586756972267792e-06, "loss": 0.7529, "step": 10149 }, { "epoch": 0.69, "learning_rate": 4.584901209578354e-06, "loss": 0.8076, "step": 10150 }, { "epoch": 0.69, "learning_rate": 4.583045710712266e-06, "loss": 0.7881, "step": 10151 }, { "epoch": 0.69, "learning_rate": 4.581190475759927e-06, "loss": 0.7168, "step": 10152 }, { "epoch": 0.69, "learning_rate": 4.579335504811727e-06, "loss": 0.7793, "step": 10153 }, { "epoch": 0.69, "learning_rate": 4.577480797958033e-06, "loss": 0.7764, "step": 10154 }, { "epoch": 0.69, "learning_rate": 4.5756263552892066e-06, "loss": 0.7998, "step": 10155 }, { "epoch": 0.69, "learning_rate": 4.573772176895607e-06, "loss": 0.8213, "step": 10156 }, { "epoch": 0.69, "learning_rate": 4.571918262867559e-06, "loss": 0.6973, "step": 10157 }, { "epoch": 0.69, "learning_rate": 4.5700646132953874e-06, "loss": 0.7197, "step": 10158 }, { "epoch": 0.69, "learning_rate": 4.568211228269408e-06, "loss": 0.7451, "step": 10159 }, { "epoch": 0.69, "learning_rate": 4.566358107879908e-06, "loss": 0.6934, "step": 10160 }, { "epoch": 0.69, "learning_rate": 4.5645052522171726e-06, "loss": 0.7539, "step": 10161 }, { "epoch": 0.69, "learning_rate": 4.562652661371485e-06, "loss": 0.7188, "step": 10162 }, { "epoch": 0.69, "learning_rate": 4.5608003354330884e-06, "loss": 0.7402, "step": 10163 }, { "epoch": 0.69, "learning_rate": 4.558948274492236e-06, "loss": 0.7402, "step": 10164 }, { "epoch": 0.69, "learning_rate": 4.5570964786391585e-06, "loss": 0.7227, "step": 10165 }, { "epoch": 0.69, "learning_rate": 4.555244947964078e-06, "loss": 0.7627, "step": 10166 }, { "epoch": 0.69, "learning_rate": 4.553393682557191e-06, "loss": 0.7803, "step": 10167 }, { "epoch": 0.69, "learning_rate": 4.551542682508702e-06, "loss": 0.7295, "step": 10168 }, { "epoch": 0.69, "learning_rate": 4.5496919479087905e-06, "loss": 0.7578, "step": 10169 }, { "epoch": 0.69, "learning_rate": 4.547841478847619e-06, "loss": 0.8164, "step": 10170 }, { "epoch": 0.69, "learning_rate": 4.545991275415344e-06, "loss": 0.8682, "step": 10171 }, { "epoch": 0.69, "learning_rate": 4.544141337702113e-06, "loss": 0.7988, "step": 10172 }, { "epoch": 0.69, "learning_rate": 4.542291665798041e-06, "loss": 0.8037, "step": 10173 }, { "epoch": 0.69, "learning_rate": 4.540442259793257e-06, "loss": 0.7617, "step": 10174 }, { "epoch": 0.69, "learning_rate": 4.538593119777864e-06, "loss": 0.8086, "step": 10175 }, { "epoch": 0.69, "learning_rate": 4.536744245841944e-06, "loss": 0.7598, "step": 10176 }, { "epoch": 0.69, "learning_rate": 4.534895638075578e-06, "loss": 0.7754, "step": 10177 }, { "epoch": 0.69, "learning_rate": 4.53304729656883e-06, "loss": 0.793, "step": 10178 }, { "epoch": 0.69, "learning_rate": 4.531199221411751e-06, "loss": 0.8145, "step": 10179 }, { "epoch": 0.69, "learning_rate": 4.5293514126943795e-06, "loss": 0.79, "step": 10180 }, { "epoch": 0.69, "learning_rate": 4.52750387050674e-06, "loss": 0.71, "step": 10181 }, { "epoch": 0.69, "learning_rate": 4.525656594938848e-06, "loss": 0.748, "step": 10182 }, { "epoch": 0.69, "learning_rate": 4.523809586080697e-06, "loss": 0.7715, "step": 10183 }, { "epoch": 0.69, "learning_rate": 4.5219628440222765e-06, "loss": 0.8057, "step": 10184 }, { "epoch": 0.69, "learning_rate": 4.520116368853559e-06, "loss": 0.8076, "step": 10185 }, { "epoch": 0.69, "learning_rate": 4.518270160664503e-06, "loss": 0.7988, "step": 10186 }, { "epoch": 0.69, "learning_rate": 4.516424219545059e-06, "loss": 0.7549, "step": 10187 }, { "epoch": 0.69, "learning_rate": 4.5145785455851595e-06, "loss": 0.7461, "step": 10188 }, { "epoch": 0.69, "learning_rate": 4.512733138874729e-06, "loss": 0.7891, "step": 10189 }, { "epoch": 0.69, "learning_rate": 4.510887999503669e-06, "loss": 0.7803, "step": 10190 }, { "epoch": 0.69, "learning_rate": 4.509043127561874e-06, "loss": 0.7549, "step": 10191 }, { "epoch": 0.69, "learning_rate": 4.507198523139238e-06, "loss": 0.6709, "step": 10192 }, { "epoch": 0.69, "learning_rate": 4.505354186325618e-06, "loss": 0.7666, "step": 10193 }, { "epoch": 0.69, "learning_rate": 4.503510117210874e-06, "loss": 0.8779, "step": 10194 }, { "epoch": 0.69, "learning_rate": 4.5016663158848525e-06, "loss": 0.8428, "step": 10195 }, { "epoch": 0.69, "learning_rate": 4.499822782437376e-06, "loss": 0.7695, "step": 10196 }, { "epoch": 0.69, "learning_rate": 4.4979795169582625e-06, "loss": 0.7568, "step": 10197 }, { "epoch": 0.69, "learning_rate": 4.496136519537326e-06, "loss": 0.8135, "step": 10198 }, { "epoch": 0.7, "learning_rate": 4.4942937902643455e-06, "loss": 0.8867, "step": 10199 }, { "epoch": 0.7, "learning_rate": 4.4924513292291035e-06, "loss": 0.7666, "step": 10200 }, { "epoch": 0.7, "learning_rate": 4.490609136521365e-06, "loss": 0.7734, "step": 10201 }, { "epoch": 0.7, "learning_rate": 4.488767212230884e-06, "loss": 0.7549, "step": 10202 }, { "epoch": 0.7, "learning_rate": 4.486925556447387e-06, "loss": 0.832, "step": 10203 }, { "epoch": 0.7, "learning_rate": 4.485084169260613e-06, "loss": 0.8193, "step": 10204 }, { "epoch": 0.7, "learning_rate": 4.483243050760272e-06, "loss": 0.7598, "step": 10205 }, { "epoch": 0.7, "learning_rate": 4.481402201036057e-06, "loss": 0.7881, "step": 10206 }, { "epoch": 0.7, "learning_rate": 4.479561620177658e-06, "loss": 0.7012, "step": 10207 }, { "epoch": 0.7, "learning_rate": 4.477721308274751e-06, "loss": 0.8057, "step": 10208 }, { "epoch": 0.7, "learning_rate": 4.475881265416986e-06, "loss": 0.7959, "step": 10209 }, { "epoch": 0.7, "learning_rate": 4.47404149169402e-06, "loss": 0.7646, "step": 10210 }, { "epoch": 0.7, "learning_rate": 4.472201987195486e-06, "loss": 0.751, "step": 10211 }, { "epoch": 0.7, "learning_rate": 4.470362752010998e-06, "loss": 0.7334, "step": 10212 }, { "epoch": 0.7, "learning_rate": 4.468523786230168e-06, "loss": 0.7158, "step": 10213 }, { "epoch": 0.7, "learning_rate": 4.466685089942589e-06, "loss": 0.7891, "step": 10214 }, { "epoch": 0.7, "learning_rate": 4.4648466632378405e-06, "loss": 0.7881, "step": 10215 }, { "epoch": 0.7, "learning_rate": 4.463008506205495e-06, "loss": 0.7598, "step": 10216 }, { "epoch": 0.7, "learning_rate": 4.4611706189351046e-06, "loss": 0.7998, "step": 10217 }, { "epoch": 0.7, "learning_rate": 4.459333001516215e-06, "loss": 0.749, "step": 10218 }, { "epoch": 0.7, "learning_rate": 4.4574956540383475e-06, "loss": 0.8037, "step": 10219 }, { "epoch": 0.7, "learning_rate": 4.455658576591022e-06, "loss": 0.7383, "step": 10220 }, { "epoch": 0.7, "learning_rate": 4.45382176926374e-06, "loss": 0.8184, "step": 10221 }, { "epoch": 0.7, "learning_rate": 4.451985232145991e-06, "loss": 0.7207, "step": 10222 }, { "epoch": 0.7, "learning_rate": 4.45014896532725e-06, "loss": 0.6973, "step": 10223 }, { "epoch": 0.7, "learning_rate": 4.4483129688969815e-06, "loss": 0.7871, "step": 10224 }, { "epoch": 0.7, "learning_rate": 4.446477242944639e-06, "loss": 0.8086, "step": 10225 }, { "epoch": 0.7, "learning_rate": 4.444641787559649e-06, "loss": 0.6777, "step": 10226 }, { "epoch": 0.7, "learning_rate": 4.442806602831442e-06, "loss": 0.7783, "step": 10227 }, { "epoch": 0.7, "learning_rate": 4.440971688849425e-06, "loss": 0.8125, "step": 10228 }, { "epoch": 0.7, "learning_rate": 4.439137045702997e-06, "loss": 0.8379, "step": 10229 }, { "epoch": 0.7, "learning_rate": 4.4373026734815405e-06, "loss": 0.7842, "step": 10230 }, { "epoch": 0.7, "learning_rate": 4.435468572274429e-06, "loss": 0.7344, "step": 10231 }, { "epoch": 0.7, "learning_rate": 4.433634742171015e-06, "loss": 0.7637, "step": 10232 }, { "epoch": 0.7, "learning_rate": 4.431801183260641e-06, "loss": 0.8496, "step": 10233 }, { "epoch": 0.7, "learning_rate": 4.42996789563265e-06, "loss": 0.8184, "step": 10234 }, { "epoch": 0.7, "learning_rate": 4.428134879376347e-06, "loss": 0.7754, "step": 10235 }, { "epoch": 0.7, "learning_rate": 4.426302134581041e-06, "loss": 0.748, "step": 10236 }, { "epoch": 0.7, "learning_rate": 4.424469661336023e-06, "loss": 0.791, "step": 10237 }, { "epoch": 0.7, "learning_rate": 4.4226374597305755e-06, "loss": 0.7842, "step": 10238 }, { "epoch": 0.7, "learning_rate": 4.420805529853951e-06, "loss": 0.6665, "step": 10239 }, { "epoch": 0.7, "learning_rate": 4.418973871795412e-06, "loss": 0.8154, "step": 10240 }, { "epoch": 0.7, "learning_rate": 4.417142485644199e-06, "loss": 0.7734, "step": 10241 }, { "epoch": 0.7, "learning_rate": 4.415311371489528e-06, "loss": 0.7715, "step": 10242 }, { "epoch": 0.7, "learning_rate": 4.413480529420614e-06, "loss": 0.7168, "step": 10243 }, { "epoch": 0.7, "learning_rate": 4.4116499595266596e-06, "loss": 0.7432, "step": 10244 }, { "epoch": 0.7, "learning_rate": 4.409819661896839e-06, "loss": 0.6885, "step": 10245 }, { "epoch": 0.7, "learning_rate": 4.4079896366203365e-06, "loss": 0.7959, "step": 10246 }, { "epoch": 0.7, "learning_rate": 4.40615988378631e-06, "loss": 0.7344, "step": 10247 }, { "epoch": 0.7, "learning_rate": 4.404330403483897e-06, "loss": 0.7783, "step": 10248 }, { "epoch": 0.7, "learning_rate": 4.402501195802233e-06, "loss": 0.8018, "step": 10249 }, { "epoch": 0.7, "learning_rate": 4.400672260830439e-06, "loss": 0.7314, "step": 10250 }, { "epoch": 0.7, "learning_rate": 4.3988435986576195e-06, "loss": 0.7705, "step": 10251 }, { "epoch": 0.7, "learning_rate": 4.3970152093728665e-06, "loss": 0.7656, "step": 10252 }, { "epoch": 0.7, "learning_rate": 4.395187093065259e-06, "loss": 0.7422, "step": 10253 }, { "epoch": 0.7, "learning_rate": 4.393359249823867e-06, "loss": 0.7529, "step": 10254 }, { "epoch": 0.7, "learning_rate": 4.391531679737735e-06, "loss": 0.75, "step": 10255 }, { "epoch": 0.7, "learning_rate": 4.389704382895902e-06, "loss": 0.7451, "step": 10256 }, { "epoch": 0.7, "learning_rate": 4.3878773593874054e-06, "loss": 0.8418, "step": 10257 }, { "epoch": 0.7, "learning_rate": 4.3860506093012465e-06, "loss": 0.793, "step": 10258 }, { "epoch": 0.7, "learning_rate": 4.384224132726429e-06, "loss": 0.7471, "step": 10259 }, { "epoch": 0.7, "learning_rate": 4.382397929751942e-06, "loss": 0.7988, "step": 10260 }, { "epoch": 0.7, "learning_rate": 4.380572000466748e-06, "loss": 0.7676, "step": 10261 }, { "epoch": 0.7, "learning_rate": 4.37874634495981e-06, "loss": 0.6611, "step": 10262 }, { "epoch": 0.7, "learning_rate": 4.376920963320083e-06, "loss": 0.8291, "step": 10263 }, { "epoch": 0.7, "learning_rate": 4.375095855636488e-06, "loss": 0.792, "step": 10264 }, { "epoch": 0.7, "learning_rate": 4.373271021997949e-06, "loss": 0.7334, "step": 10265 }, { "epoch": 0.7, "learning_rate": 4.371446462493372e-06, "loss": 0.792, "step": 10266 }, { "epoch": 0.7, "learning_rate": 4.369622177211652e-06, "loss": 0.8057, "step": 10267 }, { "epoch": 0.7, "learning_rate": 4.367798166241658e-06, "loss": 0.7373, "step": 10268 }, { "epoch": 0.7, "learning_rate": 4.365974429672266e-06, "loss": 0.7949, "step": 10269 }, { "epoch": 0.7, "learning_rate": 4.364150967592329e-06, "loss": 0.7842, "step": 10270 }, { "epoch": 0.7, "learning_rate": 4.362327780090678e-06, "loss": 0.7734, "step": 10271 }, { "epoch": 0.7, "learning_rate": 4.360504867256144e-06, "loss": 0.8066, "step": 10272 }, { "epoch": 0.7, "learning_rate": 4.358682229177536e-06, "loss": 0.8613, "step": 10273 }, { "epoch": 0.7, "learning_rate": 4.356859865943656e-06, "loss": 0.833, "step": 10274 }, { "epoch": 0.7, "learning_rate": 4.355037777643286e-06, "loss": 0.8008, "step": 10275 }, { "epoch": 0.7, "learning_rate": 4.3532159643652025e-06, "loss": 0.7773, "step": 10276 }, { "epoch": 0.7, "learning_rate": 4.3513944261981645e-06, "loss": 0.708, "step": 10277 }, { "epoch": 0.7, "learning_rate": 4.349573163230911e-06, "loss": 0.8369, "step": 10278 }, { "epoch": 0.7, "learning_rate": 4.347752175552178e-06, "loss": 0.8174, "step": 10279 }, { "epoch": 0.7, "learning_rate": 4.3459314632506824e-06, "loss": 0.7783, "step": 10280 }, { "epoch": 0.7, "learning_rate": 4.344111026415131e-06, "loss": 0.7822, "step": 10281 }, { "epoch": 0.7, "learning_rate": 4.342290865134214e-06, "loss": 0.7422, "step": 10282 }, { "epoch": 0.7, "learning_rate": 4.340470979496614e-06, "loss": 0.7021, "step": 10283 }, { "epoch": 0.7, "learning_rate": 4.338651369590988e-06, "loss": 0.7725, "step": 10284 }, { "epoch": 0.7, "learning_rate": 4.336832035505992e-06, "loss": 0.7246, "step": 10285 }, { "epoch": 0.7, "learning_rate": 4.335012977330263e-06, "loss": 0.7861, "step": 10286 }, { "epoch": 0.7, "learning_rate": 4.333194195152425e-06, "loss": 0.7686, "step": 10287 }, { "epoch": 0.7, "learning_rate": 4.331375689061089e-06, "loss": 0.7002, "step": 10288 }, { "epoch": 0.7, "learning_rate": 4.329557459144853e-06, "loss": 0.7812, "step": 10289 }, { "epoch": 0.7, "learning_rate": 4.3277395054923054e-06, "loss": 0.7627, "step": 10290 }, { "epoch": 0.7, "learning_rate": 4.325921828192009e-06, "loss": 0.7178, "step": 10291 }, { "epoch": 0.7, "learning_rate": 4.3241044273325205e-06, "loss": 0.7549, "step": 10292 }, { "epoch": 0.7, "learning_rate": 4.322287303002395e-06, "loss": 0.7588, "step": 10293 }, { "epoch": 0.7, "learning_rate": 4.320470455290151e-06, "loss": 0.7754, "step": 10294 }, { "epoch": 0.7, "learning_rate": 4.31865388428431e-06, "loss": 0.7451, "step": 10295 }, { "epoch": 0.7, "learning_rate": 4.316837590073377e-06, "loss": 0.8379, "step": 10296 }, { "epoch": 0.7, "learning_rate": 4.315021572745838e-06, "loss": 0.8564, "step": 10297 }, { "epoch": 0.7, "learning_rate": 4.313205832390165e-06, "loss": 0.7227, "step": 10298 }, { "epoch": 0.7, "learning_rate": 4.3113903690948355e-06, "loss": 0.7334, "step": 10299 }, { "epoch": 0.7, "learning_rate": 4.309575182948285e-06, "loss": 0.6816, "step": 10300 }, { "epoch": 0.7, "learning_rate": 4.307760274038954e-06, "loss": 0.793, "step": 10301 }, { "epoch": 0.7, "learning_rate": 4.305945642455266e-06, "loss": 0.7412, "step": 10302 }, { "epoch": 0.7, "learning_rate": 4.304131288285631e-06, "loss": 0.7637, "step": 10303 }, { "epoch": 0.7, "learning_rate": 4.302317211618435e-06, "loss": 0.8223, "step": 10304 }, { "epoch": 0.7, "learning_rate": 4.3005034125420704e-06, "loss": 0.7822, "step": 10305 }, { "epoch": 0.7, "learning_rate": 4.298689891144906e-06, "loss": 0.7705, "step": 10306 }, { "epoch": 0.7, "learning_rate": 4.296876647515288e-06, "loss": 0.833, "step": 10307 }, { "epoch": 0.7, "learning_rate": 4.295063681741562e-06, "loss": 0.7705, "step": 10308 }, { "epoch": 0.7, "learning_rate": 4.293250993912053e-06, "loss": 0.7559, "step": 10309 }, { "epoch": 0.7, "learning_rate": 4.29143858411508e-06, "loss": 0.7041, "step": 10310 }, { "epoch": 0.7, "learning_rate": 4.289626452438939e-06, "loss": 0.7471, "step": 10311 }, { "epoch": 0.7, "learning_rate": 4.28781459897192e-06, "loss": 0.79, "step": 10312 }, { "epoch": 0.7, "learning_rate": 4.2860030238022975e-06, "loss": 0.7852, "step": 10313 }, { "epoch": 0.7, "learning_rate": 4.284191727018326e-06, "loss": 0.7129, "step": 10314 }, { "epoch": 0.7, "learning_rate": 4.282380708708255e-06, "loss": 0.7549, "step": 10315 }, { "epoch": 0.7, "learning_rate": 4.280569968960317e-06, "loss": 0.7178, "step": 10316 }, { "epoch": 0.7, "learning_rate": 4.278759507862731e-06, "loss": 0.7275, "step": 10317 }, { "epoch": 0.7, "learning_rate": 4.276949325503703e-06, "loss": 0.7227, "step": 10318 }, { "epoch": 0.7, "learning_rate": 4.275139421971428e-06, "loss": 0.7832, "step": 10319 }, { "epoch": 0.7, "learning_rate": 4.273329797354079e-06, "loss": 0.7695, "step": 10320 }, { "epoch": 0.7, "learning_rate": 4.271520451739821e-06, "loss": 0.7744, "step": 10321 }, { "epoch": 0.7, "learning_rate": 4.269711385216808e-06, "loss": 0.7559, "step": 10322 }, { "epoch": 0.7, "learning_rate": 4.267902597873177e-06, "loss": 0.7256, "step": 10323 }, { "epoch": 0.7, "learning_rate": 4.266094089797052e-06, "loss": 0.6934, "step": 10324 }, { "epoch": 0.7, "learning_rate": 4.264285861076543e-06, "loss": 0.7881, "step": 10325 }, { "epoch": 0.7, "learning_rate": 4.262477911799752e-06, "loss": 0.6953, "step": 10326 }, { "epoch": 0.7, "learning_rate": 4.260670242054752e-06, "loss": 0.708, "step": 10327 }, { "epoch": 0.7, "learning_rate": 4.258862851929615e-06, "loss": 0.7471, "step": 10328 }, { "epoch": 0.7, "learning_rate": 4.257055741512407e-06, "loss": 0.7783, "step": 10329 }, { "epoch": 0.7, "learning_rate": 4.25524891089116e-06, "loss": 0.7285, "step": 10330 }, { "epoch": 0.7, "learning_rate": 4.253442360153905e-06, "loss": 0.7568, "step": 10331 }, { "epoch": 0.7, "learning_rate": 4.251636089388662e-06, "loss": 0.7705, "step": 10332 }, { "epoch": 0.7, "learning_rate": 4.249830098683425e-06, "loss": 0.8174, "step": 10333 }, { "epoch": 0.7, "learning_rate": 4.248024388126181e-06, "loss": 0.7803, "step": 10334 }, { "epoch": 0.7, "learning_rate": 4.246218957804916e-06, "loss": 0.7627, "step": 10335 }, { "epoch": 0.7, "learning_rate": 4.24441380780758e-06, "loss": 0.7783, "step": 10336 }, { "epoch": 0.7, "learning_rate": 4.2426089382221215e-06, "loss": 0.8633, "step": 10337 }, { "epoch": 0.7, "learning_rate": 4.2408043491364745e-06, "loss": 0.7852, "step": 10338 }, { "epoch": 0.7, "learning_rate": 4.2390000406385634e-06, "loss": 0.8008, "step": 10339 }, { "epoch": 0.7, "learning_rate": 4.237196012816282e-06, "loss": 0.8252, "step": 10340 }, { "epoch": 0.7, "learning_rate": 4.235392265757533e-06, "loss": 0.7334, "step": 10341 }, { "epoch": 0.7, "learning_rate": 4.2335887995501955e-06, "loss": 0.8408, "step": 10342 }, { "epoch": 0.7, "learning_rate": 4.231785614282127e-06, "loss": 0.7734, "step": 10343 }, { "epoch": 0.7, "learning_rate": 4.229982710041181e-06, "loss": 0.8477, "step": 10344 }, { "epoch": 0.7, "learning_rate": 4.2281800869151975e-06, "loss": 0.8057, "step": 10345 }, { "epoch": 0.71, "learning_rate": 4.226377744991999e-06, "loss": 0.7988, "step": 10346 }, { "epoch": 0.71, "learning_rate": 4.224575684359393e-06, "loss": 0.7793, "step": 10347 }, { "epoch": 0.71, "learning_rate": 4.222773905105183e-06, "loss": 0.7275, "step": 10348 }, { "epoch": 0.71, "learning_rate": 4.220972407317143e-06, "loss": 0.7432, "step": 10349 }, { "epoch": 0.71, "learning_rate": 4.219171191083046e-06, "loss": 0.8369, "step": 10350 }, { "epoch": 0.71, "learning_rate": 4.217370256490645e-06, "loss": 0.7412, "step": 10351 }, { "epoch": 0.71, "learning_rate": 4.2155696036276835e-06, "loss": 0.8311, "step": 10352 }, { "epoch": 0.71, "learning_rate": 4.21376923258189e-06, "loss": 0.7695, "step": 10353 }, { "epoch": 0.71, "learning_rate": 4.211969143440977e-06, "loss": 0.6768, "step": 10354 }, { "epoch": 0.71, "learning_rate": 4.210169336292649e-06, "loss": 0.8105, "step": 10355 }, { "epoch": 0.71, "learning_rate": 4.208369811224584e-06, "loss": 0.7441, "step": 10356 }, { "epoch": 0.71, "learning_rate": 4.20657056832446e-06, "loss": 0.7832, "step": 10357 }, { "epoch": 0.71, "learning_rate": 4.204771607679935e-06, "loss": 0.7529, "step": 10358 }, { "epoch": 0.71, "learning_rate": 4.202972929378655e-06, "loss": 0.7529, "step": 10359 }, { "epoch": 0.71, "learning_rate": 4.201174533508251e-06, "loss": 0.7646, "step": 10360 }, { "epoch": 0.71, "learning_rate": 4.199376420156341e-06, "loss": 0.7441, "step": 10361 }, { "epoch": 0.71, "learning_rate": 4.197578589410533e-06, "loss": 0.7559, "step": 10362 }, { "epoch": 0.71, "learning_rate": 4.1957810413584075e-06, "loss": 0.7686, "step": 10363 }, { "epoch": 0.71, "learning_rate": 4.193983776087545e-06, "loss": 0.792, "step": 10364 }, { "epoch": 0.71, "learning_rate": 4.192186793685517e-06, "loss": 0.7832, "step": 10365 }, { "epoch": 0.71, "learning_rate": 4.1903900942398615e-06, "loss": 0.7617, "step": 10366 }, { "epoch": 0.71, "learning_rate": 4.188593677838116e-06, "loss": 0.8027, "step": 10367 }, { "epoch": 0.71, "learning_rate": 4.1867975445678076e-06, "loss": 0.75, "step": 10368 }, { "epoch": 0.71, "learning_rate": 4.185001694516432e-06, "loss": 0.7822, "step": 10369 }, { "epoch": 0.71, "learning_rate": 4.1832061277714945e-06, "loss": 0.7275, "step": 10370 }, { "epoch": 0.71, "learning_rate": 4.181410844420473e-06, "loss": 0.7783, "step": 10371 }, { "epoch": 0.71, "learning_rate": 4.17961584455083e-06, "loss": 0.7568, "step": 10372 }, { "epoch": 0.71, "learning_rate": 4.177821128250017e-06, "loss": 0.7314, "step": 10373 }, { "epoch": 0.71, "learning_rate": 4.176026695605476e-06, "loss": 0.8018, "step": 10374 }, { "epoch": 0.71, "learning_rate": 4.17423254670463e-06, "loss": 0.8145, "step": 10375 }, { "epoch": 0.71, "learning_rate": 4.17243868163489e-06, "loss": 0.7842, "step": 10376 }, { "epoch": 0.71, "learning_rate": 4.170645100483653e-06, "loss": 0.749, "step": 10377 }, { "epoch": 0.71, "learning_rate": 4.168851803338307e-06, "loss": 0.7773, "step": 10378 }, { "epoch": 0.71, "learning_rate": 4.1670587902862125e-06, "loss": 0.707, "step": 10379 }, { "epoch": 0.71, "learning_rate": 4.16526606141473e-06, "loss": 0.7197, "step": 10380 }, { "epoch": 0.71, "learning_rate": 4.1634736168112e-06, "loss": 0.7324, "step": 10381 }, { "epoch": 0.71, "learning_rate": 4.161681456562951e-06, "loss": 0.7109, "step": 10382 }, { "epoch": 0.71, "learning_rate": 4.159889580757296e-06, "loss": 0.7949, "step": 10383 }, { "epoch": 0.71, "learning_rate": 4.15809798948154e-06, "loss": 0.7676, "step": 10384 }, { "epoch": 0.71, "learning_rate": 4.15630668282296e-06, "loss": 0.6963, "step": 10385 }, { "epoch": 0.71, "learning_rate": 4.154515660868835e-06, "loss": 0.6855, "step": 10386 }, { "epoch": 0.71, "learning_rate": 4.152724923706421e-06, "loss": 0.8203, "step": 10387 }, { "epoch": 0.71, "learning_rate": 4.150934471422965e-06, "loss": 0.7617, "step": 10388 }, { "epoch": 0.71, "learning_rate": 4.149144304105696e-06, "loss": 0.7451, "step": 10389 }, { "epoch": 0.71, "learning_rate": 4.1473544218418305e-06, "loss": 0.7627, "step": 10390 }, { "epoch": 0.71, "learning_rate": 4.145564824718576e-06, "loss": 0.7832, "step": 10391 }, { "epoch": 0.71, "learning_rate": 4.143775512823114e-06, "loss": 0.7637, "step": 10392 }, { "epoch": 0.71, "learning_rate": 4.14198648624262e-06, "loss": 0.8008, "step": 10393 }, { "epoch": 0.71, "learning_rate": 4.1401977450642665e-06, "loss": 0.7461, "step": 10394 }, { "epoch": 0.71, "learning_rate": 4.138409289375188e-06, "loss": 0.7646, "step": 10395 }, { "epoch": 0.71, "learning_rate": 4.136621119262524e-06, "loss": 0.7598, "step": 10396 }, { "epoch": 0.71, "learning_rate": 4.134833234813394e-06, "loss": 0.7266, "step": 10397 }, { "epoch": 0.71, "learning_rate": 4.133045636114904e-06, "loss": 0.7139, "step": 10398 }, { "epoch": 0.71, "learning_rate": 4.131258323254139e-06, "loss": 0.7637, "step": 10399 }, { "epoch": 0.71, "learning_rate": 4.12947129631819e-06, "loss": 0.7793, "step": 10400 }, { "epoch": 0.71, "learning_rate": 4.127684555394108e-06, "loss": 0.7471, "step": 10401 }, { "epoch": 0.71, "learning_rate": 4.1258981005689495e-06, "loss": 0.75, "step": 10402 }, { "epoch": 0.71, "learning_rate": 4.124111931929748e-06, "loss": 0.7842, "step": 10403 }, { "epoch": 0.71, "learning_rate": 4.122326049563531e-06, "loss": 0.7891, "step": 10404 }, { "epoch": 0.71, "learning_rate": 4.120540453557294e-06, "loss": 0.7939, "step": 10405 }, { "epoch": 0.71, "learning_rate": 4.1187551439980435e-06, "loss": 0.7559, "step": 10406 }, { "epoch": 0.71, "learning_rate": 4.1169701209727595e-06, "loss": 0.7451, "step": 10407 }, { "epoch": 0.71, "learning_rate": 4.115185384568401e-06, "loss": 0.7646, "step": 10408 }, { "epoch": 0.71, "learning_rate": 4.113400934871923e-06, "loss": 0.7773, "step": 10409 }, { "epoch": 0.71, "learning_rate": 4.111616771970265e-06, "loss": 0.7725, "step": 10410 }, { "epoch": 0.71, "learning_rate": 4.109832895950349e-06, "loss": 0.7559, "step": 10411 }, { "epoch": 0.71, "learning_rate": 4.108049306899089e-06, "loss": 0.7656, "step": 10412 }, { "epoch": 0.71, "learning_rate": 4.106266004903378e-06, "loss": 0.751, "step": 10413 }, { "epoch": 0.71, "learning_rate": 4.104482990050105e-06, "loss": 0.7861, "step": 10414 }, { "epoch": 0.71, "learning_rate": 4.102700262426128e-06, "loss": 0.7939, "step": 10415 }, { "epoch": 0.71, "learning_rate": 4.100917822118308e-06, "loss": 0.749, "step": 10416 }, { "epoch": 0.71, "learning_rate": 4.099135669213483e-06, "loss": 0.8809, "step": 10417 }, { "epoch": 0.71, "learning_rate": 4.097353803798482e-06, "loss": 0.7676, "step": 10418 }, { "epoch": 0.71, "learning_rate": 4.095572225960114e-06, "loss": 0.8262, "step": 10419 }, { "epoch": 0.71, "learning_rate": 4.093790935785184e-06, "loss": 0.8018, "step": 10420 }, { "epoch": 0.71, "learning_rate": 4.092009933360467e-06, "loss": 0.748, "step": 10421 }, { "epoch": 0.71, "learning_rate": 4.090229218772739e-06, "loss": 0.7021, "step": 10422 }, { "epoch": 0.71, "learning_rate": 4.088448792108754e-06, "loss": 0.792, "step": 10423 }, { "epoch": 0.71, "learning_rate": 4.0866686534552555e-06, "loss": 0.8154, "step": 10424 }, { "epoch": 0.71, "learning_rate": 4.084888802898973e-06, "loss": 0.708, "step": 10425 }, { "epoch": 0.71, "learning_rate": 4.083109240526619e-06, "loss": 0.7773, "step": 10426 }, { "epoch": 0.71, "learning_rate": 4.081329966424899e-06, "loss": 0.6846, "step": 10427 }, { "epoch": 0.71, "learning_rate": 4.079550980680489e-06, "loss": 0.7168, "step": 10428 }, { "epoch": 0.71, "learning_rate": 4.077772283380063e-06, "loss": 0.7783, "step": 10429 }, { "epoch": 0.71, "learning_rate": 4.0759938746102915e-06, "loss": 0.7676, "step": 10430 }, { "epoch": 0.71, "learning_rate": 4.0742157544578044e-06, "loss": 0.7637, "step": 10431 }, { "epoch": 0.71, "learning_rate": 4.072437923009237e-06, "loss": 0.7793, "step": 10432 }, { "epoch": 0.71, "learning_rate": 4.070660380351206e-06, "loss": 0.8096, "step": 10433 }, { "epoch": 0.71, "learning_rate": 4.068883126570314e-06, "loss": 0.708, "step": 10434 }, { "epoch": 0.71, "learning_rate": 4.067106161753141e-06, "loss": 0.7646, "step": 10435 }, { "epoch": 0.71, "learning_rate": 4.065329485986273e-06, "loss": 0.8477, "step": 10436 }, { "epoch": 0.71, "learning_rate": 4.06355309935626e-06, "loss": 0.7568, "step": 10437 }, { "epoch": 0.71, "learning_rate": 4.061777001949649e-06, "loss": 0.7373, "step": 10438 }, { "epoch": 0.71, "learning_rate": 4.0600011938529745e-06, "loss": 0.7588, "step": 10439 }, { "epoch": 0.71, "learning_rate": 4.058225675152756e-06, "loss": 0.8037, "step": 10440 }, { "epoch": 0.71, "learning_rate": 4.056450445935485e-06, "loss": 0.752, "step": 10441 }, { "epoch": 0.71, "learning_rate": 4.054675506287662e-06, "loss": 0.708, "step": 10442 }, { "epoch": 0.71, "learning_rate": 4.052900856295761e-06, "loss": 0.752, "step": 10443 }, { "epoch": 0.71, "learning_rate": 4.051126496046238e-06, "loss": 0.8047, "step": 10444 }, { "epoch": 0.71, "learning_rate": 4.049352425625541e-06, "loss": 0.7979, "step": 10445 }, { "epoch": 0.71, "learning_rate": 4.0475786451201046e-06, "loss": 0.7881, "step": 10446 }, { "epoch": 0.71, "learning_rate": 4.045805154616345e-06, "loss": 0.8281, "step": 10447 }, { "epoch": 0.71, "learning_rate": 4.04403195420067e-06, "loss": 0.7891, "step": 10448 }, { "epoch": 0.71, "learning_rate": 4.042259043959466e-06, "loss": 0.7344, "step": 10449 }, { "epoch": 0.71, "learning_rate": 4.040486423979115e-06, "loss": 0.6934, "step": 10450 }, { "epoch": 0.71, "learning_rate": 4.038714094345971e-06, "loss": 0.708, "step": 10451 }, { "epoch": 0.71, "learning_rate": 4.036942055146387e-06, "loss": 0.75, "step": 10452 }, { "epoch": 0.71, "learning_rate": 4.0351703064666935e-06, "loss": 0.7783, "step": 10453 }, { "epoch": 0.71, "learning_rate": 4.033398848393213e-06, "loss": 0.8125, "step": 10454 }, { "epoch": 0.71, "learning_rate": 4.031627681012249e-06, "loss": 0.7305, "step": 10455 }, { "epoch": 0.71, "learning_rate": 4.029856804410096e-06, "loss": 0.8271, "step": 10456 }, { "epoch": 0.71, "learning_rate": 4.028086218673026e-06, "loss": 0.7666, "step": 10457 }, { "epoch": 0.71, "learning_rate": 4.026315923887304e-06, "loss": 0.8633, "step": 10458 }, { "epoch": 0.71, "learning_rate": 4.024545920139179e-06, "loss": 0.8145, "step": 10459 }, { "epoch": 0.71, "learning_rate": 4.022776207514885e-06, "loss": 0.7627, "step": 10460 }, { "epoch": 0.71, "learning_rate": 4.021006786100643e-06, "loss": 0.8008, "step": 10461 }, { "epoch": 0.71, "learning_rate": 4.0192376559826585e-06, "loss": 0.7637, "step": 10462 }, { "epoch": 0.71, "learning_rate": 4.017468817247128e-06, "loss": 0.7295, "step": 10463 }, { "epoch": 0.71, "learning_rate": 4.015700269980221e-06, "loss": 0.7295, "step": 10464 }, { "epoch": 0.71, "learning_rate": 4.0139320142681004e-06, "loss": 0.7646, "step": 10465 }, { "epoch": 0.71, "learning_rate": 4.0121640501969285e-06, "loss": 0.7988, "step": 10466 }, { "epoch": 0.71, "learning_rate": 4.010396377852828e-06, "loss": 0.7959, "step": 10467 }, { "epoch": 0.71, "learning_rate": 4.008628997321924e-06, "loss": 0.7773, "step": 10468 }, { "epoch": 0.71, "learning_rate": 4.006861908690327e-06, "loss": 0.8066, "step": 10469 }, { "epoch": 0.71, "learning_rate": 4.005095112044122e-06, "loss": 0.7178, "step": 10470 }, { "epoch": 0.71, "learning_rate": 4.003328607469387e-06, "loss": 0.7842, "step": 10471 }, { "epoch": 0.71, "learning_rate": 4.001562395052197e-06, "loss": 0.7725, "step": 10472 }, { "epoch": 0.71, "learning_rate": 3.99979647487859e-06, "loss": 0.7695, "step": 10473 }, { "epoch": 0.71, "learning_rate": 3.998030847034607e-06, "loss": 0.7666, "step": 10474 }, { "epoch": 0.71, "learning_rate": 3.996265511606269e-06, "loss": 0.793, "step": 10475 }, { "epoch": 0.71, "learning_rate": 3.994500468679586e-06, "loss": 0.8184, "step": 10476 }, { "epoch": 0.71, "learning_rate": 3.992735718340538e-06, "loss": 0.79, "step": 10477 }, { "epoch": 0.71, "learning_rate": 3.990971260675118e-06, "loss": 0.8174, "step": 10478 }, { "epoch": 0.71, "learning_rate": 3.98920709576929e-06, "loss": 0.751, "step": 10479 }, { "epoch": 0.71, "learning_rate": 3.987443223708994e-06, "loss": 0.7656, "step": 10480 }, { "epoch": 0.71, "learning_rate": 3.98567964458017e-06, "loss": 0.6426, "step": 10481 }, { "epoch": 0.71, "learning_rate": 3.9839163584687425e-06, "loss": 0.75, "step": 10482 }, { "epoch": 0.71, "learning_rate": 3.9821533654606156e-06, "loss": 0.7451, "step": 10483 }, { "epoch": 0.71, "learning_rate": 3.980390665641684e-06, "loss": 0.7256, "step": 10484 }, { "epoch": 0.71, "learning_rate": 3.978628259097825e-06, "loss": 0.7783, "step": 10485 }, { "epoch": 0.71, "learning_rate": 3.976866145914907e-06, "loss": 0.7773, "step": 10486 }, { "epoch": 0.71, "learning_rate": 3.975104326178774e-06, "loss": 0.7715, "step": 10487 }, { "epoch": 0.71, "learning_rate": 3.973342799975262e-06, "loss": 0.8389, "step": 10488 }, { "epoch": 0.71, "learning_rate": 3.971581567390198e-06, "loss": 0.7549, "step": 10489 }, { "epoch": 0.71, "learning_rate": 3.969820628509384e-06, "loss": 0.8203, "step": 10490 }, { "epoch": 0.71, "learning_rate": 3.968059983418616e-06, "loss": 0.7803, "step": 10491 }, { "epoch": 0.72, "learning_rate": 3.966299632203675e-06, "loss": 0.793, "step": 10492 }, { "epoch": 0.72, "learning_rate": 3.964539574950318e-06, "loss": 0.6748, "step": 10493 }, { "epoch": 0.72, "learning_rate": 3.962779811744294e-06, "loss": 0.7295, "step": 10494 }, { "epoch": 0.72, "learning_rate": 3.961020342671351e-06, "loss": 0.7764, "step": 10495 }, { "epoch": 0.72, "learning_rate": 3.9592611678171985e-06, "loss": 0.8037, "step": 10496 }, { "epoch": 0.72, "learning_rate": 3.957502287267548e-06, "loss": 0.7891, "step": 10497 }, { "epoch": 0.72, "learning_rate": 3.955743701108091e-06, "loss": 0.79, "step": 10498 }, { "epoch": 0.72, "learning_rate": 3.95398540942451e-06, "loss": 0.7754, "step": 10499 }, { "epoch": 0.72, "learning_rate": 3.952227412302458e-06, "loss": 0.6484, "step": 10500 }, { "epoch": 0.72, "learning_rate": 3.950469709827594e-06, "loss": 0.7686, "step": 10501 }, { "epoch": 0.72, "learning_rate": 3.948712302085555e-06, "loss": 0.8789, "step": 10502 }, { "epoch": 0.72, "learning_rate": 3.946955189161954e-06, "loss": 0.7246, "step": 10503 }, { "epoch": 0.72, "learning_rate": 3.9451983711424015e-06, "loss": 0.7686, "step": 10504 }, { "epoch": 0.72, "learning_rate": 3.943441848112492e-06, "loss": 0.8369, "step": 10505 }, { "epoch": 0.72, "learning_rate": 3.941685620157794e-06, "loss": 0.8047, "step": 10506 }, { "epoch": 0.72, "learning_rate": 3.939929687363879e-06, "loss": 0.7725, "step": 10507 }, { "epoch": 0.72, "learning_rate": 3.938174049816299e-06, "loss": 0.751, "step": 10508 }, { "epoch": 0.72, "learning_rate": 3.93641870760058e-06, "loss": 0.6621, "step": 10509 }, { "epoch": 0.72, "learning_rate": 3.934663660802246e-06, "loss": 0.7773, "step": 10510 }, { "epoch": 0.72, "learning_rate": 3.932908909506802e-06, "loss": 0.8018, "step": 10511 }, { "epoch": 0.72, "learning_rate": 3.93115445379974e-06, "loss": 0.8457, "step": 10512 }, { "epoch": 0.72, "learning_rate": 3.929400293766538e-06, "loss": 0.7764, "step": 10513 }, { "epoch": 0.72, "learning_rate": 3.927646429492657e-06, "loss": 0.7031, "step": 10514 }, { "epoch": 0.72, "learning_rate": 3.92589286106355e-06, "loss": 0.8535, "step": 10515 }, { "epoch": 0.72, "learning_rate": 3.924139588564642e-06, "loss": 0.6846, "step": 10516 }, { "epoch": 0.72, "learning_rate": 3.922386612081357e-06, "loss": 0.7012, "step": 10517 }, { "epoch": 0.72, "learning_rate": 3.9206339316991e-06, "loss": 0.7246, "step": 10518 }, { "epoch": 0.72, "learning_rate": 3.918881547503263e-06, "loss": 0.7305, "step": 10519 }, { "epoch": 0.72, "learning_rate": 3.9171294595792185e-06, "loss": 0.7578, "step": 10520 }, { "epoch": 0.72, "learning_rate": 3.915377668012334e-06, "loss": 0.8066, "step": 10521 }, { "epoch": 0.72, "learning_rate": 3.9136261728879495e-06, "loss": 0.8154, "step": 10522 }, { "epoch": 0.72, "learning_rate": 3.911874974291402e-06, "loss": 0.6934, "step": 10523 }, { "epoch": 0.72, "learning_rate": 3.910124072308008e-06, "loss": 0.8613, "step": 10524 }, { "epoch": 0.72, "learning_rate": 3.9083734670230725e-06, "loss": 0.7422, "step": 10525 }, { "epoch": 0.72, "learning_rate": 3.906623158521884e-06, "loss": 0.7666, "step": 10526 }, { "epoch": 0.72, "learning_rate": 3.904873146889719e-06, "loss": 0.749, "step": 10527 }, { "epoch": 0.72, "learning_rate": 3.903123432211838e-06, "loss": 0.7471, "step": 10528 }, { "epoch": 0.72, "learning_rate": 3.901374014573485e-06, "loss": 0.8154, "step": 10529 }, { "epoch": 0.72, "learning_rate": 3.899624894059889e-06, "loss": 0.8262, "step": 10530 }, { "epoch": 0.72, "learning_rate": 3.897876070756277e-06, "loss": 0.7939, "step": 10531 }, { "epoch": 0.72, "learning_rate": 3.896127544747842e-06, "loss": 0.8584, "step": 10532 }, { "epoch": 0.72, "learning_rate": 3.894379316119775e-06, "loss": 0.7588, "step": 10533 }, { "epoch": 0.72, "learning_rate": 3.892631384957251e-06, "loss": 0.7314, "step": 10534 }, { "epoch": 0.72, "learning_rate": 3.89088375134543e-06, "loss": 0.7578, "step": 10535 }, { "epoch": 0.72, "learning_rate": 3.889136415369449e-06, "loss": 0.7764, "step": 10536 }, { "epoch": 0.72, "learning_rate": 3.887389377114447e-06, "loss": 0.7598, "step": 10537 }, { "epoch": 0.72, "learning_rate": 3.88564263666554e-06, "loss": 0.751, "step": 10538 }, { "epoch": 0.72, "learning_rate": 3.883896194107821e-06, "loss": 0.792, "step": 10539 }, { "epoch": 0.72, "learning_rate": 3.882150049526383e-06, "loss": 0.7793, "step": 10540 }, { "epoch": 0.72, "learning_rate": 3.880404203006298e-06, "loss": 0.7578, "step": 10541 }, { "epoch": 0.72, "learning_rate": 3.878658654632617e-06, "loss": 0.7334, "step": 10542 }, { "epoch": 0.72, "learning_rate": 3.876913404490389e-06, "loss": 0.7725, "step": 10543 }, { "epoch": 0.72, "learning_rate": 3.875168452664646e-06, "loss": 0.7686, "step": 10544 }, { "epoch": 0.72, "learning_rate": 3.8734237992403935e-06, "loss": 0.7666, "step": 10545 }, { "epoch": 0.72, "learning_rate": 3.871679444302635e-06, "loss": 0.7979, "step": 10546 }, { "epoch": 0.72, "learning_rate": 3.869935387936356e-06, "loss": 0.793, "step": 10547 }, { "epoch": 0.72, "learning_rate": 3.8681916302265246e-06, "loss": 0.8184, "step": 10548 }, { "epoch": 0.72, "learning_rate": 3.866448171258098e-06, "loss": 0.6963, "step": 10549 }, { "epoch": 0.72, "learning_rate": 3.864705011116018e-06, "loss": 0.7666, "step": 10550 }, { "epoch": 0.72, "learning_rate": 3.862962149885213e-06, "loss": 0.8076, "step": 10551 }, { "epoch": 0.72, "learning_rate": 3.8612195876505895e-06, "loss": 0.75, "step": 10552 }, { "epoch": 0.72, "learning_rate": 3.8594773244970495e-06, "loss": 0.6865, "step": 10553 }, { "epoch": 0.72, "learning_rate": 3.857735360509475e-06, "loss": 0.7744, "step": 10554 }, { "epoch": 0.72, "learning_rate": 3.855993695772733e-06, "loss": 0.6973, "step": 10555 }, { "epoch": 0.72, "learning_rate": 3.854252330371678e-06, "loss": 0.7783, "step": 10556 }, { "epoch": 0.72, "learning_rate": 3.852511264391154e-06, "loss": 0.8066, "step": 10557 }, { "epoch": 0.72, "learning_rate": 3.8507704979159785e-06, "loss": 0.8223, "step": 10558 }, { "epoch": 0.72, "learning_rate": 3.849030031030965e-06, "loss": 0.7607, "step": 10559 }, { "epoch": 0.72, "learning_rate": 3.847289863820907e-06, "loss": 0.6865, "step": 10560 }, { "epoch": 0.72, "learning_rate": 3.845549996370587e-06, "loss": 0.7227, "step": 10561 }, { "epoch": 0.72, "learning_rate": 3.843810428764771e-06, "loss": 0.8271, "step": 10562 }, { "epoch": 0.72, "learning_rate": 3.842071161088211e-06, "loss": 0.7178, "step": 10563 }, { "epoch": 0.72, "learning_rate": 3.840332193425647e-06, "loss": 0.8018, "step": 10564 }, { "epoch": 0.72, "learning_rate": 3.838593525861796e-06, "loss": 0.7236, "step": 10565 }, { "epoch": 0.72, "learning_rate": 3.836855158481363e-06, "loss": 0.7354, "step": 10566 }, { "epoch": 0.72, "learning_rate": 3.835117091369054e-06, "loss": 0.8145, "step": 10567 }, { "epoch": 0.72, "learning_rate": 3.8333793246095355e-06, "loss": 0.6895, "step": 10568 }, { "epoch": 0.72, "learning_rate": 3.831641858287474e-06, "loss": 0.7236, "step": 10569 }, { "epoch": 0.72, "learning_rate": 3.8299046924875226e-06, "loss": 0.7109, "step": 10570 }, { "epoch": 0.72, "learning_rate": 3.828167827294317e-06, "loss": 0.6631, "step": 10571 }, { "epoch": 0.72, "learning_rate": 3.8264312627924675e-06, "loss": 0.7197, "step": 10572 }, { "epoch": 0.72, "learning_rate": 3.824694999066587e-06, "loss": 0.7646, "step": 10573 }, { "epoch": 0.72, "learning_rate": 3.82295903620127e-06, "loss": 0.7969, "step": 10574 }, { "epoch": 0.72, "learning_rate": 3.821223374281085e-06, "loss": 0.8359, "step": 10575 }, { "epoch": 0.72, "learning_rate": 3.819488013390594e-06, "loss": 0.8135, "step": 10576 }, { "epoch": 0.72, "learning_rate": 3.81775295361435e-06, "loss": 0.791, "step": 10577 }, { "epoch": 0.72, "learning_rate": 3.8160181950368735e-06, "loss": 0.7705, "step": 10578 }, { "epoch": 0.72, "learning_rate": 3.8142837377426923e-06, "loss": 0.7393, "step": 10579 }, { "epoch": 0.72, "learning_rate": 3.8125495818163095e-06, "loss": 0.7324, "step": 10580 }, { "epoch": 0.72, "learning_rate": 3.810815727342205e-06, "loss": 0.8027, "step": 10581 }, { "epoch": 0.72, "learning_rate": 3.809082174404858e-06, "loss": 0.835, "step": 10582 }, { "epoch": 0.72, "learning_rate": 3.807348923088724e-06, "loss": 0.7725, "step": 10583 }, { "epoch": 0.72, "learning_rate": 3.8056159734782495e-06, "loss": 0.7471, "step": 10584 }, { "epoch": 0.72, "learning_rate": 3.803883325657862e-06, "loss": 0.6973, "step": 10585 }, { "epoch": 0.72, "learning_rate": 3.8021509797119773e-06, "loss": 0.7158, "step": 10586 }, { "epoch": 0.72, "learning_rate": 3.8004189357249978e-06, "loss": 0.8262, "step": 10587 }, { "epoch": 0.72, "learning_rate": 3.798687193781302e-06, "loss": 0.832, "step": 10588 }, { "epoch": 0.72, "learning_rate": 3.7969557539652636e-06, "loss": 0.8203, "step": 10589 }, { "epoch": 0.72, "learning_rate": 3.7952246163612384e-06, "loss": 0.7363, "step": 10590 }, { "epoch": 0.72, "learning_rate": 3.7934937810535676e-06, "loss": 0.7715, "step": 10591 }, { "epoch": 0.72, "learning_rate": 3.7917632481265763e-06, "loss": 0.791, "step": 10592 }, { "epoch": 0.72, "learning_rate": 3.7900330176645816e-06, "loss": 0.8047, "step": 10593 }, { "epoch": 0.72, "learning_rate": 3.7883030897518704e-06, "loss": 0.752, "step": 10594 }, { "epoch": 0.72, "learning_rate": 3.7865734644727305e-06, "loss": 0.79, "step": 10595 }, { "epoch": 0.72, "learning_rate": 3.784844141911429e-06, "loss": 0.8223, "step": 10596 }, { "epoch": 0.72, "learning_rate": 3.7831151221522167e-06, "loss": 0.6982, "step": 10597 }, { "epoch": 0.72, "learning_rate": 3.7813864052793337e-06, "loss": 0.7139, "step": 10598 }, { "epoch": 0.72, "learning_rate": 3.7796579913770006e-06, "loss": 0.7744, "step": 10599 }, { "epoch": 0.72, "learning_rate": 3.7779298805294306e-06, "loss": 0.7246, "step": 10600 }, { "epoch": 0.72, "learning_rate": 3.7762020728208103e-06, "loss": 0.793, "step": 10601 }, { "epoch": 0.72, "learning_rate": 3.774474568335318e-06, "loss": 0.749, "step": 10602 }, { "epoch": 0.72, "learning_rate": 3.772747367157128e-06, "loss": 0.7119, "step": 10603 }, { "epoch": 0.72, "learning_rate": 3.7710204693703787e-06, "loss": 0.7812, "step": 10604 }, { "epoch": 0.72, "learning_rate": 3.769293875059209e-06, "loss": 0.7119, "step": 10605 }, { "epoch": 0.72, "learning_rate": 3.7675675843077375e-06, "loss": 0.6709, "step": 10606 }, { "epoch": 0.72, "learning_rate": 3.7658415972000726e-06, "loss": 0.791, "step": 10607 }, { "epoch": 0.72, "learning_rate": 3.7641159138202944e-06, "loss": 0.7236, "step": 10608 }, { "epoch": 0.72, "learning_rate": 3.7623905342524924e-06, "loss": 0.7881, "step": 10609 }, { "epoch": 0.72, "learning_rate": 3.7606654585807145e-06, "loss": 0.8271, "step": 10610 }, { "epoch": 0.72, "learning_rate": 3.758940686889012e-06, "loss": 0.7617, "step": 10611 }, { "epoch": 0.72, "learning_rate": 3.757216219261415e-06, "loss": 0.8096, "step": 10612 }, { "epoch": 0.72, "learning_rate": 3.7554920557819397e-06, "loss": 0.7637, "step": 10613 }, { "epoch": 0.72, "learning_rate": 3.7537681965345864e-06, "loss": 0.7021, "step": 10614 }, { "epoch": 0.72, "learning_rate": 3.752044641603342e-06, "loss": 0.7305, "step": 10615 }, { "epoch": 0.72, "learning_rate": 3.7503213910721813e-06, "loss": 0.7734, "step": 10616 }, { "epoch": 0.72, "learning_rate": 3.7485984450250533e-06, "loss": 0.6826, "step": 10617 }, { "epoch": 0.72, "learning_rate": 3.7468758035459065e-06, "loss": 0.7627, "step": 10618 }, { "epoch": 0.72, "learning_rate": 3.745153466718664e-06, "loss": 0.6758, "step": 10619 }, { "epoch": 0.72, "learning_rate": 3.7434314346272392e-06, "loss": 0.7129, "step": 10620 }, { "epoch": 0.72, "learning_rate": 3.741709707355531e-06, "loss": 0.749, "step": 10621 }, { "epoch": 0.72, "learning_rate": 3.7399882849874202e-06, "loss": 0.7812, "step": 10622 }, { "epoch": 0.72, "learning_rate": 3.7382671676067783e-06, "loss": 0.8027, "step": 10623 }, { "epoch": 0.72, "learning_rate": 3.7365463552974503e-06, "loss": 0.7773, "step": 10624 }, { "epoch": 0.72, "learning_rate": 3.7348258481432764e-06, "loss": 0.7588, "step": 10625 }, { "epoch": 0.72, "learning_rate": 3.733105646228088e-06, "loss": 0.7393, "step": 10626 }, { "epoch": 0.72, "learning_rate": 3.7313857496356832e-06, "loss": 0.8008, "step": 10627 }, { "epoch": 0.72, "learning_rate": 3.7296661584498595e-06, "loss": 0.7021, "step": 10628 }, { "epoch": 0.72, "learning_rate": 3.7279468727543977e-06, "loss": 0.7607, "step": 10629 }, { "epoch": 0.72, "learning_rate": 3.7262278926330554e-06, "loss": 0.8076, "step": 10630 }, { "epoch": 0.72, "learning_rate": 3.7245092181695797e-06, "loss": 0.7305, "step": 10631 }, { "epoch": 0.72, "learning_rate": 3.7227908494477174e-06, "loss": 0.7705, "step": 10632 }, { "epoch": 0.72, "learning_rate": 3.721072786551174e-06, "loss": 0.7822, "step": 10633 }, { "epoch": 0.72, "learning_rate": 3.7193550295636582e-06, "loss": 0.7969, "step": 10634 }, { "epoch": 0.72, "learning_rate": 3.71763757856886e-06, "loss": 0.7559, "step": 10635 }, { "epoch": 0.72, "learning_rate": 3.715920433650455e-06, "loss": 0.7539, "step": 10636 }, { "epoch": 0.72, "learning_rate": 3.714203594892094e-06, "loss": 0.793, "step": 10637 }, { "epoch": 0.72, "learning_rate": 3.712487062377431e-06, "loss": 0.7598, "step": 10638 }, { "epoch": 0.73, "learning_rate": 3.710770836190095e-06, "loss": 0.8184, "step": 10639 }, { "epoch": 0.73, "learning_rate": 3.7090549164136936e-06, "loss": 0.7471, "step": 10640 }, { "epoch": 0.73, "learning_rate": 3.7073393031318293e-06, "loss": 0.7988, "step": 10641 }, { "epoch": 0.73, "learning_rate": 3.7056239964280904e-06, "loss": 0.7705, "step": 10642 }, { "epoch": 0.73, "learning_rate": 3.7039089963860376e-06, "loss": 0.708, "step": 10643 }, { "epoch": 0.73, "learning_rate": 3.702194303089235e-06, "loss": 0.667, "step": 10644 }, { "epoch": 0.73, "learning_rate": 3.700479916621221e-06, "loss": 0.7373, "step": 10645 }, { "epoch": 0.73, "learning_rate": 3.6987658370655164e-06, "loss": 0.7373, "step": 10646 }, { "epoch": 0.73, "learning_rate": 3.697052064505632e-06, "loss": 0.6904, "step": 10647 }, { "epoch": 0.73, "learning_rate": 3.6953385990250632e-06, "loss": 0.749, "step": 10648 }, { "epoch": 0.73, "learning_rate": 3.693625440707291e-06, "loss": 0.792, "step": 10649 }, { "epoch": 0.73, "learning_rate": 3.6919125896357812e-06, "loss": 0.7793, "step": 10650 }, { "epoch": 0.73, "learning_rate": 3.69020004589398e-06, "loss": 0.8203, "step": 10651 }, { "epoch": 0.73, "learning_rate": 3.6884878095653298e-06, "loss": 0.6621, "step": 10652 }, { "epoch": 0.73, "learning_rate": 3.6867758807332423e-06, "loss": 0.7969, "step": 10653 }, { "epoch": 0.73, "learning_rate": 3.6850642594811246e-06, "loss": 0.8145, "step": 10654 }, { "epoch": 0.73, "learning_rate": 3.6833529458923687e-06, "loss": 0.7598, "step": 10655 }, { "epoch": 0.73, "learning_rate": 3.68164194005035e-06, "loss": 0.7979, "step": 10656 }, { "epoch": 0.73, "learning_rate": 3.679931242038428e-06, "loss": 0.7295, "step": 10657 }, { "epoch": 0.73, "learning_rate": 3.6782208519399475e-06, "loss": 0.7295, "step": 10658 }, { "epoch": 0.73, "learning_rate": 3.676510769838242e-06, "loss": 0.8398, "step": 10659 }, { "epoch": 0.73, "learning_rate": 3.6748009958166197e-06, "loss": 0.8496, "step": 10660 }, { "epoch": 0.73, "learning_rate": 3.673091529958385e-06, "loss": 0.7822, "step": 10661 }, { "epoch": 0.73, "learning_rate": 3.671382372346821e-06, "loss": 0.7832, "step": 10662 }, { "epoch": 0.73, "learning_rate": 3.6696735230652003e-06, "loss": 0.8057, "step": 10663 }, { "epoch": 0.73, "learning_rate": 3.6679649821967777e-06, "loss": 0.7676, "step": 10664 }, { "epoch": 0.73, "learning_rate": 3.6662567498247946e-06, "loss": 0.749, "step": 10665 }, { "epoch": 0.73, "learning_rate": 3.6645488260324703e-06, "loss": 0.7871, "step": 10666 }, { "epoch": 0.73, "learning_rate": 3.6628412109030156e-06, "loss": 0.7666, "step": 10667 }, { "epoch": 0.73, "learning_rate": 3.661133904519635e-06, "loss": 0.8135, "step": 10668 }, { "epoch": 0.73, "learning_rate": 3.6594269069654965e-06, "loss": 0.7627, "step": 10669 }, { "epoch": 0.73, "learning_rate": 3.6577202183237716e-06, "loss": 0.7783, "step": 10670 }, { "epoch": 0.73, "learning_rate": 3.656013838677608e-06, "loss": 0.7861, "step": 10671 }, { "epoch": 0.73, "learning_rate": 3.6543077681101436e-06, "loss": 0.7065, "step": 10672 }, { "epoch": 0.73, "learning_rate": 3.6526020067044886e-06, "loss": 0.7891, "step": 10673 }, { "epoch": 0.73, "learning_rate": 3.650896554543758e-06, "loss": 0.6934, "step": 10674 }, { "epoch": 0.73, "learning_rate": 3.6491914117110405e-06, "loss": 0.7998, "step": 10675 }, { "epoch": 0.73, "learning_rate": 3.647486578289404e-06, "loss": 0.8105, "step": 10676 }, { "epoch": 0.73, "learning_rate": 3.645782054361913e-06, "loss": 0.7578, "step": 10677 }, { "epoch": 0.73, "learning_rate": 3.644077840011613e-06, "loss": 0.7363, "step": 10678 }, { "epoch": 0.73, "learning_rate": 3.6423739353215236e-06, "loss": 0.7549, "step": 10679 }, { "epoch": 0.73, "learning_rate": 3.6406703403746703e-06, "loss": 0.8223, "step": 10680 }, { "epoch": 0.73, "learning_rate": 3.6389670552540513e-06, "loss": 0.7139, "step": 10681 }, { "epoch": 0.73, "learning_rate": 3.637264080042643e-06, "loss": 0.7363, "step": 10682 }, { "epoch": 0.73, "learning_rate": 3.6355614148234185e-06, "loss": 0.8057, "step": 10683 }, { "epoch": 0.73, "learning_rate": 3.633859059679332e-06, "loss": 0.7197, "step": 10684 }, { "epoch": 0.73, "learning_rate": 3.6321570146933217e-06, "loss": 0.7539, "step": 10685 }, { "epoch": 0.73, "learning_rate": 3.6304552799483104e-06, "loss": 0.7246, "step": 10686 }, { "epoch": 0.73, "learning_rate": 3.6287538555272084e-06, "loss": 0.7881, "step": 10687 }, { "epoch": 0.73, "learning_rate": 3.6270527415129097e-06, "loss": 0.8037, "step": 10688 }, { "epoch": 0.73, "learning_rate": 3.6253519379882885e-06, "loss": 0.7949, "step": 10689 }, { "epoch": 0.73, "learning_rate": 3.623651445036209e-06, "loss": 0.7695, "step": 10690 }, { "epoch": 0.73, "learning_rate": 3.6219512627395214e-06, "loss": 0.7988, "step": 10691 }, { "epoch": 0.73, "learning_rate": 3.6202513911810565e-06, "loss": 0.7383, "step": 10692 }, { "epoch": 0.73, "learning_rate": 3.618551830443633e-06, "loss": 0.7695, "step": 10693 }, { "epoch": 0.73, "learning_rate": 3.6168525806100517e-06, "loss": 0.7363, "step": 10694 }, { "epoch": 0.73, "learning_rate": 3.615153641763106e-06, "loss": 0.79, "step": 10695 }, { "epoch": 0.73, "learning_rate": 3.6134550139855605e-06, "loss": 0.7725, "step": 10696 }, { "epoch": 0.73, "learning_rate": 3.6117566973601747e-06, "loss": 0.7363, "step": 10697 }, { "epoch": 0.73, "learning_rate": 3.610058691969691e-06, "loss": 0.7773, "step": 10698 }, { "epoch": 0.73, "learning_rate": 3.608360997896837e-06, "loss": 0.7266, "step": 10699 }, { "epoch": 0.73, "learning_rate": 3.6066636152243227e-06, "loss": 0.6787, "step": 10700 }, { "epoch": 0.73, "learning_rate": 3.604966544034849e-06, "loss": 0.7139, "step": 10701 }, { "epoch": 0.73, "learning_rate": 3.6032697844110896e-06, "loss": 0.6826, "step": 10702 }, { "epoch": 0.73, "learning_rate": 3.601573336435712e-06, "loss": 0.7373, "step": 10703 }, { "epoch": 0.73, "learning_rate": 3.599877200191375e-06, "loss": 0.7656, "step": 10704 }, { "epoch": 0.73, "learning_rate": 3.5981813757607055e-06, "loss": 0.7646, "step": 10705 }, { "epoch": 0.73, "learning_rate": 3.596485863226328e-06, "loss": 0.8008, "step": 10706 }, { "epoch": 0.73, "learning_rate": 3.5947906626708464e-06, "loss": 0.8008, "step": 10707 }, { "epoch": 0.73, "learning_rate": 3.5930957741768546e-06, "loss": 0.7549, "step": 10708 }, { "epoch": 0.73, "learning_rate": 3.591401197826917e-06, "loss": 0.8555, "step": 10709 }, { "epoch": 0.73, "learning_rate": 3.589706933703605e-06, "loss": 0.7549, "step": 10710 }, { "epoch": 0.73, "learning_rate": 3.5880129818894614e-06, "loss": 0.7686, "step": 10711 }, { "epoch": 0.73, "learning_rate": 3.5863193424670094e-06, "loss": 0.7373, "step": 10712 }, { "epoch": 0.73, "learning_rate": 3.584626015518766e-06, "loss": 0.7979, "step": 10713 }, { "epoch": 0.73, "learning_rate": 3.5829330011272347e-06, "loss": 0.8477, "step": 10714 }, { "epoch": 0.73, "learning_rate": 3.581240299374886e-06, "loss": 0.833, "step": 10715 }, { "epoch": 0.73, "learning_rate": 3.579547910344202e-06, "loss": 0.7207, "step": 10716 }, { "epoch": 0.73, "learning_rate": 3.5778558341176327e-06, "loss": 0.6704, "step": 10717 }, { "epoch": 0.73, "learning_rate": 3.5761640707776115e-06, "loss": 0.7461, "step": 10718 }, { "epoch": 0.73, "learning_rate": 3.574472620406564e-06, "loss": 0.8486, "step": 10719 }, { "epoch": 0.73, "learning_rate": 3.5727814830868956e-06, "loss": 0.7939, "step": 10720 }, { "epoch": 0.73, "learning_rate": 3.571090658901001e-06, "loss": 0.6963, "step": 10721 }, { "epoch": 0.73, "learning_rate": 3.569400147931256e-06, "loss": 0.8662, "step": 10722 }, { "epoch": 0.73, "learning_rate": 3.567709950260021e-06, "loss": 0.7334, "step": 10723 }, { "epoch": 0.73, "learning_rate": 3.5660200659696487e-06, "loss": 0.8027, "step": 10724 }, { "epoch": 0.73, "learning_rate": 3.5643304951424605e-06, "loss": 0.7695, "step": 10725 }, { "epoch": 0.73, "learning_rate": 3.5626412378607765e-06, "loss": 0.7744, "step": 10726 }, { "epoch": 0.73, "learning_rate": 3.5609522942068986e-06, "loss": 0.6963, "step": 10727 }, { "epoch": 0.73, "learning_rate": 3.5592636642631095e-06, "loss": 0.8008, "step": 10728 }, { "epoch": 0.73, "learning_rate": 3.5575753481116813e-06, "loss": 0.7529, "step": 10729 }, { "epoch": 0.73, "learning_rate": 3.555887345834872e-06, "loss": 0.7021, "step": 10730 }, { "epoch": 0.73, "learning_rate": 3.5541996575149127e-06, "loss": 0.7002, "step": 10731 }, { "epoch": 0.73, "learning_rate": 3.5525122832340285e-06, "loss": 0.7939, "step": 10732 }, { "epoch": 0.73, "learning_rate": 3.5508252230744378e-06, "loss": 0.6875, "step": 10733 }, { "epoch": 0.73, "learning_rate": 3.5491384771183256e-06, "loss": 0.7383, "step": 10734 }, { "epoch": 0.73, "learning_rate": 3.547452045447871e-06, "loss": 0.75, "step": 10735 }, { "epoch": 0.73, "learning_rate": 3.5457659281452383e-06, "loss": 0.7441, "step": 10736 }, { "epoch": 0.73, "learning_rate": 3.544080125292578e-06, "loss": 0.7539, "step": 10737 }, { "epoch": 0.73, "learning_rate": 3.542394636972013e-06, "loss": 0.7441, "step": 10738 }, { "epoch": 0.73, "learning_rate": 3.54070946326567e-06, "loss": 0.75, "step": 10739 }, { "epoch": 0.73, "learning_rate": 3.5390246042556496e-06, "loss": 0.7637, "step": 10740 }, { "epoch": 0.73, "learning_rate": 3.5373400600240325e-06, "loss": 0.7803, "step": 10741 }, { "epoch": 0.73, "learning_rate": 3.5356558306528934e-06, "loss": 0.8457, "step": 10742 }, { "epoch": 0.73, "learning_rate": 3.5339719162242847e-06, "loss": 0.6826, "step": 10743 }, { "epoch": 0.73, "learning_rate": 3.5322883168202506e-06, "loss": 0.7451, "step": 10744 }, { "epoch": 0.73, "learning_rate": 3.5306050325228135e-06, "loss": 0.7012, "step": 10745 }, { "epoch": 0.73, "learning_rate": 3.5289220634139843e-06, "loss": 0.8223, "step": 10746 }, { "epoch": 0.73, "learning_rate": 3.52723940957576e-06, "loss": 0.7744, "step": 10747 }, { "epoch": 0.73, "learning_rate": 3.525557071090112e-06, "loss": 0.7197, "step": 10748 }, { "epoch": 0.73, "learning_rate": 3.5238750480390084e-06, "loss": 0.6943, "step": 10749 }, { "epoch": 0.73, "learning_rate": 3.522193340504396e-06, "loss": 0.6729, "step": 10750 }, { "epoch": 0.73, "learning_rate": 3.5205119485682093e-06, "loss": 0.835, "step": 10751 }, { "epoch": 0.73, "learning_rate": 3.518830872312363e-06, "loss": 0.8369, "step": 10752 }, { "epoch": 0.73, "learning_rate": 3.5171501118187644e-06, "loss": 0.7334, "step": 10753 }, { "epoch": 0.73, "learning_rate": 3.5154696671692933e-06, "loss": 0.6904, "step": 10754 }, { "epoch": 0.73, "learning_rate": 3.5137895384458244e-06, "loss": 0.7383, "step": 10755 }, { "epoch": 0.73, "learning_rate": 3.5121097257302117e-06, "loss": 0.7686, "step": 10756 }, { "epoch": 0.73, "learning_rate": 3.510430229104297e-06, "loss": 0.8027, "step": 10757 }, { "epoch": 0.73, "learning_rate": 3.5087510486499056e-06, "loss": 0.7812, "step": 10758 }, { "epoch": 0.73, "learning_rate": 3.5070721844488455e-06, "loss": 0.7549, "step": 10759 }, { "epoch": 0.73, "learning_rate": 3.5053936365829155e-06, "loss": 0.7197, "step": 10760 }, { "epoch": 0.73, "learning_rate": 3.5037154051338883e-06, "loss": 0.7285, "step": 10761 }, { "epoch": 0.73, "learning_rate": 3.502037490183526e-06, "loss": 0.7979, "step": 10762 }, { "epoch": 0.73, "learning_rate": 3.5003598918135873e-06, "loss": 0.6553, "step": 10763 }, { "epoch": 0.73, "learning_rate": 3.4986826101057934e-06, "loss": 0.8164, "step": 10764 }, { "epoch": 0.73, "learning_rate": 3.4970056451418668e-06, "loss": 0.7871, "step": 10765 }, { "epoch": 0.73, "learning_rate": 3.495328997003511e-06, "loss": 0.8096, "step": 10766 }, { "epoch": 0.73, "learning_rate": 3.4936526657724058e-06, "loss": 0.7998, "step": 10767 }, { "epoch": 0.73, "learning_rate": 3.491976651530222e-06, "loss": 0.7998, "step": 10768 }, { "epoch": 0.73, "learning_rate": 3.4903009543586254e-06, "loss": 0.7471, "step": 10769 }, { "epoch": 0.73, "learning_rate": 3.488625574339245e-06, "loss": 0.7266, "step": 10770 }, { "epoch": 0.73, "learning_rate": 3.4869505115537096e-06, "loss": 0.7158, "step": 10771 }, { "epoch": 0.73, "learning_rate": 3.4852757660836266e-06, "loss": 0.7666, "step": 10772 }, { "epoch": 0.73, "learning_rate": 3.4836013380105947e-06, "loss": 0.748, "step": 10773 }, { "epoch": 0.73, "learning_rate": 3.481927227416182e-06, "loss": 0.7627, "step": 10774 }, { "epoch": 0.73, "learning_rate": 3.4802534343819583e-06, "loss": 0.7373, "step": 10775 }, { "epoch": 0.73, "learning_rate": 3.478579958989474e-06, "loss": 0.7119, "step": 10776 }, { "epoch": 0.73, "learning_rate": 3.4769068013202523e-06, "loss": 0.7324, "step": 10777 }, { "epoch": 0.73, "learning_rate": 3.475233961455814e-06, "loss": 0.7939, "step": 10778 }, { "epoch": 0.73, "learning_rate": 3.4735614394776585e-06, "loss": 0.7617, "step": 10779 }, { "epoch": 0.73, "learning_rate": 3.4718892354672706e-06, "loss": 0.833, "step": 10780 }, { "epoch": 0.73, "learning_rate": 3.470217349506121e-06, "loss": 0.8262, "step": 10781 }, { "epoch": 0.73, "learning_rate": 3.4685457816756675e-06, "loss": 0.7422, "step": 10782 }, { "epoch": 0.73, "learning_rate": 3.4668745320573417e-06, "loss": 0.7979, "step": 10783 }, { "epoch": 0.73, "learning_rate": 3.4652036007325694e-06, "loss": 0.8047, "step": 10784 }, { "epoch": 0.73, "learning_rate": 3.463532987782761e-06, "loss": 0.7686, "step": 10785 }, { "epoch": 0.74, "learning_rate": 3.461862693289304e-06, "loss": 0.7969, "step": 10786 }, { "epoch": 0.74, "learning_rate": 3.460192717333579e-06, "loss": 0.8623, "step": 10787 }, { "epoch": 0.74, "learning_rate": 3.4585230599969467e-06, "loss": 0.791, "step": 10788 }, { "epoch": 0.74, "learning_rate": 3.4568537213607535e-06, "loss": 0.8076, "step": 10789 }, { "epoch": 0.74, "learning_rate": 3.4551847015063257e-06, "loss": 0.7119, "step": 10790 }, { "epoch": 0.74, "learning_rate": 3.453516000514979e-06, "loss": 0.749, "step": 10791 }, { "epoch": 0.74, "learning_rate": 3.451847618468015e-06, "loss": 0.79, "step": 10792 }, { "epoch": 0.74, "learning_rate": 3.4501795554467155e-06, "loss": 0.7764, "step": 10793 }, { "epoch": 0.74, "learning_rate": 3.4485118115323478e-06, "loss": 0.7979, "step": 10794 }, { "epoch": 0.74, "learning_rate": 3.4468443868061653e-06, "loss": 0.8105, "step": 10795 }, { "epoch": 0.74, "learning_rate": 3.445177281349409e-06, "loss": 0.7109, "step": 10796 }, { "epoch": 0.74, "learning_rate": 3.4435104952432905e-06, "loss": 0.7715, "step": 10797 }, { "epoch": 0.74, "learning_rate": 3.4418440285690192e-06, "loss": 0.8203, "step": 10798 }, { "epoch": 0.74, "learning_rate": 3.4401778814077937e-06, "loss": 0.8027, "step": 10799 }, { "epoch": 0.74, "learning_rate": 3.438512053840778e-06, "loss": 0.7412, "step": 10800 }, { "epoch": 0.74, "learning_rate": 3.436846545949135e-06, "loss": 0.793, "step": 10801 }, { "epoch": 0.74, "learning_rate": 3.4351813578140124e-06, "loss": 0.7773, "step": 10802 }, { "epoch": 0.74, "learning_rate": 3.4335164895165307e-06, "loss": 0.7471, "step": 10803 }, { "epoch": 0.74, "learning_rate": 3.4318519411378006e-06, "loss": 0.7871, "step": 10804 }, { "epoch": 0.74, "learning_rate": 3.430187712758931e-06, "loss": 0.8535, "step": 10805 }, { "epoch": 0.74, "learning_rate": 3.4285238044609924e-06, "loss": 0.8018, "step": 10806 }, { "epoch": 0.74, "learning_rate": 3.4268602163250543e-06, "loss": 0.7588, "step": 10807 }, { "epoch": 0.74, "learning_rate": 3.4251969484321645e-06, "loss": 0.7402, "step": 10808 }, { "epoch": 0.74, "learning_rate": 3.4235340008633633e-06, "loss": 0.7842, "step": 10809 }, { "epoch": 0.74, "learning_rate": 3.4218713736996577e-06, "loss": 0.71, "step": 10810 }, { "epoch": 0.74, "learning_rate": 3.4202090670220612e-06, "loss": 0.8311, "step": 10811 }, { "epoch": 0.74, "learning_rate": 3.4185470809115617e-06, "loss": 0.8066, "step": 10812 }, { "epoch": 0.74, "learning_rate": 3.416885415449124e-06, "loss": 0.8359, "step": 10813 }, { "epoch": 0.74, "learning_rate": 3.415224070715707e-06, "loss": 0.8242, "step": 10814 }, { "epoch": 0.74, "learning_rate": 3.4135630467922564e-06, "loss": 0.7373, "step": 10815 }, { "epoch": 0.74, "learning_rate": 3.4119023437596865e-06, "loss": 0.7637, "step": 10816 }, { "epoch": 0.74, "learning_rate": 3.4102419616989157e-06, "loss": 0.8076, "step": 10817 }, { "epoch": 0.74, "learning_rate": 3.4085819006908395e-06, "loss": 0.7441, "step": 10818 }, { "epoch": 0.74, "learning_rate": 3.406922160816327e-06, "loss": 0.7891, "step": 10819 }, { "epoch": 0.74, "learning_rate": 3.4052627421562466e-06, "loss": 0.749, "step": 10820 }, { "epoch": 0.74, "learning_rate": 3.4036036447914434e-06, "loss": 0.7432, "step": 10821 }, { "epoch": 0.74, "learning_rate": 3.401944868802749e-06, "loss": 0.6875, "step": 10822 }, { "epoch": 0.74, "learning_rate": 3.400286414270978e-06, "loss": 0.6885, "step": 10823 }, { "epoch": 0.74, "learning_rate": 3.3986282812769323e-06, "loss": 0.6758, "step": 10824 }, { "epoch": 0.74, "learning_rate": 3.3969704699013974e-06, "loss": 0.7637, "step": 10825 }, { "epoch": 0.74, "learning_rate": 3.395312980225135e-06, "loss": 0.7988, "step": 10826 }, { "epoch": 0.74, "learning_rate": 3.3936558123289033e-06, "loss": 0.8066, "step": 10827 }, { "epoch": 0.74, "learning_rate": 3.391998966293438e-06, "loss": 0.7607, "step": 10828 }, { "epoch": 0.74, "learning_rate": 3.3903424421994614e-06, "loss": 0.7197, "step": 10829 }, { "epoch": 0.74, "learning_rate": 3.388686240127678e-06, "loss": 0.791, "step": 10830 }, { "epoch": 0.74, "learning_rate": 3.3870303601587784e-06, "loss": 0.7051, "step": 10831 }, { "epoch": 0.74, "learning_rate": 3.3853748023734413e-06, "loss": 0.7207, "step": 10832 }, { "epoch": 0.74, "learning_rate": 3.383719566852317e-06, "loss": 0.79, "step": 10833 }, { "epoch": 0.74, "learning_rate": 3.3820646536760502e-06, "loss": 0.8359, "step": 10834 }, { "epoch": 0.74, "learning_rate": 3.380410062925277e-06, "loss": 0.6543, "step": 10835 }, { "epoch": 0.74, "learning_rate": 3.378755794680599e-06, "loss": 0.7119, "step": 10836 }, { "epoch": 0.74, "learning_rate": 3.377101849022616e-06, "loss": 0.7754, "step": 10837 }, { "epoch": 0.74, "learning_rate": 3.375448226031912e-06, "loss": 0.6895, "step": 10838 }, { "epoch": 0.74, "learning_rate": 3.3737949257890433e-06, "loss": 0.7363, "step": 10839 }, { "epoch": 0.74, "learning_rate": 3.37214194837456e-06, "loss": 0.6904, "step": 10840 }, { "epoch": 0.74, "learning_rate": 3.370489293869004e-06, "loss": 0.6924, "step": 10841 }, { "epoch": 0.74, "learning_rate": 3.3688369623528827e-06, "loss": 0.7979, "step": 10842 }, { "epoch": 0.74, "learning_rate": 3.3671849539067014e-06, "loss": 0.7725, "step": 10843 }, { "epoch": 0.74, "learning_rate": 3.3655332686109456e-06, "loss": 0.7617, "step": 10844 }, { "epoch": 0.74, "learning_rate": 3.3638819065460892e-06, "loss": 0.7949, "step": 10845 }, { "epoch": 0.74, "learning_rate": 3.362230867792575e-06, "loss": 0.7744, "step": 10846 }, { "epoch": 0.74, "learning_rate": 3.3605801524308535e-06, "loss": 0.7285, "step": 10847 }, { "epoch": 0.74, "learning_rate": 3.358929760541346e-06, "loss": 0.8066, "step": 10848 }, { "epoch": 0.74, "learning_rate": 3.357279692204454e-06, "loss": 0.7754, "step": 10849 }, { "epoch": 0.74, "learning_rate": 3.3556299475005715e-06, "loss": 0.7793, "step": 10850 }, { "epoch": 0.74, "learning_rate": 3.3539805265100734e-06, "loss": 0.7598, "step": 10851 }, { "epoch": 0.74, "learning_rate": 3.35233142931332e-06, "loss": 0.7168, "step": 10852 }, { "epoch": 0.74, "learning_rate": 3.3506826559906557e-06, "loss": 0.8174, "step": 10853 }, { "epoch": 0.74, "learning_rate": 3.3490342066224102e-06, "loss": 0.7354, "step": 10854 }, { "epoch": 0.74, "learning_rate": 3.3473860812888913e-06, "loss": 0.7041, "step": 10855 }, { "epoch": 0.74, "learning_rate": 3.3457382800703986e-06, "loss": 0.7471, "step": 10856 }, { "epoch": 0.74, "learning_rate": 3.344090803047212e-06, "loss": 0.7998, "step": 10857 }, { "epoch": 0.74, "learning_rate": 3.3424436502995974e-06, "loss": 0.7158, "step": 10858 }, { "epoch": 0.74, "learning_rate": 3.3407968219078025e-06, "loss": 0.7715, "step": 10859 }, { "epoch": 0.74, "learning_rate": 3.3391503179520623e-06, "loss": 0.7686, "step": 10860 }, { "epoch": 0.74, "learning_rate": 3.337504138512596e-06, "loss": 0.7832, "step": 10861 }, { "epoch": 0.74, "learning_rate": 3.335858283669601e-06, "loss": 0.7764, "step": 10862 }, { "epoch": 0.74, "learning_rate": 3.334212753503262e-06, "loss": 0.7324, "step": 10863 }, { "epoch": 0.74, "learning_rate": 3.332567548093759e-06, "loss": 0.6885, "step": 10864 }, { "epoch": 0.74, "learning_rate": 3.330922667521237e-06, "loss": 0.71, "step": 10865 }, { "epoch": 0.74, "learning_rate": 3.329278111865837e-06, "loss": 0.793, "step": 10866 }, { "epoch": 0.74, "learning_rate": 3.3276338812076824e-06, "loss": 0.8066, "step": 10867 }, { "epoch": 0.74, "learning_rate": 3.325989975626882e-06, "loss": 0.7637, "step": 10868 }, { "epoch": 0.74, "learning_rate": 3.3243463952035195e-06, "loss": 0.7305, "step": 10869 }, { "epoch": 0.74, "learning_rate": 3.32270314001768e-06, "loss": 0.8262, "step": 10870 }, { "epoch": 0.74, "learning_rate": 3.321060210149416e-06, "loss": 0.7734, "step": 10871 }, { "epoch": 0.74, "learning_rate": 3.3194176056787717e-06, "loss": 0.7285, "step": 10872 }, { "epoch": 0.74, "learning_rate": 3.3177753266857772e-06, "loss": 0.752, "step": 10873 }, { "epoch": 0.74, "learning_rate": 3.3161333732504453e-06, "loss": 0.7969, "step": 10874 }, { "epoch": 0.74, "learning_rate": 3.3144917454527626e-06, "loss": 0.7334, "step": 10875 }, { "epoch": 0.74, "learning_rate": 3.3128504433727203e-06, "loss": 0.7529, "step": 10876 }, { "epoch": 0.74, "learning_rate": 3.3112094670902805e-06, "loss": 0.7715, "step": 10877 }, { "epoch": 0.74, "learning_rate": 3.309568816685387e-06, "loss": 0.7314, "step": 10878 }, { "epoch": 0.74, "learning_rate": 3.307928492237974e-06, "loss": 0.7275, "step": 10879 }, { "epoch": 0.74, "learning_rate": 3.3062884938279583e-06, "loss": 0.8242, "step": 10880 }, { "epoch": 0.74, "learning_rate": 3.3046488215352414e-06, "loss": 0.7764, "step": 10881 }, { "epoch": 0.74, "learning_rate": 3.303009475439707e-06, "loss": 0.748, "step": 10882 }, { "epoch": 0.74, "learning_rate": 3.3013704556212245e-06, "loss": 0.7012, "step": 10883 }, { "epoch": 0.74, "learning_rate": 3.29973176215965e-06, "loss": 0.709, "step": 10884 }, { "epoch": 0.74, "learning_rate": 3.298093395134814e-06, "loss": 0.7285, "step": 10885 }, { "epoch": 0.74, "learning_rate": 3.296455354626541e-06, "loss": 0.7949, "step": 10886 }, { "epoch": 0.74, "learning_rate": 3.294817640714636e-06, "loss": 0.7178, "step": 10887 }, { "epoch": 0.74, "learning_rate": 3.293180253478888e-06, "loss": 0.7422, "step": 10888 }, { "epoch": 0.74, "learning_rate": 3.2915431929990717e-06, "loss": 0.7334, "step": 10889 }, { "epoch": 0.74, "learning_rate": 3.2899064593549477e-06, "loss": 0.8301, "step": 10890 }, { "epoch": 0.74, "learning_rate": 3.28827005262625e-06, "loss": 0.7705, "step": 10891 }, { "epoch": 0.74, "learning_rate": 3.2866339728927075e-06, "loss": 0.7422, "step": 10892 }, { "epoch": 0.74, "learning_rate": 3.284998220234031e-06, "loss": 0.7275, "step": 10893 }, { "epoch": 0.74, "learning_rate": 3.283362794729913e-06, "loss": 0.7734, "step": 10894 }, { "epoch": 0.74, "learning_rate": 3.2817276964600333e-06, "loss": 0.7822, "step": 10895 }, { "epoch": 0.74, "learning_rate": 3.2800929255040513e-06, "loss": 0.7598, "step": 10896 }, { "epoch": 0.74, "learning_rate": 3.2784584819416187e-06, "loss": 0.7686, "step": 10897 }, { "epoch": 0.74, "learning_rate": 3.276824365852358e-06, "loss": 0.7754, "step": 10898 }, { "epoch": 0.74, "learning_rate": 3.275190577315882e-06, "loss": 0.7979, "step": 10899 }, { "epoch": 0.74, "learning_rate": 3.2735571164117996e-06, "loss": 0.7959, "step": 10900 }, { "epoch": 0.74, "learning_rate": 3.2719239832196837e-06, "loss": 0.791, "step": 10901 }, { "epoch": 0.74, "learning_rate": 3.2702911778191036e-06, "loss": 0.7285, "step": 10902 }, { "epoch": 0.74, "learning_rate": 3.268658700289612e-06, "loss": 0.7461, "step": 10903 }, { "epoch": 0.74, "learning_rate": 3.2670265507107366e-06, "loss": 0.7598, "step": 10904 }, { "epoch": 0.74, "learning_rate": 3.265394729161997e-06, "loss": 0.6846, "step": 10905 }, { "epoch": 0.74, "learning_rate": 3.2637632357229034e-06, "loss": 0.7568, "step": 10906 }, { "epoch": 0.74, "learning_rate": 3.262132070472933e-06, "loss": 0.7246, "step": 10907 }, { "epoch": 0.74, "learning_rate": 3.260501233491561e-06, "loss": 0.7725, "step": 10908 }, { "epoch": 0.74, "learning_rate": 3.2588707248582387e-06, "loss": 0.7891, "step": 10909 }, { "epoch": 0.74, "learning_rate": 3.2572405446524102e-06, "loss": 0.7197, "step": 10910 }, { "epoch": 0.74, "learning_rate": 3.255610692953486e-06, "loss": 0.8291, "step": 10911 }, { "epoch": 0.74, "learning_rate": 3.253981169840884e-06, "loss": 0.709, "step": 10912 }, { "epoch": 0.74, "learning_rate": 3.2523519753939935e-06, "loss": 0.7861, "step": 10913 }, { "epoch": 0.74, "learning_rate": 3.2507231096921834e-06, "loss": 0.7285, "step": 10914 }, { "epoch": 0.74, "learning_rate": 3.249094572814813e-06, "loss": 0.7637, "step": 10915 }, { "epoch": 0.74, "learning_rate": 3.247466364841225e-06, "loss": 0.8398, "step": 10916 }, { "epoch": 0.74, "learning_rate": 3.2458384858507485e-06, "loss": 0.8086, "step": 10917 }, { "epoch": 0.74, "learning_rate": 3.2442109359226905e-06, "loss": 0.7246, "step": 10918 }, { "epoch": 0.74, "learning_rate": 3.242583715136346e-06, "loss": 0.8398, "step": 10919 }, { "epoch": 0.74, "learning_rate": 3.2409568235709965e-06, "loss": 0.7568, "step": 10920 }, { "epoch": 0.74, "learning_rate": 3.2393302613058984e-06, "loss": 0.7188, "step": 10921 }, { "epoch": 0.74, "learning_rate": 3.2377040284203e-06, "loss": 0.7197, "step": 10922 }, { "epoch": 0.74, "learning_rate": 3.2360781249934312e-06, "loss": 0.7568, "step": 10923 }, { "epoch": 0.74, "learning_rate": 3.234452551104508e-06, "loss": 0.6846, "step": 10924 }, { "epoch": 0.74, "learning_rate": 3.2328273068327244e-06, "loss": 0.7979, "step": 10925 }, { "epoch": 0.74, "learning_rate": 3.2312023922572688e-06, "loss": 0.79, "step": 10926 }, { "epoch": 0.74, "learning_rate": 3.229577807457299e-06, "loss": 0.7578, "step": 10927 }, { "epoch": 0.74, "learning_rate": 3.227953552511968e-06, "loss": 0.7832, "step": 10928 }, { "epoch": 0.74, "learning_rate": 3.2263296275004096e-06, "loss": 0.7842, "step": 10929 }, { "epoch": 0.74, "learning_rate": 3.224706032501742e-06, "loss": 0.6826, "step": 10930 }, { "epoch": 0.74, "learning_rate": 3.223082767595066e-06, "loss": 0.7207, "step": 10931 }, { "epoch": 0.74, "learning_rate": 3.221459832859467e-06, "loss": 0.7207, "step": 10932 }, { "epoch": 0.75, "learning_rate": 3.2198372283740176e-06, "loss": 0.7471, "step": 10933 }, { "epoch": 0.75, "learning_rate": 3.2182149542177643e-06, "loss": 0.7051, "step": 10934 }, { "epoch": 0.75, "learning_rate": 3.216593010469745e-06, "loss": 0.7256, "step": 10935 }, { "epoch": 0.75, "learning_rate": 3.214971397208989e-06, "loss": 0.7734, "step": 10936 }, { "epoch": 0.75, "learning_rate": 3.213350114514493e-06, "loss": 0.7148, "step": 10937 }, { "epoch": 0.75, "learning_rate": 3.211729162465249e-06, "loss": 0.8584, "step": 10938 }, { "epoch": 0.75, "learning_rate": 3.210108541140231e-06, "loss": 0.8389, "step": 10939 }, { "epoch": 0.75, "learning_rate": 3.208488250618391e-06, "loss": 0.7852, "step": 10940 }, { "epoch": 0.75, "learning_rate": 3.2068682909786696e-06, "loss": 0.791, "step": 10941 }, { "epoch": 0.75, "learning_rate": 3.2052486623e-06, "loss": 0.79, "step": 10942 }, { "epoch": 0.75, "learning_rate": 3.2036293646612815e-06, "loss": 0.7217, "step": 10943 }, { "epoch": 0.75, "learning_rate": 3.2020103981414086e-06, "loss": 0.7803, "step": 10944 }, { "epoch": 0.75, "learning_rate": 3.2003917628192573e-06, "loss": 0.7549, "step": 10945 }, { "epoch": 0.75, "learning_rate": 3.1987734587736907e-06, "loss": 0.752, "step": 10946 }, { "epoch": 0.75, "learning_rate": 3.197155486083543e-06, "loss": 0.8193, "step": 10947 }, { "epoch": 0.75, "learning_rate": 3.1955378448276518e-06, "loss": 0.6748, "step": 10948 }, { "epoch": 0.75, "learning_rate": 3.193920535084829e-06, "loss": 0.8057, "step": 10949 }, { "epoch": 0.75, "learning_rate": 3.192303556933861e-06, "loss": 0.7998, "step": 10950 }, { "epoch": 0.75, "learning_rate": 3.190686910453533e-06, "loss": 0.8027, "step": 10951 }, { "epoch": 0.75, "learning_rate": 3.1890705957226066e-06, "loss": 0.709, "step": 10952 }, { "epoch": 0.75, "learning_rate": 3.187454612819828e-06, "loss": 0.7988, "step": 10953 }, { "epoch": 0.75, "learning_rate": 3.1858389618239295e-06, "loss": 0.7617, "step": 10954 }, { "epoch": 0.75, "learning_rate": 3.184223642813623e-06, "loss": 0.8594, "step": 10955 }, { "epoch": 0.75, "learning_rate": 3.1826086558676116e-06, "loss": 0.7568, "step": 10956 }, { "epoch": 0.75, "learning_rate": 3.180994001064572e-06, "loss": 0.7539, "step": 10957 }, { "epoch": 0.75, "learning_rate": 3.179379678483171e-06, "loss": 0.7295, "step": 10958 }, { "epoch": 0.75, "learning_rate": 3.17776568820206e-06, "loss": 0.7891, "step": 10959 }, { "epoch": 0.75, "learning_rate": 3.1761520302998726e-06, "loss": 0.6943, "step": 10960 }, { "epoch": 0.75, "learning_rate": 3.1745387048552247e-06, "loss": 0.708, "step": 10961 }, { "epoch": 0.75, "learning_rate": 3.1729257119467214e-06, "loss": 0.7969, "step": 10962 }, { "epoch": 0.75, "learning_rate": 3.1713130516529413e-06, "loss": 0.7266, "step": 10963 }, { "epoch": 0.75, "learning_rate": 3.1697007240524567e-06, "loss": 0.7188, "step": 10964 }, { "epoch": 0.75, "learning_rate": 3.1680887292238194e-06, "loss": 0.7598, "step": 10965 }, { "epoch": 0.75, "learning_rate": 3.166477067245566e-06, "loss": 0.8086, "step": 10966 }, { "epoch": 0.75, "learning_rate": 3.164865738196217e-06, "loss": 0.7725, "step": 10967 }, { "epoch": 0.75, "learning_rate": 3.1632547421542746e-06, "loss": 0.7422, "step": 10968 }, { "epoch": 0.75, "learning_rate": 3.1616440791982327e-06, "loss": 0.7168, "step": 10969 }, { "epoch": 0.75, "learning_rate": 3.16003374940655e-06, "loss": 0.7578, "step": 10970 }, { "epoch": 0.75, "learning_rate": 3.1584237528576944e-06, "loss": 0.6943, "step": 10971 }, { "epoch": 0.75, "learning_rate": 3.156814089630101e-06, "loss": 0.7324, "step": 10972 }, { "epoch": 0.75, "learning_rate": 3.1552047598021896e-06, "loss": 0.7744, "step": 10973 }, { "epoch": 0.75, "learning_rate": 3.1535957634523683e-06, "loss": 0.7236, "step": 10974 }, { "epoch": 0.75, "learning_rate": 3.151987100659031e-06, "loss": 0.8125, "step": 10975 }, { "epoch": 0.75, "learning_rate": 3.150378771500542e-06, "loss": 0.7734, "step": 10976 }, { "epoch": 0.75, "learning_rate": 3.1487707760552677e-06, "loss": 0.6592, "step": 10977 }, { "epoch": 0.75, "learning_rate": 3.1471631144015503e-06, "loss": 0.8008, "step": 10978 }, { "epoch": 0.75, "learning_rate": 3.145555786617709e-06, "loss": 0.7871, "step": 10979 }, { "epoch": 0.75, "learning_rate": 3.1439487927820546e-06, "loss": 0.7461, "step": 10980 }, { "epoch": 0.75, "learning_rate": 3.142342132972882e-06, "loss": 0.709, "step": 10981 }, { "epoch": 0.75, "learning_rate": 3.140735807268465e-06, "loss": 0.7617, "step": 10982 }, { "epoch": 0.75, "learning_rate": 3.1391298157470653e-06, "loss": 0.7295, "step": 10983 }, { "epoch": 0.75, "learning_rate": 3.1375241584869264e-06, "loss": 0.75, "step": 10984 }, { "epoch": 0.75, "learning_rate": 3.1359188355662794e-06, "loss": 0.7451, "step": 10985 }, { "epoch": 0.75, "learning_rate": 3.1343138470633294e-06, "loss": 0.7246, "step": 10986 }, { "epoch": 0.75, "learning_rate": 3.1327091930562725e-06, "loss": 0.6973, "step": 10987 }, { "epoch": 0.75, "learning_rate": 3.13110487362329e-06, "loss": 0.7305, "step": 10988 }, { "epoch": 0.75, "learning_rate": 3.1295008888425425e-06, "loss": 0.8301, "step": 10989 }, { "epoch": 0.75, "learning_rate": 3.127897238792177e-06, "loss": 0.7334, "step": 10990 }, { "epoch": 0.75, "learning_rate": 3.1262939235503255e-06, "loss": 0.7891, "step": 10991 }, { "epoch": 0.75, "learning_rate": 3.1246909431950956e-06, "loss": 0.7891, "step": 10992 }, { "epoch": 0.75, "learning_rate": 3.1230882978045886e-06, "loss": 0.6934, "step": 10993 }, { "epoch": 0.75, "learning_rate": 3.121485987456884e-06, "loss": 0.7539, "step": 10994 }, { "epoch": 0.75, "learning_rate": 3.1198840122300465e-06, "loss": 0.7627, "step": 10995 }, { "epoch": 0.75, "learning_rate": 3.118282372202124e-06, "loss": 0.6982, "step": 10996 }, { "epoch": 0.75, "learning_rate": 3.1166810674511494e-06, "loss": 0.7754, "step": 10997 }, { "epoch": 0.75, "learning_rate": 3.1150800980551398e-06, "loss": 0.7197, "step": 10998 }, { "epoch": 0.75, "learning_rate": 3.1134794640920894e-06, "loss": 0.7617, "step": 10999 }, { "epoch": 0.75, "learning_rate": 3.1118791656399816e-06, "loss": 0.71, "step": 11000 }, { "epoch": 0.75, "learning_rate": 3.1102792027767905e-06, "loss": 0.8164, "step": 11001 }, { "epoch": 0.75, "learning_rate": 3.1086795755804565e-06, "loss": 0.7822, "step": 11002 }, { "epoch": 0.75, "learning_rate": 3.1070802841289183e-06, "loss": 0.7119, "step": 11003 }, { "epoch": 0.75, "learning_rate": 3.1054813285000927e-06, "loss": 0.6973, "step": 11004 }, { "epoch": 0.75, "learning_rate": 3.1038827087718838e-06, "loss": 0.7871, "step": 11005 }, { "epoch": 0.75, "learning_rate": 3.102284425022166e-06, "loss": 0.7412, "step": 11006 }, { "epoch": 0.75, "learning_rate": 3.100686477328818e-06, "loss": 0.7715, "step": 11007 }, { "epoch": 0.75, "learning_rate": 3.0990888657696915e-06, "loss": 0.7432, "step": 11008 }, { "epoch": 0.75, "learning_rate": 3.0974915904226167e-06, "loss": 0.7559, "step": 11009 }, { "epoch": 0.75, "learning_rate": 3.0958946513654143e-06, "loss": 0.7236, "step": 11010 }, { "epoch": 0.75, "learning_rate": 3.094298048675891e-06, "loss": 0.7246, "step": 11011 }, { "epoch": 0.75, "learning_rate": 3.092701782431823e-06, "loss": 0.7744, "step": 11012 }, { "epoch": 0.75, "learning_rate": 3.091105852710992e-06, "loss": 0.7441, "step": 11013 }, { "epoch": 0.75, "learning_rate": 3.0895102595911484e-06, "loss": 0.7119, "step": 11014 }, { "epoch": 0.75, "learning_rate": 3.087915003150026e-06, "loss": 0.7324, "step": 11015 }, { "epoch": 0.75, "learning_rate": 3.0863200834653473e-06, "loss": 0.7461, "step": 11016 }, { "epoch": 0.75, "learning_rate": 3.084725500614817e-06, "loss": 0.8594, "step": 11017 }, { "epoch": 0.75, "learning_rate": 3.0831312546761227e-06, "loss": 0.7793, "step": 11018 }, { "epoch": 0.75, "learning_rate": 3.081537345726936e-06, "loss": 0.7842, "step": 11019 }, { "epoch": 0.75, "learning_rate": 3.0799437738449135e-06, "loss": 0.6582, "step": 11020 }, { "epoch": 0.75, "learning_rate": 3.078350539107695e-06, "loss": 0.8174, "step": 11021 }, { "epoch": 0.75, "learning_rate": 3.076757641592898e-06, "loss": 0.7324, "step": 11022 }, { "epoch": 0.75, "learning_rate": 3.075165081378131e-06, "loss": 0.8281, "step": 11023 }, { "epoch": 0.75, "learning_rate": 3.073572858540984e-06, "loss": 0.7041, "step": 11024 }, { "epoch": 0.75, "learning_rate": 3.071980973159029e-06, "loss": 0.75, "step": 11025 }, { "epoch": 0.75, "learning_rate": 3.0703894253098234e-06, "loss": 0.7988, "step": 11026 }, { "epoch": 0.75, "learning_rate": 3.0687982150709108e-06, "loss": 0.7656, "step": 11027 }, { "epoch": 0.75, "learning_rate": 3.067207342519807e-06, "loss": 0.7305, "step": 11028 }, { "epoch": 0.75, "learning_rate": 3.0656168077340244e-06, "loss": 0.8359, "step": 11029 }, { "epoch": 0.75, "learning_rate": 3.064026610791051e-06, "loss": 0.7725, "step": 11030 }, { "epoch": 0.75, "learning_rate": 3.062436751768364e-06, "loss": 0.8076, "step": 11031 }, { "epoch": 0.75, "learning_rate": 3.06084723074342e-06, "loss": 0.7119, "step": 11032 }, { "epoch": 0.75, "learning_rate": 3.0592580477936606e-06, "loss": 0.7861, "step": 11033 }, { "epoch": 0.75, "learning_rate": 3.057669202996515e-06, "loss": 0.751, "step": 11034 }, { "epoch": 0.75, "learning_rate": 3.0560806964293823e-06, "loss": 0.752, "step": 11035 }, { "epoch": 0.75, "learning_rate": 3.054492528169657e-06, "loss": 0.8359, "step": 11036 }, { "epoch": 0.75, "learning_rate": 3.052904698294723e-06, "loss": 0.7354, "step": 11037 }, { "epoch": 0.75, "learning_rate": 3.051317206881931e-06, "loss": 0.8008, "step": 11038 }, { "epoch": 0.75, "learning_rate": 3.049730054008625e-06, "loss": 0.8203, "step": 11039 }, { "epoch": 0.75, "learning_rate": 3.0481432397521317e-06, "loss": 0.835, "step": 11040 }, { "epoch": 0.75, "learning_rate": 3.0465567641897642e-06, "loss": 0.748, "step": 11041 }, { "epoch": 0.75, "learning_rate": 3.0449706273988068e-06, "loss": 0.7793, "step": 11042 }, { "epoch": 0.75, "learning_rate": 3.043384829456546e-06, "loss": 0.7461, "step": 11043 }, { "epoch": 0.75, "learning_rate": 3.041799370440235e-06, "loss": 0.7217, "step": 11044 }, { "epoch": 0.75, "learning_rate": 3.040214250427118e-06, "loss": 0.7422, "step": 11045 }, { "epoch": 0.75, "learning_rate": 3.0386294694944242e-06, "loss": 0.7383, "step": 11046 }, { "epoch": 0.75, "learning_rate": 3.0370450277193663e-06, "loss": 0.748, "step": 11047 }, { "epoch": 0.75, "learning_rate": 3.035460925179129e-06, "loss": 0.7412, "step": 11048 }, { "epoch": 0.75, "learning_rate": 3.033877161950899e-06, "loss": 0.6816, "step": 11049 }, { "epoch": 0.75, "learning_rate": 3.032293738111837e-06, "loss": 0.7295, "step": 11050 }, { "epoch": 0.75, "learning_rate": 3.0307106537390808e-06, "loss": 0.7461, "step": 11051 }, { "epoch": 0.75, "learning_rate": 3.029127908909761e-06, "loss": 0.75, "step": 11052 }, { "epoch": 0.75, "learning_rate": 3.0275455037009903e-06, "loss": 0.7578, "step": 11053 }, { "epoch": 0.75, "learning_rate": 3.025963438189863e-06, "loss": 0.7793, "step": 11054 }, { "epoch": 0.75, "learning_rate": 3.024381712453457e-06, "loss": 0.752, "step": 11055 }, { "epoch": 0.75, "learning_rate": 3.0228003265688332e-06, "loss": 0.7266, "step": 11056 }, { "epoch": 0.75, "learning_rate": 3.02121928061304e-06, "loss": 0.8008, "step": 11057 }, { "epoch": 0.75, "learning_rate": 3.019638574663101e-06, "loss": 0.7256, "step": 11058 }, { "epoch": 0.75, "learning_rate": 3.0180582087960297e-06, "loss": 0.7324, "step": 11059 }, { "epoch": 0.75, "learning_rate": 3.0164781830888224e-06, "loss": 0.7949, "step": 11060 }, { "epoch": 0.75, "learning_rate": 3.014898497618457e-06, "loss": 0.7246, "step": 11061 }, { "epoch": 0.75, "learning_rate": 3.0133191524618956e-06, "loss": 0.8066, "step": 11062 }, { "epoch": 0.75, "learning_rate": 3.0117401476960882e-06, "loss": 0.7158, "step": 11063 }, { "epoch": 0.75, "learning_rate": 3.0101614833979565e-06, "loss": 0.7012, "step": 11064 }, { "epoch": 0.75, "learning_rate": 3.008583159644417e-06, "loss": 0.7637, "step": 11065 }, { "epoch": 0.75, "learning_rate": 3.0070051765123655e-06, "loss": 0.749, "step": 11066 }, { "epoch": 0.75, "learning_rate": 3.00542753407868e-06, "loss": 0.79, "step": 11067 }, { "epoch": 0.75, "learning_rate": 3.0038502324202233e-06, "loss": 0.7324, "step": 11068 }, { "epoch": 0.75, "learning_rate": 3.0022732716138437e-06, "loss": 0.8232, "step": 11069 }, { "epoch": 0.75, "learning_rate": 3.0006966517363712e-06, "loss": 0.707, "step": 11070 }, { "epoch": 0.75, "learning_rate": 2.9991203728646135e-06, "loss": 0.7676, "step": 11071 }, { "epoch": 0.75, "learning_rate": 2.9975444350753656e-06, "loss": 0.7881, "step": 11072 }, { "epoch": 0.75, "learning_rate": 2.9959688384454187e-06, "loss": 0.7217, "step": 11073 }, { "epoch": 0.75, "learning_rate": 2.9943935830515256e-06, "loss": 0.7461, "step": 11074 }, { "epoch": 0.75, "learning_rate": 2.9928186689704354e-06, "loss": 0.7998, "step": 11075 }, { "epoch": 0.75, "learning_rate": 2.9912440962788802e-06, "loss": 0.7754, "step": 11076 }, { "epoch": 0.75, "learning_rate": 2.9896698650535683e-06, "loss": 0.6309, "step": 11077 }, { "epoch": 0.75, "learning_rate": 2.988095975371196e-06, "loss": 0.7139, "step": 11078 }, { "epoch": 0.76, "learning_rate": 2.9865224273084515e-06, "loss": 0.7041, "step": 11079 }, { "epoch": 0.76, "learning_rate": 2.9849492209419894e-06, "loss": 0.7617, "step": 11080 }, { "epoch": 0.76, "learning_rate": 2.9833763563484595e-06, "loss": 0.7549, "step": 11081 }, { "epoch": 0.76, "learning_rate": 2.981803833604491e-06, "loss": 0.752, "step": 11082 }, { "epoch": 0.76, "learning_rate": 2.9802316527867004e-06, "loss": 0.6934, "step": 11083 }, { "epoch": 0.76, "learning_rate": 2.978659813971675e-06, "loss": 0.751, "step": 11084 }, { "epoch": 0.76, "learning_rate": 2.9770883172360043e-06, "loss": 0.7412, "step": 11085 }, { "epoch": 0.76, "learning_rate": 2.975517162656252e-06, "loss": 0.749, "step": 11086 }, { "epoch": 0.76, "learning_rate": 2.973946350308957e-06, "loss": 0.6904, "step": 11087 }, { "epoch": 0.76, "learning_rate": 2.9723758802706536e-06, "loss": 0.7402, "step": 11088 }, { "epoch": 0.76, "learning_rate": 2.9708057526178547e-06, "loss": 0.7969, "step": 11089 }, { "epoch": 0.76, "learning_rate": 2.9692359674270567e-06, "loss": 0.7432, "step": 11090 }, { "epoch": 0.76, "learning_rate": 2.967666524774739e-06, "loss": 0.7725, "step": 11091 }, { "epoch": 0.76, "learning_rate": 2.9660974247373666e-06, "loss": 0.7461, "step": 11092 }, { "epoch": 0.76, "learning_rate": 2.9645286673913865e-06, "loss": 0.8301, "step": 11093 }, { "epoch": 0.76, "learning_rate": 2.962960252813224e-06, "loss": 0.7725, "step": 11094 }, { "epoch": 0.76, "learning_rate": 2.9613921810792912e-06, "loss": 0.8193, "step": 11095 }, { "epoch": 0.76, "learning_rate": 2.959824452265995e-06, "loss": 0.7695, "step": 11096 }, { "epoch": 0.76, "learning_rate": 2.9582570664497046e-06, "loss": 0.7021, "step": 11097 }, { "epoch": 0.76, "learning_rate": 2.9566900237067862e-06, "loss": 0.7568, "step": 11098 }, { "epoch": 0.76, "learning_rate": 2.9551233241135903e-06, "loss": 0.7461, "step": 11099 }, { "epoch": 0.76, "learning_rate": 2.953556967746439e-06, "loss": 0.6777, "step": 11100 }, { "epoch": 0.76, "learning_rate": 2.951990954681645e-06, "loss": 0.7812, "step": 11101 }, { "epoch": 0.76, "learning_rate": 2.9504252849955153e-06, "loss": 0.8027, "step": 11102 }, { "epoch": 0.76, "learning_rate": 2.9488599587643185e-06, "loss": 0.6758, "step": 11103 }, { "epoch": 0.76, "learning_rate": 2.94729497606432e-06, "loss": 0.6592, "step": 11104 }, { "epoch": 0.76, "learning_rate": 2.945730336971767e-06, "loss": 0.7451, "step": 11105 }, { "epoch": 0.76, "learning_rate": 2.9441660415628903e-06, "loss": 0.8105, "step": 11106 }, { "epoch": 0.76, "learning_rate": 2.942602089913894e-06, "loss": 0.7871, "step": 11107 }, { "epoch": 0.76, "learning_rate": 2.9410384821009828e-06, "loss": 0.7715, "step": 11108 }, { "epoch": 0.76, "learning_rate": 2.939475218200336e-06, "loss": 0.7607, "step": 11109 }, { "epoch": 0.76, "learning_rate": 2.937912298288109e-06, "loss": 0.7412, "step": 11110 }, { "epoch": 0.76, "learning_rate": 2.9363497224404515e-06, "loss": 0.6924, "step": 11111 }, { "epoch": 0.76, "learning_rate": 2.934787490733493e-06, "loss": 0.7588, "step": 11112 }, { "epoch": 0.76, "learning_rate": 2.933225603243337e-06, "loss": 0.7754, "step": 11113 }, { "epoch": 0.76, "learning_rate": 2.9316640600460886e-06, "loss": 0.7354, "step": 11114 }, { "epoch": 0.76, "learning_rate": 2.930102861217825e-06, "loss": 0.7979, "step": 11115 }, { "epoch": 0.76, "learning_rate": 2.928542006834603e-06, "loss": 0.7275, "step": 11116 }, { "epoch": 0.76, "learning_rate": 2.9269814969724687e-06, "loss": 0.7568, "step": 11117 }, { "epoch": 0.76, "learning_rate": 2.9254213317074508e-06, "loss": 0.7422, "step": 11118 }, { "epoch": 0.76, "learning_rate": 2.9238615111155623e-06, "loss": 0.834, "step": 11119 }, { "epoch": 0.76, "learning_rate": 2.9223020352727936e-06, "loss": 0.7754, "step": 11120 }, { "epoch": 0.76, "learning_rate": 2.920742904255126e-06, "loss": 0.7988, "step": 11121 }, { "epoch": 0.76, "learning_rate": 2.9191841181385218e-06, "loss": 0.7334, "step": 11122 }, { "epoch": 0.76, "learning_rate": 2.9176256769989184e-06, "loss": 0.7598, "step": 11123 }, { "epoch": 0.76, "learning_rate": 2.9160675809122473e-06, "loss": 0.6953, "step": 11124 }, { "epoch": 0.76, "learning_rate": 2.9145098299544183e-06, "loss": 0.7979, "step": 11125 }, { "epoch": 0.76, "learning_rate": 2.912952424201325e-06, "loss": 0.7197, "step": 11126 }, { "epoch": 0.76, "learning_rate": 2.9113953637288426e-06, "loss": 0.79, "step": 11127 }, { "epoch": 0.76, "learning_rate": 2.909838648612834e-06, "loss": 0.6943, "step": 11128 }, { "epoch": 0.76, "learning_rate": 2.908282278929143e-06, "loss": 0.7627, "step": 11129 }, { "epoch": 0.76, "learning_rate": 2.90672625475359e-06, "loss": 0.7754, "step": 11130 }, { "epoch": 0.76, "learning_rate": 2.9051705761619884e-06, "loss": 0.7275, "step": 11131 }, { "epoch": 0.76, "learning_rate": 2.903615243230131e-06, "loss": 0.8037, "step": 11132 }, { "epoch": 0.76, "learning_rate": 2.902060256033792e-06, "loss": 0.7393, "step": 11133 }, { "epoch": 0.76, "learning_rate": 2.900505614648732e-06, "loss": 0.8184, "step": 11134 }, { "epoch": 0.76, "learning_rate": 2.8989513191506946e-06, "loss": 0.8135, "step": 11135 }, { "epoch": 0.76, "learning_rate": 2.8973973696154e-06, "loss": 0.7285, "step": 11136 }, { "epoch": 0.76, "learning_rate": 2.895843766118556e-06, "loss": 0.7227, "step": 11137 }, { "epoch": 0.76, "learning_rate": 2.894290508735863e-06, "loss": 0.7617, "step": 11138 }, { "epoch": 0.76, "learning_rate": 2.8927375975429873e-06, "loss": 0.75, "step": 11139 }, { "epoch": 0.76, "learning_rate": 2.8911850326155887e-06, "loss": 0.751, "step": 11140 }, { "epoch": 0.76, "learning_rate": 2.8896328140293095e-06, "loss": 0.7617, "step": 11141 }, { "epoch": 0.76, "learning_rate": 2.8880809418597754e-06, "loss": 0.7998, "step": 11142 }, { "epoch": 0.76, "learning_rate": 2.886529416182584e-06, "loss": 0.8047, "step": 11143 }, { "epoch": 0.76, "learning_rate": 2.884978237073337e-06, "loss": 0.7852, "step": 11144 }, { "epoch": 0.76, "learning_rate": 2.883427404607606e-06, "loss": 0.8242, "step": 11145 }, { "epoch": 0.76, "learning_rate": 2.8818769188609406e-06, "loss": 0.7227, "step": 11146 }, { "epoch": 0.76, "learning_rate": 2.8803267799088863e-06, "loss": 0.8135, "step": 11147 }, { "epoch": 0.76, "learning_rate": 2.8787769878269667e-06, "loss": 0.7354, "step": 11148 }, { "epoch": 0.76, "learning_rate": 2.877227542690678e-06, "loss": 0.7471, "step": 11149 }, { "epoch": 0.76, "learning_rate": 2.8756784445755203e-06, "loss": 0.7285, "step": 11150 }, { "epoch": 0.76, "learning_rate": 2.874129693556964e-06, "loss": 0.6855, "step": 11151 }, { "epoch": 0.76, "learning_rate": 2.872581289710458e-06, "loss": 0.8174, "step": 11152 }, { "epoch": 0.76, "learning_rate": 2.8710332331114444e-06, "loss": 0.8584, "step": 11153 }, { "epoch": 0.76, "learning_rate": 2.869485523835344e-06, "loss": 0.8008, "step": 11154 }, { "epoch": 0.76, "learning_rate": 2.867938161957561e-06, "loss": 0.7119, "step": 11155 }, { "epoch": 0.76, "learning_rate": 2.866391147553482e-06, "loss": 0.8076, "step": 11156 }, { "epoch": 0.76, "learning_rate": 2.86484448069848e-06, "loss": 0.7803, "step": 11157 }, { "epoch": 0.76, "learning_rate": 2.863298161467909e-06, "loss": 0.7646, "step": 11158 }, { "epoch": 0.76, "learning_rate": 2.8617521899371013e-06, "loss": 0.791, "step": 11159 }, { "epoch": 0.76, "learning_rate": 2.860206566181378e-06, "loss": 0.751, "step": 11160 }, { "epoch": 0.76, "learning_rate": 2.8586612902760436e-06, "loss": 0.7197, "step": 11161 }, { "epoch": 0.76, "learning_rate": 2.8571163622963815e-06, "loss": 0.6265, "step": 11162 }, { "epoch": 0.76, "learning_rate": 2.8555717823176633e-06, "loss": 0.7295, "step": 11163 }, { "epoch": 0.76, "learning_rate": 2.8540275504151418e-06, "loss": 0.7549, "step": 11164 }, { "epoch": 0.76, "learning_rate": 2.8524836666640463e-06, "loss": 0.7539, "step": 11165 }, { "epoch": 0.76, "learning_rate": 2.850940131139598e-06, "loss": 0.6973, "step": 11166 }, { "epoch": 0.76, "learning_rate": 2.849396943916999e-06, "loss": 0.7842, "step": 11167 }, { "epoch": 0.76, "learning_rate": 2.8478541050714304e-06, "loss": 0.7441, "step": 11168 }, { "epoch": 0.76, "learning_rate": 2.8463116146780623e-06, "loss": 0.7256, "step": 11169 }, { "epoch": 0.76, "learning_rate": 2.8447694728120434e-06, "loss": 0.7324, "step": 11170 }, { "epoch": 0.76, "learning_rate": 2.843227679548509e-06, "loss": 0.8486, "step": 11171 }, { "epoch": 0.76, "learning_rate": 2.841686234962571e-06, "loss": 0.7471, "step": 11172 }, { "epoch": 0.76, "learning_rate": 2.8401451391293268e-06, "loss": 0.7354, "step": 11173 }, { "epoch": 0.76, "learning_rate": 2.8386043921238693e-06, "loss": 0.7578, "step": 11174 }, { "epoch": 0.76, "learning_rate": 2.837063994021252e-06, "loss": 0.832, "step": 11175 }, { "epoch": 0.76, "learning_rate": 2.8355239448965287e-06, "loss": 0.7314, "step": 11176 }, { "epoch": 0.76, "learning_rate": 2.833984244824729e-06, "loss": 0.7461, "step": 11177 }, { "epoch": 0.76, "learning_rate": 2.8324448938808714e-06, "loss": 0.7197, "step": 11178 }, { "epoch": 0.76, "learning_rate": 2.8309058921399413e-06, "loss": 0.8154, "step": 11179 }, { "epoch": 0.76, "learning_rate": 2.829367239676931e-06, "loss": 0.7412, "step": 11180 }, { "epoch": 0.76, "learning_rate": 2.827828936566802e-06, "loss": 0.7041, "step": 11181 }, { "epoch": 0.76, "learning_rate": 2.826290982884493e-06, "loss": 0.7451, "step": 11182 }, { "epoch": 0.76, "learning_rate": 2.8247533787049386e-06, "loss": 0.7334, "step": 11183 }, { "epoch": 0.76, "learning_rate": 2.823216124103053e-06, "loss": 0.8047, "step": 11184 }, { "epoch": 0.76, "learning_rate": 2.8216792191537214e-06, "loss": 0.7656, "step": 11185 }, { "epoch": 0.76, "learning_rate": 2.820142663931831e-06, "loss": 0.7549, "step": 11186 }, { "epoch": 0.76, "learning_rate": 2.818606458512243e-06, "loss": 0.7314, "step": 11187 }, { "epoch": 0.76, "learning_rate": 2.817070602969796e-06, "loss": 0.7266, "step": 11188 }, { "epoch": 0.76, "learning_rate": 2.8155350973793184e-06, "loss": 0.7012, "step": 11189 }, { "epoch": 0.76, "learning_rate": 2.8139999418156192e-06, "loss": 0.7402, "step": 11190 }, { "epoch": 0.76, "learning_rate": 2.812465136353494e-06, "loss": 0.7588, "step": 11191 }, { "epoch": 0.76, "learning_rate": 2.8109306810677163e-06, "loss": 0.7637, "step": 11192 }, { "epoch": 0.76, "learning_rate": 2.8093965760330453e-06, "loss": 0.6904, "step": 11193 }, { "epoch": 0.76, "learning_rate": 2.8078628213242255e-06, "loss": 0.7666, "step": 11194 }, { "epoch": 0.76, "learning_rate": 2.806329417015975e-06, "loss": 0.7998, "step": 11195 }, { "epoch": 0.76, "learning_rate": 2.8047963631830043e-06, "loss": 0.7109, "step": 11196 }, { "epoch": 0.76, "learning_rate": 2.803263659900004e-06, "loss": 0.7422, "step": 11197 }, { "epoch": 0.76, "learning_rate": 2.8017313072416487e-06, "loss": 0.7344, "step": 11198 }, { "epoch": 0.76, "learning_rate": 2.8001993052825916e-06, "loss": 0.7754, "step": 11199 }, { "epoch": 0.76, "learning_rate": 2.7986676540974767e-06, "loss": 0.7559, "step": 11200 }, { "epoch": 0.76, "learning_rate": 2.797136353760919e-06, "loss": 0.7949, "step": 11201 }, { "epoch": 0.76, "learning_rate": 2.7956054043475267e-06, "loss": 0.7354, "step": 11202 }, { "epoch": 0.76, "learning_rate": 2.7940748059318888e-06, "loss": 0.7363, "step": 11203 }, { "epoch": 0.76, "learning_rate": 2.792544558588575e-06, "loss": 0.752, "step": 11204 }, { "epoch": 0.76, "learning_rate": 2.7910146623921374e-06, "loss": 0.8398, "step": 11205 }, { "epoch": 0.76, "learning_rate": 2.7894851174171144e-06, "loss": 0.7578, "step": 11206 }, { "epoch": 0.76, "learning_rate": 2.7879559237380284e-06, "loss": 0.7529, "step": 11207 }, { "epoch": 0.76, "learning_rate": 2.7864270814293716e-06, "loss": 0.7725, "step": 11208 }, { "epoch": 0.76, "learning_rate": 2.784898590565639e-06, "loss": 0.8447, "step": 11209 }, { "epoch": 0.76, "learning_rate": 2.783370451221298e-06, "loss": 0.7666, "step": 11210 }, { "epoch": 0.76, "learning_rate": 2.781842663470794e-06, "loss": 0.7617, "step": 11211 }, { "epoch": 0.76, "learning_rate": 2.780315227388564e-06, "loss": 0.7695, "step": 11212 }, { "epoch": 0.76, "learning_rate": 2.7787881430490227e-06, "loss": 0.7949, "step": 11213 }, { "epoch": 0.76, "learning_rate": 2.7772614105265716e-06, "loss": 0.71, "step": 11214 }, { "epoch": 0.76, "learning_rate": 2.775735029895592e-06, "loss": 0.7148, "step": 11215 }, { "epoch": 0.76, "learning_rate": 2.774209001230449e-06, "loss": 0.7451, "step": 11216 }, { "epoch": 0.76, "learning_rate": 2.7726833246054954e-06, "loss": 0.6631, "step": 11217 }, { "epoch": 0.76, "learning_rate": 2.7711580000950544e-06, "loss": 0.7803, "step": 11218 }, { "epoch": 0.76, "learning_rate": 2.769633027773443e-06, "loss": 0.7148, "step": 11219 }, { "epoch": 0.76, "learning_rate": 2.7681084077149567e-06, "loss": 0.751, "step": 11220 }, { "epoch": 0.76, "learning_rate": 2.7665841399938776e-06, "loss": 0.6777, "step": 11221 }, { "epoch": 0.76, "learning_rate": 2.765060224684466e-06, "loss": 0.6904, "step": 11222 }, { "epoch": 0.76, "learning_rate": 2.7635366618609707e-06, "loss": 0.7764, "step": 11223 }, { "epoch": 0.76, "learning_rate": 2.762013451597613e-06, "loss": 0.6963, "step": 11224 }, { "epoch": 0.76, "learning_rate": 2.7604905939686065e-06, "loss": 0.6924, "step": 11225 }, { "epoch": 0.77, "learning_rate": 2.758968089048146e-06, "loss": 0.7568, "step": 11226 }, { "epoch": 0.77, "learning_rate": 2.757445936910407e-06, "loss": 0.7725, "step": 11227 }, { "epoch": 0.77, "learning_rate": 2.7559241376295487e-06, "loss": 0.7998, "step": 11228 }, { "epoch": 0.77, "learning_rate": 2.7544026912797127e-06, "loss": 0.7959, "step": 11229 }, { "epoch": 0.77, "learning_rate": 2.752881597935028e-06, "loss": 0.6787, "step": 11230 }, { "epoch": 0.77, "learning_rate": 2.7513608576695938e-06, "loss": 0.8066, "step": 11231 }, { "epoch": 0.77, "learning_rate": 2.749840470557503e-06, "loss": 0.7822, "step": 11232 }, { "epoch": 0.77, "learning_rate": 2.7483204366728377e-06, "loss": 0.7383, "step": 11233 }, { "epoch": 0.77, "learning_rate": 2.7468007560896435e-06, "loss": 0.7627, "step": 11234 }, { "epoch": 0.77, "learning_rate": 2.745281428881963e-06, "loss": 0.8057, "step": 11235 }, { "epoch": 0.77, "learning_rate": 2.7437624551238207e-06, "loss": 0.7188, "step": 11236 }, { "epoch": 0.77, "learning_rate": 2.7422438348892145e-06, "loss": 0.7207, "step": 11237 }, { "epoch": 0.77, "learning_rate": 2.7407255682521315e-06, "loss": 0.7939, "step": 11238 }, { "epoch": 0.77, "learning_rate": 2.739207655286551e-06, "loss": 0.7588, "step": 11239 }, { "epoch": 0.77, "learning_rate": 2.7376900960664156e-06, "loss": 0.6953, "step": 11240 }, { "epoch": 0.77, "learning_rate": 2.736172890665666e-06, "loss": 0.8398, "step": 11241 }, { "epoch": 0.77, "learning_rate": 2.734656039158218e-06, "loss": 0.7217, "step": 11242 }, { "epoch": 0.77, "learning_rate": 2.733139541617976e-06, "loss": 0.7344, "step": 11243 }, { "epoch": 0.77, "learning_rate": 2.731623398118817e-06, "loss": 0.7627, "step": 11244 }, { "epoch": 0.77, "learning_rate": 2.730107608734612e-06, "loss": 0.7246, "step": 11245 }, { "epoch": 0.77, "learning_rate": 2.728592173539215e-06, "loss": 0.7754, "step": 11246 }, { "epoch": 0.77, "learning_rate": 2.7270770926064494e-06, "loss": 0.748, "step": 11247 }, { "epoch": 0.77, "learning_rate": 2.7255623660101316e-06, "loss": 0.7031, "step": 11248 }, { "epoch": 0.77, "learning_rate": 2.7240479938240627e-06, "loss": 0.7148, "step": 11249 }, { "epoch": 0.77, "learning_rate": 2.722533976122019e-06, "loss": 0.7568, "step": 11250 }, { "epoch": 0.77, "learning_rate": 2.7210203129777656e-06, "loss": 0.707, "step": 11251 }, { "epoch": 0.77, "learning_rate": 2.7195070044650507e-06, "loss": 0.7256, "step": 11252 }, { "epoch": 0.77, "learning_rate": 2.7179940506575964e-06, "loss": 0.7295, "step": 11253 }, { "epoch": 0.77, "learning_rate": 2.716481451629117e-06, "loss": 0.792, "step": 11254 }, { "epoch": 0.77, "learning_rate": 2.7149692074533063e-06, "loss": 0.7998, "step": 11255 }, { "epoch": 0.77, "learning_rate": 2.7134573182038405e-06, "loss": 0.7158, "step": 11256 }, { "epoch": 0.77, "learning_rate": 2.7119457839543783e-06, "loss": 0.752, "step": 11257 }, { "epoch": 0.77, "learning_rate": 2.7104346047785623e-06, "loss": 0.6914, "step": 11258 }, { "epoch": 0.77, "learning_rate": 2.70892378075002e-06, "loss": 0.7383, "step": 11259 }, { "epoch": 0.77, "learning_rate": 2.7074133119423528e-06, "loss": 0.7041, "step": 11260 }, { "epoch": 0.77, "learning_rate": 2.705903198429153e-06, "loss": 0.7139, "step": 11261 }, { "epoch": 0.77, "learning_rate": 2.7043934402839943e-06, "loss": 0.8193, "step": 11262 }, { "epoch": 0.77, "learning_rate": 2.702884037580431e-06, "loss": 0.7568, "step": 11263 }, { "epoch": 0.77, "learning_rate": 2.7013749903920007e-06, "loss": 0.8018, "step": 11264 }, { "epoch": 0.77, "learning_rate": 2.6998662987922262e-06, "loss": 0.7461, "step": 11265 }, { "epoch": 0.77, "learning_rate": 2.698357962854612e-06, "loss": 0.7666, "step": 11266 }, { "epoch": 0.77, "learning_rate": 2.6968499826526385e-06, "loss": 0.793, "step": 11267 }, { "epoch": 0.77, "learning_rate": 2.695342358259775e-06, "loss": 0.75, "step": 11268 }, { "epoch": 0.77, "learning_rate": 2.6938350897494823e-06, "loss": 0.7129, "step": 11269 }, { "epoch": 0.77, "learning_rate": 2.6923281771951836e-06, "loss": 0.7666, "step": 11270 }, { "epoch": 0.77, "learning_rate": 2.690821620670301e-06, "loss": 0.7227, "step": 11271 }, { "epoch": 0.77, "learning_rate": 2.6893154202482343e-06, "loss": 0.6816, "step": 11272 }, { "epoch": 0.77, "learning_rate": 2.6878095760023615e-06, "loss": 0.7842, "step": 11273 }, { "epoch": 0.77, "learning_rate": 2.6863040880060466e-06, "loss": 0.6572, "step": 11274 }, { "epoch": 0.77, "learning_rate": 2.684798956332645e-06, "loss": 0.6777, "step": 11275 }, { "epoch": 0.77, "learning_rate": 2.683294181055479e-06, "loss": 0.8301, "step": 11276 }, { "epoch": 0.77, "learning_rate": 2.681789762247864e-06, "loss": 0.7354, "step": 11277 }, { "epoch": 0.77, "learning_rate": 2.680285699983095e-06, "loss": 0.7617, "step": 11278 }, { "epoch": 0.77, "learning_rate": 2.678781994334453e-06, "loss": 0.7646, "step": 11279 }, { "epoch": 0.77, "learning_rate": 2.6772786453751874e-06, "loss": 0.708, "step": 11280 }, { "epoch": 0.77, "learning_rate": 2.675775653178554e-06, "loss": 0.7217, "step": 11281 }, { "epoch": 0.77, "learning_rate": 2.6742730178177754e-06, "loss": 0.8086, "step": 11282 }, { "epoch": 0.77, "learning_rate": 2.672770739366056e-06, "loss": 0.7988, "step": 11283 }, { "epoch": 0.77, "learning_rate": 2.6712688178965886e-06, "loss": 0.749, "step": 11284 }, { "epoch": 0.77, "learning_rate": 2.6697672534825504e-06, "loss": 0.7705, "step": 11285 }, { "epoch": 0.77, "learning_rate": 2.668266046197088e-06, "loss": 0.7666, "step": 11286 }, { "epoch": 0.77, "learning_rate": 2.666765196113349e-06, "loss": 0.792, "step": 11287 }, { "epoch": 0.77, "learning_rate": 2.6652647033044542e-06, "loss": 0.749, "step": 11288 }, { "epoch": 0.77, "learning_rate": 2.663764567843503e-06, "loss": 0.7207, "step": 11289 }, { "epoch": 0.77, "learning_rate": 2.662264789803585e-06, "loss": 0.7803, "step": 11290 }, { "epoch": 0.77, "learning_rate": 2.6607653692577683e-06, "loss": 0.7637, "step": 11291 }, { "epoch": 0.77, "learning_rate": 2.6592663062791046e-06, "loss": 0.7607, "step": 11292 }, { "epoch": 0.77, "learning_rate": 2.6577676009406284e-06, "loss": 0.7715, "step": 11293 }, { "epoch": 0.77, "learning_rate": 2.6562692533153568e-06, "loss": 0.7627, "step": 11294 }, { "epoch": 0.77, "learning_rate": 2.654771263476292e-06, "loss": 0.8213, "step": 11295 }, { "epoch": 0.77, "learning_rate": 2.6532736314964103e-06, "loss": 0.708, "step": 11296 }, { "epoch": 0.77, "learning_rate": 2.6517763574486787e-06, "loss": 0.6836, "step": 11297 }, { "epoch": 0.77, "learning_rate": 2.650279441406044e-06, "loss": 0.7178, "step": 11298 }, { "epoch": 0.77, "learning_rate": 2.6487828834414374e-06, "loss": 0.7656, "step": 11299 }, { "epoch": 0.77, "learning_rate": 2.64728668362777e-06, "loss": 0.6865, "step": 11300 }, { "epoch": 0.77, "learning_rate": 2.6457908420379362e-06, "loss": 0.7002, "step": 11301 }, { "epoch": 0.77, "learning_rate": 2.6442953587448182e-06, "loss": 0.7773, "step": 11302 }, { "epoch": 0.77, "learning_rate": 2.6428002338212677e-06, "loss": 0.8301, "step": 11303 }, { "epoch": 0.77, "learning_rate": 2.6413054673401316e-06, "loss": 0.7256, "step": 11304 }, { "epoch": 0.77, "learning_rate": 2.6398110593742345e-06, "loss": 0.7656, "step": 11305 }, { "epoch": 0.77, "learning_rate": 2.638317009996383e-06, "loss": 0.791, "step": 11306 }, { "epoch": 0.77, "learning_rate": 2.636823319279367e-06, "loss": 0.7803, "step": 11307 }, { "epoch": 0.77, "learning_rate": 2.6353299872959635e-06, "loss": 0.707, "step": 11308 }, { "epoch": 0.77, "learning_rate": 2.6338370141189216e-06, "loss": 0.8125, "step": 11309 }, { "epoch": 0.77, "learning_rate": 2.6323443998209774e-06, "loss": 0.7119, "step": 11310 }, { "epoch": 0.77, "learning_rate": 2.630852144474861e-06, "loss": 0.7568, "step": 11311 }, { "epoch": 0.77, "learning_rate": 2.6293602481532655e-06, "loss": 0.7178, "step": 11312 }, { "epoch": 0.77, "learning_rate": 2.6278687109288793e-06, "loss": 0.6943, "step": 11313 }, { "epoch": 0.77, "learning_rate": 2.6263775328743703e-06, "loss": 0.7256, "step": 11314 }, { "epoch": 0.77, "learning_rate": 2.624886714062391e-06, "loss": 0.7979, "step": 11315 }, { "epoch": 0.77, "learning_rate": 2.6233962545655655e-06, "loss": 0.7969, "step": 11316 }, { "epoch": 0.77, "learning_rate": 2.6219061544565185e-06, "loss": 0.7695, "step": 11317 }, { "epoch": 0.77, "learning_rate": 2.620416413807846e-06, "loss": 0.792, "step": 11318 }, { "epoch": 0.77, "learning_rate": 2.6189270326921223e-06, "loss": 0.7598, "step": 11319 }, { "epoch": 0.77, "learning_rate": 2.6174380111819144e-06, "loss": 0.7891, "step": 11320 }, { "epoch": 0.77, "learning_rate": 2.61594934934977e-06, "loss": 0.7617, "step": 11321 }, { "epoch": 0.77, "learning_rate": 2.614461047268206e-06, "loss": 0.8115, "step": 11322 }, { "epoch": 0.77, "learning_rate": 2.612973105009744e-06, "loss": 0.749, "step": 11323 }, { "epoch": 0.77, "learning_rate": 2.6114855226468737e-06, "loss": 0.8115, "step": 11324 }, { "epoch": 0.77, "learning_rate": 2.6099983002520666e-06, "loss": 0.8154, "step": 11325 }, { "epoch": 0.77, "learning_rate": 2.6085114378977816e-06, "loss": 0.792, "step": 11326 }, { "epoch": 0.77, "learning_rate": 2.6070249356564583e-06, "loss": 0.8203, "step": 11327 }, { "epoch": 0.77, "learning_rate": 2.6055387936005204e-06, "loss": 0.8008, "step": 11328 }, { "epoch": 0.77, "learning_rate": 2.604053011802371e-06, "loss": 0.8213, "step": 11329 }, { "epoch": 0.77, "learning_rate": 2.6025675903343995e-06, "loss": 0.6982, "step": 11330 }, { "epoch": 0.77, "learning_rate": 2.6010825292689757e-06, "loss": 0.8301, "step": 11331 }, { "epoch": 0.77, "learning_rate": 2.5995978286784486e-06, "loss": 0.8018, "step": 11332 }, { "epoch": 0.77, "learning_rate": 2.598113488635151e-06, "loss": 0.7314, "step": 11333 }, { "epoch": 0.77, "learning_rate": 2.5966295092114093e-06, "loss": 0.8496, "step": 11334 }, { "epoch": 0.77, "learning_rate": 2.5951458904795136e-06, "loss": 0.8418, "step": 11335 }, { "epoch": 0.77, "learning_rate": 2.5936626325117487e-06, "loss": 0.832, "step": 11336 }, { "epoch": 0.77, "learning_rate": 2.5921797353803824e-06, "loss": 0.6421, "step": 11337 }, { "epoch": 0.77, "learning_rate": 2.590697199157656e-06, "loss": 0.6768, "step": 11338 }, { "epoch": 0.77, "learning_rate": 2.5892150239157965e-06, "loss": 0.7744, "step": 11339 }, { "epoch": 0.77, "learning_rate": 2.5877332097270256e-06, "loss": 0.7061, "step": 11340 }, { "epoch": 0.77, "learning_rate": 2.5862517566635292e-06, "loss": 0.7852, "step": 11341 }, { "epoch": 0.77, "learning_rate": 2.5847706647974846e-06, "loss": 0.7598, "step": 11342 }, { "epoch": 0.77, "learning_rate": 2.583289934201053e-06, "loss": 0.7949, "step": 11343 }, { "epoch": 0.77, "learning_rate": 2.581809564946376e-06, "loss": 0.7969, "step": 11344 }, { "epoch": 0.77, "learning_rate": 2.5803295571055696e-06, "loss": 0.749, "step": 11345 }, { "epoch": 0.77, "learning_rate": 2.578849910750748e-06, "loss": 0.7988, "step": 11346 }, { "epoch": 0.77, "learning_rate": 2.577370625954001e-06, "loss": 0.7695, "step": 11347 }, { "epoch": 0.77, "learning_rate": 2.5758917027873908e-06, "loss": 0.7412, "step": 11348 }, { "epoch": 0.77, "learning_rate": 2.5744131413229758e-06, "loss": 0.6406, "step": 11349 }, { "epoch": 0.77, "learning_rate": 2.57293494163279e-06, "loss": 0.7773, "step": 11350 }, { "epoch": 0.77, "learning_rate": 2.5714571037888513e-06, "loss": 0.7246, "step": 11351 }, { "epoch": 0.77, "learning_rate": 2.5699796278631607e-06, "loss": 0.7656, "step": 11352 }, { "epoch": 0.77, "learning_rate": 2.5685025139277e-06, "loss": 0.7383, "step": 11353 }, { "epoch": 0.77, "learning_rate": 2.567025762054437e-06, "loss": 0.7686, "step": 11354 }, { "epoch": 0.77, "learning_rate": 2.5655493723153146e-06, "loss": 0.7285, "step": 11355 }, { "epoch": 0.77, "learning_rate": 2.564073344782263e-06, "loss": 0.7383, "step": 11356 }, { "epoch": 0.77, "learning_rate": 2.562597679527196e-06, "loss": 0.7461, "step": 11357 }, { "epoch": 0.77, "learning_rate": 2.5611223766220074e-06, "loss": 0.7305, "step": 11358 }, { "epoch": 0.77, "learning_rate": 2.559647436138574e-06, "loss": 0.7568, "step": 11359 }, { "epoch": 0.77, "learning_rate": 2.5581728581487575e-06, "loss": 0.7139, "step": 11360 }, { "epoch": 0.77, "learning_rate": 2.5566986427243935e-06, "loss": 0.7412, "step": 11361 }, { "epoch": 0.77, "learning_rate": 2.555224789937308e-06, "loss": 0.8125, "step": 11362 }, { "epoch": 0.77, "learning_rate": 2.553751299859308e-06, "loss": 0.7344, "step": 11363 }, { "epoch": 0.77, "learning_rate": 2.5522781725621814e-06, "loss": 0.7793, "step": 11364 }, { "epoch": 0.77, "learning_rate": 2.5508054081177002e-06, "loss": 0.8174, "step": 11365 }, { "epoch": 0.77, "learning_rate": 2.549333006597615e-06, "loss": 0.8047, "step": 11366 }, { "epoch": 0.77, "learning_rate": 2.5478609680736653e-06, "loss": 0.6826, "step": 11367 }, { "epoch": 0.77, "learning_rate": 2.5463892926175637e-06, "loss": 0.7227, "step": 11368 }, { "epoch": 0.77, "learning_rate": 2.5449179803010092e-06, "loss": 0.748, "step": 11369 }, { "epoch": 0.77, "learning_rate": 2.5434470311956927e-06, "loss": 0.7705, "step": 11370 }, { "epoch": 0.77, "learning_rate": 2.541976445373271e-06, "loss": 0.7715, "step": 11371 }, { "epoch": 0.77, "learning_rate": 2.5405062229053922e-06, "loss": 0.793, "step": 11372 }, { "epoch": 0.78, "learning_rate": 2.5390363638636895e-06, "loss": 0.7852, "step": 11373 }, { "epoch": 0.78, "learning_rate": 2.5375668683197686e-06, "loss": 0.748, "step": 11374 }, { "epoch": 0.78, "learning_rate": 2.536097736345223e-06, "loss": 0.6719, "step": 11375 }, { "epoch": 0.78, "learning_rate": 2.5346289680116377e-06, "loss": 0.7402, "step": 11376 }, { "epoch": 0.78, "learning_rate": 2.533160563390562e-06, "loss": 0.7646, "step": 11377 }, { "epoch": 0.78, "learning_rate": 2.5316925225535394e-06, "loss": 0.7129, "step": 11378 }, { "epoch": 0.78, "learning_rate": 2.530224845572092e-06, "loss": 0.6992, "step": 11379 }, { "epoch": 0.78, "learning_rate": 2.5287575325177306e-06, "loss": 0.7129, "step": 11380 }, { "epoch": 0.78, "learning_rate": 2.527290583461931e-06, "loss": 0.8096, "step": 11381 }, { "epoch": 0.78, "learning_rate": 2.5258239984761723e-06, "loss": 0.6963, "step": 11382 }, { "epoch": 0.78, "learning_rate": 2.5243577776319086e-06, "loss": 0.7129, "step": 11383 }, { "epoch": 0.78, "learning_rate": 2.5228919210005644e-06, "loss": 0.7324, "step": 11384 }, { "epoch": 0.78, "learning_rate": 2.5214264286535616e-06, "loss": 0.7441, "step": 11385 }, { "epoch": 0.78, "learning_rate": 2.519961300662299e-06, "loss": 0.7012, "step": 11386 }, { "epoch": 0.78, "learning_rate": 2.5184965370981573e-06, "loss": 0.7559, "step": 11387 }, { "epoch": 0.78, "learning_rate": 2.517032138032499e-06, "loss": 0.71, "step": 11388 }, { "epoch": 0.78, "learning_rate": 2.515568103536671e-06, "loss": 0.7979, "step": 11389 }, { "epoch": 0.78, "learning_rate": 2.514104433682002e-06, "loss": 0.7109, "step": 11390 }, { "epoch": 0.78, "learning_rate": 2.5126411285397967e-06, "loss": 0.7959, "step": 11391 }, { "epoch": 0.78, "learning_rate": 2.5111781881813513e-06, "loss": 0.6372, "step": 11392 }, { "epoch": 0.78, "learning_rate": 2.5097156126779387e-06, "loss": 0.7705, "step": 11393 }, { "epoch": 0.78, "learning_rate": 2.5082534021008163e-06, "loss": 0.8066, "step": 11394 }, { "epoch": 0.78, "learning_rate": 2.506791556521223e-06, "loss": 0.7158, "step": 11395 }, { "epoch": 0.78, "learning_rate": 2.5053300760103827e-06, "loss": 0.8057, "step": 11396 }, { "epoch": 0.78, "learning_rate": 2.5038689606394916e-06, "loss": 0.7314, "step": 11397 }, { "epoch": 0.78, "learning_rate": 2.5024082104797407e-06, "loss": 0.7236, "step": 11398 }, { "epoch": 0.78, "learning_rate": 2.5009478256022957e-06, "loss": 0.7676, "step": 11399 }, { "epoch": 0.78, "learning_rate": 2.499487806078307e-06, "loss": 0.8877, "step": 11400 }, { "epoch": 0.78, "learning_rate": 2.498028151978905e-06, "loss": 0.751, "step": 11401 }, { "epoch": 0.78, "learning_rate": 2.4965688633752074e-06, "loss": 0.7695, "step": 11402 }, { "epoch": 0.78, "learning_rate": 2.495109940338312e-06, "loss": 0.748, "step": 11403 }, { "epoch": 0.78, "learning_rate": 2.4936513829392905e-06, "loss": 0.8174, "step": 11404 }, { "epoch": 0.78, "learning_rate": 2.4921931912492047e-06, "loss": 0.7744, "step": 11405 }, { "epoch": 0.78, "learning_rate": 2.4907353653391062e-06, "loss": 0.7646, "step": 11406 }, { "epoch": 0.78, "learning_rate": 2.489277905280012e-06, "loss": 0.793, "step": 11407 }, { "epoch": 0.78, "learning_rate": 2.4878208111429312e-06, "loss": 0.7617, "step": 11408 }, { "epoch": 0.78, "learning_rate": 2.4863640829988576e-06, "loss": 0.7617, "step": 11409 }, { "epoch": 0.78, "learning_rate": 2.4849077209187578e-06, "loss": 0.7393, "step": 11410 }, { "epoch": 0.78, "learning_rate": 2.4834517249735824e-06, "loss": 0.8018, "step": 11411 }, { "epoch": 0.78, "learning_rate": 2.481996095234279e-06, "loss": 0.7344, "step": 11412 }, { "epoch": 0.78, "learning_rate": 2.4805408317717573e-06, "loss": 0.792, "step": 11413 }, { "epoch": 0.78, "learning_rate": 2.4790859346569186e-06, "loss": 0.7705, "step": 11414 }, { "epoch": 0.78, "learning_rate": 2.477631403960646e-06, "loss": 0.75, "step": 11415 }, { "epoch": 0.78, "learning_rate": 2.4761772397538087e-06, "loss": 0.7275, "step": 11416 }, { "epoch": 0.78, "learning_rate": 2.474723442107242e-06, "loss": 0.7627, "step": 11417 }, { "epoch": 0.78, "learning_rate": 2.473270011091786e-06, "loss": 0.6914, "step": 11418 }, { "epoch": 0.78, "learning_rate": 2.4718169467782514e-06, "loss": 0.7695, "step": 11419 }, { "epoch": 0.78, "learning_rate": 2.4703642492374245e-06, "loss": 0.7598, "step": 11420 }, { "epoch": 0.78, "learning_rate": 2.4689119185400843e-06, "loss": 0.8086, "step": 11421 }, { "epoch": 0.78, "learning_rate": 2.4674599547569877e-06, "loss": 0.7734, "step": 11422 }, { "epoch": 0.78, "learning_rate": 2.4660083579588755e-06, "loss": 0.7754, "step": 11423 }, { "epoch": 0.78, "learning_rate": 2.464557128216468e-06, "loss": 0.7148, "step": 11424 }, { "epoch": 0.78, "learning_rate": 2.4631062656004735e-06, "loss": 0.7119, "step": 11425 }, { "epoch": 0.78, "learning_rate": 2.4616557701815703e-06, "loss": 0.7529, "step": 11426 }, { "epoch": 0.78, "learning_rate": 2.460205642030431e-06, "loss": 0.7383, "step": 11427 }, { "epoch": 0.78, "learning_rate": 2.458755881217705e-06, "loss": 0.7686, "step": 11428 }, { "epoch": 0.78, "learning_rate": 2.457306487814025e-06, "loss": 0.7168, "step": 11429 }, { "epoch": 0.78, "learning_rate": 2.4558574618900044e-06, "loss": 0.8057, "step": 11430 }, { "epoch": 0.78, "learning_rate": 2.4544088035162408e-06, "loss": 0.7842, "step": 11431 }, { "epoch": 0.78, "learning_rate": 2.4529605127633147e-06, "loss": 0.7529, "step": 11432 }, { "epoch": 0.78, "learning_rate": 2.451512589701782e-06, "loss": 0.7354, "step": 11433 }, { "epoch": 0.78, "learning_rate": 2.4500650344021882e-06, "loss": 0.7617, "step": 11434 }, { "epoch": 0.78, "learning_rate": 2.4486178469350573e-06, "loss": 0.6582, "step": 11435 }, { "epoch": 0.78, "learning_rate": 2.447171027370896e-06, "loss": 0.7773, "step": 11436 }, { "epoch": 0.78, "learning_rate": 2.445724575780195e-06, "loss": 0.7441, "step": 11437 }, { "epoch": 0.78, "learning_rate": 2.444278492233424e-06, "loss": 0.7012, "step": 11438 }, { "epoch": 0.78, "learning_rate": 2.4428327768010387e-06, "loss": 0.7383, "step": 11439 }, { "epoch": 0.78, "learning_rate": 2.44138742955347e-06, "loss": 0.7852, "step": 11440 }, { "epoch": 0.78, "learning_rate": 2.4399424505611337e-06, "loss": 0.7568, "step": 11441 }, { "epoch": 0.78, "learning_rate": 2.438497839894438e-06, "loss": 0.8203, "step": 11442 }, { "epoch": 0.78, "learning_rate": 2.4370535976237564e-06, "loss": 0.7383, "step": 11443 }, { "epoch": 0.78, "learning_rate": 2.4356097238194542e-06, "loss": 0.7178, "step": 11444 }, { "epoch": 0.78, "learning_rate": 2.434166218551881e-06, "loss": 0.7275, "step": 11445 }, { "epoch": 0.78, "learning_rate": 2.4327230818913537e-06, "loss": 0.8076, "step": 11446 }, { "epoch": 0.78, "learning_rate": 2.431280313908193e-06, "loss": 0.6777, "step": 11447 }, { "epoch": 0.78, "learning_rate": 2.429837914672689e-06, "loss": 0.8027, "step": 11448 }, { "epoch": 0.78, "learning_rate": 2.428395884255109e-06, "loss": 0.7217, "step": 11449 }, { "epoch": 0.78, "learning_rate": 2.4269542227257124e-06, "loss": 0.7383, "step": 11450 }, { "epoch": 0.78, "learning_rate": 2.4255129301547377e-06, "loss": 0.7451, "step": 11451 }, { "epoch": 0.78, "learning_rate": 2.4240720066124024e-06, "loss": 0.7598, "step": 11452 }, { "epoch": 0.78, "learning_rate": 2.422631452168911e-06, "loss": 0.7549, "step": 11453 }, { "epoch": 0.78, "learning_rate": 2.421191266894445e-06, "loss": 0.7607, "step": 11454 }, { "epoch": 0.78, "learning_rate": 2.4197514508591726e-06, "loss": 0.7129, "step": 11455 }, { "epoch": 0.78, "learning_rate": 2.418312004133239e-06, "loss": 0.7617, "step": 11456 }, { "epoch": 0.78, "learning_rate": 2.416872926786773e-06, "loss": 0.7383, "step": 11457 }, { "epoch": 0.78, "learning_rate": 2.4154342188898895e-06, "loss": 0.7344, "step": 11458 }, { "epoch": 0.78, "learning_rate": 2.4139958805126794e-06, "loss": 0.792, "step": 11459 }, { "epoch": 0.78, "learning_rate": 2.412557911725222e-06, "loss": 0.7578, "step": 11460 }, { "epoch": 0.78, "learning_rate": 2.4111203125975746e-06, "loss": 0.7383, "step": 11461 }, { "epoch": 0.78, "learning_rate": 2.409683083199773e-06, "loss": 0.7881, "step": 11462 }, { "epoch": 0.78, "learning_rate": 2.408246223601842e-06, "loss": 0.7393, "step": 11463 }, { "epoch": 0.78, "learning_rate": 2.406809733873784e-06, "loss": 0.7354, "step": 11464 }, { "epoch": 0.78, "learning_rate": 2.4053736140855864e-06, "loss": 0.7334, "step": 11465 }, { "epoch": 0.78, "learning_rate": 2.403937864307215e-06, "loss": 0.6904, "step": 11466 }, { "epoch": 0.78, "learning_rate": 2.402502484608621e-06, "loss": 0.7793, "step": 11467 }, { "epoch": 0.78, "learning_rate": 2.4010674750597383e-06, "loss": 0.7686, "step": 11468 }, { "epoch": 0.78, "learning_rate": 2.3996328357304745e-06, "loss": 0.7549, "step": 11469 }, { "epoch": 0.78, "learning_rate": 2.3981985666907247e-06, "loss": 0.7695, "step": 11470 }, { "epoch": 0.78, "learning_rate": 2.3967646680103772e-06, "loss": 0.6816, "step": 11471 }, { "epoch": 0.78, "learning_rate": 2.3953311397592805e-06, "loss": 0.8066, "step": 11472 }, { "epoch": 0.78, "learning_rate": 2.3938979820072804e-06, "loss": 0.7217, "step": 11473 }, { "epoch": 0.78, "learning_rate": 2.3924651948241996e-06, "loss": 0.75, "step": 11474 }, { "epoch": 0.78, "learning_rate": 2.391032778279846e-06, "loss": 0.752, "step": 11475 }, { "epoch": 0.78, "learning_rate": 2.3896007324439986e-06, "loss": 0.7256, "step": 11476 }, { "epoch": 0.78, "learning_rate": 2.3881690573864356e-06, "loss": 0.7744, "step": 11477 }, { "epoch": 0.78, "learning_rate": 2.3867377531769075e-06, "loss": 0.6943, "step": 11478 }, { "epoch": 0.78, "learning_rate": 2.3853068198851428e-06, "loss": 0.7471, "step": 11479 }, { "epoch": 0.78, "learning_rate": 2.383876257580857e-06, "loss": 0.7007, "step": 11480 }, { "epoch": 0.78, "learning_rate": 2.3824460663337524e-06, "loss": 0.874, "step": 11481 }, { "epoch": 0.78, "learning_rate": 2.3810162462134976e-06, "loss": 0.7441, "step": 11482 }, { "epoch": 0.78, "learning_rate": 2.3795867972897635e-06, "loss": 0.792, "step": 11483 }, { "epoch": 0.78, "learning_rate": 2.3781577196321915e-06, "loss": 0.7295, "step": 11484 }, { "epoch": 0.78, "learning_rate": 2.3767290133104005e-06, "loss": 0.8203, "step": 11485 }, { "epoch": 0.78, "learning_rate": 2.3753006783940004e-06, "loss": 0.7988, "step": 11486 }, { "epoch": 0.78, "learning_rate": 2.3738727149525798e-06, "loss": 0.8477, "step": 11487 }, { "epoch": 0.78, "learning_rate": 2.372445123055708e-06, "loss": 0.7842, "step": 11488 }, { "epoch": 0.78, "learning_rate": 2.3710179027729372e-06, "loss": 0.7139, "step": 11489 }, { "epoch": 0.78, "learning_rate": 2.369591054173803e-06, "loss": 0.7715, "step": 11490 }, { "epoch": 0.78, "learning_rate": 2.368164577327824e-06, "loss": 0.7832, "step": 11491 }, { "epoch": 0.78, "learning_rate": 2.3667384723044918e-06, "loss": 0.751, "step": 11492 }, { "epoch": 0.78, "learning_rate": 2.365312739173288e-06, "loss": 0.7783, "step": 11493 }, { "epoch": 0.78, "learning_rate": 2.3638873780036754e-06, "loss": 0.7998, "step": 11494 }, { "epoch": 0.78, "learning_rate": 2.362462388865098e-06, "loss": 0.7178, "step": 11495 }, { "epoch": 0.78, "learning_rate": 2.3610377718269793e-06, "loss": 0.7666, "step": 11496 }, { "epoch": 0.78, "learning_rate": 2.3596135269587316e-06, "loss": 0.6904, "step": 11497 }, { "epoch": 0.78, "learning_rate": 2.3581896543297377e-06, "loss": 0.6797, "step": 11498 }, { "epoch": 0.78, "learning_rate": 2.35676615400937e-06, "loss": 0.7539, "step": 11499 }, { "epoch": 0.78, "learning_rate": 2.355343026066984e-06, "loss": 0.7119, "step": 11500 }, { "epoch": 0.78, "learning_rate": 2.353920270571912e-06, "loss": 0.792, "step": 11501 }, { "epoch": 0.78, "learning_rate": 2.3524978875934724e-06, "loss": 0.7227, "step": 11502 }, { "epoch": 0.78, "learning_rate": 2.3510758772009623e-06, "loss": 0.7822, "step": 11503 }, { "epoch": 0.78, "learning_rate": 2.3496542394636644e-06, "loss": 0.7627, "step": 11504 }, { "epoch": 0.78, "learning_rate": 2.348232974450837e-06, "loss": 0.7256, "step": 11505 }, { "epoch": 0.78, "learning_rate": 2.346812082231723e-06, "loss": 0.7324, "step": 11506 }, { "epoch": 0.78, "learning_rate": 2.3453915628755565e-06, "loss": 0.8516, "step": 11507 }, { "epoch": 0.78, "learning_rate": 2.343971416451537e-06, "loss": 0.7041, "step": 11508 }, { "epoch": 0.78, "learning_rate": 2.3425516430288574e-06, "loss": 0.7764, "step": 11509 }, { "epoch": 0.78, "learning_rate": 2.341132242676688e-06, "loss": 0.7773, "step": 11510 }, { "epoch": 0.78, "learning_rate": 2.3397132154641842e-06, "loss": 0.6943, "step": 11511 }, { "epoch": 0.78, "learning_rate": 2.3382945614604744e-06, "loss": 0.7588, "step": 11512 }, { "epoch": 0.78, "learning_rate": 2.336876280734686e-06, "loss": 0.7002, "step": 11513 }, { "epoch": 0.78, "learning_rate": 2.3354583733559067e-06, "loss": 0.7471, "step": 11514 }, { "epoch": 0.78, "learning_rate": 2.3340408393932236e-06, "loss": 0.6777, "step": 11515 }, { "epoch": 0.78, "learning_rate": 2.332623678915695e-06, "loss": 0.7266, "step": 11516 }, { "epoch": 0.78, "learning_rate": 2.3312068919923714e-06, "loss": 0.8242, "step": 11517 }, { "epoch": 0.78, "learning_rate": 2.3297904786922674e-06, "loss": 0.71, "step": 11518 }, { "epoch": 0.78, "learning_rate": 2.328374439084401e-06, "loss": 0.6807, "step": 11519 }, { "epoch": 0.79, "learning_rate": 2.3269587732377606e-06, "loss": 0.7461, "step": 11520 }, { "epoch": 0.79, "learning_rate": 2.3255434812213107e-06, "loss": 0.793, "step": 11521 }, { "epoch": 0.79, "learning_rate": 2.3241285631040087e-06, "loss": 0.7217, "step": 11522 }, { "epoch": 0.79, "learning_rate": 2.322714018954789e-06, "loss": 0.751, "step": 11523 }, { "epoch": 0.79, "learning_rate": 2.3212998488425674e-06, "loss": 0.6865, "step": 11524 }, { "epoch": 0.79, "learning_rate": 2.3198860528362433e-06, "loss": 0.752, "step": 11525 }, { "epoch": 0.79, "learning_rate": 2.3184726310046966e-06, "loss": 0.7969, "step": 11526 }, { "epoch": 0.79, "learning_rate": 2.317059583416791e-06, "loss": 0.79, "step": 11527 }, { "epoch": 0.79, "learning_rate": 2.3156469101413647e-06, "loss": 0.75, "step": 11528 }, { "epoch": 0.79, "learning_rate": 2.3142346112472456e-06, "loss": 0.7314, "step": 11529 }, { "epoch": 0.79, "learning_rate": 2.3128226868032422e-06, "loss": 0.7393, "step": 11530 }, { "epoch": 0.79, "learning_rate": 2.3114111368781434e-06, "loss": 0.8066, "step": 11531 }, { "epoch": 0.79, "learning_rate": 2.3099999615407175e-06, "loss": 0.7598, "step": 11532 }, { "epoch": 0.79, "learning_rate": 2.3085891608597222e-06, "loss": 0.7637, "step": 11533 }, { "epoch": 0.79, "learning_rate": 2.3071787349038856e-06, "loss": 0.8027, "step": 11534 }, { "epoch": 0.79, "learning_rate": 2.3057686837419246e-06, "loss": 0.7773, "step": 11535 }, { "epoch": 0.79, "learning_rate": 2.3043590074425383e-06, "loss": 0.7686, "step": 11536 }, { "epoch": 0.79, "learning_rate": 2.3029497060744064e-06, "loss": 0.7363, "step": 11537 }, { "epoch": 0.79, "learning_rate": 2.3015407797061897e-06, "loss": 0.709, "step": 11538 }, { "epoch": 0.79, "learning_rate": 2.3001322284065307e-06, "loss": 0.7373, "step": 11539 }, { "epoch": 0.79, "learning_rate": 2.2987240522440557e-06, "loss": 0.7666, "step": 11540 }, { "epoch": 0.79, "learning_rate": 2.297316251287368e-06, "loss": 0.8184, "step": 11541 }, { "epoch": 0.79, "learning_rate": 2.295908825605053e-06, "loss": 0.7334, "step": 11542 }, { "epoch": 0.79, "learning_rate": 2.2945017752656905e-06, "loss": 0.7051, "step": 11543 }, { "epoch": 0.79, "learning_rate": 2.293095100337823e-06, "loss": 0.7598, "step": 11544 }, { "epoch": 0.79, "learning_rate": 2.291688800889986e-06, "loss": 0.6309, "step": 11545 }, { "epoch": 0.79, "learning_rate": 2.2902828769906983e-06, "loss": 0.7441, "step": 11546 }, { "epoch": 0.79, "learning_rate": 2.2888773287084488e-06, "loss": 0.6914, "step": 11547 }, { "epoch": 0.79, "learning_rate": 2.2874721561117176e-06, "loss": 0.8721, "step": 11548 }, { "epoch": 0.79, "learning_rate": 2.286067359268973e-06, "loss": 0.7705, "step": 11549 }, { "epoch": 0.79, "learning_rate": 2.2846629382486473e-06, "loss": 0.7666, "step": 11550 }, { "epoch": 0.79, "learning_rate": 2.2832588931191666e-06, "loss": 0.7744, "step": 11551 }, { "epoch": 0.79, "learning_rate": 2.2818552239489365e-06, "loss": 0.7236, "step": 11552 }, { "epoch": 0.79, "learning_rate": 2.2804519308063465e-06, "loss": 0.7295, "step": 11553 }, { "epoch": 0.79, "learning_rate": 2.2790490137597567e-06, "loss": 0.707, "step": 11554 }, { "epoch": 0.79, "learning_rate": 2.2776464728775236e-06, "loss": 0.7012, "step": 11555 }, { "epoch": 0.79, "learning_rate": 2.276244308227983e-06, "loss": 0.7119, "step": 11556 }, { "epoch": 0.79, "learning_rate": 2.274842519879438e-06, "loss": 0.71, "step": 11557 }, { "epoch": 0.79, "learning_rate": 2.2734411079001896e-06, "loss": 0.7441, "step": 11558 }, { "epoch": 0.79, "learning_rate": 2.2720400723585136e-06, "loss": 0.7793, "step": 11559 }, { "epoch": 0.79, "learning_rate": 2.2706394133226684e-06, "loss": 0.6855, "step": 11560 }, { "epoch": 0.79, "learning_rate": 2.2692391308608943e-06, "loss": 0.8232, "step": 11561 }, { "epoch": 0.79, "learning_rate": 2.2678392250414127e-06, "loss": 0.7344, "step": 11562 }, { "epoch": 0.79, "learning_rate": 2.2664396959324297e-06, "loss": 0.7734, "step": 11563 }, { "epoch": 0.79, "learning_rate": 2.265040543602125e-06, "loss": 0.7822, "step": 11564 }, { "epoch": 0.79, "learning_rate": 2.2636417681186673e-06, "loss": 0.7725, "step": 11565 }, { "epoch": 0.79, "learning_rate": 2.2622433695502057e-06, "loss": 0.708, "step": 11566 }, { "epoch": 0.79, "learning_rate": 2.2608453479648695e-06, "loss": 0.6963, "step": 11567 }, { "epoch": 0.79, "learning_rate": 2.2594477034307716e-06, "loss": 0.7236, "step": 11568 }, { "epoch": 0.79, "learning_rate": 2.258050436016006e-06, "loss": 0.6924, "step": 11569 }, { "epoch": 0.79, "learning_rate": 2.256653545788643e-06, "loss": 0.75, "step": 11570 }, { "epoch": 0.79, "learning_rate": 2.2552570328167378e-06, "loss": 0.7754, "step": 11571 }, { "epoch": 0.79, "learning_rate": 2.2538608971683394e-06, "loss": 0.7236, "step": 11572 }, { "epoch": 0.79, "learning_rate": 2.252465138911457e-06, "loss": 0.7041, "step": 11573 }, { "epoch": 0.79, "learning_rate": 2.251069758114095e-06, "loss": 0.6729, "step": 11574 }, { "epoch": 0.79, "learning_rate": 2.2496747548442364e-06, "loss": 0.8027, "step": 11575 }, { "epoch": 0.79, "learning_rate": 2.2482801291698487e-06, "loss": 0.7334, "step": 11576 }, { "epoch": 0.79, "learning_rate": 2.24688588115887e-06, "loss": 0.7266, "step": 11577 }, { "epoch": 0.79, "learning_rate": 2.2454920108792354e-06, "loss": 0.7129, "step": 11578 }, { "epoch": 0.79, "learning_rate": 2.244098518398855e-06, "loss": 0.8301, "step": 11579 }, { "epoch": 0.79, "learning_rate": 2.2427054037856133e-06, "loss": 0.7119, "step": 11580 }, { "epoch": 0.79, "learning_rate": 2.241312667107386e-06, "loss": 0.625, "step": 11581 }, { "epoch": 0.79, "learning_rate": 2.23992030843203e-06, "loss": 0.7188, "step": 11582 }, { "epoch": 0.79, "learning_rate": 2.2385283278273727e-06, "loss": 0.7031, "step": 11583 }, { "epoch": 0.79, "learning_rate": 2.23713672536124e-06, "loss": 0.7949, "step": 11584 }, { "epoch": 0.79, "learning_rate": 2.2357455011014295e-06, "loss": 0.7275, "step": 11585 }, { "epoch": 0.79, "learning_rate": 2.234354655115717e-06, "loss": 0.8154, "step": 11586 }, { "epoch": 0.79, "learning_rate": 2.232964187471868e-06, "loss": 0.7656, "step": 11587 }, { "epoch": 0.79, "learning_rate": 2.2315740982376235e-06, "loss": 0.7334, "step": 11588 }, { "epoch": 0.79, "learning_rate": 2.2301843874807107e-06, "loss": 0.7637, "step": 11589 }, { "epoch": 0.79, "learning_rate": 2.2287950552688365e-06, "loss": 0.7773, "step": 11590 }, { "epoch": 0.79, "learning_rate": 2.2274061016696868e-06, "loss": 0.7568, "step": 11591 }, { "epoch": 0.79, "learning_rate": 2.2260175267509364e-06, "loss": 0.6885, "step": 11592 }, { "epoch": 0.79, "learning_rate": 2.2246293305802304e-06, "loss": 0.7949, "step": 11593 }, { "epoch": 0.79, "learning_rate": 2.223241513225204e-06, "loss": 0.8594, "step": 11594 }, { "epoch": 0.79, "learning_rate": 2.2218540747534713e-06, "loss": 0.6699, "step": 11595 }, { "epoch": 0.79, "learning_rate": 2.220467015232629e-06, "loss": 0.7002, "step": 11596 }, { "epoch": 0.79, "learning_rate": 2.2190803347302547e-06, "loss": 0.7529, "step": 11597 }, { "epoch": 0.79, "learning_rate": 2.21769403331391e-06, "loss": 0.7295, "step": 11598 }, { "epoch": 0.79, "learning_rate": 2.2163081110511288e-06, "loss": 0.7715, "step": 11599 }, { "epoch": 0.79, "learning_rate": 2.2149225680094367e-06, "loss": 0.7178, "step": 11600 }, { "epoch": 0.79, "learning_rate": 2.2135374042563387e-06, "loss": 0.749, "step": 11601 }, { "epoch": 0.79, "learning_rate": 2.212152619859318e-06, "loss": 0.8057, "step": 11602 }, { "epoch": 0.79, "learning_rate": 2.2107682148858412e-06, "loss": 0.7275, "step": 11603 }, { "epoch": 0.79, "learning_rate": 2.2093841894033585e-06, "loss": 0.792, "step": 11604 }, { "epoch": 0.79, "learning_rate": 2.2080005434792993e-06, "loss": 0.8496, "step": 11605 }, { "epoch": 0.79, "learning_rate": 2.2066172771810724e-06, "loss": 0.7598, "step": 11606 }, { "epoch": 0.79, "learning_rate": 2.205234390576069e-06, "loss": 0.7637, "step": 11607 }, { "epoch": 0.79, "learning_rate": 2.2038518837316703e-06, "loss": 0.7803, "step": 11608 }, { "epoch": 0.79, "learning_rate": 2.2024697567152254e-06, "loss": 0.7246, "step": 11609 }, { "epoch": 0.79, "learning_rate": 2.2010880095940733e-06, "loss": 0.7324, "step": 11610 }, { "epoch": 0.79, "learning_rate": 2.199706642435534e-06, "loss": 0.7207, "step": 11611 }, { "epoch": 0.79, "learning_rate": 2.1983256553069086e-06, "loss": 0.8252, "step": 11612 }, { "epoch": 0.79, "learning_rate": 2.1969450482754717e-06, "loss": 0.6943, "step": 11613 }, { "epoch": 0.79, "learning_rate": 2.1955648214084935e-06, "loss": 0.75, "step": 11614 }, { "epoch": 0.79, "learning_rate": 2.1941849747732204e-06, "loss": 0.7305, "step": 11615 }, { "epoch": 0.79, "learning_rate": 2.1928055084368717e-06, "loss": 0.6846, "step": 11616 }, { "epoch": 0.79, "learning_rate": 2.191426422466658e-06, "loss": 0.7373, "step": 11617 }, { "epoch": 0.79, "learning_rate": 2.1900477169297708e-06, "loss": 0.8115, "step": 11618 }, { "epoch": 0.79, "learning_rate": 2.188669391893372e-06, "loss": 0.7695, "step": 11619 }, { "epoch": 0.79, "learning_rate": 2.187291447424622e-06, "loss": 0.7754, "step": 11620 }, { "epoch": 0.79, "learning_rate": 2.1859138835906557e-06, "loss": 0.7324, "step": 11621 }, { "epoch": 0.79, "learning_rate": 2.1845367004585804e-06, "loss": 0.8125, "step": 11622 }, { "epoch": 0.79, "learning_rate": 2.183159898095496e-06, "loss": 0.8359, "step": 11623 }, { "epoch": 0.79, "learning_rate": 2.1817834765684796e-06, "loss": 0.8096, "step": 11624 }, { "epoch": 0.79, "learning_rate": 2.1804074359445924e-06, "loss": 0.7188, "step": 11625 }, { "epoch": 0.79, "learning_rate": 2.179031776290872e-06, "loss": 0.71, "step": 11626 }, { "epoch": 0.79, "learning_rate": 2.1776564976743432e-06, "loss": 0.6807, "step": 11627 }, { "epoch": 0.79, "learning_rate": 2.1762816001620103e-06, "loss": 0.7373, "step": 11628 }, { "epoch": 0.79, "learning_rate": 2.1749070838208542e-06, "loss": 0.707, "step": 11629 }, { "epoch": 0.79, "learning_rate": 2.1735329487178436e-06, "loss": 0.7051, "step": 11630 }, { "epoch": 0.79, "learning_rate": 2.172159194919925e-06, "loss": 0.6982, "step": 11631 }, { "epoch": 0.79, "learning_rate": 2.170785822494029e-06, "loss": 0.8184, "step": 11632 }, { "epoch": 0.79, "learning_rate": 2.169412831507066e-06, "loss": 0.8008, "step": 11633 }, { "epoch": 0.79, "learning_rate": 2.1680402220259313e-06, "loss": 0.7705, "step": 11634 }, { "epoch": 0.79, "learning_rate": 2.1666679941174916e-06, "loss": 0.7168, "step": 11635 }, { "epoch": 0.79, "learning_rate": 2.165296147848606e-06, "loss": 0.6729, "step": 11636 }, { "epoch": 0.79, "learning_rate": 2.1639246832861095e-06, "loss": 0.6885, "step": 11637 }, { "epoch": 0.79, "learning_rate": 2.1625536004968205e-06, "loss": 0.7637, "step": 11638 }, { "epoch": 0.79, "learning_rate": 2.1611828995475383e-06, "loss": 0.7139, "step": 11639 }, { "epoch": 0.79, "learning_rate": 2.1598125805050417e-06, "loss": 0.7646, "step": 11640 }, { "epoch": 0.79, "learning_rate": 2.158442643436097e-06, "loss": 0.7559, "step": 11641 }, { "epoch": 0.79, "learning_rate": 2.157073088407442e-06, "loss": 0.8076, "step": 11642 }, { "epoch": 0.79, "learning_rate": 2.155703915485801e-06, "loss": 0.7939, "step": 11643 }, { "epoch": 0.79, "learning_rate": 2.1543351247378875e-06, "loss": 0.7393, "step": 11644 }, { "epoch": 0.79, "learning_rate": 2.1529667162303823e-06, "loss": 0.7617, "step": 11645 }, { "epoch": 0.79, "learning_rate": 2.1515986900299557e-06, "loss": 0.7002, "step": 11646 }, { "epoch": 0.79, "learning_rate": 2.1502310462032573e-06, "loss": 0.7568, "step": 11647 }, { "epoch": 0.79, "learning_rate": 2.1488637848169237e-06, "loss": 0.7656, "step": 11648 }, { "epoch": 0.79, "learning_rate": 2.1474969059375573e-06, "loss": 0.7461, "step": 11649 }, { "epoch": 0.79, "learning_rate": 2.1461304096317614e-06, "loss": 0.7002, "step": 11650 }, { "epoch": 0.79, "learning_rate": 2.1447642959661118e-06, "loss": 0.833, "step": 11651 }, { "epoch": 0.79, "learning_rate": 2.14339856500716e-06, "loss": 0.7822, "step": 11652 }, { "epoch": 0.79, "learning_rate": 2.1420332168214464e-06, "loss": 0.7412, "step": 11653 }, { "epoch": 0.79, "learning_rate": 2.140668251475495e-06, "loss": 0.666, "step": 11654 }, { "epoch": 0.79, "learning_rate": 2.139303669035797e-06, "loss": 0.7373, "step": 11655 }, { "epoch": 0.79, "learning_rate": 2.137939469568844e-06, "loss": 0.7646, "step": 11656 }, { "epoch": 0.79, "learning_rate": 2.1365756531410984e-06, "loss": 0.7568, "step": 11657 }, { "epoch": 0.79, "learning_rate": 2.1352122198190015e-06, "loss": 0.8223, "step": 11658 }, { "epoch": 0.79, "learning_rate": 2.133849169668982e-06, "loss": 0.7832, "step": 11659 }, { "epoch": 0.79, "learning_rate": 2.1324865027574472e-06, "loss": 0.7246, "step": 11660 }, { "epoch": 0.79, "learning_rate": 2.1311242191507864e-06, "loss": 0.8096, "step": 11661 }, { "epoch": 0.79, "learning_rate": 2.1297623189153693e-06, "loss": 0.7695, "step": 11662 }, { "epoch": 0.79, "learning_rate": 2.1284008021175482e-06, "loss": 0.751, "step": 11663 }, { "epoch": 0.79, "learning_rate": 2.1270396688236595e-06, "loss": 0.791, "step": 11664 }, { "epoch": 0.79, "learning_rate": 2.1256789191000114e-06, "loss": 0.7627, "step": 11665 }, { "epoch": 0.8, "learning_rate": 2.124318553012902e-06, "loss": 0.8271, "step": 11666 }, { "epoch": 0.8, "learning_rate": 2.1229585706286095e-06, "loss": 0.7686, "step": 11667 }, { "epoch": 0.8, "learning_rate": 2.12159897201339e-06, "loss": 0.7207, "step": 11668 }, { "epoch": 0.8, "learning_rate": 2.1202397572334852e-06, "loss": 0.7812, "step": 11669 }, { "epoch": 0.8, "learning_rate": 2.118880926355118e-06, "loss": 0.7129, "step": 11670 }, { "epoch": 0.8, "learning_rate": 2.1175224794444847e-06, "loss": 0.7734, "step": 11671 }, { "epoch": 0.8, "learning_rate": 2.116164416567772e-06, "loss": 0.7988, "step": 11672 }, { "epoch": 0.8, "learning_rate": 2.1148067377911443e-06, "loss": 0.7236, "step": 11673 }, { "epoch": 0.8, "learning_rate": 2.1134494431807474e-06, "loss": 0.7578, "step": 11674 }, { "epoch": 0.8, "learning_rate": 2.11209253280271e-06, "loss": 0.7529, "step": 11675 }, { "epoch": 0.8, "learning_rate": 2.1107360067231386e-06, "loss": 0.6895, "step": 11676 }, { "epoch": 0.8, "learning_rate": 2.1093798650081275e-06, "loss": 0.7266, "step": 11677 }, { "epoch": 0.8, "learning_rate": 2.1080241077237417e-06, "loss": 0.7207, "step": 11678 }, { "epoch": 0.8, "learning_rate": 2.1066687349360336e-06, "loss": 0.7686, "step": 11679 }, { "epoch": 0.8, "learning_rate": 2.105313746711046e-06, "loss": 0.8594, "step": 11680 }, { "epoch": 0.8, "learning_rate": 2.103959143114784e-06, "loss": 0.6992, "step": 11681 }, { "epoch": 0.8, "learning_rate": 2.1026049242132487e-06, "loss": 0.7412, "step": 11682 }, { "epoch": 0.8, "learning_rate": 2.101251090072415e-06, "loss": 0.7402, "step": 11683 }, { "epoch": 0.8, "learning_rate": 2.099897640758244e-06, "loss": 0.7539, "step": 11684 }, { "epoch": 0.8, "learning_rate": 2.0985445763366742e-06, "loss": 0.7715, "step": 11685 }, { "epoch": 0.8, "learning_rate": 2.0971918968736305e-06, "loss": 0.7559, "step": 11686 }, { "epoch": 0.8, "learning_rate": 2.0958396024350092e-06, "loss": 0.75, "step": 11687 }, { "epoch": 0.8, "learning_rate": 2.0944876930866965e-06, "loss": 0.7314, "step": 11688 }, { "epoch": 0.8, "learning_rate": 2.0931361688945585e-06, "loss": 0.7256, "step": 11689 }, { "epoch": 0.8, "learning_rate": 2.09178502992444e-06, "loss": 0.7656, "step": 11690 }, { "epoch": 0.8, "learning_rate": 2.0904342762421703e-06, "loss": 0.7686, "step": 11691 }, { "epoch": 0.8, "learning_rate": 2.089083907913556e-06, "loss": 0.7139, "step": 11692 }, { "epoch": 0.8, "learning_rate": 2.0877339250043915e-06, "loss": 0.7764, "step": 11693 }, { "epoch": 0.8, "learning_rate": 2.086384327580441e-06, "loss": 0.7539, "step": 11694 }, { "epoch": 0.8, "learning_rate": 2.08503511570746e-06, "loss": 0.6836, "step": 11695 }, { "epoch": 0.8, "learning_rate": 2.083686289451182e-06, "loss": 0.7812, "step": 11696 }, { "epoch": 0.8, "learning_rate": 2.082337848877323e-06, "loss": 0.7109, "step": 11697 }, { "epoch": 0.8, "learning_rate": 2.0809897940515768e-06, "loss": 0.7354, "step": 11698 }, { "epoch": 0.8, "learning_rate": 2.0796421250396227e-06, "loss": 0.7549, "step": 11699 }, { "epoch": 0.8, "learning_rate": 2.07829484190712e-06, "loss": 0.7832, "step": 11700 }, { "epoch": 0.8, "learning_rate": 2.076947944719704e-06, "loss": 0.791, "step": 11701 }, { "epoch": 0.8, "learning_rate": 2.075601433542994e-06, "loss": 0.752, "step": 11702 }, { "epoch": 0.8, "learning_rate": 2.074255308442602e-06, "loss": 0.6934, "step": 11703 }, { "epoch": 0.8, "learning_rate": 2.0729095694841017e-06, "loss": 0.7803, "step": 11704 }, { "epoch": 0.8, "learning_rate": 2.0715642167330617e-06, "loss": 0.7539, "step": 11705 }, { "epoch": 0.8, "learning_rate": 2.070219250255028e-06, "loss": 0.7227, "step": 11706 }, { "epoch": 0.8, "learning_rate": 2.068874670115524e-06, "loss": 0.7754, "step": 11707 }, { "epoch": 0.8, "learning_rate": 2.0675304763800553e-06, "loss": 0.7607, "step": 11708 }, { "epoch": 0.8, "learning_rate": 2.066186669114121e-06, "loss": 0.7744, "step": 11709 }, { "epoch": 0.8, "learning_rate": 2.0648432483831828e-06, "loss": 0.7939, "step": 11710 }, { "epoch": 0.8, "learning_rate": 2.063500214252694e-06, "loss": 0.7686, "step": 11711 }, { "epoch": 0.8, "learning_rate": 2.0621575667880887e-06, "loss": 0.8389, "step": 11712 }, { "epoch": 0.8, "learning_rate": 2.060815306054782e-06, "loss": 0.8291, "step": 11713 }, { "epoch": 0.8, "learning_rate": 2.05947343211816e-06, "loss": 0.7744, "step": 11714 }, { "epoch": 0.8, "learning_rate": 2.0581319450436086e-06, "loss": 0.7246, "step": 11715 }, { "epoch": 0.8, "learning_rate": 2.0567908448964846e-06, "loss": 0.8379, "step": 11716 }, { "epoch": 0.8, "learning_rate": 2.0554501317421204e-06, "loss": 0.7988, "step": 11717 }, { "epoch": 0.8, "learning_rate": 2.0541098056458375e-06, "loss": 0.7783, "step": 11718 }, { "epoch": 0.8, "learning_rate": 2.0527698666729412e-06, "loss": 0.7803, "step": 11719 }, { "epoch": 0.8, "learning_rate": 2.0514303148887036e-06, "loss": 0.6904, "step": 11720 }, { "epoch": 0.8, "learning_rate": 2.0500911503583965e-06, "loss": 0.6885, "step": 11721 }, { "epoch": 0.8, "learning_rate": 2.0487523731472623e-06, "loss": 0.7207, "step": 11722 }, { "epoch": 0.8, "learning_rate": 2.0474139833205233e-06, "loss": 0.7705, "step": 11723 }, { "epoch": 0.8, "learning_rate": 2.046075980943387e-06, "loss": 0.7314, "step": 11724 }, { "epoch": 0.8, "learning_rate": 2.0447383660810404e-06, "loss": 0.7744, "step": 11725 }, { "epoch": 0.8, "learning_rate": 2.043401138798653e-06, "loss": 0.8311, "step": 11726 }, { "epoch": 0.8, "learning_rate": 2.0420642991613747e-06, "loss": 0.7344, "step": 11727 }, { "epoch": 0.8, "learning_rate": 2.040727847234335e-06, "loss": 0.7705, "step": 11728 }, { "epoch": 0.8, "learning_rate": 2.039391783082649e-06, "loss": 0.7236, "step": 11729 }, { "epoch": 0.8, "learning_rate": 2.0380561067714054e-06, "loss": 0.791, "step": 11730 }, { "epoch": 0.8, "learning_rate": 2.0367208183656784e-06, "loss": 0.7783, "step": 11731 }, { "epoch": 0.8, "learning_rate": 2.035385917930526e-06, "loss": 0.7969, "step": 11732 }, { "epoch": 0.8, "learning_rate": 2.0340514055309833e-06, "loss": 0.7939, "step": 11733 }, { "epoch": 0.8, "learning_rate": 2.032717281232067e-06, "loss": 0.7373, "step": 11734 }, { "epoch": 0.8, "learning_rate": 2.0313835450987764e-06, "loss": 0.7129, "step": 11735 }, { "epoch": 0.8, "learning_rate": 2.030050197196094e-06, "loss": 0.7744, "step": 11736 }, { "epoch": 0.8, "learning_rate": 2.028717237588974e-06, "loss": 0.8037, "step": 11737 }, { "epoch": 0.8, "learning_rate": 2.027384666342359e-06, "loss": 0.7529, "step": 11738 }, { "epoch": 0.8, "learning_rate": 2.0260524835211803e-06, "loss": 0.6631, "step": 11739 }, { "epoch": 0.8, "learning_rate": 2.024720689190333e-06, "loss": 0.8398, "step": 11740 }, { "epoch": 0.8, "learning_rate": 2.023389283414704e-06, "loss": 0.6846, "step": 11741 }, { "epoch": 0.8, "learning_rate": 2.0220582662591625e-06, "loss": 0.7163, "step": 11742 }, { "epoch": 0.8, "learning_rate": 2.020727637788551e-06, "loss": 0.7725, "step": 11743 }, { "epoch": 0.8, "learning_rate": 2.019397398067697e-06, "loss": 0.751, "step": 11744 }, { "epoch": 0.8, "learning_rate": 2.0180675471614186e-06, "loss": 0.7734, "step": 11745 }, { "epoch": 0.8, "learning_rate": 2.0167380851344975e-06, "loss": 0.7598, "step": 11746 }, { "epoch": 0.8, "learning_rate": 2.0154090120517066e-06, "loss": 0.7207, "step": 11747 }, { "epoch": 0.8, "learning_rate": 2.0140803279778e-06, "loss": 0.6709, "step": 11748 }, { "epoch": 0.8, "learning_rate": 2.012752032977513e-06, "loss": 0.7354, "step": 11749 }, { "epoch": 0.8, "learning_rate": 2.011424127115552e-06, "loss": 0.7285, "step": 11750 }, { "epoch": 0.8, "learning_rate": 2.01009661045662e-06, "loss": 0.6865, "step": 11751 }, { "epoch": 0.8, "learning_rate": 2.008769483065395e-06, "loss": 0.7627, "step": 11752 }, { "epoch": 0.8, "learning_rate": 2.007442745006528e-06, "loss": 0.7793, "step": 11753 }, { "epoch": 0.8, "learning_rate": 2.0061163963446606e-06, "loss": 0.7871, "step": 11754 }, { "epoch": 0.8, "learning_rate": 2.004790437144416e-06, "loss": 0.7852, "step": 11755 }, { "epoch": 0.8, "learning_rate": 2.003464867470385e-06, "loss": 0.8115, "step": 11756 }, { "epoch": 0.8, "learning_rate": 2.002139687387159e-06, "loss": 0.7686, "step": 11757 }, { "epoch": 0.8, "learning_rate": 2.0008148969593e-06, "loss": 0.7578, "step": 11758 }, { "epoch": 0.8, "learning_rate": 1.9994904962513464e-06, "loss": 0.6406, "step": 11759 }, { "epoch": 0.8, "learning_rate": 1.9981664853278247e-06, "loss": 0.8037, "step": 11760 }, { "epoch": 0.8, "learning_rate": 1.9968428642532435e-06, "loss": 0.8379, "step": 11761 }, { "epoch": 0.8, "learning_rate": 1.9955196330920866e-06, "loss": 0.749, "step": 11762 }, { "epoch": 0.8, "learning_rate": 1.9941967919088225e-06, "loss": 0.6846, "step": 11763 }, { "epoch": 0.8, "learning_rate": 1.9928743407679007e-06, "loss": 0.8223, "step": 11764 }, { "epoch": 0.8, "learning_rate": 1.991552279733754e-06, "loss": 0.8545, "step": 11765 }, { "epoch": 0.8, "learning_rate": 1.9902306088707855e-06, "loss": 0.7324, "step": 11766 }, { "epoch": 0.8, "learning_rate": 1.9889093282433925e-06, "loss": 0.6748, "step": 11767 }, { "epoch": 0.8, "learning_rate": 1.9875884379159447e-06, "loss": 0.6865, "step": 11768 }, { "epoch": 0.8, "learning_rate": 1.9862679379527994e-06, "loss": 0.751, "step": 11769 }, { "epoch": 0.8, "learning_rate": 1.984947828418288e-06, "loss": 0.748, "step": 11770 }, { "epoch": 0.8, "learning_rate": 1.9836281093767274e-06, "loss": 0.7617, "step": 11771 }, { "epoch": 0.8, "learning_rate": 1.982308780892418e-06, "loss": 0.792, "step": 11772 }, { "epoch": 0.8, "learning_rate": 1.9809898430296303e-06, "loss": 0.7979, "step": 11773 }, { "epoch": 0.8, "learning_rate": 1.9796712958526276e-06, "loss": 0.6572, "step": 11774 }, { "epoch": 0.8, "learning_rate": 1.978353139425647e-06, "loss": 0.7412, "step": 11775 }, { "epoch": 0.8, "learning_rate": 1.9770353738129113e-06, "loss": 0.7422, "step": 11776 }, { "epoch": 0.8, "learning_rate": 1.97571799907862e-06, "loss": 0.7168, "step": 11777 }, { "epoch": 0.8, "learning_rate": 1.9744010152869596e-06, "loss": 0.7822, "step": 11778 }, { "epoch": 0.8, "learning_rate": 1.9730844225020875e-06, "loss": 0.6431, "step": 11779 }, { "epoch": 0.8, "learning_rate": 1.9717682207881483e-06, "loss": 0.7119, "step": 11780 }, { "epoch": 0.8, "learning_rate": 1.9704524102092747e-06, "loss": 0.792, "step": 11781 }, { "epoch": 0.8, "learning_rate": 1.9691369908295668e-06, "loss": 0.79, "step": 11782 }, { "epoch": 0.8, "learning_rate": 1.9678219627131122e-06, "loss": 0.6904, "step": 11783 }, { "epoch": 0.8, "learning_rate": 1.96650732592398e-06, "loss": 0.7715, "step": 11784 }, { "epoch": 0.8, "learning_rate": 1.965193080526221e-06, "loss": 0.668, "step": 11785 }, { "epoch": 0.8, "learning_rate": 1.963879226583859e-06, "loss": 0.8818, "step": 11786 }, { "epoch": 0.8, "learning_rate": 1.962565764160911e-06, "loss": 0.7617, "step": 11787 }, { "epoch": 0.8, "learning_rate": 1.9612526933213706e-06, "loss": 0.8457, "step": 11788 }, { "epoch": 0.8, "learning_rate": 1.9599400141292036e-06, "loss": 0.75, "step": 11789 }, { "epoch": 0.8, "learning_rate": 1.958627726648368e-06, "loss": 0.7197, "step": 11790 }, { "epoch": 0.8, "learning_rate": 1.957315830942799e-06, "loss": 0.7002, "step": 11791 }, { "epoch": 0.8, "learning_rate": 1.956004327076405e-06, "loss": 0.7471, "step": 11792 }, { "epoch": 0.8, "learning_rate": 1.9546932151130913e-06, "loss": 0.7451, "step": 11793 }, { "epoch": 0.8, "learning_rate": 1.9533824951167346e-06, "loss": 0.7471, "step": 11794 }, { "epoch": 0.8, "learning_rate": 1.9520721671511868e-06, "loss": 0.748, "step": 11795 }, { "epoch": 0.8, "learning_rate": 1.950762231280291e-06, "loss": 0.7383, "step": 11796 }, { "epoch": 0.8, "learning_rate": 1.9494526875678667e-06, "loss": 0.7607, "step": 11797 }, { "epoch": 0.8, "learning_rate": 1.9481435360777157e-06, "loss": 0.7295, "step": 11798 }, { "epoch": 0.8, "learning_rate": 1.9468347768736184e-06, "loss": 0.8389, "step": 11799 }, { "epoch": 0.8, "learning_rate": 1.945526410019337e-06, "loss": 0.7822, "step": 11800 }, { "epoch": 0.8, "learning_rate": 1.9442184355786197e-06, "loss": 0.8359, "step": 11801 }, { "epoch": 0.8, "learning_rate": 1.942910853615185e-06, "loss": 0.7275, "step": 11802 }, { "epoch": 0.8, "learning_rate": 1.9416036641927406e-06, "loss": 0.7441, "step": 11803 }, { "epoch": 0.8, "learning_rate": 1.9402968673749722e-06, "loss": 0.7314, "step": 11804 }, { "epoch": 0.8, "learning_rate": 1.9389904632255473e-06, "loss": 0.7822, "step": 11805 }, { "epoch": 0.8, "learning_rate": 1.937684451808114e-06, "loss": 0.7666, "step": 11806 }, { "epoch": 0.8, "learning_rate": 1.9363788331863045e-06, "loss": 0.7598, "step": 11807 }, { "epoch": 0.8, "learning_rate": 1.935073607423722e-06, "loss": 0.7588, "step": 11808 }, { "epoch": 0.8, "learning_rate": 1.933768774583956e-06, "loss": 0.7451, "step": 11809 }, { "epoch": 0.8, "learning_rate": 1.9324643347305893e-06, "loss": 0.7227, "step": 11810 }, { "epoch": 0.8, "learning_rate": 1.931160287927163e-06, "loss": 0.7793, "step": 11811 }, { "epoch": 0.8, "learning_rate": 1.9298566342372137e-06, "loss": 0.6982, "step": 11812 }, { "epoch": 0.81, "learning_rate": 1.9285533737242566e-06, "loss": 0.7246, "step": 11813 }, { "epoch": 0.81, "learning_rate": 1.927250506451788e-06, "loss": 0.7314, "step": 11814 }, { "epoch": 0.81, "learning_rate": 1.9259480324832745e-06, "loss": 0.7119, "step": 11815 }, { "epoch": 0.81, "learning_rate": 1.9246459518821836e-06, "loss": 0.7529, "step": 11816 }, { "epoch": 0.81, "learning_rate": 1.9233442647119493e-06, "loss": 0.7607, "step": 11817 }, { "epoch": 0.81, "learning_rate": 1.9220429710359867e-06, "loss": 0.752, "step": 11818 }, { "epoch": 0.81, "learning_rate": 1.920742070917696e-06, "loss": 0.7344, "step": 11819 }, { "epoch": 0.81, "learning_rate": 1.9194415644204576e-06, "loss": 0.7363, "step": 11820 }, { "epoch": 0.81, "learning_rate": 1.9181414516076335e-06, "loss": 0.7959, "step": 11821 }, { "epoch": 0.81, "learning_rate": 1.9168417325425625e-06, "loss": 0.7988, "step": 11822 }, { "epoch": 0.81, "learning_rate": 1.9155424072885688e-06, "loss": 0.7744, "step": 11823 }, { "epoch": 0.81, "learning_rate": 1.9142434759089566e-06, "loss": 0.7705, "step": 11824 }, { "epoch": 0.81, "learning_rate": 1.912944938467005e-06, "loss": 0.7705, "step": 11825 }, { "epoch": 0.81, "learning_rate": 1.9116467950259832e-06, "loss": 0.7236, "step": 11826 }, { "epoch": 0.81, "learning_rate": 1.9103490456491335e-06, "loss": 0.7031, "step": 11827 }, { "epoch": 0.81, "learning_rate": 1.9090516903996847e-06, "loss": 0.7324, "step": 11828 }, { "epoch": 0.81, "learning_rate": 1.907754729340843e-06, "loss": 0.7656, "step": 11829 }, { "epoch": 0.81, "learning_rate": 1.906458162535798e-06, "loss": 0.7891, "step": 11830 }, { "epoch": 0.81, "learning_rate": 1.9051619900477148e-06, "loss": 0.7607, "step": 11831 }, { "epoch": 0.81, "learning_rate": 1.9038662119397443e-06, "loss": 0.7998, "step": 11832 }, { "epoch": 0.81, "learning_rate": 1.9025708282750177e-06, "loss": 0.7197, "step": 11833 }, { "epoch": 0.81, "learning_rate": 1.9012758391166454e-06, "loss": 0.7168, "step": 11834 }, { "epoch": 0.81, "learning_rate": 1.8999812445277188e-06, "loss": 0.7471, "step": 11835 }, { "epoch": 0.81, "learning_rate": 1.8986870445713112e-06, "loss": 0.7783, "step": 11836 }, { "epoch": 0.81, "learning_rate": 1.8973932393104778e-06, "loss": 0.7842, "step": 11837 }, { "epoch": 0.81, "learning_rate": 1.8960998288082487e-06, "loss": 0.7695, "step": 11838 }, { "epoch": 0.81, "learning_rate": 1.8948068131276376e-06, "loss": 0.7598, "step": 11839 }, { "epoch": 0.81, "learning_rate": 1.8935141923316492e-06, "loss": 0.7939, "step": 11840 }, { "epoch": 0.81, "learning_rate": 1.8922219664832508e-06, "loss": 0.7617, "step": 11841 }, { "epoch": 0.81, "learning_rate": 1.8909301356454034e-06, "loss": 0.8135, "step": 11842 }, { "epoch": 0.81, "learning_rate": 1.8896386998810468e-06, "loss": 0.7812, "step": 11843 }, { "epoch": 0.81, "learning_rate": 1.8883476592530936e-06, "loss": 0.7402, "step": 11844 }, { "epoch": 0.81, "learning_rate": 1.8870570138244459e-06, "loss": 0.7275, "step": 11845 }, { "epoch": 0.81, "learning_rate": 1.885766763657989e-06, "loss": 0.8213, "step": 11846 }, { "epoch": 0.81, "learning_rate": 1.884476908816577e-06, "loss": 0.7754, "step": 11847 }, { "epoch": 0.81, "learning_rate": 1.8831874493630554e-06, "loss": 0.7422, "step": 11848 }, { "epoch": 0.81, "learning_rate": 1.8818983853602434e-06, "loss": 0.7598, "step": 11849 }, { "epoch": 0.81, "learning_rate": 1.8806097168709503e-06, "loss": 0.7305, "step": 11850 }, { "epoch": 0.81, "learning_rate": 1.879321443957951e-06, "loss": 0.793, "step": 11851 }, { "epoch": 0.81, "learning_rate": 1.8780335666840166e-06, "loss": 0.7344, "step": 11852 }, { "epoch": 0.81, "learning_rate": 1.8767460851118934e-06, "loss": 0.7881, "step": 11853 }, { "epoch": 0.81, "learning_rate": 1.8754589993043026e-06, "loss": 0.7725, "step": 11854 }, { "epoch": 0.81, "learning_rate": 1.8741723093239529e-06, "loss": 0.7656, "step": 11855 }, { "epoch": 0.81, "learning_rate": 1.8728860152335315e-06, "loss": 0.7363, "step": 11856 }, { "epoch": 0.81, "learning_rate": 1.8716001170957076e-06, "loss": 0.8193, "step": 11857 }, { "epoch": 0.81, "learning_rate": 1.8703146149731299e-06, "loss": 0.7568, "step": 11858 }, { "epoch": 0.81, "learning_rate": 1.8690295089284304e-06, "loss": 0.6514, "step": 11859 }, { "epoch": 0.81, "learning_rate": 1.8677447990242136e-06, "loss": 0.7598, "step": 11860 }, { "epoch": 0.81, "learning_rate": 1.866460485323074e-06, "loss": 0.748, "step": 11861 }, { "epoch": 0.81, "learning_rate": 1.865176567887582e-06, "loss": 0.7578, "step": 11862 }, { "epoch": 0.81, "learning_rate": 1.8638930467802919e-06, "loss": 0.792, "step": 11863 }, { "epoch": 0.81, "learning_rate": 1.862609922063735e-06, "loss": 0.7686, "step": 11864 }, { "epoch": 0.81, "learning_rate": 1.8613271938004262e-06, "loss": 0.7549, "step": 11865 }, { "epoch": 0.81, "learning_rate": 1.8600448620528632e-06, "loss": 0.7686, "step": 11866 }, { "epoch": 0.81, "learning_rate": 1.8587629268835139e-06, "loss": 0.7119, "step": 11867 }, { "epoch": 0.81, "learning_rate": 1.8574813883548382e-06, "loss": 0.6631, "step": 11868 }, { "epoch": 0.81, "learning_rate": 1.8562002465292717e-06, "loss": 0.7256, "step": 11869 }, { "epoch": 0.81, "learning_rate": 1.8549195014692323e-06, "loss": 0.7852, "step": 11870 }, { "epoch": 0.81, "learning_rate": 1.853639153237118e-06, "loss": 0.6641, "step": 11871 }, { "epoch": 0.81, "learning_rate": 1.8523592018953064e-06, "loss": 0.7275, "step": 11872 }, { "epoch": 0.81, "learning_rate": 1.85107964750616e-06, "loss": 0.75, "step": 11873 }, { "epoch": 0.81, "learning_rate": 1.8498004901320121e-06, "loss": 0.7871, "step": 11874 }, { "epoch": 0.81, "learning_rate": 1.8485217298351854e-06, "loss": 0.7891, "step": 11875 }, { "epoch": 0.81, "learning_rate": 1.8472433666779877e-06, "loss": 0.7285, "step": 11876 }, { "epoch": 0.81, "learning_rate": 1.8459654007226924e-06, "loss": 0.7568, "step": 11877 }, { "epoch": 0.81, "learning_rate": 1.8446878320315653e-06, "loss": 0.7217, "step": 11878 }, { "epoch": 0.81, "learning_rate": 1.8434106606668522e-06, "loss": 0.8525, "step": 11879 }, { "epoch": 0.81, "learning_rate": 1.8421338866907713e-06, "loss": 0.7129, "step": 11880 }, { "epoch": 0.81, "learning_rate": 1.8408575101655268e-06, "loss": 0.7061, "step": 11881 }, { "epoch": 0.81, "learning_rate": 1.8395815311533127e-06, "loss": 0.7979, "step": 11882 }, { "epoch": 0.81, "learning_rate": 1.8383059497162846e-06, "loss": 0.707, "step": 11883 }, { "epoch": 0.81, "learning_rate": 1.837030765916593e-06, "loss": 0.7891, "step": 11884 }, { "epoch": 0.81, "learning_rate": 1.8357559798163648e-06, "loss": 0.8369, "step": 11885 }, { "epoch": 0.81, "learning_rate": 1.8344815914777092e-06, "loss": 0.7822, "step": 11886 }, { "epoch": 0.81, "learning_rate": 1.8332076009627075e-06, "loss": 0.8047, "step": 11887 }, { "epoch": 0.81, "learning_rate": 1.8319340083334346e-06, "loss": 0.7666, "step": 11888 }, { "epoch": 0.81, "learning_rate": 1.8306608136519421e-06, "loss": 0.7344, "step": 11889 }, { "epoch": 0.81, "learning_rate": 1.8293880169802547e-06, "loss": 0.7695, "step": 11890 }, { "epoch": 0.81, "learning_rate": 1.8281156183803828e-06, "loss": 0.7002, "step": 11891 }, { "epoch": 0.81, "learning_rate": 1.8268436179143201e-06, "loss": 0.749, "step": 11892 }, { "epoch": 0.81, "learning_rate": 1.8255720156440383e-06, "loss": 0.7207, "step": 11893 }, { "epoch": 0.81, "learning_rate": 1.8243008116314886e-06, "loss": 0.71, "step": 11894 }, { "epoch": 0.81, "learning_rate": 1.8230300059386085e-06, "loss": 0.7363, "step": 11895 }, { "epoch": 0.81, "learning_rate": 1.821759598627304e-06, "loss": 0.7793, "step": 11896 }, { "epoch": 0.81, "learning_rate": 1.8204895897594733e-06, "loss": 0.7803, "step": 11897 }, { "epoch": 0.81, "learning_rate": 1.81921997939699e-06, "loss": 0.7256, "step": 11898 }, { "epoch": 0.81, "learning_rate": 1.8179507676017117e-06, "loss": 0.7725, "step": 11899 }, { "epoch": 0.81, "learning_rate": 1.816681954435473e-06, "loss": 0.7422, "step": 11900 }, { "epoch": 0.81, "learning_rate": 1.815413539960089e-06, "loss": 0.8164, "step": 11901 }, { "epoch": 0.81, "learning_rate": 1.8141455242373618e-06, "loss": 0.7158, "step": 11902 }, { "epoch": 0.81, "learning_rate": 1.8128779073290626e-06, "loss": 0.7842, "step": 11903 }, { "epoch": 0.81, "learning_rate": 1.811610689296953e-06, "loss": 0.7295, "step": 11904 }, { "epoch": 0.81, "learning_rate": 1.810343870202771e-06, "loss": 0.7588, "step": 11905 }, { "epoch": 0.81, "learning_rate": 1.8090774501082365e-06, "loss": 0.7461, "step": 11906 }, { "epoch": 0.81, "learning_rate": 1.8078114290750492e-06, "loss": 0.8057, "step": 11907 }, { "epoch": 0.81, "learning_rate": 1.806545807164889e-06, "loss": 0.7373, "step": 11908 }, { "epoch": 0.81, "learning_rate": 1.8052805844394206e-06, "loss": 0.8125, "step": 11909 }, { "epoch": 0.81, "learning_rate": 1.8040157609602793e-06, "loss": 0.7852, "step": 11910 }, { "epoch": 0.81, "learning_rate": 1.802751336789088e-06, "loss": 0.7109, "step": 11911 }, { "epoch": 0.81, "learning_rate": 1.8014873119874577e-06, "loss": 0.7646, "step": 11912 }, { "epoch": 0.81, "learning_rate": 1.800223686616962e-06, "loss": 0.7393, "step": 11913 }, { "epoch": 0.81, "learning_rate": 1.7989604607391699e-06, "loss": 0.6973, "step": 11914 }, { "epoch": 0.81, "learning_rate": 1.797697634415626e-06, "loss": 0.791, "step": 11915 }, { "epoch": 0.81, "learning_rate": 1.7964352077078506e-06, "loss": 0.7822, "step": 11916 }, { "epoch": 0.81, "learning_rate": 1.7951731806773486e-06, "loss": 0.7471, "step": 11917 }, { "epoch": 0.81, "learning_rate": 1.7939115533856155e-06, "loss": 0.7051, "step": 11918 }, { "epoch": 0.81, "learning_rate": 1.7926503258941086e-06, "loss": 0.7168, "step": 11919 }, { "epoch": 0.81, "learning_rate": 1.7913894982642776e-06, "loss": 0.6963, "step": 11920 }, { "epoch": 0.81, "learning_rate": 1.790129070557549e-06, "loss": 0.748, "step": 11921 }, { "epoch": 0.81, "learning_rate": 1.788869042835335e-06, "loss": 0.833, "step": 11922 }, { "epoch": 0.81, "learning_rate": 1.7876094151590162e-06, "loss": 0.7314, "step": 11923 }, { "epoch": 0.81, "learning_rate": 1.786350187589968e-06, "loss": 0.7666, "step": 11924 }, { "epoch": 0.81, "learning_rate": 1.7850913601895404e-06, "loss": 0.8047, "step": 11925 }, { "epoch": 0.81, "learning_rate": 1.7838329330190596e-06, "loss": 0.7314, "step": 11926 }, { "epoch": 0.81, "learning_rate": 1.7825749061398368e-06, "loss": 0.6992, "step": 11927 }, { "epoch": 0.81, "learning_rate": 1.7813172796131639e-06, "loss": 0.7842, "step": 11928 }, { "epoch": 0.81, "learning_rate": 1.780060053500312e-06, "loss": 0.6875, "step": 11929 }, { "epoch": 0.81, "learning_rate": 1.7788032278625345e-06, "loss": 0.7734, "step": 11930 }, { "epoch": 0.81, "learning_rate": 1.7775468027610643e-06, "loss": 0.749, "step": 11931 }, { "epoch": 0.81, "learning_rate": 1.7762907782571114e-06, "loss": 0.7715, "step": 11932 }, { "epoch": 0.81, "learning_rate": 1.7750351544118704e-06, "loss": 0.7227, "step": 11933 }, { "epoch": 0.81, "learning_rate": 1.7737799312865157e-06, "loss": 0.7979, "step": 11934 }, { "epoch": 0.81, "learning_rate": 1.7725251089422003e-06, "loss": 0.6846, "step": 11935 }, { "epoch": 0.81, "learning_rate": 1.771270687440062e-06, "loss": 0.7686, "step": 11936 }, { "epoch": 0.81, "learning_rate": 1.7700166668412133e-06, "loss": 0.7803, "step": 11937 }, { "epoch": 0.81, "learning_rate": 1.768763047206754e-06, "loss": 0.7256, "step": 11938 }, { "epoch": 0.81, "learning_rate": 1.7675098285977555e-06, "loss": 0.7959, "step": 11939 }, { "epoch": 0.81, "learning_rate": 1.766257011075274e-06, "loss": 0.7451, "step": 11940 }, { "epoch": 0.81, "learning_rate": 1.7650045947003548e-06, "loss": 0.7803, "step": 11941 }, { "epoch": 0.81, "learning_rate": 1.763752579534007e-06, "loss": 0.7803, "step": 11942 }, { "epoch": 0.81, "learning_rate": 1.7625009656372327e-06, "loss": 0.7734, "step": 11943 }, { "epoch": 0.81, "learning_rate": 1.7612497530710092e-06, "loss": 0.752, "step": 11944 }, { "epoch": 0.81, "learning_rate": 1.7599989418962982e-06, "loss": 0.8027, "step": 11945 }, { "epoch": 0.81, "learning_rate": 1.7587485321740327e-06, "loss": 0.75, "step": 11946 }, { "epoch": 0.81, "learning_rate": 1.757498523965141e-06, "loss": 0.751, "step": 11947 }, { "epoch": 0.81, "learning_rate": 1.7562489173305164e-06, "loss": 0.7139, "step": 11948 }, { "epoch": 0.81, "learning_rate": 1.7549997123310437e-06, "loss": 0.6143, "step": 11949 }, { "epoch": 0.81, "learning_rate": 1.7537509090275817e-06, "loss": 0.7178, "step": 11950 }, { "epoch": 0.81, "learning_rate": 1.7525025074809765e-06, "loss": 0.7227, "step": 11951 }, { "epoch": 0.81, "learning_rate": 1.7512545077520425e-06, "loss": 0.7139, "step": 11952 }, { "epoch": 0.81, "learning_rate": 1.7500069099015882e-06, "loss": 0.7793, "step": 11953 }, { "epoch": 0.81, "learning_rate": 1.7487597139903979e-06, "loss": 0.7676, "step": 11954 }, { "epoch": 0.81, "learning_rate": 1.7475129200792286e-06, "loss": 0.835, "step": 11955 }, { "epoch": 0.81, "learning_rate": 1.7462665282288283e-06, "loss": 0.7637, "step": 11956 }, { "epoch": 0.81, "learning_rate": 1.7450205384999197e-06, "loss": 0.8145, "step": 11957 }, { "epoch": 0.81, "learning_rate": 1.7437749509532086e-06, "loss": 0.7959, "step": 11958 }, { "epoch": 0.81, "learning_rate": 1.742529765649379e-06, "loss": 0.6816, "step": 11959 }, { "epoch": 0.82, "learning_rate": 1.7412849826490963e-06, "loss": 0.7529, "step": 11960 }, { "epoch": 0.82, "learning_rate": 1.740040602013009e-06, "loss": 0.6865, "step": 11961 }, { "epoch": 0.82, "learning_rate": 1.7387966238017384e-06, "loss": 0.7656, "step": 11962 }, { "epoch": 0.82, "learning_rate": 1.737553048075893e-06, "loss": 0.7451, "step": 11963 }, { "epoch": 0.82, "learning_rate": 1.7363098748960605e-06, "loss": 0.793, "step": 11964 }, { "epoch": 0.82, "learning_rate": 1.7350671043228072e-06, "loss": 0.7773, "step": 11965 }, { "epoch": 0.82, "learning_rate": 1.7338247364166828e-06, "loss": 0.6865, "step": 11966 }, { "epoch": 0.82, "learning_rate": 1.732582771238216e-06, "loss": 0.708, "step": 11967 }, { "epoch": 0.82, "learning_rate": 1.731341208847911e-06, "loss": 0.7637, "step": 11968 }, { "epoch": 0.82, "learning_rate": 1.7301000493062592e-06, "loss": 0.7148, "step": 11969 }, { "epoch": 0.82, "learning_rate": 1.7288592926737292e-06, "loss": 0.7637, "step": 11970 }, { "epoch": 0.82, "learning_rate": 1.727618939010771e-06, "loss": 0.7363, "step": 11971 }, { "epoch": 0.82, "learning_rate": 1.726378988377816e-06, "loss": 0.6357, "step": 11972 }, { "epoch": 0.82, "learning_rate": 1.7251394408352718e-06, "loss": 0.7402, "step": 11973 }, { "epoch": 0.82, "learning_rate": 1.7239002964435337e-06, "loss": 0.8057, "step": 11974 }, { "epoch": 0.82, "learning_rate": 1.7226615552629667e-06, "loss": 0.6943, "step": 11975 }, { "epoch": 0.82, "learning_rate": 1.7214232173539236e-06, "loss": 0.7695, "step": 11976 }, { "epoch": 0.82, "learning_rate": 1.7201852827767417e-06, "loss": 0.7832, "step": 11977 }, { "epoch": 0.82, "learning_rate": 1.7189477515917263e-06, "loss": 0.7852, "step": 11978 }, { "epoch": 0.82, "learning_rate": 1.7177106238591724e-06, "loss": 0.7686, "step": 11979 }, { "epoch": 0.82, "learning_rate": 1.716473899639356e-06, "loss": 0.8018, "step": 11980 }, { "epoch": 0.82, "learning_rate": 1.7152375789925257e-06, "loss": 0.7324, "step": 11981 }, { "epoch": 0.82, "learning_rate": 1.7140016619789124e-06, "loss": 0.7051, "step": 11982 }, { "epoch": 0.82, "learning_rate": 1.71276614865874e-06, "loss": 0.6553, "step": 11983 }, { "epoch": 0.82, "learning_rate": 1.7115310390921935e-06, "loss": 0.7793, "step": 11984 }, { "epoch": 0.82, "learning_rate": 1.7102963333394517e-06, "loss": 0.7422, "step": 11985 }, { "epoch": 0.82, "learning_rate": 1.7090620314606676e-06, "loss": 0.7188, "step": 11986 }, { "epoch": 0.82, "learning_rate": 1.7078281335159797e-06, "loss": 0.7207, "step": 11987 }, { "epoch": 0.82, "learning_rate": 1.7065946395654953e-06, "loss": 0.7803, "step": 11988 }, { "epoch": 0.82, "learning_rate": 1.7053615496693188e-06, "loss": 0.7939, "step": 11989 }, { "epoch": 0.82, "learning_rate": 1.7041288638875253e-06, "loss": 0.7168, "step": 11990 }, { "epoch": 0.82, "learning_rate": 1.7028965822801658e-06, "loss": 0.7373, "step": 11991 }, { "epoch": 0.82, "learning_rate": 1.701664704907281e-06, "loss": 0.6826, "step": 11992 }, { "epoch": 0.82, "learning_rate": 1.7004332318288863e-06, "loss": 0.6641, "step": 11993 }, { "epoch": 0.82, "learning_rate": 1.6992021631049805e-06, "loss": 0.7227, "step": 11994 }, { "epoch": 0.82, "learning_rate": 1.697971498795541e-06, "loss": 0.7588, "step": 11995 }, { "epoch": 0.82, "learning_rate": 1.6967412389605242e-06, "loss": 0.8193, "step": 11996 }, { "epoch": 0.82, "learning_rate": 1.6955113836598723e-06, "loss": 0.6523, "step": 11997 }, { "epoch": 0.82, "learning_rate": 1.6942819329534977e-06, "loss": 0.7607, "step": 11998 }, { "epoch": 0.82, "learning_rate": 1.693052886901303e-06, "loss": 0.7441, "step": 11999 }, { "epoch": 0.82, "learning_rate": 1.6918242455631662e-06, "loss": 0.7529, "step": 12000 }, { "epoch": 0.82, "learning_rate": 1.6905960089989482e-06, "loss": 0.7266, "step": 12001 }, { "epoch": 0.82, "learning_rate": 1.6893681772684855e-06, "loss": 0.7412, "step": 12002 }, { "epoch": 0.82, "learning_rate": 1.688140750431604e-06, "loss": 0.7783, "step": 12003 }, { "epoch": 0.82, "learning_rate": 1.6869137285480963e-06, "loss": 0.6816, "step": 12004 }, { "epoch": 0.82, "learning_rate": 1.6856871116777462e-06, "loss": 0.7871, "step": 12005 }, { "epoch": 0.82, "learning_rate": 1.684460899880316e-06, "loss": 0.8076, "step": 12006 }, { "epoch": 0.82, "learning_rate": 1.6832350932155438e-06, "loss": 0.7275, "step": 12007 }, { "epoch": 0.82, "learning_rate": 1.6820096917431527e-06, "loss": 0.8281, "step": 12008 }, { "epoch": 0.82, "learning_rate": 1.6807846955228435e-06, "loss": 0.6826, "step": 12009 }, { "epoch": 0.82, "learning_rate": 1.6795601046143006e-06, "loss": 0.7939, "step": 12010 }, { "epoch": 0.82, "learning_rate": 1.678335919077182e-06, "loss": 0.7402, "step": 12011 }, { "epoch": 0.82, "learning_rate": 1.6771121389711288e-06, "loss": 0.7412, "step": 12012 }, { "epoch": 0.82, "learning_rate": 1.6758887643557708e-06, "loss": 0.752, "step": 12013 }, { "epoch": 0.82, "learning_rate": 1.6746657952907042e-06, "loss": 0.7676, "step": 12014 }, { "epoch": 0.82, "learning_rate": 1.6734432318355143e-06, "loss": 0.7334, "step": 12015 }, { "epoch": 0.82, "learning_rate": 1.6722210740497658e-06, "loss": 0.7275, "step": 12016 }, { "epoch": 0.82, "learning_rate": 1.6709993219929987e-06, "loss": 0.709, "step": 12017 }, { "epoch": 0.82, "learning_rate": 1.6697779757247357e-06, "loss": 0.751, "step": 12018 }, { "epoch": 0.82, "learning_rate": 1.668557035304489e-06, "loss": 0.7188, "step": 12019 }, { "epoch": 0.82, "learning_rate": 1.6673365007917341e-06, "loss": 0.7451, "step": 12020 }, { "epoch": 0.82, "learning_rate": 1.6661163722459385e-06, "loss": 0.8193, "step": 12021 }, { "epoch": 0.82, "learning_rate": 1.6648966497265473e-06, "loss": 0.7803, "step": 12022 }, { "epoch": 0.82, "learning_rate": 1.6636773332929867e-06, "loss": 0.7578, "step": 12023 }, { "epoch": 0.82, "learning_rate": 1.6624584230046547e-06, "loss": 0.8047, "step": 12024 }, { "epoch": 0.82, "learning_rate": 1.6612399189209449e-06, "loss": 0.7812, "step": 12025 }, { "epoch": 0.82, "learning_rate": 1.660021821101222e-06, "loss": 0.791, "step": 12026 }, { "epoch": 0.82, "learning_rate": 1.6588041296048264e-06, "loss": 0.7793, "step": 12027 }, { "epoch": 0.82, "learning_rate": 1.657586844491088e-06, "loss": 0.7666, "step": 12028 }, { "epoch": 0.82, "learning_rate": 1.65636996581931e-06, "loss": 0.8398, "step": 12029 }, { "epoch": 0.82, "learning_rate": 1.6551534936487813e-06, "loss": 0.833, "step": 12030 }, { "epoch": 0.82, "learning_rate": 1.6539374280387676e-06, "loss": 0.6602, "step": 12031 }, { "epoch": 0.82, "learning_rate": 1.6527217690485152e-06, "loss": 0.7461, "step": 12032 }, { "epoch": 0.82, "learning_rate": 1.6515065167372536e-06, "loss": 0.7207, "step": 12033 }, { "epoch": 0.82, "learning_rate": 1.6502916711641847e-06, "loss": 0.7021, "step": 12034 }, { "epoch": 0.82, "learning_rate": 1.6490772323884984e-06, "loss": 0.7695, "step": 12035 }, { "epoch": 0.82, "learning_rate": 1.6478632004693628e-06, "loss": 0.75, "step": 12036 }, { "epoch": 0.82, "learning_rate": 1.646649575465924e-06, "loss": 0.7051, "step": 12037 }, { "epoch": 0.82, "learning_rate": 1.645436357437311e-06, "loss": 0.7197, "step": 12038 }, { "epoch": 0.82, "learning_rate": 1.6442235464426337e-06, "loss": 0.748, "step": 12039 }, { "epoch": 0.82, "learning_rate": 1.6430111425409745e-06, "loss": 0.7314, "step": 12040 }, { "epoch": 0.82, "learning_rate": 1.6417991457914052e-06, "loss": 0.751, "step": 12041 }, { "epoch": 0.82, "learning_rate": 1.640587556252975e-06, "loss": 0.7559, "step": 12042 }, { "epoch": 0.82, "learning_rate": 1.6393763739847102e-06, "loss": 0.79, "step": 12043 }, { "epoch": 0.82, "learning_rate": 1.6381655990456213e-06, "loss": 0.8096, "step": 12044 }, { "epoch": 0.82, "learning_rate": 1.6369552314946957e-06, "loss": 0.7188, "step": 12045 }, { "epoch": 0.82, "learning_rate": 1.6357452713909073e-06, "loss": 0.7598, "step": 12046 }, { "epoch": 0.82, "learning_rate": 1.6345357187931955e-06, "loss": 0.7578, "step": 12047 }, { "epoch": 0.82, "learning_rate": 1.6333265737604976e-06, "loss": 0.7754, "step": 12048 }, { "epoch": 0.82, "learning_rate": 1.6321178363517242e-06, "loss": 0.6235, "step": 12049 }, { "epoch": 0.82, "learning_rate": 1.6309095066257597e-06, "loss": 0.7148, "step": 12050 }, { "epoch": 0.82, "learning_rate": 1.6297015846414755e-06, "loss": 0.7168, "step": 12051 }, { "epoch": 0.82, "learning_rate": 1.6284940704577235e-06, "loss": 0.7539, "step": 12052 }, { "epoch": 0.82, "learning_rate": 1.6272869641333279e-06, "loss": 0.7588, "step": 12053 }, { "epoch": 0.82, "learning_rate": 1.6260802657271056e-06, "loss": 0.7646, "step": 12054 }, { "epoch": 0.82, "learning_rate": 1.624873975297847e-06, "loss": 0.79, "step": 12055 }, { "epoch": 0.82, "learning_rate": 1.623668092904318e-06, "loss": 0.71, "step": 12056 }, { "epoch": 0.82, "learning_rate": 1.6224626186052695e-06, "loss": 0.7969, "step": 12057 }, { "epoch": 0.82, "learning_rate": 1.6212575524594343e-06, "loss": 0.6533, "step": 12058 }, { "epoch": 0.82, "learning_rate": 1.6200528945255233e-06, "loss": 0.7451, "step": 12059 }, { "epoch": 0.82, "learning_rate": 1.6188486448622265e-06, "loss": 0.7314, "step": 12060 }, { "epoch": 0.82, "learning_rate": 1.6176448035282144e-06, "loss": 0.7207, "step": 12061 }, { "epoch": 0.82, "learning_rate": 1.6164413705821414e-06, "loss": 0.7666, "step": 12062 }, { "epoch": 0.82, "learning_rate": 1.6152383460826327e-06, "loss": 0.7705, "step": 12063 }, { "epoch": 0.82, "learning_rate": 1.6140357300883035e-06, "loss": 0.7607, "step": 12064 }, { "epoch": 0.82, "learning_rate": 1.6128335226577451e-06, "loss": 0.7705, "step": 12065 }, { "epoch": 0.82, "learning_rate": 1.6116317238495282e-06, "loss": 0.7295, "step": 12066 }, { "epoch": 0.82, "learning_rate": 1.6104303337222039e-06, "loss": 0.7676, "step": 12067 }, { "epoch": 0.82, "learning_rate": 1.6092293523343084e-06, "loss": 0.7734, "step": 12068 }, { "epoch": 0.82, "learning_rate": 1.608028779744346e-06, "loss": 0.7949, "step": 12069 }, { "epoch": 0.82, "learning_rate": 1.6068286160108126e-06, "loss": 0.8271, "step": 12070 }, { "epoch": 0.82, "learning_rate": 1.60562886119218e-06, "loss": 0.7734, "step": 12071 }, { "epoch": 0.82, "learning_rate": 1.6044295153468992e-06, "loss": 0.7578, "step": 12072 }, { "epoch": 0.82, "learning_rate": 1.6032305785334035e-06, "loss": 0.7812, "step": 12073 }, { "epoch": 0.82, "learning_rate": 1.6020320508101051e-06, "loss": 0.7344, "step": 12074 }, { "epoch": 0.82, "learning_rate": 1.6008339322353973e-06, "loss": 0.7246, "step": 12075 }, { "epoch": 0.82, "learning_rate": 1.5996362228676487e-06, "loss": 0.7246, "step": 12076 }, { "epoch": 0.82, "learning_rate": 1.5984389227652108e-06, "loss": 0.8438, "step": 12077 }, { "epoch": 0.82, "learning_rate": 1.5972420319864245e-06, "loss": 0.7559, "step": 12078 }, { "epoch": 0.82, "learning_rate": 1.5960455505895933e-06, "loss": 0.833, "step": 12079 }, { "epoch": 0.82, "learning_rate": 1.5948494786330139e-06, "loss": 0.7891, "step": 12080 }, { "epoch": 0.82, "learning_rate": 1.593653816174957e-06, "loss": 0.7451, "step": 12081 }, { "epoch": 0.82, "learning_rate": 1.5924585632736788e-06, "loss": 0.7148, "step": 12082 }, { "epoch": 0.82, "learning_rate": 1.5912637199874048e-06, "loss": 0.7705, "step": 12083 }, { "epoch": 0.82, "learning_rate": 1.5900692863743549e-06, "loss": 0.7383, "step": 12084 }, { "epoch": 0.82, "learning_rate": 1.5888752624927218e-06, "loss": 0.7051, "step": 12085 }, { "epoch": 0.82, "learning_rate": 1.587681648400673e-06, "loss": 0.7646, "step": 12086 }, { "epoch": 0.82, "learning_rate": 1.5864884441563644e-06, "loss": 0.7715, "step": 12087 }, { "epoch": 0.82, "learning_rate": 1.5852956498179307e-06, "loss": 0.7832, "step": 12088 }, { "epoch": 0.82, "learning_rate": 1.5841032654434773e-06, "loss": 0.7422, "step": 12089 }, { "epoch": 0.82, "learning_rate": 1.582911291091106e-06, "loss": 0.75, "step": 12090 }, { "epoch": 0.82, "learning_rate": 1.5817197268188878e-06, "loss": 0.7412, "step": 12091 }, { "epoch": 0.82, "learning_rate": 1.5805285726848706e-06, "loss": 0.793, "step": 12092 }, { "epoch": 0.82, "learning_rate": 1.5793378287470918e-06, "loss": 0.666, "step": 12093 }, { "epoch": 0.82, "learning_rate": 1.5781474950635633e-06, "loss": 0.6758, "step": 12094 }, { "epoch": 0.82, "learning_rate": 1.576957571692278e-06, "loss": 0.7588, "step": 12095 }, { "epoch": 0.82, "learning_rate": 1.5757680586912094e-06, "loss": 0.7793, "step": 12096 }, { "epoch": 0.82, "learning_rate": 1.57457895611831e-06, "loss": 0.7773, "step": 12097 }, { "epoch": 0.82, "learning_rate": 1.5733902640315146e-06, "loss": 0.7412, "step": 12098 }, { "epoch": 0.82, "learning_rate": 1.5722019824887335e-06, "loss": 0.7041, "step": 12099 }, { "epoch": 0.82, "learning_rate": 1.5710141115478593e-06, "loss": 0.7764, "step": 12100 }, { "epoch": 0.82, "learning_rate": 1.5698266512667682e-06, "loss": 0.7578, "step": 12101 }, { "epoch": 0.82, "learning_rate": 1.5686396017033102e-06, "loss": 0.7949, "step": 12102 }, { "epoch": 0.82, "learning_rate": 1.5674529629153202e-06, "loss": 0.75, "step": 12103 }, { "epoch": 0.82, "learning_rate": 1.566266734960613e-06, "loss": 0.8066, "step": 12104 }, { "epoch": 0.82, "learning_rate": 1.5650809178969772e-06, "loss": 0.751, "step": 12105 }, { "epoch": 0.82, "learning_rate": 1.5638955117821874e-06, "loss": 0.7227, "step": 12106 }, { "epoch": 0.83, "learning_rate": 1.5627105166739965e-06, "loss": 0.7627, "step": 12107 }, { "epoch": 0.83, "learning_rate": 1.561525932630138e-06, "loss": 0.7891, "step": 12108 }, { "epoch": 0.83, "learning_rate": 1.5603417597083248e-06, "loss": 0.8135, "step": 12109 }, { "epoch": 0.83, "learning_rate": 1.5591579979662497e-06, "loss": 0.7178, "step": 12110 }, { "epoch": 0.83, "learning_rate": 1.5579746474615864e-06, "loss": 0.7461, "step": 12111 }, { "epoch": 0.83, "learning_rate": 1.5567917082519856e-06, "loss": 0.7402, "step": 12112 }, { "epoch": 0.83, "learning_rate": 1.555609180395078e-06, "loss": 0.7139, "step": 12113 }, { "epoch": 0.83, "learning_rate": 1.5544270639484837e-06, "loss": 0.7275, "step": 12114 }, { "epoch": 0.83, "learning_rate": 1.5532453589697894e-06, "loss": 0.7852, "step": 12115 }, { "epoch": 0.83, "learning_rate": 1.5520640655165687e-06, "loss": 0.7148, "step": 12116 }, { "epoch": 0.83, "learning_rate": 1.5508831836463756e-06, "loss": 0.7529, "step": 12117 }, { "epoch": 0.83, "learning_rate": 1.5497027134167431e-06, "loss": 0.7725, "step": 12118 }, { "epoch": 0.83, "learning_rate": 1.5485226548851783e-06, "loss": 0.8379, "step": 12119 }, { "epoch": 0.83, "learning_rate": 1.5473430081091823e-06, "loss": 0.8184, "step": 12120 }, { "epoch": 0.83, "learning_rate": 1.5461637731462198e-06, "loss": 0.6963, "step": 12121 }, { "epoch": 0.83, "learning_rate": 1.5449849500537462e-06, "loss": 0.8164, "step": 12122 }, { "epoch": 0.83, "learning_rate": 1.5438065388891944e-06, "loss": 0.748, "step": 12123 }, { "epoch": 0.83, "learning_rate": 1.5426285397099772e-06, "loss": 0.7158, "step": 12124 }, { "epoch": 0.83, "learning_rate": 1.54145095257348e-06, "loss": 0.6582, "step": 12125 }, { "epoch": 0.83, "learning_rate": 1.5402737775370834e-06, "loss": 0.7588, "step": 12126 }, { "epoch": 0.83, "learning_rate": 1.5390970146581374e-06, "loss": 0.7461, "step": 12127 }, { "epoch": 0.83, "learning_rate": 1.5379206639939693e-06, "loss": 0.7109, "step": 12128 }, { "epoch": 0.83, "learning_rate": 1.5367447256018952e-06, "loss": 0.7188, "step": 12129 }, { "epoch": 0.83, "learning_rate": 1.5355691995392042e-06, "loss": 0.7148, "step": 12130 }, { "epoch": 0.83, "learning_rate": 1.534394085863169e-06, "loss": 0.7158, "step": 12131 }, { "epoch": 0.83, "learning_rate": 1.5332193846310417e-06, "loss": 0.7334, "step": 12132 }, { "epoch": 0.83, "learning_rate": 1.5320450959000533e-06, "loss": 0.7637, "step": 12133 }, { "epoch": 0.83, "learning_rate": 1.5308712197274168e-06, "loss": 0.7891, "step": 12134 }, { "epoch": 0.83, "learning_rate": 1.5296977561703185e-06, "loss": 0.7598, "step": 12135 }, { "epoch": 0.83, "learning_rate": 1.5285247052859331e-06, "loss": 0.7021, "step": 12136 }, { "epoch": 0.83, "learning_rate": 1.5273520671314113e-06, "loss": 0.7998, "step": 12137 }, { "epoch": 0.83, "learning_rate": 1.5261798417638828e-06, "loss": 0.7705, "step": 12138 }, { "epoch": 0.83, "learning_rate": 1.5250080292404602e-06, "loss": 0.7148, "step": 12139 }, { "epoch": 0.83, "learning_rate": 1.523836629618235e-06, "loss": 0.6875, "step": 12140 }, { "epoch": 0.83, "learning_rate": 1.522665642954273e-06, "loss": 0.8018, "step": 12141 }, { "epoch": 0.83, "learning_rate": 1.5214950693056285e-06, "loss": 0.709, "step": 12142 }, { "epoch": 0.83, "learning_rate": 1.5203249087293293e-06, "loss": 0.7236, "step": 12143 }, { "epoch": 0.83, "learning_rate": 1.5191551612823886e-06, "loss": 0.7051, "step": 12144 }, { "epoch": 0.83, "learning_rate": 1.517985827021794e-06, "loss": 0.7617, "step": 12145 }, { "epoch": 0.83, "learning_rate": 1.5168169060045157e-06, "loss": 0.7363, "step": 12146 }, { "epoch": 0.83, "learning_rate": 1.515648398287507e-06, "loss": 0.6846, "step": 12147 }, { "epoch": 0.83, "learning_rate": 1.5144803039276924e-06, "loss": 0.7852, "step": 12148 }, { "epoch": 0.83, "learning_rate": 1.5133126229819816e-06, "loss": 0.7256, "step": 12149 }, { "epoch": 0.83, "learning_rate": 1.5121453555072696e-06, "loss": 0.7119, "step": 12150 }, { "epoch": 0.83, "learning_rate": 1.5109785015604206e-06, "loss": 0.7354, "step": 12151 }, { "epoch": 0.83, "learning_rate": 1.5098120611982846e-06, "loss": 0.7393, "step": 12152 }, { "epoch": 0.83, "learning_rate": 1.508646034477691e-06, "loss": 0.7617, "step": 12153 }, { "epoch": 0.83, "learning_rate": 1.5074804214554507e-06, "loss": 0.7598, "step": 12154 }, { "epoch": 0.83, "learning_rate": 1.5063152221883448e-06, "loss": 0.8154, "step": 12155 }, { "epoch": 0.83, "learning_rate": 1.5051504367331525e-06, "loss": 0.7207, "step": 12156 }, { "epoch": 0.83, "learning_rate": 1.5039860651466143e-06, "loss": 0.7568, "step": 12157 }, { "epoch": 0.83, "learning_rate": 1.502822107485461e-06, "loss": 0.7422, "step": 12158 }, { "epoch": 0.83, "learning_rate": 1.5016585638063996e-06, "loss": 0.7168, "step": 12159 }, { "epoch": 0.83, "learning_rate": 1.5004954341661216e-06, "loss": 0.6973, "step": 12160 }, { "epoch": 0.83, "learning_rate": 1.4993327186212858e-06, "loss": 0.8164, "step": 12161 }, { "epoch": 0.83, "learning_rate": 1.4981704172285482e-06, "loss": 0.7363, "step": 12162 }, { "epoch": 0.83, "learning_rate": 1.4970085300445358e-06, "loss": 0.7871, "step": 12163 }, { "epoch": 0.83, "learning_rate": 1.495847057125851e-06, "loss": 0.7617, "step": 12164 }, { "epoch": 0.83, "learning_rate": 1.494685998529083e-06, "loss": 0.8867, "step": 12165 }, { "epoch": 0.83, "learning_rate": 1.4935253543107974e-06, "loss": 0.7139, "step": 12166 }, { "epoch": 0.83, "learning_rate": 1.4923651245275427e-06, "loss": 0.7422, "step": 12167 }, { "epoch": 0.83, "learning_rate": 1.4912053092358435e-06, "loss": 0.748, "step": 12168 }, { "epoch": 0.83, "learning_rate": 1.490045908492207e-06, "loss": 0.7725, "step": 12169 }, { "epoch": 0.83, "learning_rate": 1.4888869223531222e-06, "loss": 0.7383, "step": 12170 }, { "epoch": 0.83, "learning_rate": 1.4877283508750474e-06, "loss": 0.7881, "step": 12171 }, { "epoch": 0.83, "learning_rate": 1.4865701941144305e-06, "loss": 0.7891, "step": 12172 }, { "epoch": 0.83, "learning_rate": 1.4854124521277036e-06, "loss": 0.7725, "step": 12173 }, { "epoch": 0.83, "learning_rate": 1.4842551249712645e-06, "loss": 0.8232, "step": 12174 }, { "epoch": 0.83, "learning_rate": 1.4830982127015003e-06, "loss": 0.7168, "step": 12175 }, { "epoch": 0.83, "learning_rate": 1.4819417153747784e-06, "loss": 0.7383, "step": 12176 }, { "epoch": 0.83, "learning_rate": 1.480785633047438e-06, "loss": 0.8164, "step": 12177 }, { "epoch": 0.83, "learning_rate": 1.479629965775804e-06, "loss": 0.8145, "step": 12178 }, { "epoch": 0.83, "learning_rate": 1.478474713616187e-06, "loss": 0.7461, "step": 12179 }, { "epoch": 0.83, "learning_rate": 1.4773198766248642e-06, "loss": 0.7236, "step": 12180 }, { "epoch": 0.83, "learning_rate": 1.4761654548581007e-06, "loss": 0.7256, "step": 12181 }, { "epoch": 0.83, "learning_rate": 1.4750114483721413e-06, "loss": 0.8174, "step": 12182 }, { "epoch": 0.83, "learning_rate": 1.4738578572232109e-06, "loss": 0.8193, "step": 12183 }, { "epoch": 0.83, "learning_rate": 1.472704681467505e-06, "loss": 0.8057, "step": 12184 }, { "epoch": 0.83, "learning_rate": 1.4715519211612128e-06, "loss": 0.7979, "step": 12185 }, { "epoch": 0.83, "learning_rate": 1.4703995763604984e-06, "loss": 0.8301, "step": 12186 }, { "epoch": 0.83, "learning_rate": 1.4692476471214978e-06, "loss": 0.7588, "step": 12187 }, { "epoch": 0.83, "learning_rate": 1.4680961335003362e-06, "loss": 0.8193, "step": 12188 }, { "epoch": 0.83, "learning_rate": 1.4669450355531179e-06, "loss": 0.7588, "step": 12189 }, { "epoch": 0.83, "learning_rate": 1.4657943533359154e-06, "loss": 0.7725, "step": 12190 }, { "epoch": 0.83, "learning_rate": 1.4646440869047984e-06, "loss": 0.7725, "step": 12191 }, { "epoch": 0.83, "learning_rate": 1.4634942363158079e-06, "loss": 0.7715, "step": 12192 }, { "epoch": 0.83, "learning_rate": 1.4623448016249597e-06, "loss": 0.7373, "step": 12193 }, { "epoch": 0.83, "learning_rate": 1.4611957828882562e-06, "loss": 0.7236, "step": 12194 }, { "epoch": 0.83, "learning_rate": 1.4600471801616779e-06, "loss": 0.7031, "step": 12195 }, { "epoch": 0.83, "learning_rate": 1.4588989935011843e-06, "loss": 0.8398, "step": 12196 }, { "epoch": 0.83, "learning_rate": 1.4577512229627145e-06, "loss": 0.7461, "step": 12197 }, { "epoch": 0.83, "learning_rate": 1.45660386860219e-06, "loss": 0.7686, "step": 12198 }, { "epoch": 0.83, "learning_rate": 1.4554569304755096e-06, "loss": 0.6973, "step": 12199 }, { "epoch": 0.83, "learning_rate": 1.4543104086385496e-06, "loss": 0.6699, "step": 12200 }, { "epoch": 0.83, "learning_rate": 1.4531643031471687e-06, "loss": 0.7383, "step": 12201 }, { "epoch": 0.83, "learning_rate": 1.4520186140572067e-06, "loss": 0.6875, "step": 12202 }, { "epoch": 0.83, "learning_rate": 1.4508733414244803e-06, "loss": 0.6875, "step": 12203 }, { "epoch": 0.83, "learning_rate": 1.4497284853047889e-06, "loss": 0.7891, "step": 12204 }, { "epoch": 0.83, "learning_rate": 1.448584045753908e-06, "loss": 0.708, "step": 12205 }, { "epoch": 0.83, "learning_rate": 1.4474400228275976e-06, "loss": 0.6914, "step": 12206 }, { "epoch": 0.83, "learning_rate": 1.4462964165815908e-06, "loss": 0.7148, "step": 12207 }, { "epoch": 0.83, "learning_rate": 1.445153227071604e-06, "loss": 0.7227, "step": 12208 }, { "epoch": 0.83, "learning_rate": 1.4440104543533363e-06, "loss": 0.7295, "step": 12209 }, { "epoch": 0.83, "learning_rate": 1.4428680984824605e-06, "loss": 0.7559, "step": 12210 }, { "epoch": 0.83, "learning_rate": 1.4417261595146348e-06, "loss": 0.7812, "step": 12211 }, { "epoch": 0.83, "learning_rate": 1.4405846375054956e-06, "loss": 0.7656, "step": 12212 }, { "epoch": 0.83, "learning_rate": 1.4394435325106525e-06, "loss": 0.6885, "step": 12213 }, { "epoch": 0.83, "learning_rate": 1.4383028445857006e-06, "loss": 0.7393, "step": 12214 }, { "epoch": 0.83, "learning_rate": 1.4371625737862215e-06, "loss": 0.7529, "step": 12215 }, { "epoch": 0.83, "learning_rate": 1.4360227201677624e-06, "loss": 0.7881, "step": 12216 }, { "epoch": 0.83, "learning_rate": 1.4348832837858573e-06, "loss": 0.8262, "step": 12217 }, { "epoch": 0.83, "learning_rate": 1.433744264696022e-06, "loss": 0.749, "step": 12218 }, { "epoch": 0.83, "learning_rate": 1.4326056629537511e-06, "loss": 0.8066, "step": 12219 }, { "epoch": 0.83, "learning_rate": 1.4314674786145088e-06, "loss": 0.7246, "step": 12220 }, { "epoch": 0.83, "learning_rate": 1.4303297117337567e-06, "loss": 0.8389, "step": 12221 }, { "epoch": 0.83, "learning_rate": 1.4291923623669246e-06, "loss": 0.6895, "step": 12222 }, { "epoch": 0.83, "learning_rate": 1.4280554305694205e-06, "loss": 0.7588, "step": 12223 }, { "epoch": 0.83, "learning_rate": 1.4269189163966378e-06, "loss": 0.7881, "step": 12224 }, { "epoch": 0.83, "learning_rate": 1.4257828199039491e-06, "loss": 0.8125, "step": 12225 }, { "epoch": 0.83, "learning_rate": 1.4246471411466988e-06, "loss": 0.666, "step": 12226 }, { "epoch": 0.83, "learning_rate": 1.423511880180225e-06, "loss": 0.7598, "step": 12227 }, { "epoch": 0.83, "learning_rate": 1.4223770370598356e-06, "loss": 0.8076, "step": 12228 }, { "epoch": 0.83, "learning_rate": 1.4212426118408163e-06, "loss": 0.7393, "step": 12229 }, { "epoch": 0.83, "learning_rate": 1.4201086045784395e-06, "loss": 0.7998, "step": 12230 }, { "epoch": 0.83, "learning_rate": 1.4189750153279525e-06, "loss": 0.7686, "step": 12231 }, { "epoch": 0.83, "learning_rate": 1.417841844144584e-06, "loss": 0.7529, "step": 12232 }, { "epoch": 0.83, "learning_rate": 1.4167090910835424e-06, "loss": 0.6738, "step": 12233 }, { "epoch": 0.83, "learning_rate": 1.4155767562000156e-06, "loss": 0.7188, "step": 12234 }, { "epoch": 0.83, "learning_rate": 1.4144448395491728e-06, "loss": 0.7734, "step": 12235 }, { "epoch": 0.83, "learning_rate": 1.4133133411861555e-06, "loss": 0.7646, "step": 12236 }, { "epoch": 0.83, "learning_rate": 1.412182261166095e-06, "loss": 0.7998, "step": 12237 }, { "epoch": 0.83, "learning_rate": 1.4110515995440954e-06, "loss": 0.6689, "step": 12238 }, { "epoch": 0.83, "learning_rate": 1.4099213563752424e-06, "loss": 0.7646, "step": 12239 }, { "epoch": 0.83, "learning_rate": 1.4087915317146028e-06, "loss": 0.7754, "step": 12240 }, { "epoch": 0.83, "learning_rate": 1.407662125617222e-06, "loss": 0.7568, "step": 12241 }, { "epoch": 0.83, "learning_rate": 1.406533138138122e-06, "loss": 0.7803, "step": 12242 }, { "epoch": 0.83, "learning_rate": 1.4054045693323083e-06, "loss": 0.707, "step": 12243 }, { "epoch": 0.83, "learning_rate": 1.4042764192547652e-06, "loss": 0.7578, "step": 12244 }, { "epoch": 0.83, "learning_rate": 1.403148687960455e-06, "loss": 0.7568, "step": 12245 }, { "epoch": 0.83, "learning_rate": 1.4020213755043222e-06, "loss": 0.708, "step": 12246 }, { "epoch": 0.83, "learning_rate": 1.4008944819412884e-06, "loss": 0.8105, "step": 12247 }, { "epoch": 0.83, "learning_rate": 1.3997680073262587e-06, "loss": 0.7139, "step": 12248 }, { "epoch": 0.83, "learning_rate": 1.3986419517141092e-06, "loss": 0.6875, "step": 12249 }, { "epoch": 0.83, "learning_rate": 1.3975163151597027e-06, "loss": 0.7373, "step": 12250 }, { "epoch": 0.83, "learning_rate": 1.3963910977178863e-06, "loss": 0.7002, "step": 12251 }, { "epoch": 0.83, "learning_rate": 1.395266299443474e-06, "loss": 0.7471, "step": 12252 }, { "epoch": 0.84, "learning_rate": 1.3941419203912675e-06, "loss": 0.7344, "step": 12253 }, { "epoch": 0.84, "learning_rate": 1.3930179606160477e-06, "loss": 0.7529, "step": 12254 }, { "epoch": 0.84, "learning_rate": 1.3918944201725748e-06, "loss": 0.667, "step": 12255 }, { "epoch": 0.84, "learning_rate": 1.3907712991155809e-06, "loss": 0.8105, "step": 12256 }, { "epoch": 0.84, "learning_rate": 1.389648597499793e-06, "loss": 0.7334, "step": 12257 }, { "epoch": 0.84, "learning_rate": 1.3885263153799068e-06, "loss": 0.6982, "step": 12258 }, { "epoch": 0.84, "learning_rate": 1.3874044528105969e-06, "loss": 0.7588, "step": 12259 }, { "epoch": 0.84, "learning_rate": 1.3862830098465208e-06, "loss": 0.7314, "step": 12260 }, { "epoch": 0.84, "learning_rate": 1.3851619865423205e-06, "loss": 0.7188, "step": 12261 }, { "epoch": 0.84, "learning_rate": 1.3840413829526022e-06, "loss": 0.7334, "step": 12262 }, { "epoch": 0.84, "learning_rate": 1.3829211991319701e-06, "loss": 0.6797, "step": 12263 }, { "epoch": 0.84, "learning_rate": 1.3818014351349995e-06, "loss": 0.7031, "step": 12264 }, { "epoch": 0.84, "learning_rate": 1.3806820910162399e-06, "loss": 0.6855, "step": 12265 }, { "epoch": 0.84, "learning_rate": 1.37956316683023e-06, "loss": 0.7832, "step": 12266 }, { "epoch": 0.84, "learning_rate": 1.3784446626314807e-06, "loss": 0.7021, "step": 12267 }, { "epoch": 0.84, "learning_rate": 1.377326578474487e-06, "loss": 0.7412, "step": 12268 }, { "epoch": 0.84, "learning_rate": 1.3762089144137224e-06, "loss": 0.709, "step": 12269 }, { "epoch": 0.84, "learning_rate": 1.3750916705036388e-06, "loss": 0.7314, "step": 12270 }, { "epoch": 0.84, "learning_rate": 1.3739748467986713e-06, "loss": 0.7051, "step": 12271 }, { "epoch": 0.84, "learning_rate": 1.3728584433532256e-06, "loss": 0.7676, "step": 12272 }, { "epoch": 0.84, "learning_rate": 1.3717424602216967e-06, "loss": 0.7539, "step": 12273 }, { "epoch": 0.84, "learning_rate": 1.3706268974584535e-06, "loss": 0.8379, "step": 12274 }, { "epoch": 0.84, "learning_rate": 1.3695117551178472e-06, "loss": 0.7207, "step": 12275 }, { "epoch": 0.84, "learning_rate": 1.3683970332542073e-06, "loss": 0.709, "step": 12276 }, { "epoch": 0.84, "learning_rate": 1.3672827319218452e-06, "loss": 0.7139, "step": 12277 }, { "epoch": 0.84, "learning_rate": 1.3661688511750448e-06, "loss": 0.7549, "step": 12278 }, { "epoch": 0.84, "learning_rate": 1.3650553910680774e-06, "loss": 0.7549, "step": 12279 }, { "epoch": 0.84, "learning_rate": 1.3639423516551908e-06, "loss": 0.7734, "step": 12280 }, { "epoch": 0.84, "learning_rate": 1.3628297329906103e-06, "loss": 0.6992, "step": 12281 }, { "epoch": 0.84, "learning_rate": 1.361717535128545e-06, "loss": 0.7227, "step": 12282 }, { "epoch": 0.84, "learning_rate": 1.3606057581231803e-06, "loss": 0.7373, "step": 12283 }, { "epoch": 0.84, "learning_rate": 1.3594944020286838e-06, "loss": 0.7334, "step": 12284 }, { "epoch": 0.84, "learning_rate": 1.3583834668991936e-06, "loss": 0.7803, "step": 12285 }, { "epoch": 0.84, "learning_rate": 1.3572729527888418e-06, "loss": 0.8018, "step": 12286 }, { "epoch": 0.84, "learning_rate": 1.356162859751733e-06, "loss": 0.7334, "step": 12287 }, { "epoch": 0.84, "learning_rate": 1.355053187841946e-06, "loss": 0.79, "step": 12288 }, { "epoch": 0.84, "learning_rate": 1.3539439371135455e-06, "loss": 0.7842, "step": 12289 }, { "epoch": 0.84, "learning_rate": 1.3528351076205748e-06, "loss": 0.6992, "step": 12290 }, { "epoch": 0.84, "learning_rate": 1.3517266994170565e-06, "loss": 0.7109, "step": 12291 }, { "epoch": 0.84, "learning_rate": 1.3506187125569914e-06, "loss": 0.6621, "step": 12292 }, { "epoch": 0.84, "learning_rate": 1.3495111470943612e-06, "loss": 0.7568, "step": 12293 }, { "epoch": 0.84, "learning_rate": 1.3484040030831281e-06, "loss": 0.7373, "step": 12294 }, { "epoch": 0.84, "learning_rate": 1.3472972805772278e-06, "loss": 0.7188, "step": 12295 }, { "epoch": 0.84, "learning_rate": 1.3461909796305816e-06, "loss": 0.7578, "step": 12296 }, { "epoch": 0.84, "learning_rate": 1.3450851002970888e-06, "loss": 0.8076, "step": 12297 }, { "epoch": 0.84, "learning_rate": 1.3439796426306283e-06, "loss": 0.7012, "step": 12298 }, { "epoch": 0.84, "learning_rate": 1.3428746066850573e-06, "loss": 0.7471, "step": 12299 }, { "epoch": 0.84, "learning_rate": 1.3417699925142157e-06, "loss": 0.7197, "step": 12300 }, { "epoch": 0.84, "learning_rate": 1.3406658001719152e-06, "loss": 0.7549, "step": 12301 }, { "epoch": 0.84, "learning_rate": 1.339562029711955e-06, "loss": 0.7598, "step": 12302 }, { "epoch": 0.84, "learning_rate": 1.3384586811881107e-06, "loss": 0.7275, "step": 12303 }, { "epoch": 0.84, "learning_rate": 1.3373557546541361e-06, "loss": 0.7637, "step": 12304 }, { "epoch": 0.84, "learning_rate": 1.336253250163767e-06, "loss": 0.7139, "step": 12305 }, { "epoch": 0.84, "learning_rate": 1.3351511677707173e-06, "loss": 0.71, "step": 12306 }, { "epoch": 0.84, "learning_rate": 1.334049507528683e-06, "loss": 0.6816, "step": 12307 }, { "epoch": 0.84, "learning_rate": 1.3329482694913308e-06, "loss": 0.7871, "step": 12308 }, { "epoch": 0.84, "learning_rate": 1.3318474537123138e-06, "loss": 0.8037, "step": 12309 }, { "epoch": 0.84, "learning_rate": 1.3307470602452722e-06, "loss": 0.7578, "step": 12310 }, { "epoch": 0.84, "learning_rate": 1.3296470891438073e-06, "loss": 0.7725, "step": 12311 }, { "epoch": 0.84, "learning_rate": 1.3285475404615145e-06, "loss": 0.8057, "step": 12312 }, { "epoch": 0.84, "learning_rate": 1.327448414251964e-06, "loss": 0.7754, "step": 12313 }, { "epoch": 0.84, "learning_rate": 1.3263497105687018e-06, "loss": 0.7012, "step": 12314 }, { "epoch": 0.84, "learning_rate": 1.3252514294652563e-06, "loss": 0.7617, "step": 12315 }, { "epoch": 0.84, "learning_rate": 1.3241535709951425e-06, "loss": 0.751, "step": 12316 }, { "epoch": 0.84, "learning_rate": 1.323056135211842e-06, "loss": 0.792, "step": 12317 }, { "epoch": 0.84, "learning_rate": 1.3219591221688234e-06, "loss": 0.7578, "step": 12318 }, { "epoch": 0.84, "learning_rate": 1.3208625319195333e-06, "loss": 0.7207, "step": 12319 }, { "epoch": 0.84, "learning_rate": 1.3197663645173987e-06, "loss": 0.7412, "step": 12320 }, { "epoch": 0.84, "learning_rate": 1.3186706200158195e-06, "loss": 0.7598, "step": 12321 }, { "epoch": 0.84, "learning_rate": 1.3175752984681878e-06, "loss": 0.7412, "step": 12322 }, { "epoch": 0.84, "learning_rate": 1.3164803999278653e-06, "loss": 0.7666, "step": 12323 }, { "epoch": 0.84, "learning_rate": 1.3153859244481915e-06, "loss": 0.6807, "step": 12324 }, { "epoch": 0.84, "learning_rate": 1.3142918720824926e-06, "loss": 0.7598, "step": 12325 }, { "epoch": 0.84, "learning_rate": 1.3131982428840694e-06, "loss": 0.7725, "step": 12326 }, { "epoch": 0.84, "learning_rate": 1.312105036906205e-06, "loss": 0.752, "step": 12327 }, { "epoch": 0.84, "learning_rate": 1.3110122542021597e-06, "loss": 0.7881, "step": 12328 }, { "epoch": 0.84, "learning_rate": 1.3099198948251756e-06, "loss": 0.7119, "step": 12329 }, { "epoch": 0.84, "learning_rate": 1.308827958828468e-06, "loss": 0.7734, "step": 12330 }, { "epoch": 0.84, "learning_rate": 1.3077364462652376e-06, "loss": 0.7402, "step": 12331 }, { "epoch": 0.84, "learning_rate": 1.306645357188665e-06, "loss": 0.7559, "step": 12332 }, { "epoch": 0.84, "learning_rate": 1.3055546916519057e-06, "loss": 0.7363, "step": 12333 }, { "epoch": 0.84, "learning_rate": 1.3044644497080982e-06, "loss": 0.7812, "step": 12334 }, { "epoch": 0.84, "learning_rate": 1.303374631410359e-06, "loss": 0.8066, "step": 12335 }, { "epoch": 0.84, "learning_rate": 1.3022852368117856e-06, "loss": 0.7607, "step": 12336 }, { "epoch": 0.84, "learning_rate": 1.3011962659654499e-06, "loss": 0.748, "step": 12337 }, { "epoch": 0.84, "learning_rate": 1.3001077189244072e-06, "loss": 0.6953, "step": 12338 }, { "epoch": 0.84, "learning_rate": 1.2990195957416917e-06, "loss": 0.8018, "step": 12339 }, { "epoch": 0.84, "learning_rate": 1.297931896470317e-06, "loss": 0.7891, "step": 12340 }, { "epoch": 0.84, "learning_rate": 1.2968446211632768e-06, "loss": 0.7617, "step": 12341 }, { "epoch": 0.84, "learning_rate": 1.2957577698735425e-06, "loss": 0.7324, "step": 12342 }, { "epoch": 0.84, "learning_rate": 1.2946713426540658e-06, "loss": 0.7539, "step": 12343 }, { "epoch": 0.84, "learning_rate": 1.2935853395577757e-06, "loss": 0.793, "step": 12344 }, { "epoch": 0.84, "learning_rate": 1.292499760637581e-06, "loss": 0.7471, "step": 12345 }, { "epoch": 0.84, "learning_rate": 1.2914146059463784e-06, "loss": 0.6807, "step": 12346 }, { "epoch": 0.84, "learning_rate": 1.2903298755370286e-06, "loss": 0.7002, "step": 12347 }, { "epoch": 0.84, "learning_rate": 1.2892455694623818e-06, "loss": 0.792, "step": 12348 }, { "epoch": 0.84, "learning_rate": 1.288161687775269e-06, "loss": 0.7334, "step": 12349 }, { "epoch": 0.84, "learning_rate": 1.2870782305284924e-06, "loss": 0.7988, "step": 12350 }, { "epoch": 0.84, "learning_rate": 1.2859951977748364e-06, "loss": 0.7754, "step": 12351 }, { "epoch": 0.84, "learning_rate": 1.2849125895670733e-06, "loss": 0.6768, "step": 12352 }, { "epoch": 0.84, "learning_rate": 1.2838304059579432e-06, "loss": 0.7529, "step": 12353 }, { "epoch": 0.84, "learning_rate": 1.2827486470001694e-06, "loss": 0.7471, "step": 12354 }, { "epoch": 0.84, "learning_rate": 1.2816673127464562e-06, "loss": 0.8213, "step": 12355 }, { "epoch": 0.84, "learning_rate": 1.2805864032494897e-06, "loss": 0.708, "step": 12356 }, { "epoch": 0.84, "learning_rate": 1.279505918561923e-06, "loss": 0.7832, "step": 12357 }, { "epoch": 0.84, "learning_rate": 1.2784258587364063e-06, "loss": 0.7656, "step": 12358 }, { "epoch": 0.84, "learning_rate": 1.2773462238255574e-06, "loss": 0.7402, "step": 12359 }, { "epoch": 0.84, "learning_rate": 1.2762670138819733e-06, "loss": 0.8047, "step": 12360 }, { "epoch": 0.84, "learning_rate": 1.275188228958234e-06, "loss": 0.8125, "step": 12361 }, { "epoch": 0.84, "learning_rate": 1.274109869106902e-06, "loss": 0.7822, "step": 12362 }, { "epoch": 0.84, "learning_rate": 1.2730319343805075e-06, "loss": 0.7344, "step": 12363 }, { "epoch": 0.84, "learning_rate": 1.271954424831573e-06, "loss": 0.7754, "step": 12364 }, { "epoch": 0.84, "learning_rate": 1.270877340512595e-06, "loss": 0.7773, "step": 12365 }, { "epoch": 0.84, "learning_rate": 1.2698006814760466e-06, "loss": 0.7285, "step": 12366 }, { "epoch": 0.84, "learning_rate": 1.2687244477743822e-06, "loss": 0.7334, "step": 12367 }, { "epoch": 0.84, "learning_rate": 1.2676486394600374e-06, "loss": 0.792, "step": 12368 }, { "epoch": 0.84, "learning_rate": 1.266573256585424e-06, "loss": 0.7939, "step": 12369 }, { "epoch": 0.84, "learning_rate": 1.2654982992029362e-06, "loss": 0.7441, "step": 12370 }, { "epoch": 0.84, "learning_rate": 1.2644237673649463e-06, "loss": 0.8047, "step": 12371 }, { "epoch": 0.84, "learning_rate": 1.263349661123805e-06, "loss": 0.7295, "step": 12372 }, { "epoch": 0.84, "learning_rate": 1.2622759805318408e-06, "loss": 0.7686, "step": 12373 }, { "epoch": 0.84, "learning_rate": 1.261202725641365e-06, "loss": 0.7539, "step": 12374 }, { "epoch": 0.84, "learning_rate": 1.260129896504666e-06, "loss": 0.7139, "step": 12375 }, { "epoch": 0.84, "learning_rate": 1.259057493174012e-06, "loss": 0.7627, "step": 12376 }, { "epoch": 0.84, "learning_rate": 1.2579855157016507e-06, "loss": 0.7402, "step": 12377 }, { "epoch": 0.84, "learning_rate": 1.2569139641398098e-06, "loss": 0.749, "step": 12378 }, { "epoch": 0.84, "learning_rate": 1.255842838540695e-06, "loss": 0.7637, "step": 12379 }, { "epoch": 0.84, "learning_rate": 1.2547721389564893e-06, "loss": 0.7314, "step": 12380 }, { "epoch": 0.84, "learning_rate": 1.2537018654393584e-06, "loss": 0.792, "step": 12381 }, { "epoch": 0.84, "learning_rate": 1.2526320180414453e-06, "loss": 0.7217, "step": 12382 }, { "epoch": 0.84, "learning_rate": 1.2515625968148748e-06, "loss": 0.7578, "step": 12383 }, { "epoch": 0.84, "learning_rate": 1.2504936018117476e-06, "loss": 0.8359, "step": 12384 }, { "epoch": 0.84, "learning_rate": 1.2494250330841473e-06, "loss": 0.7441, "step": 12385 }, { "epoch": 0.84, "learning_rate": 1.2483568906841304e-06, "loss": 0.7158, "step": 12386 }, { "epoch": 0.84, "learning_rate": 1.2472891746637372e-06, "loss": 0.6807, "step": 12387 }, { "epoch": 0.84, "learning_rate": 1.246221885074993e-06, "loss": 0.7744, "step": 12388 }, { "epoch": 0.84, "learning_rate": 1.2451550219698893e-06, "loss": 0.7959, "step": 12389 }, { "epoch": 0.84, "learning_rate": 1.2440885854004059e-06, "loss": 0.7627, "step": 12390 }, { "epoch": 0.84, "learning_rate": 1.2430225754185e-06, "loss": 0.7441, "step": 12391 }, { "epoch": 0.84, "learning_rate": 1.2419569920761089e-06, "loss": 0.7129, "step": 12392 }, { "epoch": 0.84, "learning_rate": 1.2408918354251408e-06, "loss": 0.6973, "step": 12393 }, { "epoch": 0.84, "learning_rate": 1.2398271055174994e-06, "loss": 0.7373, "step": 12394 }, { "epoch": 0.84, "learning_rate": 1.2387628024050557e-06, "loss": 0.6924, "step": 12395 }, { "epoch": 0.84, "learning_rate": 1.2376989261396577e-06, "loss": 0.6816, "step": 12396 }, { "epoch": 0.84, "learning_rate": 1.2366354767731425e-06, "loss": 0.7139, "step": 12397 }, { "epoch": 0.84, "learning_rate": 1.23557245435732e-06, "loss": 0.7129, "step": 12398 }, { "epoch": 0.84, "learning_rate": 1.2345098589439775e-06, "loss": 0.7969, "step": 12399 }, { "epoch": 0.85, "learning_rate": 1.233447690584888e-06, "loss": 0.7109, "step": 12400 }, { "epoch": 0.85, "learning_rate": 1.2323859493318025e-06, "loss": 0.6377, "step": 12401 }, { "epoch": 0.85, "learning_rate": 1.2313246352364438e-06, "loss": 0.7393, "step": 12402 }, { "epoch": 0.85, "learning_rate": 1.230263748350521e-06, "loss": 0.8066, "step": 12403 }, { "epoch": 0.85, "learning_rate": 1.22920328872572e-06, "loss": 0.7031, "step": 12404 }, { "epoch": 0.85, "learning_rate": 1.2281432564137076e-06, "loss": 0.7607, "step": 12405 }, { "epoch": 0.85, "learning_rate": 1.2270836514661288e-06, "loss": 0.7412, "step": 12406 }, { "epoch": 0.85, "learning_rate": 1.226024473934605e-06, "loss": 0.7305, "step": 12407 }, { "epoch": 0.85, "learning_rate": 1.2249657238707446e-06, "loss": 0.7734, "step": 12408 }, { "epoch": 0.85, "learning_rate": 1.2239074013261232e-06, "loss": 0.7178, "step": 12409 }, { "epoch": 0.85, "learning_rate": 1.2228495063523038e-06, "loss": 0.7676, "step": 12410 }, { "epoch": 0.85, "learning_rate": 1.221792039000832e-06, "loss": 0.7783, "step": 12411 }, { "epoch": 0.85, "learning_rate": 1.220734999323222e-06, "loss": 0.6748, "step": 12412 }, { "epoch": 0.85, "learning_rate": 1.219678387370975e-06, "loss": 0.7578, "step": 12413 }, { "epoch": 0.85, "learning_rate": 1.2186222031955685e-06, "loss": 0.793, "step": 12414 }, { "epoch": 0.85, "learning_rate": 1.2175664468484628e-06, "loss": 0.6777, "step": 12415 }, { "epoch": 0.85, "learning_rate": 1.2165111183810863e-06, "loss": 0.7832, "step": 12416 }, { "epoch": 0.85, "learning_rate": 1.2154562178448647e-06, "loss": 0.7158, "step": 12417 }, { "epoch": 0.85, "learning_rate": 1.214401745291185e-06, "loss": 0.7812, "step": 12418 }, { "epoch": 0.85, "learning_rate": 1.2133477007714246e-06, "loss": 0.8428, "step": 12419 }, { "epoch": 0.85, "learning_rate": 1.2122940843369346e-06, "loss": 0.7793, "step": 12420 }, { "epoch": 0.85, "learning_rate": 1.211240896039052e-06, "loss": 0.7646, "step": 12421 }, { "epoch": 0.85, "learning_rate": 1.210188135929079e-06, "loss": 0.7754, "step": 12422 }, { "epoch": 0.85, "learning_rate": 1.2091358040583134e-06, "loss": 0.7109, "step": 12423 }, { "epoch": 0.85, "learning_rate": 1.2080839004780253e-06, "loss": 0.7461, "step": 12424 }, { "epoch": 0.85, "learning_rate": 1.2070324252394584e-06, "loss": 0.7627, "step": 12425 }, { "epoch": 0.85, "learning_rate": 1.2059813783938434e-06, "loss": 0.7998, "step": 12426 }, { "epoch": 0.85, "learning_rate": 1.2049307599923865e-06, "loss": 0.7812, "step": 12427 }, { "epoch": 0.85, "learning_rate": 1.2038805700862744e-06, "loss": 0.8086, "step": 12428 }, { "epoch": 0.85, "learning_rate": 1.2028308087266716e-06, "loss": 0.7129, "step": 12429 }, { "epoch": 0.85, "learning_rate": 1.2017814759647228e-06, "loss": 0.7695, "step": 12430 }, { "epoch": 0.85, "learning_rate": 1.2007325718515528e-06, "loss": 0.7451, "step": 12431 }, { "epoch": 0.85, "learning_rate": 1.1996840964382617e-06, "loss": 0.752, "step": 12432 }, { "epoch": 0.85, "learning_rate": 1.198636049775932e-06, "loss": 0.6885, "step": 12433 }, { "epoch": 0.85, "learning_rate": 1.197588431915625e-06, "loss": 0.7988, "step": 12434 }, { "epoch": 0.85, "learning_rate": 1.19654124290838e-06, "loss": 0.793, "step": 12435 }, { "epoch": 0.85, "learning_rate": 1.1954944828052161e-06, "loss": 0.7773, "step": 12436 }, { "epoch": 0.85, "learning_rate": 1.194448151657135e-06, "loss": 0.7539, "step": 12437 }, { "epoch": 0.85, "learning_rate": 1.1934022495151064e-06, "loss": 0.6924, "step": 12438 }, { "epoch": 0.85, "learning_rate": 1.1923567764300925e-06, "loss": 0.7812, "step": 12439 }, { "epoch": 0.85, "learning_rate": 1.1913117324530266e-06, "loss": 0.7373, "step": 12440 }, { "epoch": 0.85, "learning_rate": 1.1902671176348223e-06, "loss": 0.6494, "step": 12441 }, { "epoch": 0.85, "learning_rate": 1.189222932026376e-06, "loss": 0.7158, "step": 12442 }, { "epoch": 0.85, "learning_rate": 1.1881791756785577e-06, "loss": 0.8867, "step": 12443 }, { "epoch": 0.85, "learning_rate": 1.1871358486422223e-06, "loss": 0.8057, "step": 12444 }, { "epoch": 0.85, "learning_rate": 1.1860929509681974e-06, "loss": 0.7188, "step": 12445 }, { "epoch": 0.85, "learning_rate": 1.1850504827072918e-06, "loss": 0.7861, "step": 12446 }, { "epoch": 0.85, "learning_rate": 1.1840084439103006e-06, "loss": 0.7266, "step": 12447 }, { "epoch": 0.85, "learning_rate": 1.1829668346279855e-06, "loss": 0.6924, "step": 12448 }, { "epoch": 0.85, "learning_rate": 1.181925654911097e-06, "loss": 0.7695, "step": 12449 }, { "epoch": 0.85, "learning_rate": 1.180884904810362e-06, "loss": 0.7744, "step": 12450 }, { "epoch": 0.85, "learning_rate": 1.1798445843764827e-06, "loss": 0.7412, "step": 12451 }, { "epoch": 0.85, "learning_rate": 1.1788046936601438e-06, "loss": 0.7676, "step": 12452 }, { "epoch": 0.85, "learning_rate": 1.1777652327120136e-06, "loss": 0.8398, "step": 12453 }, { "epoch": 0.85, "learning_rate": 1.1767262015827286e-06, "loss": 0.7773, "step": 12454 }, { "epoch": 0.85, "learning_rate": 1.1756876003229135e-06, "loss": 0.7803, "step": 12455 }, { "epoch": 0.85, "learning_rate": 1.1746494289831667e-06, "loss": 0.7725, "step": 12456 }, { "epoch": 0.85, "learning_rate": 1.1736116876140724e-06, "loss": 0.7393, "step": 12457 }, { "epoch": 0.85, "learning_rate": 1.1725743762661822e-06, "loss": 0.7529, "step": 12458 }, { "epoch": 0.85, "learning_rate": 1.1715374949900405e-06, "loss": 0.7158, "step": 12459 }, { "epoch": 0.85, "learning_rate": 1.1705010438361631e-06, "loss": 0.7598, "step": 12460 }, { "epoch": 0.85, "learning_rate": 1.169465022855042e-06, "loss": 0.7109, "step": 12461 }, { "epoch": 0.85, "learning_rate": 1.1684294320971546e-06, "loss": 0.708, "step": 12462 }, { "epoch": 0.85, "learning_rate": 1.1673942716129538e-06, "loss": 0.7002, "step": 12463 }, { "epoch": 0.85, "learning_rate": 1.1663595414528738e-06, "loss": 0.7695, "step": 12464 }, { "epoch": 0.85, "learning_rate": 1.1653252416673267e-06, "loss": 0.6709, "step": 12465 }, { "epoch": 0.85, "learning_rate": 1.1642913723067029e-06, "loss": 0.7393, "step": 12466 }, { "epoch": 0.85, "learning_rate": 1.1632579334213734e-06, "loss": 0.7471, "step": 12467 }, { "epoch": 0.85, "learning_rate": 1.1622249250616858e-06, "loss": 0.6865, "step": 12468 }, { "epoch": 0.85, "learning_rate": 1.1611923472779686e-06, "loss": 0.7139, "step": 12469 }, { "epoch": 0.85, "learning_rate": 1.160160200120528e-06, "loss": 0.709, "step": 12470 }, { "epoch": 0.85, "learning_rate": 1.1591284836396532e-06, "loss": 0.709, "step": 12471 }, { "epoch": 0.85, "learning_rate": 1.1580971978856058e-06, "loss": 0.7656, "step": 12472 }, { "epoch": 0.85, "learning_rate": 1.1570663429086349e-06, "loss": 0.751, "step": 12473 }, { "epoch": 0.85, "learning_rate": 1.1560359187589588e-06, "loss": 0.6445, "step": 12474 }, { "epoch": 0.85, "learning_rate": 1.1550059254867807e-06, "loss": 0.7871, "step": 12475 }, { "epoch": 0.85, "learning_rate": 1.153976363142283e-06, "loss": 0.8018, "step": 12476 }, { "epoch": 0.85, "learning_rate": 1.1529472317756252e-06, "loss": 0.6445, "step": 12477 }, { "epoch": 0.85, "learning_rate": 1.1519185314369463e-06, "loss": 0.7725, "step": 12478 }, { "epoch": 0.85, "learning_rate": 1.150890262176365e-06, "loss": 0.7773, "step": 12479 }, { "epoch": 0.85, "learning_rate": 1.1498624240439816e-06, "loss": 0.7725, "step": 12480 }, { "epoch": 0.85, "learning_rate": 1.1488350170898676e-06, "loss": 0.7715, "step": 12481 }, { "epoch": 0.85, "learning_rate": 1.1478080413640769e-06, "loss": 0.7686, "step": 12482 }, { "epoch": 0.85, "learning_rate": 1.1467814969166514e-06, "loss": 0.7539, "step": 12483 }, { "epoch": 0.85, "learning_rate": 1.1457553837975964e-06, "loss": 0.7656, "step": 12484 }, { "epoch": 0.85, "learning_rate": 1.144729702056908e-06, "loss": 0.7061, "step": 12485 }, { "epoch": 0.85, "learning_rate": 1.1437044517445594e-06, "loss": 0.7402, "step": 12486 }, { "epoch": 0.85, "learning_rate": 1.1426796329104962e-06, "loss": 0.7666, "step": 12487 }, { "epoch": 0.85, "learning_rate": 1.141655245604646e-06, "loss": 0.7627, "step": 12488 }, { "epoch": 0.85, "learning_rate": 1.1406312898769246e-06, "loss": 0.7705, "step": 12489 }, { "epoch": 0.85, "learning_rate": 1.139607765777213e-06, "loss": 0.71, "step": 12490 }, { "epoch": 0.85, "learning_rate": 1.1385846733553796e-06, "loss": 0.7354, "step": 12491 }, { "epoch": 0.85, "learning_rate": 1.1375620126612674e-06, "loss": 0.7803, "step": 12492 }, { "epoch": 0.85, "learning_rate": 1.1365397837447044e-06, "loss": 0.7471, "step": 12493 }, { "epoch": 0.85, "learning_rate": 1.1355179866554877e-06, "loss": 0.8232, "step": 12494 }, { "epoch": 0.85, "learning_rate": 1.134496621443404e-06, "loss": 0.7852, "step": 12495 }, { "epoch": 0.85, "learning_rate": 1.1334756881582143e-06, "loss": 0.7295, "step": 12496 }, { "epoch": 0.85, "learning_rate": 1.1324551868496537e-06, "loss": 0.7617, "step": 12497 }, { "epoch": 0.85, "learning_rate": 1.1314351175674455e-06, "loss": 0.7471, "step": 12498 }, { "epoch": 0.85, "learning_rate": 1.1304154803612854e-06, "loss": 0.8086, "step": 12499 }, { "epoch": 0.85, "learning_rate": 1.1293962752808495e-06, "loss": 0.8174, "step": 12500 }, { "epoch": 0.85, "learning_rate": 1.128377502375796e-06, "loss": 0.6914, "step": 12501 }, { "epoch": 0.85, "learning_rate": 1.1273591616957592e-06, "loss": 0.707, "step": 12502 }, { "epoch": 0.85, "learning_rate": 1.1263412532903495e-06, "loss": 0.7236, "step": 12503 }, { "epoch": 0.85, "learning_rate": 1.1253237772091608e-06, "loss": 0.7412, "step": 12504 }, { "epoch": 0.85, "learning_rate": 1.1243067335017655e-06, "loss": 0.7324, "step": 12505 }, { "epoch": 0.85, "learning_rate": 1.1232901222177127e-06, "loss": 0.7803, "step": 12506 }, { "epoch": 0.85, "learning_rate": 1.1222739434065333e-06, "loss": 0.7979, "step": 12507 }, { "epoch": 0.85, "learning_rate": 1.1212581971177338e-06, "loss": 0.6934, "step": 12508 }, { "epoch": 0.85, "learning_rate": 1.1202428834008038e-06, "loss": 0.7158, "step": 12509 }, { "epoch": 0.85, "learning_rate": 1.119228002305206e-06, "loss": 0.7344, "step": 12510 }, { "epoch": 0.85, "learning_rate": 1.1182135538803862e-06, "loss": 0.7236, "step": 12511 }, { "epoch": 0.85, "learning_rate": 1.1171995381757694e-06, "loss": 0.7812, "step": 12512 }, { "epoch": 0.85, "learning_rate": 1.1161859552407572e-06, "loss": 0.7549, "step": 12513 }, { "epoch": 0.85, "learning_rate": 1.1151728051247324e-06, "loss": 0.6846, "step": 12514 }, { "epoch": 0.85, "learning_rate": 1.1141600878770554e-06, "loss": 0.7646, "step": 12515 }, { "epoch": 0.85, "learning_rate": 1.1131478035470677e-06, "loss": 0.8076, "step": 12516 }, { "epoch": 0.85, "learning_rate": 1.1121359521840836e-06, "loss": 0.7314, "step": 12517 }, { "epoch": 0.85, "learning_rate": 1.1111245338373998e-06, "loss": 0.7822, "step": 12518 }, { "epoch": 0.85, "learning_rate": 1.1101135485563007e-06, "loss": 0.833, "step": 12519 }, { "epoch": 0.85, "learning_rate": 1.1091029963900324e-06, "loss": 0.8428, "step": 12520 }, { "epoch": 0.85, "learning_rate": 1.108092877387834e-06, "loss": 0.7393, "step": 12521 }, { "epoch": 0.85, "learning_rate": 1.1070831915989178e-06, "loss": 0.7773, "step": 12522 }, { "epoch": 0.85, "learning_rate": 1.1060739390724718e-06, "loss": 0.7451, "step": 12523 }, { "epoch": 0.85, "learning_rate": 1.1050651198576713e-06, "loss": 0.7529, "step": 12524 }, { "epoch": 0.85, "learning_rate": 1.1040567340036657e-06, "loss": 0.8203, "step": 12525 }, { "epoch": 0.85, "learning_rate": 1.1030487815595803e-06, "loss": 0.7344, "step": 12526 }, { "epoch": 0.85, "learning_rate": 1.1020412625745259e-06, "loss": 0.7725, "step": 12527 }, { "epoch": 0.85, "learning_rate": 1.101034177097585e-06, "loss": 0.7402, "step": 12528 }, { "epoch": 0.85, "learning_rate": 1.100027525177827e-06, "loss": 0.7344, "step": 12529 }, { "epoch": 0.85, "learning_rate": 1.099021306864293e-06, "loss": 0.7998, "step": 12530 }, { "epoch": 0.85, "learning_rate": 1.0980155222060074e-06, "loss": 0.7617, "step": 12531 }, { "epoch": 0.85, "learning_rate": 1.0970101712519732e-06, "loss": 0.8623, "step": 12532 }, { "epoch": 0.85, "learning_rate": 1.0960052540511667e-06, "loss": 0.875, "step": 12533 }, { "epoch": 0.85, "learning_rate": 1.0950007706525512e-06, "loss": 0.7373, "step": 12534 }, { "epoch": 0.85, "learning_rate": 1.0939967211050629e-06, "loss": 0.8291, "step": 12535 }, { "epoch": 0.85, "learning_rate": 1.0929931054576204e-06, "loss": 0.7832, "step": 12536 }, { "epoch": 0.85, "learning_rate": 1.0919899237591193e-06, "loss": 0.7295, "step": 12537 }, { "epoch": 0.85, "learning_rate": 1.0909871760584367e-06, "loss": 0.7578, "step": 12538 }, { "epoch": 0.85, "learning_rate": 1.089984862404422e-06, "loss": 0.6885, "step": 12539 }, { "epoch": 0.85, "learning_rate": 1.0889829828459108e-06, "loss": 0.7734, "step": 12540 }, { "epoch": 0.85, "learning_rate": 1.0879815374317137e-06, "loss": 0.7568, "step": 12541 }, { "epoch": 0.85, "learning_rate": 1.0869805262106226e-06, "loss": 0.832, "step": 12542 }, { "epoch": 0.85, "learning_rate": 1.085979949231405e-06, "loss": 0.7002, "step": 12543 }, { "epoch": 0.85, "learning_rate": 1.0849798065428096e-06, "loss": 0.7344, "step": 12544 }, { "epoch": 0.85, "learning_rate": 1.0839800981935643e-06, "loss": 0.6973, "step": 12545 }, { "epoch": 0.85, "learning_rate": 1.0829808242323724e-06, "loss": 0.7832, "step": 12546 }, { "epoch": 0.86, "learning_rate": 1.0819819847079182e-06, "loss": 0.751, "step": 12547 }, { "epoch": 0.86, "learning_rate": 1.0809835796688718e-06, "loss": 0.7969, "step": 12548 }, { "epoch": 0.86, "learning_rate": 1.0799856091638672e-06, "loss": 0.7061, "step": 12549 }, { "epoch": 0.86, "learning_rate": 1.078988073241528e-06, "loss": 0.7354, "step": 12550 }, { "epoch": 0.86, "learning_rate": 1.0779909719504555e-06, "loss": 0.7939, "step": 12551 }, { "epoch": 0.86, "learning_rate": 1.0769943053392306e-06, "loss": 0.7412, "step": 12552 }, { "epoch": 0.86, "learning_rate": 1.0759980734564034e-06, "loss": 0.6777, "step": 12553 }, { "epoch": 0.86, "learning_rate": 1.0750022763505163e-06, "loss": 0.7627, "step": 12554 }, { "epoch": 0.86, "learning_rate": 1.074006914070086e-06, "loss": 0.7568, "step": 12555 }, { "epoch": 0.86, "learning_rate": 1.0730119866636012e-06, "loss": 0.7344, "step": 12556 }, { "epoch": 0.86, "learning_rate": 1.0720174941795369e-06, "loss": 0.7578, "step": 12557 }, { "epoch": 0.86, "learning_rate": 1.0710234366663474e-06, "loss": 0.7305, "step": 12558 }, { "epoch": 0.86, "learning_rate": 1.0700298141724564e-06, "loss": 0.8389, "step": 12559 }, { "epoch": 0.86, "learning_rate": 1.069036626746278e-06, "loss": 0.7861, "step": 12560 }, { "epoch": 0.86, "learning_rate": 1.0680438744362032e-06, "loss": 0.7598, "step": 12561 }, { "epoch": 0.86, "learning_rate": 1.0670515572905927e-06, "loss": 0.7207, "step": 12562 }, { "epoch": 0.86, "learning_rate": 1.0660596753577956e-06, "loss": 0.7236, "step": 12563 }, { "epoch": 0.86, "learning_rate": 1.0650682286861347e-06, "loss": 0.7275, "step": 12564 }, { "epoch": 0.86, "learning_rate": 1.0640772173239134e-06, "loss": 0.7129, "step": 12565 }, { "epoch": 0.86, "learning_rate": 1.0630866413194152e-06, "loss": 0.7812, "step": 12566 }, { "epoch": 0.86, "learning_rate": 1.0620965007208993e-06, "loss": 0.7461, "step": 12567 }, { "epoch": 0.86, "learning_rate": 1.0611067955766087e-06, "loss": 0.7109, "step": 12568 }, { "epoch": 0.86, "learning_rate": 1.0601175259347563e-06, "loss": 0.7764, "step": 12569 }, { "epoch": 0.86, "learning_rate": 1.059128691843543e-06, "loss": 0.6709, "step": 12570 }, { "epoch": 0.86, "learning_rate": 1.058140293351143e-06, "loss": 0.7373, "step": 12571 }, { "epoch": 0.86, "learning_rate": 1.057152330505713e-06, "loss": 0.7969, "step": 12572 }, { "epoch": 0.86, "learning_rate": 1.056164803355384e-06, "loss": 0.8262, "step": 12573 }, { "epoch": 0.86, "learning_rate": 1.055177711948272e-06, "loss": 0.7666, "step": 12574 }, { "epoch": 0.86, "learning_rate": 1.0541910563324642e-06, "loss": 0.7842, "step": 12575 }, { "epoch": 0.86, "learning_rate": 1.0532048365560321e-06, "loss": 0.7949, "step": 12576 }, { "epoch": 0.86, "learning_rate": 1.052219052667023e-06, "loss": 0.7305, "step": 12577 }, { "epoch": 0.86, "learning_rate": 1.0512337047134657e-06, "loss": 0.7725, "step": 12578 }, { "epoch": 0.86, "learning_rate": 1.0502487927433657e-06, "loss": 0.8115, "step": 12579 }, { "epoch": 0.86, "learning_rate": 1.049264316804709e-06, "loss": 0.7754, "step": 12580 }, { "epoch": 0.86, "learning_rate": 1.0482802769454592e-06, "loss": 0.7148, "step": 12581 }, { "epoch": 0.86, "learning_rate": 1.0472966732135559e-06, "loss": 0.832, "step": 12582 }, { "epoch": 0.86, "learning_rate": 1.0463135056569206e-06, "loss": 0.7119, "step": 12583 }, { "epoch": 0.86, "learning_rate": 1.0453307743234586e-06, "loss": 0.7568, "step": 12584 }, { "epoch": 0.86, "learning_rate": 1.0443484792610425e-06, "loss": 0.8125, "step": 12585 }, { "epoch": 0.86, "learning_rate": 1.043366620517532e-06, "loss": 0.7178, "step": 12586 }, { "epoch": 0.86, "learning_rate": 1.042385198140763e-06, "loss": 0.7969, "step": 12587 }, { "epoch": 0.86, "learning_rate": 1.0414042121785517e-06, "loss": 0.7324, "step": 12588 }, { "epoch": 0.86, "learning_rate": 1.0404236626786867e-06, "loss": 0.7852, "step": 12589 }, { "epoch": 0.86, "learning_rate": 1.0394435496889476e-06, "loss": 0.7168, "step": 12590 }, { "epoch": 0.86, "learning_rate": 1.0384638732570796e-06, "loss": 0.6934, "step": 12591 }, { "epoch": 0.86, "learning_rate": 1.0374846334308152e-06, "loss": 0.7412, "step": 12592 }, { "epoch": 0.86, "learning_rate": 1.0365058302578624e-06, "loss": 0.7725, "step": 12593 }, { "epoch": 0.86, "learning_rate": 1.0355274637859103e-06, "loss": 0.79, "step": 12594 }, { "epoch": 0.86, "learning_rate": 1.0345495340626187e-06, "loss": 0.6943, "step": 12595 }, { "epoch": 0.86, "learning_rate": 1.0335720411356386e-06, "loss": 0.7588, "step": 12596 }, { "epoch": 0.86, "learning_rate": 1.032594985052594e-06, "loss": 0.7646, "step": 12597 }, { "epoch": 0.86, "learning_rate": 1.0316183658610823e-06, "loss": 0.835, "step": 12598 }, { "epoch": 0.86, "learning_rate": 1.0306421836086867e-06, "loss": 0.7432, "step": 12599 }, { "epoch": 0.86, "learning_rate": 1.0296664383429656e-06, "loss": 0.7764, "step": 12600 }, { "epoch": 0.86, "learning_rate": 1.0286911301114587e-06, "loss": 0.7949, "step": 12601 }, { "epoch": 0.86, "learning_rate": 1.0277162589616818e-06, "loss": 0.7666, "step": 12602 }, { "epoch": 0.86, "learning_rate": 1.0267418249411321e-06, "loss": 0.7734, "step": 12603 }, { "epoch": 0.86, "learning_rate": 1.0257678280972849e-06, "loss": 0.7227, "step": 12604 }, { "epoch": 0.86, "learning_rate": 1.024794268477589e-06, "loss": 0.7773, "step": 12605 }, { "epoch": 0.86, "learning_rate": 1.0238211461294788e-06, "loss": 0.7793, "step": 12606 }, { "epoch": 0.86, "learning_rate": 1.0228484611003653e-06, "loss": 0.7051, "step": 12607 }, { "epoch": 0.86, "learning_rate": 1.0218762134376358e-06, "loss": 0.7588, "step": 12608 }, { "epoch": 0.86, "learning_rate": 1.0209044031886605e-06, "loss": 0.7783, "step": 12609 }, { "epoch": 0.86, "learning_rate": 1.0199330304007858e-06, "loss": 0.6982, "step": 12610 }, { "epoch": 0.86, "learning_rate": 1.0189620951213353e-06, "loss": 0.7227, "step": 12611 }, { "epoch": 0.86, "learning_rate": 1.0179915973976129e-06, "loss": 0.7822, "step": 12612 }, { "epoch": 0.86, "learning_rate": 1.017021537276901e-06, "loss": 0.708, "step": 12613 }, { "epoch": 0.86, "learning_rate": 1.016051914806463e-06, "loss": 0.7002, "step": 12614 }, { "epoch": 0.86, "learning_rate": 1.0150827300335364e-06, "loss": 0.6963, "step": 12615 }, { "epoch": 0.86, "learning_rate": 1.0141139830053426e-06, "loss": 0.8271, "step": 12616 }, { "epoch": 0.86, "learning_rate": 1.013145673769078e-06, "loss": 0.7559, "step": 12617 }, { "epoch": 0.86, "learning_rate": 1.0121778023719165e-06, "loss": 0.8125, "step": 12618 }, { "epoch": 0.86, "learning_rate": 1.011210368861012e-06, "loss": 0.7402, "step": 12619 }, { "epoch": 0.86, "learning_rate": 1.0102433732835038e-06, "loss": 0.749, "step": 12620 }, { "epoch": 0.86, "learning_rate": 1.0092768156864974e-06, "loss": 0.7676, "step": 12621 }, { "epoch": 0.86, "learning_rate": 1.0083106961170875e-06, "loss": 0.7354, "step": 12622 }, { "epoch": 0.86, "learning_rate": 1.007345014622343e-06, "loss": 0.7275, "step": 12623 }, { "epoch": 0.86, "learning_rate": 1.0063797712493095e-06, "loss": 0.7588, "step": 12624 }, { "epoch": 0.86, "learning_rate": 1.005414966045013e-06, "loss": 0.8525, "step": 12625 }, { "epoch": 0.86, "learning_rate": 1.0044505990564636e-06, "loss": 0.7031, "step": 12626 }, { "epoch": 0.86, "learning_rate": 1.0034866703306411e-06, "loss": 0.7842, "step": 12627 }, { "epoch": 0.86, "learning_rate": 1.0025231799145095e-06, "loss": 0.7021, "step": 12628 }, { "epoch": 0.86, "learning_rate": 1.0015601278550103e-06, "loss": 0.8301, "step": 12629 }, { "epoch": 0.86, "learning_rate": 1.0005975141990632e-06, "loss": 0.7354, "step": 12630 }, { "epoch": 0.86, "learning_rate": 9.99635338993563e-07, "loss": 0.7773, "step": 12631 }, { "epoch": 0.86, "learning_rate": 9.986736022853927e-07, "loss": 0.7422, "step": 12632 }, { "epoch": 0.86, "learning_rate": 9.977123041214077e-07, "loss": 0.6836, "step": 12633 }, { "epoch": 0.86, "learning_rate": 9.967514445484383e-07, "loss": 0.749, "step": 12634 }, { "epoch": 0.86, "learning_rate": 9.957910236132984e-07, "loss": 0.7012, "step": 12635 }, { "epoch": 0.86, "learning_rate": 9.948310413627815e-07, "loss": 0.7236, "step": 12636 }, { "epoch": 0.86, "learning_rate": 9.93871497843657e-07, "loss": 0.7021, "step": 12637 }, { "epoch": 0.86, "learning_rate": 9.929123931026742e-07, "loss": 0.6621, "step": 12638 }, { "epoch": 0.86, "learning_rate": 9.919537271865598e-07, "loss": 0.6875, "step": 12639 }, { "epoch": 0.86, "learning_rate": 9.909955001420223e-07, "loss": 0.7197, "step": 12640 }, { "epoch": 0.86, "learning_rate": 9.900377120157434e-07, "loss": 0.7021, "step": 12641 }, { "epoch": 0.86, "learning_rate": 9.890803628543876e-07, "loss": 0.7158, "step": 12642 }, { "epoch": 0.86, "learning_rate": 9.881234527045968e-07, "loss": 0.7744, "step": 12643 }, { "epoch": 0.86, "learning_rate": 9.871669816129925e-07, "loss": 0.7051, "step": 12644 }, { "epoch": 0.86, "learning_rate": 9.86210949626173e-07, "loss": 0.7324, "step": 12645 }, { "epoch": 0.86, "learning_rate": 9.852553567907175e-07, "loss": 0.7598, "step": 12646 }, { "epoch": 0.86, "learning_rate": 9.8430020315318e-07, "loss": 0.791, "step": 12647 }, { "epoch": 0.86, "learning_rate": 9.833454887600956e-07, "loss": 0.7744, "step": 12648 }, { "epoch": 0.86, "learning_rate": 9.823912136579827e-07, "loss": 0.8262, "step": 12649 }, { "epoch": 0.86, "learning_rate": 9.814373778933284e-07, "loss": 0.7842, "step": 12650 }, { "epoch": 0.86, "learning_rate": 9.804839815126055e-07, "loss": 0.7734, "step": 12651 }, { "epoch": 0.86, "learning_rate": 9.795310245622624e-07, "loss": 0.7793, "step": 12652 }, { "epoch": 0.86, "learning_rate": 9.78578507088731e-07, "loss": 0.7334, "step": 12653 }, { "epoch": 0.86, "learning_rate": 9.776264291384096e-07, "loss": 0.7598, "step": 12654 }, { "epoch": 0.86, "learning_rate": 9.766747907576912e-07, "loss": 0.707, "step": 12655 }, { "epoch": 0.86, "learning_rate": 9.757235919929386e-07, "loss": 0.7686, "step": 12656 }, { "epoch": 0.86, "learning_rate": 9.747728328904915e-07, "loss": 0.6836, "step": 12657 }, { "epoch": 0.86, "learning_rate": 9.738225134966706e-07, "loss": 0.7686, "step": 12658 }, { "epoch": 0.86, "learning_rate": 9.728726338577788e-07, "loss": 0.7783, "step": 12659 }, { "epoch": 0.86, "learning_rate": 9.719231940200891e-07, "loss": 0.7432, "step": 12660 }, { "epoch": 0.86, "learning_rate": 9.709741940298622e-07, "loss": 0.6924, "step": 12661 }, { "epoch": 0.86, "learning_rate": 9.700256339333348e-07, "loss": 0.8125, "step": 12662 }, { "epoch": 0.86, "learning_rate": 9.690775137767161e-07, "loss": 0.7236, "step": 12663 }, { "epoch": 0.86, "learning_rate": 9.681298336061995e-07, "loss": 0.7529, "step": 12664 }, { "epoch": 0.86, "learning_rate": 9.671825934679578e-07, "loss": 0.7363, "step": 12665 }, { "epoch": 0.86, "learning_rate": 9.662357934081402e-07, "loss": 0.8135, "step": 12666 }, { "epoch": 0.86, "learning_rate": 9.652894334728735e-07, "loss": 0.707, "step": 12667 }, { "epoch": 0.86, "learning_rate": 9.643435137082646e-07, "loss": 0.708, "step": 12668 }, { "epoch": 0.86, "learning_rate": 9.63398034160402e-07, "loss": 0.75, "step": 12669 }, { "epoch": 0.86, "learning_rate": 9.624529948753436e-07, "loss": 0.7812, "step": 12670 }, { "epoch": 0.86, "learning_rate": 9.615083958991355e-07, "loss": 0.7275, "step": 12671 }, { "epoch": 0.86, "learning_rate": 9.605642372777969e-07, "loss": 0.7598, "step": 12672 }, { "epoch": 0.86, "learning_rate": 9.596205190573281e-07, "loss": 0.7949, "step": 12673 }, { "epoch": 0.86, "learning_rate": 9.586772412837064e-07, "loss": 0.7246, "step": 12674 }, { "epoch": 0.86, "learning_rate": 9.57734404002889e-07, "loss": 0.7461, "step": 12675 }, { "epoch": 0.86, "learning_rate": 9.567920072608129e-07, "loss": 0.7109, "step": 12676 }, { "epoch": 0.86, "learning_rate": 9.558500511033863e-07, "loss": 0.8193, "step": 12677 }, { "epoch": 0.86, "learning_rate": 9.549085355765043e-07, "loss": 0.7266, "step": 12678 }, { "epoch": 0.86, "learning_rate": 9.539674607260375e-07, "loss": 0.6885, "step": 12679 }, { "epoch": 0.86, "learning_rate": 9.530268265978348e-07, "loss": 0.7568, "step": 12680 }, { "epoch": 0.86, "learning_rate": 9.520866332377243e-07, "loss": 0.7266, "step": 12681 }, { "epoch": 0.86, "learning_rate": 9.511468806915136e-07, "loss": 0.7773, "step": 12682 }, { "epoch": 0.86, "learning_rate": 9.502075690049828e-07, "loss": 0.7959, "step": 12683 }, { "epoch": 0.86, "learning_rate": 9.492686982238974e-07, "loss": 0.7852, "step": 12684 }, { "epoch": 0.86, "learning_rate": 9.483302683940021e-07, "loss": 0.7451, "step": 12685 }, { "epoch": 0.86, "learning_rate": 9.473922795610135e-07, "loss": 0.7041, "step": 12686 }, { "epoch": 0.86, "learning_rate": 9.464547317706318e-07, "loss": 0.667, "step": 12687 }, { "epoch": 0.86, "learning_rate": 9.455176250685338e-07, "loss": 0.7539, "step": 12688 }, { "epoch": 0.86, "learning_rate": 9.445809595003774e-07, "loss": 0.7803, "step": 12689 }, { "epoch": 0.86, "learning_rate": 9.436447351117916e-07, "loss": 0.8438, "step": 12690 }, { "epoch": 0.86, "learning_rate": 9.427089519483945e-07, "loss": 0.8193, "step": 12691 }, { "epoch": 0.86, "learning_rate": 9.417736100557772e-07, "loss": 0.7891, "step": 12692 }, { "epoch": 0.86, "learning_rate": 9.408387094795057e-07, "loss": 0.7363, "step": 12693 }, { "epoch": 0.87, "learning_rate": 9.399042502651312e-07, "loss": 0.7998, "step": 12694 }, { "epoch": 0.87, "learning_rate": 9.389702324581806e-07, "loss": 0.7334, "step": 12695 }, { "epoch": 0.87, "learning_rate": 9.380366561041553e-07, "loss": 0.7959, "step": 12696 }, { "epoch": 0.87, "learning_rate": 9.371035212485446e-07, "loss": 0.7529, "step": 12697 }, { "epoch": 0.87, "learning_rate": 9.361708279368098e-07, "loss": 0.7178, "step": 12698 }, { "epoch": 0.87, "learning_rate": 9.352385762143879e-07, "loss": 0.6494, "step": 12699 }, { "epoch": 0.87, "learning_rate": 9.343067661267014e-07, "loss": 0.7734, "step": 12700 }, { "epoch": 0.87, "learning_rate": 9.333753977191462e-07, "loss": 0.6943, "step": 12701 }, { "epoch": 0.87, "learning_rate": 9.324444710371006e-07, "loss": 0.6875, "step": 12702 }, { "epoch": 0.87, "learning_rate": 9.315139861259171e-07, "loss": 0.8057, "step": 12703 }, { "epoch": 0.87, "learning_rate": 9.305839430309305e-07, "loss": 0.7021, "step": 12704 }, { "epoch": 0.87, "learning_rate": 9.296543417974535e-07, "loss": 0.7354, "step": 12705 }, { "epoch": 0.87, "learning_rate": 9.287251824707733e-07, "loss": 0.7549, "step": 12706 }, { "epoch": 0.87, "learning_rate": 9.27796465096159e-07, "loss": 0.7119, "step": 12707 }, { "epoch": 0.87, "learning_rate": 9.268681897188592e-07, "loss": 0.7451, "step": 12708 }, { "epoch": 0.87, "learning_rate": 9.259403563840985e-07, "loss": 0.7549, "step": 12709 }, { "epoch": 0.87, "learning_rate": 9.250129651370809e-07, "loss": 0.7793, "step": 12710 }, { "epoch": 0.87, "learning_rate": 9.240860160229914e-07, "loss": 0.7188, "step": 12711 }, { "epoch": 0.87, "learning_rate": 9.23159509086986e-07, "loss": 0.7363, "step": 12712 }, { "epoch": 0.87, "learning_rate": 9.222334443742076e-07, "loss": 0.6953, "step": 12713 }, { "epoch": 0.87, "learning_rate": 9.213078219297722e-07, "loss": 0.7236, "step": 12714 }, { "epoch": 0.87, "learning_rate": 9.203826417987783e-07, "loss": 0.8174, "step": 12715 }, { "epoch": 0.87, "learning_rate": 9.194579040262985e-07, "loss": 0.7871, "step": 12716 }, { "epoch": 0.87, "learning_rate": 9.18533608657386e-07, "loss": 0.8135, "step": 12717 }, { "epoch": 0.87, "learning_rate": 9.176097557370767e-07, "loss": 0.7119, "step": 12718 }, { "epoch": 0.87, "learning_rate": 9.166863453103736e-07, "loss": 0.8271, "step": 12719 }, { "epoch": 0.87, "learning_rate": 9.157633774222685e-07, "loss": 0.6855, "step": 12720 }, { "epoch": 0.87, "learning_rate": 9.14840852117731e-07, "loss": 0.7109, "step": 12721 }, { "epoch": 0.87, "learning_rate": 9.139187694417029e-07, "loss": 0.7578, "step": 12722 }, { "epoch": 0.87, "learning_rate": 9.129971294391093e-07, "loss": 0.7178, "step": 12723 }, { "epoch": 0.87, "learning_rate": 9.120759321548522e-07, "loss": 0.6738, "step": 12724 }, { "epoch": 0.87, "learning_rate": 9.111551776338145e-07, "loss": 0.7832, "step": 12725 }, { "epoch": 0.87, "learning_rate": 9.102348659208504e-07, "loss": 0.7344, "step": 12726 }, { "epoch": 0.87, "learning_rate": 9.093149970608017e-07, "loss": 0.6963, "step": 12727 }, { "epoch": 0.87, "learning_rate": 9.083955710984838e-07, "loss": 0.752, "step": 12728 }, { "epoch": 0.87, "learning_rate": 9.074765880786896e-07, "loss": 0.7061, "step": 12729 }, { "epoch": 0.87, "learning_rate": 9.065580480461922e-07, "loss": 0.751, "step": 12730 }, { "epoch": 0.87, "learning_rate": 9.056399510457459e-07, "loss": 0.7764, "step": 12731 }, { "epoch": 0.87, "learning_rate": 9.047222971220726e-07, "loss": 0.7939, "step": 12732 }, { "epoch": 0.87, "learning_rate": 9.038050863198878e-07, "loss": 0.7344, "step": 12733 }, { "epoch": 0.87, "learning_rate": 9.028883186838777e-07, "loss": 0.7402, "step": 12734 }, { "epoch": 0.87, "learning_rate": 9.019719942587035e-07, "loss": 0.751, "step": 12735 }, { "epoch": 0.87, "learning_rate": 9.010561130890094e-07, "loss": 0.6914, "step": 12736 }, { "epoch": 0.87, "learning_rate": 9.001406752194186e-07, "loss": 0.793, "step": 12737 }, { "epoch": 0.87, "learning_rate": 8.992256806945298e-07, "loss": 0.7363, "step": 12738 }, { "epoch": 0.87, "learning_rate": 8.98311129558922e-07, "loss": 0.7881, "step": 12739 }, { "epoch": 0.87, "learning_rate": 8.973970218571515e-07, "loss": 0.7803, "step": 12740 }, { "epoch": 0.87, "learning_rate": 8.964833576337572e-07, "loss": 0.7646, "step": 12741 }, { "epoch": 0.87, "learning_rate": 8.955701369332471e-07, "loss": 0.7822, "step": 12742 }, { "epoch": 0.87, "learning_rate": 8.946573598001162e-07, "loss": 0.7427, "step": 12743 }, { "epoch": 0.87, "learning_rate": 8.93745026278835e-07, "loss": 0.7959, "step": 12744 }, { "epoch": 0.87, "learning_rate": 8.92833136413852e-07, "loss": 0.6416, "step": 12745 }, { "epoch": 0.87, "learning_rate": 8.919216902495941e-07, "loss": 0.7842, "step": 12746 }, { "epoch": 0.87, "learning_rate": 8.910106878304692e-07, "loss": 0.7168, "step": 12747 }, { "epoch": 0.87, "learning_rate": 8.901001292008571e-07, "loss": 0.7275, "step": 12748 }, { "epoch": 0.87, "learning_rate": 8.891900144051236e-07, "loss": 0.7334, "step": 12749 }, { "epoch": 0.87, "learning_rate": 8.882803434876075e-07, "loss": 0.7617, "step": 12750 }, { "epoch": 0.87, "learning_rate": 8.87371116492628e-07, "loss": 0.8037, "step": 12751 }, { "epoch": 0.87, "learning_rate": 8.864623334644851e-07, "loss": 0.7188, "step": 12752 }, { "epoch": 0.87, "learning_rate": 8.855539944474512e-07, "loss": 0.7295, "step": 12753 }, { "epoch": 0.87, "learning_rate": 8.846460994857853e-07, "loss": 0.8232, "step": 12754 }, { "epoch": 0.87, "learning_rate": 8.837386486237143e-07, "loss": 0.7334, "step": 12755 }, { "epoch": 0.87, "learning_rate": 8.828316419054505e-07, "loss": 0.7236, "step": 12756 }, { "epoch": 0.87, "learning_rate": 8.819250793751876e-07, "loss": 0.7412, "step": 12757 }, { "epoch": 0.87, "learning_rate": 8.81018961077088e-07, "loss": 0.8271, "step": 12758 }, { "epoch": 0.87, "learning_rate": 8.801132870553008e-07, "loss": 0.7578, "step": 12759 }, { "epoch": 0.87, "learning_rate": 8.792080573539496e-07, "loss": 0.8447, "step": 12760 }, { "epoch": 0.87, "learning_rate": 8.78303272017137e-07, "loss": 0.7051, "step": 12761 }, { "epoch": 0.87, "learning_rate": 8.77398931088943e-07, "loss": 0.7246, "step": 12762 }, { "epoch": 0.87, "learning_rate": 8.764950346134315e-07, "loss": 0.7803, "step": 12763 }, { "epoch": 0.87, "learning_rate": 8.755915826346339e-07, "loss": 0.7305, "step": 12764 }, { "epoch": 0.87, "learning_rate": 8.746885751965705e-07, "loss": 0.7842, "step": 12765 }, { "epoch": 0.87, "learning_rate": 8.73786012343234e-07, "loss": 0.7627, "step": 12766 }, { "epoch": 0.87, "learning_rate": 8.72883894118598e-07, "loss": 0.7236, "step": 12767 }, { "epoch": 0.87, "learning_rate": 8.71982220566614e-07, "loss": 0.6855, "step": 12768 }, { "epoch": 0.87, "learning_rate": 8.710809917312102e-07, "loss": 0.7734, "step": 12769 }, { "epoch": 0.87, "learning_rate": 8.701802076562982e-07, "loss": 0.6895, "step": 12770 }, { "epoch": 0.87, "learning_rate": 8.692798683857584e-07, "loss": 0.752, "step": 12771 }, { "epoch": 0.87, "learning_rate": 8.683799739634591e-07, "loss": 0.8057, "step": 12772 }, { "epoch": 0.87, "learning_rate": 8.674805244332418e-07, "loss": 0.7744, "step": 12773 }, { "epoch": 0.87, "learning_rate": 8.665815198389282e-07, "loss": 0.7773, "step": 12774 }, { "epoch": 0.87, "learning_rate": 8.656829602243166e-07, "loss": 0.6982, "step": 12775 }, { "epoch": 0.87, "learning_rate": 8.647848456331864e-07, "loss": 0.7373, "step": 12776 }, { "epoch": 0.87, "learning_rate": 8.638871761092948e-07, "loss": 0.6973, "step": 12777 }, { "epoch": 0.87, "learning_rate": 8.629899516963735e-07, "loss": 0.791, "step": 12778 }, { "epoch": 0.87, "learning_rate": 8.620931724381332e-07, "loss": 0.7588, "step": 12779 }, { "epoch": 0.87, "learning_rate": 8.611968383782721e-07, "loss": 0.6865, "step": 12780 }, { "epoch": 0.87, "learning_rate": 8.603009495604531e-07, "loss": 0.6807, "step": 12781 }, { "epoch": 0.87, "learning_rate": 8.594055060283268e-07, "loss": 0.7139, "step": 12782 }, { "epoch": 0.87, "learning_rate": 8.585105078255196e-07, "loss": 0.7285, "step": 12783 }, { "epoch": 0.87, "learning_rate": 8.576159549956331e-07, "loss": 0.7979, "step": 12784 }, { "epoch": 0.87, "learning_rate": 8.567218475822492e-07, "loss": 0.7686, "step": 12785 }, { "epoch": 0.87, "learning_rate": 8.558281856289352e-07, "loss": 0.8057, "step": 12786 }, { "epoch": 0.87, "learning_rate": 8.549349691792241e-07, "loss": 0.7686, "step": 12787 }, { "epoch": 0.87, "learning_rate": 8.540421982766356e-07, "loss": 0.7109, "step": 12788 }, { "epoch": 0.87, "learning_rate": 8.531498729646648e-07, "loss": 0.7646, "step": 12789 }, { "epoch": 0.87, "learning_rate": 8.522579932867881e-07, "loss": 0.7734, "step": 12790 }, { "epoch": 0.87, "learning_rate": 8.513665592864518e-07, "loss": 0.6465, "step": 12791 }, { "epoch": 0.87, "learning_rate": 8.504755710070933e-07, "loss": 0.7471, "step": 12792 }, { "epoch": 0.87, "learning_rate": 8.495850284921203e-07, "loss": 0.6689, "step": 12793 }, { "epoch": 0.87, "learning_rate": 8.486949317849158e-07, "loss": 0.7354, "step": 12794 }, { "epoch": 0.87, "learning_rate": 8.478052809288484e-07, "loss": 0.7588, "step": 12795 }, { "epoch": 0.87, "learning_rate": 8.469160759672624e-07, "loss": 0.835, "step": 12796 }, { "epoch": 0.87, "learning_rate": 8.460273169434774e-07, "loss": 0.7607, "step": 12797 }, { "epoch": 0.87, "learning_rate": 8.451390039007956e-07, "loss": 0.6436, "step": 12798 }, { "epoch": 0.87, "learning_rate": 8.442511368824968e-07, "loss": 0.8057, "step": 12799 }, { "epoch": 0.87, "learning_rate": 8.433637159318353e-07, "loss": 0.7256, "step": 12800 }, { "epoch": 0.87, "learning_rate": 8.424767410920464e-07, "loss": 0.7607, "step": 12801 }, { "epoch": 0.87, "learning_rate": 8.415902124063435e-07, "loss": 0.7471, "step": 12802 }, { "epoch": 0.87, "learning_rate": 8.407041299179198e-07, "loss": 0.7637, "step": 12803 }, { "epoch": 0.87, "learning_rate": 8.398184936699428e-07, "loss": 0.791, "step": 12804 }, { "epoch": 0.87, "learning_rate": 8.389333037055635e-07, "loss": 0.7461, "step": 12805 }, { "epoch": 0.87, "learning_rate": 8.380485600679078e-07, "loss": 0.7432, "step": 12806 }, { "epoch": 0.87, "learning_rate": 8.371642628000775e-07, "loss": 0.7549, "step": 12807 }, { "epoch": 0.87, "learning_rate": 8.362804119451585e-07, "loss": 0.748, "step": 12808 }, { "epoch": 0.87, "learning_rate": 8.353970075462104e-07, "loss": 0.7041, "step": 12809 }, { "epoch": 0.87, "learning_rate": 8.345140496462734e-07, "loss": 0.7666, "step": 12810 }, { "epoch": 0.87, "learning_rate": 8.336315382883642e-07, "loss": 0.7715, "step": 12811 }, { "epoch": 0.87, "learning_rate": 8.327494735154806e-07, "loss": 0.7129, "step": 12812 }, { "epoch": 0.87, "learning_rate": 8.318678553705961e-07, "loss": 0.7139, "step": 12813 }, { "epoch": 0.87, "learning_rate": 8.309866838966618e-07, "loss": 0.7891, "step": 12814 }, { "epoch": 0.87, "learning_rate": 8.301059591366067e-07, "loss": 0.7109, "step": 12815 }, { "epoch": 0.87, "learning_rate": 8.292256811333465e-07, "loss": 0.7549, "step": 12816 }, { "epoch": 0.87, "learning_rate": 8.283458499297614e-07, "loss": 0.75, "step": 12817 }, { "epoch": 0.87, "learning_rate": 8.274664655687192e-07, "loss": 0.6904, "step": 12818 }, { "epoch": 0.87, "learning_rate": 8.265875280930658e-07, "loss": 0.7324, "step": 12819 }, { "epoch": 0.87, "learning_rate": 8.257090375456178e-07, "loss": 0.8135, "step": 12820 }, { "epoch": 0.87, "learning_rate": 8.248309939691768e-07, "loss": 0.7178, "step": 12821 }, { "epoch": 0.87, "learning_rate": 8.239533974065262e-07, "loss": 0.7236, "step": 12822 }, { "epoch": 0.87, "learning_rate": 8.230762479004173e-07, "loss": 0.8516, "step": 12823 }, { "epoch": 0.87, "learning_rate": 8.221995454935849e-07, "loss": 0.7529, "step": 12824 }, { "epoch": 0.87, "learning_rate": 8.213232902287438e-07, "loss": 0.7646, "step": 12825 }, { "epoch": 0.87, "learning_rate": 8.204474821485864e-07, "loss": 0.751, "step": 12826 }, { "epoch": 0.87, "learning_rate": 8.195721212957763e-07, "loss": 0.7344, "step": 12827 }, { "epoch": 0.87, "learning_rate": 8.186972077129662e-07, "loss": 0.6885, "step": 12828 }, { "epoch": 0.87, "learning_rate": 8.17822741442782e-07, "loss": 0.7324, "step": 12829 }, { "epoch": 0.87, "learning_rate": 8.16948722527825e-07, "loss": 0.7246, "step": 12830 }, { "epoch": 0.87, "learning_rate": 8.160751510106779e-07, "loss": 0.8164, "step": 12831 }, { "epoch": 0.87, "learning_rate": 8.152020269339034e-07, "loss": 0.707, "step": 12832 }, { "epoch": 0.87, "learning_rate": 8.14329350340034e-07, "loss": 0.7676, "step": 12833 }, { "epoch": 0.87, "learning_rate": 8.134571212715936e-07, "loss": 0.7285, "step": 12834 }, { "epoch": 0.87, "learning_rate": 8.125853397710759e-07, "loss": 0.7471, "step": 12835 }, { "epoch": 0.87, "learning_rate": 8.117140058809502e-07, "loss": 0.7295, "step": 12836 }, { "epoch": 0.87, "learning_rate": 8.108431196436706e-07, "loss": 0.748, "step": 12837 }, { "epoch": 0.87, "learning_rate": 8.09972681101665e-07, "loss": 0.7363, "step": 12838 }, { "epoch": 0.87, "learning_rate": 8.091026902973431e-07, "loss": 0.7422, "step": 12839 }, { "epoch": 0.88, "learning_rate": 8.082331472730898e-07, "loss": 0.7461, "step": 12840 }, { "epoch": 0.88, "learning_rate": 8.073640520712689e-07, "loss": 0.7412, "step": 12841 }, { "epoch": 0.88, "learning_rate": 8.064954047342255e-07, "loss": 0.7686, "step": 12842 }, { "epoch": 0.88, "learning_rate": 8.056272053042757e-07, "loss": 0.7129, "step": 12843 }, { "epoch": 0.88, "learning_rate": 8.047594538237203e-07, "loss": 0.7959, "step": 12844 }, { "epoch": 0.88, "learning_rate": 8.038921503348351e-07, "loss": 0.7988, "step": 12845 }, { "epoch": 0.88, "learning_rate": 8.030252948798767e-07, "loss": 0.7285, "step": 12846 }, { "epoch": 0.88, "learning_rate": 8.021588875010766e-07, "loss": 0.7891, "step": 12847 }, { "epoch": 0.88, "learning_rate": 8.012929282406478e-07, "loss": 0.6895, "step": 12848 }, { "epoch": 0.88, "learning_rate": 8.0042741714078e-07, "loss": 0.6914, "step": 12849 }, { "epoch": 0.88, "learning_rate": 7.995623542436382e-07, "loss": 0.7461, "step": 12850 }, { "epoch": 0.88, "learning_rate": 7.986977395913697e-07, "loss": 0.7578, "step": 12851 }, { "epoch": 0.88, "learning_rate": 7.978335732260989e-07, "loss": 0.7129, "step": 12852 }, { "epoch": 0.88, "learning_rate": 7.969698551899286e-07, "loss": 0.7734, "step": 12853 }, { "epoch": 0.88, "learning_rate": 7.961065855249373e-07, "loss": 0.8115, "step": 12854 }, { "epoch": 0.88, "learning_rate": 7.952437642731859e-07, "loss": 0.6748, "step": 12855 }, { "epoch": 0.88, "learning_rate": 7.943813914767073e-07, "loss": 0.7676, "step": 12856 }, { "epoch": 0.88, "learning_rate": 7.93519467177517e-07, "loss": 0.7783, "step": 12857 }, { "epoch": 0.88, "learning_rate": 7.926579914176125e-07, "loss": 0.6895, "step": 12858 }, { "epoch": 0.88, "learning_rate": 7.9179696423896e-07, "loss": 0.7988, "step": 12859 }, { "epoch": 0.88, "learning_rate": 7.909363856835106e-07, "loss": 0.792, "step": 12860 }, { "epoch": 0.88, "learning_rate": 7.900762557931918e-07, "loss": 0.75, "step": 12861 }, { "epoch": 0.88, "learning_rate": 7.892165746099101e-07, "loss": 0.6973, "step": 12862 }, { "epoch": 0.88, "learning_rate": 7.883573421755442e-07, "loss": 0.7354, "step": 12863 }, { "epoch": 0.88, "learning_rate": 7.874985585319606e-07, "loss": 0.7559, "step": 12864 }, { "epoch": 0.88, "learning_rate": 7.866402237210003e-07, "loss": 0.8008, "step": 12865 }, { "epoch": 0.88, "learning_rate": 7.857823377844775e-07, "loss": 0.7568, "step": 12866 }, { "epoch": 0.88, "learning_rate": 7.84924900764189e-07, "loss": 0.7734, "step": 12867 }, { "epoch": 0.88, "learning_rate": 7.840679127019124e-07, "loss": 0.7139, "step": 12868 }, { "epoch": 0.88, "learning_rate": 7.832113736393943e-07, "loss": 0.7461, "step": 12869 }, { "epoch": 0.88, "learning_rate": 7.823552836183701e-07, "loss": 0.6895, "step": 12870 }, { "epoch": 0.88, "learning_rate": 7.814996426805477e-07, "loss": 0.7979, "step": 12871 }, { "epoch": 0.88, "learning_rate": 7.806444508676125e-07, "loss": 0.7275, "step": 12872 }, { "epoch": 0.88, "learning_rate": 7.797897082212303e-07, "loss": 0.8369, "step": 12873 }, { "epoch": 0.88, "learning_rate": 7.78935414783043e-07, "loss": 0.7344, "step": 12874 }, { "epoch": 0.88, "learning_rate": 7.780815705946731e-07, "loss": 0.7852, "step": 12875 }, { "epoch": 0.88, "learning_rate": 7.772281756977195e-07, "loss": 0.8193, "step": 12876 }, { "epoch": 0.88, "learning_rate": 7.76375230133759e-07, "loss": 0.7002, "step": 12877 }, { "epoch": 0.88, "learning_rate": 7.755227339443494e-07, "loss": 0.7598, "step": 12878 }, { "epoch": 0.88, "learning_rate": 7.746706871710208e-07, "loss": 0.7715, "step": 12879 }, { "epoch": 0.88, "learning_rate": 7.738190898552844e-07, "loss": 0.668, "step": 12880 }, { "epoch": 0.88, "learning_rate": 7.72967942038636e-07, "loss": 0.7129, "step": 12881 }, { "epoch": 0.88, "learning_rate": 7.721172437625368e-07, "loss": 0.6924, "step": 12882 }, { "epoch": 0.88, "learning_rate": 7.71266995068437e-07, "loss": 0.7773, "step": 12883 }, { "epoch": 0.88, "learning_rate": 7.704171959977592e-07, "loss": 0.7832, "step": 12884 }, { "epoch": 0.88, "learning_rate": 7.695678465919043e-07, "loss": 0.6963, "step": 12885 }, { "epoch": 0.88, "learning_rate": 7.687189468922529e-07, "loss": 0.7402, "step": 12886 }, { "epoch": 0.88, "learning_rate": 7.678704969401674e-07, "loss": 0.7188, "step": 12887 }, { "epoch": 0.88, "learning_rate": 7.670224967769791e-07, "loss": 0.7715, "step": 12888 }, { "epoch": 0.88, "learning_rate": 7.661749464440038e-07, "loss": 0.7529, "step": 12889 }, { "epoch": 0.88, "learning_rate": 7.653278459825352e-07, "loss": 0.7441, "step": 12890 }, { "epoch": 0.88, "learning_rate": 7.644811954338461e-07, "loss": 0.6562, "step": 12891 }, { "epoch": 0.88, "learning_rate": 7.636349948391786e-07, "loss": 0.7412, "step": 12892 }, { "epoch": 0.88, "learning_rate": 7.627892442397656e-07, "loss": 0.7305, "step": 12893 }, { "epoch": 0.88, "learning_rate": 7.619439436768116e-07, "loss": 0.7773, "step": 12894 }, { "epoch": 0.88, "learning_rate": 7.610990931914964e-07, "loss": 0.7773, "step": 12895 }, { "epoch": 0.88, "learning_rate": 7.602546928249832e-07, "loss": 0.7051, "step": 12896 }, { "epoch": 0.88, "learning_rate": 7.594107426184116e-07, "loss": 0.7295, "step": 12897 }, { "epoch": 0.88, "learning_rate": 7.585672426128965e-07, "loss": 0.7529, "step": 12898 }, { "epoch": 0.88, "learning_rate": 7.577241928495349e-07, "loss": 0.6963, "step": 12899 }, { "epoch": 0.88, "learning_rate": 7.568815933694007e-07, "loss": 0.708, "step": 12900 }, { "epoch": 0.88, "learning_rate": 7.560394442135455e-07, "loss": 0.7705, "step": 12901 }, { "epoch": 0.88, "learning_rate": 7.551977454229964e-07, "loss": 0.8076, "step": 12902 }, { "epoch": 0.88, "learning_rate": 7.543564970387629e-07, "loss": 0.7754, "step": 12903 }, { "epoch": 0.88, "learning_rate": 7.535156991018289e-07, "loss": 0.7031, "step": 12904 }, { "epoch": 0.88, "learning_rate": 7.526753516531593e-07, "loss": 0.8008, "step": 12905 }, { "epoch": 0.88, "learning_rate": 7.518354547336959e-07, "loss": 0.709, "step": 12906 }, { "epoch": 0.88, "learning_rate": 7.509960083843604e-07, "loss": 0.7568, "step": 12907 }, { "epoch": 0.88, "learning_rate": 7.501570126460455e-07, "loss": 0.8037, "step": 12908 }, { "epoch": 0.88, "learning_rate": 7.49318467559631e-07, "loss": 0.7988, "step": 12909 }, { "epoch": 0.88, "learning_rate": 7.484803731659684e-07, "loss": 0.7266, "step": 12910 }, { "epoch": 0.88, "learning_rate": 7.476427295058918e-07, "loss": 0.7041, "step": 12911 }, { "epoch": 0.88, "learning_rate": 7.468055366202099e-07, "loss": 0.7988, "step": 12912 }, { "epoch": 0.88, "learning_rate": 7.459687945497118e-07, "loss": 0.7627, "step": 12913 }, { "epoch": 0.88, "learning_rate": 7.45132503335163e-07, "loss": 0.751, "step": 12914 }, { "epoch": 0.88, "learning_rate": 7.442966630173066e-07, "loss": 0.7529, "step": 12915 }, { "epoch": 0.88, "learning_rate": 7.43461273636863e-07, "loss": 0.7676, "step": 12916 }, { "epoch": 0.88, "learning_rate": 7.426263352345387e-07, "loss": 0.7939, "step": 12917 }, { "epoch": 0.88, "learning_rate": 7.417918478510067e-07, "loss": 0.7764, "step": 12918 }, { "epoch": 0.88, "learning_rate": 7.409578115269234e-07, "loss": 0.7793, "step": 12919 }, { "epoch": 0.88, "learning_rate": 7.401242263029262e-07, "loss": 0.8037, "step": 12920 }, { "epoch": 0.88, "learning_rate": 7.392910922196228e-07, "loss": 0.748, "step": 12921 }, { "epoch": 0.88, "learning_rate": 7.384584093176051e-07, "loss": 0.7979, "step": 12922 }, { "epoch": 0.88, "learning_rate": 7.376261776374438e-07, "loss": 0.8467, "step": 12923 }, { "epoch": 0.88, "learning_rate": 7.367943972196834e-07, "loss": 0.6846, "step": 12924 }, { "epoch": 0.88, "learning_rate": 7.35963068104848e-07, "loss": 0.7344, "step": 12925 }, { "epoch": 0.88, "learning_rate": 7.351321903334397e-07, "loss": 0.7158, "step": 12926 }, { "epoch": 0.88, "learning_rate": 7.343017639459404e-07, "loss": 0.7236, "step": 12927 }, { "epoch": 0.88, "learning_rate": 7.334717889828047e-07, "loss": 0.707, "step": 12928 }, { "epoch": 0.88, "learning_rate": 7.326422654844734e-07, "loss": 0.7041, "step": 12929 }, { "epoch": 0.88, "learning_rate": 7.318131934913597e-07, "loss": 0.7891, "step": 12930 }, { "epoch": 0.88, "learning_rate": 7.309845730438547e-07, "loss": 0.7129, "step": 12931 }, { "epoch": 0.88, "learning_rate": 7.301564041823283e-07, "loss": 0.7354, "step": 12932 }, { "epoch": 0.88, "learning_rate": 7.293286869471306e-07, "loss": 0.7139, "step": 12933 }, { "epoch": 0.88, "learning_rate": 7.285014213785868e-07, "loss": 0.7188, "step": 12934 }, { "epoch": 0.88, "learning_rate": 7.276746075170016e-07, "loss": 0.666, "step": 12935 }, { "epoch": 0.88, "learning_rate": 7.268482454026571e-07, "loss": 0.6982, "step": 12936 }, { "epoch": 0.88, "learning_rate": 7.260223350758167e-07, "loss": 0.7598, "step": 12937 }, { "epoch": 0.88, "learning_rate": 7.251968765767126e-07, "loss": 0.7637, "step": 12938 }, { "epoch": 0.88, "learning_rate": 7.24371869945566e-07, "loss": 0.7773, "step": 12939 }, { "epoch": 0.88, "learning_rate": 7.23547315222568e-07, "loss": 0.6943, "step": 12940 }, { "epoch": 0.88, "learning_rate": 7.227232124478933e-07, "loss": 0.7412, "step": 12941 }, { "epoch": 0.88, "learning_rate": 7.218995616616908e-07, "loss": 0.7236, "step": 12942 }, { "epoch": 0.88, "learning_rate": 7.210763629040918e-07, "loss": 0.7363, "step": 12943 }, { "epoch": 0.88, "learning_rate": 7.202536162151974e-07, "loss": 0.751, "step": 12944 }, { "epoch": 0.88, "learning_rate": 7.194313216350946e-07, "loss": 0.7969, "step": 12945 }, { "epoch": 0.88, "learning_rate": 7.186094792038445e-07, "loss": 0.7305, "step": 12946 }, { "epoch": 0.88, "learning_rate": 7.177880889614885e-07, "loss": 0.7969, "step": 12947 }, { "epoch": 0.88, "learning_rate": 7.169671509480447e-07, "loss": 0.6846, "step": 12948 }, { "epoch": 0.88, "learning_rate": 7.161466652035076e-07, "loss": 0.8066, "step": 12949 }, { "epoch": 0.88, "learning_rate": 7.153266317678542e-07, "loss": 0.6777, "step": 12950 }, { "epoch": 0.88, "learning_rate": 7.145070506810336e-07, "loss": 0.708, "step": 12951 }, { "epoch": 0.88, "learning_rate": 7.13687921982974e-07, "loss": 0.7334, "step": 12952 }, { "epoch": 0.88, "learning_rate": 7.128692457135899e-07, "loss": 0.7578, "step": 12953 }, { "epoch": 0.88, "learning_rate": 7.120510219127619e-07, "loss": 0.6797, "step": 12954 }, { "epoch": 0.88, "learning_rate": 7.112332506203545e-07, "loss": 0.7383, "step": 12955 }, { "epoch": 0.88, "learning_rate": 7.104159318762116e-07, "loss": 0.7148, "step": 12956 }, { "epoch": 0.88, "learning_rate": 7.095990657201501e-07, "loss": 0.7461, "step": 12957 }, { "epoch": 0.88, "learning_rate": 7.087826521919683e-07, "loss": 0.792, "step": 12958 }, { "epoch": 0.88, "learning_rate": 7.079666913314442e-07, "loss": 0.7793, "step": 12959 }, { "epoch": 0.88, "learning_rate": 7.071511831783296e-07, "loss": 0.6572, "step": 12960 }, { "epoch": 0.88, "learning_rate": 7.063361277723558e-07, "loss": 0.7246, "step": 12961 }, { "epoch": 0.88, "learning_rate": 7.055215251532322e-07, "loss": 0.7139, "step": 12962 }, { "epoch": 0.88, "learning_rate": 7.047073753606482e-07, "loss": 0.7031, "step": 12963 }, { "epoch": 0.88, "learning_rate": 7.038936784342654e-07, "loss": 0.7061, "step": 12964 }, { "epoch": 0.88, "learning_rate": 7.030804344137299e-07, "loss": 0.7559, "step": 12965 }, { "epoch": 0.88, "learning_rate": 7.022676433386632e-07, "loss": 0.7412, "step": 12966 }, { "epoch": 0.88, "learning_rate": 7.014553052486628e-07, "loss": 0.8125, "step": 12967 }, { "epoch": 0.88, "learning_rate": 7.006434201833068e-07, "loss": 0.7607, "step": 12968 }, { "epoch": 0.88, "learning_rate": 6.998319881821492e-07, "loss": 0.7988, "step": 12969 }, { "epoch": 0.88, "learning_rate": 6.990210092847239e-07, "loss": 0.7578, "step": 12970 }, { "epoch": 0.88, "learning_rate": 6.982104835305415e-07, "loss": 0.7988, "step": 12971 }, { "epoch": 0.88, "learning_rate": 6.974004109590926e-07, "loss": 0.7627, "step": 12972 }, { "epoch": 0.88, "learning_rate": 6.965907916098402e-07, "loss": 0.7402, "step": 12973 }, { "epoch": 0.88, "learning_rate": 6.957816255222305e-07, "loss": 0.7822, "step": 12974 }, { "epoch": 0.88, "learning_rate": 6.949729127356863e-07, "loss": 0.7588, "step": 12975 }, { "epoch": 0.88, "learning_rate": 6.941646532896085e-07, "loss": 0.7617, "step": 12976 }, { "epoch": 0.88, "learning_rate": 6.933568472233743e-07, "loss": 0.7402, "step": 12977 }, { "epoch": 0.88, "learning_rate": 6.925494945763411e-07, "loss": 0.7588, "step": 12978 }, { "epoch": 0.88, "learning_rate": 6.917425953878432e-07, "loss": 0.7109, "step": 12979 }, { "epoch": 0.88, "learning_rate": 6.909361496971923e-07, "loss": 0.7246, "step": 12980 }, { "epoch": 0.88, "learning_rate": 6.90130157543677e-07, "loss": 0.6582, "step": 12981 }, { "epoch": 0.88, "learning_rate": 6.89324618966567e-07, "loss": 0.7852, "step": 12982 }, { "epoch": 0.88, "learning_rate": 6.885195340051065e-07, "loss": 0.7441, "step": 12983 }, { "epoch": 0.88, "learning_rate": 6.877149026985208e-07, "loss": 0.7227, "step": 12984 }, { "epoch": 0.88, "learning_rate": 6.869107250860118e-07, "loss": 0.7646, "step": 12985 }, { "epoch": 0.88, "learning_rate": 6.861070012067583e-07, "loss": 0.7959, "step": 12986 }, { "epoch": 0.89, "learning_rate": 6.853037310999167e-07, "loss": 0.7715, "step": 12987 }, { "epoch": 0.89, "learning_rate": 6.845009148046211e-07, "loss": 0.7861, "step": 12988 }, { "epoch": 0.89, "learning_rate": 6.836985523599904e-07, "loss": 0.7061, "step": 12989 }, { "epoch": 0.89, "learning_rate": 6.828966438051099e-07, "loss": 0.6777, "step": 12990 }, { "epoch": 0.89, "learning_rate": 6.820951891790506e-07, "loss": 0.7607, "step": 12991 }, { "epoch": 0.89, "learning_rate": 6.812941885208612e-07, "loss": 0.7598, "step": 12992 }, { "epoch": 0.89, "learning_rate": 6.804936418695629e-07, "loss": 0.791, "step": 12993 }, { "epoch": 0.89, "learning_rate": 6.796935492641576e-07, "loss": 0.7285, "step": 12994 }, { "epoch": 0.89, "learning_rate": 6.78893910743631e-07, "loss": 0.7529, "step": 12995 }, { "epoch": 0.89, "learning_rate": 6.780947263469384e-07, "loss": 0.7637, "step": 12996 }, { "epoch": 0.89, "learning_rate": 6.772959961130154e-07, "loss": 0.6826, "step": 12997 }, { "epoch": 0.89, "learning_rate": 6.764977200807765e-07, "loss": 0.6182, "step": 12998 }, { "epoch": 0.89, "learning_rate": 6.756998982891161e-07, "loss": 0.7285, "step": 12999 }, { "epoch": 0.89, "learning_rate": 6.749025307768975e-07, "loss": 0.7588, "step": 13000 }, { "epoch": 0.89, "learning_rate": 6.741056175829763e-07, "loss": 0.7646, "step": 13001 }, { "epoch": 0.89, "learning_rate": 6.733091587461749e-07, "loss": 0.7334, "step": 13002 }, { "epoch": 0.89, "learning_rate": 6.725131543052954e-07, "loss": 0.7812, "step": 13003 }, { "epoch": 0.89, "learning_rate": 6.717176042991202e-07, "loss": 0.7666, "step": 13004 }, { "epoch": 0.89, "learning_rate": 6.709225087664085e-07, "loss": 0.7383, "step": 13005 }, { "epoch": 0.89, "learning_rate": 6.701278677458967e-07, "loss": 0.7529, "step": 13006 }, { "epoch": 0.89, "learning_rate": 6.693336812762996e-07, "loss": 0.749, "step": 13007 }, { "epoch": 0.89, "learning_rate": 6.68539949396313e-07, "loss": 0.7734, "step": 13008 }, { "epoch": 0.89, "learning_rate": 6.677466721446035e-07, "loss": 0.668, "step": 13009 }, { "epoch": 0.89, "learning_rate": 6.669538495598216e-07, "loss": 0.8291, "step": 13010 }, { "epoch": 0.89, "learning_rate": 6.661614816805917e-07, "loss": 0.7881, "step": 13011 }, { "epoch": 0.89, "learning_rate": 6.653695685455197e-07, "loss": 0.7725, "step": 13012 }, { "epoch": 0.89, "learning_rate": 6.645781101931881e-07, "loss": 0.7227, "step": 13013 }, { "epoch": 0.89, "learning_rate": 6.637871066621548e-07, "loss": 0.7568, "step": 13014 }, { "epoch": 0.89, "learning_rate": 6.629965579909591e-07, "loss": 0.6553, "step": 13015 }, { "epoch": 0.89, "learning_rate": 6.622064642181159e-07, "loss": 0.7217, "step": 13016 }, { "epoch": 0.89, "learning_rate": 6.614168253821162e-07, "loss": 0.8027, "step": 13017 }, { "epoch": 0.89, "learning_rate": 6.606276415214363e-07, "loss": 0.7725, "step": 13018 }, { "epoch": 0.89, "learning_rate": 6.598389126745209e-07, "loss": 0.7266, "step": 13019 }, { "epoch": 0.89, "learning_rate": 6.590506388797979e-07, "loss": 0.7109, "step": 13020 }, { "epoch": 0.89, "learning_rate": 6.582628201756724e-07, "loss": 0.7646, "step": 13021 }, { "epoch": 0.89, "learning_rate": 6.574754566005281e-07, "loss": 0.832, "step": 13022 }, { "epoch": 0.89, "learning_rate": 6.56688548192721e-07, "loss": 0.7148, "step": 13023 }, { "epoch": 0.89, "learning_rate": 6.559020949905948e-07, "loss": 0.792, "step": 13024 }, { "epoch": 0.89, "learning_rate": 6.551160970324621e-07, "loss": 0.7295, "step": 13025 }, { "epoch": 0.89, "learning_rate": 6.54330554356617e-07, "loss": 0.7178, "step": 13026 }, { "epoch": 0.89, "learning_rate": 6.535454670013319e-07, "loss": 0.7695, "step": 13027 }, { "epoch": 0.89, "learning_rate": 6.527608350048564e-07, "loss": 0.7402, "step": 13028 }, { "epoch": 0.89, "learning_rate": 6.519766584054155e-07, "loss": 0.7529, "step": 13029 }, { "epoch": 0.89, "learning_rate": 6.511929372412163e-07, "loss": 0.7939, "step": 13030 }, { "epoch": 0.89, "learning_rate": 6.504096715504438e-07, "loss": 0.75, "step": 13031 }, { "epoch": 0.89, "learning_rate": 6.496268613712541e-07, "loss": 0.6738, "step": 13032 }, { "epoch": 0.89, "learning_rate": 6.488445067417881e-07, "loss": 0.7178, "step": 13033 }, { "epoch": 0.89, "learning_rate": 6.480626077001606e-07, "loss": 0.7793, "step": 13034 }, { "epoch": 0.89, "learning_rate": 6.472811642844679e-07, "loss": 0.6768, "step": 13035 }, { "epoch": 0.89, "learning_rate": 6.465001765327805e-07, "loss": 0.7676, "step": 13036 }, { "epoch": 0.89, "learning_rate": 6.457196444831481e-07, "loss": 0.6768, "step": 13037 }, { "epoch": 0.89, "learning_rate": 6.449395681736004e-07, "loss": 0.7842, "step": 13038 }, { "epoch": 0.89, "learning_rate": 6.441599476421389e-07, "loss": 0.6787, "step": 13039 }, { "epoch": 0.89, "learning_rate": 6.433807829267491e-07, "loss": 0.6904, "step": 13040 }, { "epoch": 0.89, "learning_rate": 6.426020740653904e-07, "loss": 0.6982, "step": 13041 }, { "epoch": 0.89, "learning_rate": 6.418238210960026e-07, "loss": 0.7256, "step": 13042 }, { "epoch": 0.89, "learning_rate": 6.410460240565019e-07, "loss": 0.7295, "step": 13043 }, { "epoch": 0.89, "learning_rate": 6.402686829847837e-07, "loss": 0.7451, "step": 13044 }, { "epoch": 0.89, "learning_rate": 6.394917979187176e-07, "loss": 0.7871, "step": 13045 }, { "epoch": 0.89, "learning_rate": 6.387153688961556e-07, "loss": 0.7119, "step": 13046 }, { "epoch": 0.89, "learning_rate": 6.37939395954923e-07, "loss": 0.7754, "step": 13047 }, { "epoch": 0.89, "learning_rate": 6.371638791328272e-07, "loss": 0.7363, "step": 13048 }, { "epoch": 0.89, "learning_rate": 6.363888184676503e-07, "loss": 0.7314, "step": 13049 }, { "epoch": 0.89, "learning_rate": 6.356142139971533e-07, "loss": 0.7637, "step": 13050 }, { "epoch": 0.89, "learning_rate": 6.34840065759077e-07, "loss": 0.7178, "step": 13051 }, { "epoch": 0.89, "learning_rate": 6.340663737911334e-07, "loss": 0.7744, "step": 13052 }, { "epoch": 0.89, "learning_rate": 6.332931381310192e-07, "loss": 0.6846, "step": 13053 }, { "epoch": 0.89, "learning_rate": 6.325203588164097e-07, "loss": 0.7754, "step": 13054 }, { "epoch": 0.89, "learning_rate": 6.317480358849493e-07, "loss": 0.7744, "step": 13055 }, { "epoch": 0.89, "learning_rate": 6.309761693742678e-07, "loss": 0.7588, "step": 13056 }, { "epoch": 0.89, "learning_rate": 6.302047593219695e-07, "loss": 0.748, "step": 13057 }, { "epoch": 0.89, "learning_rate": 6.294338057656413e-07, "loss": 0.7451, "step": 13058 }, { "epoch": 0.89, "learning_rate": 6.286633087428373e-07, "loss": 0.6963, "step": 13059 }, { "epoch": 0.89, "learning_rate": 6.278932682911032e-07, "loss": 0.7031, "step": 13060 }, { "epoch": 0.89, "learning_rate": 6.271236844479511e-07, "loss": 0.7734, "step": 13061 }, { "epoch": 0.89, "learning_rate": 6.263545572508755e-07, "loss": 0.7451, "step": 13062 }, { "epoch": 0.89, "learning_rate": 6.255858867373488e-07, "loss": 0.8027, "step": 13063 }, { "epoch": 0.89, "learning_rate": 6.248176729448219e-07, "loss": 0.7588, "step": 13064 }, { "epoch": 0.89, "learning_rate": 6.240499159107183e-07, "loss": 0.8242, "step": 13065 }, { "epoch": 0.89, "learning_rate": 6.232826156724459e-07, "loss": 0.7607, "step": 13066 }, { "epoch": 0.89, "learning_rate": 6.225157722673891e-07, "loss": 0.7305, "step": 13067 }, { "epoch": 0.89, "learning_rate": 6.21749385732906e-07, "loss": 0.7051, "step": 13068 }, { "epoch": 0.89, "learning_rate": 6.209834561063344e-07, "loss": 0.71, "step": 13069 }, { "epoch": 0.89, "learning_rate": 6.202179834249921e-07, "loss": 0.7568, "step": 13070 }, { "epoch": 0.89, "learning_rate": 6.194529677261718e-07, "loss": 0.8076, "step": 13071 }, { "epoch": 0.89, "learning_rate": 6.186884090471456e-07, "loss": 0.708, "step": 13072 }, { "epoch": 0.89, "learning_rate": 6.179243074251628e-07, "loss": 0.7539, "step": 13073 }, { "epoch": 0.89, "learning_rate": 6.171606628974513e-07, "loss": 0.7402, "step": 13074 }, { "epoch": 0.89, "learning_rate": 6.163974755012136e-07, "loss": 0.7588, "step": 13075 }, { "epoch": 0.89, "learning_rate": 6.156347452736333e-07, "loss": 0.7412, "step": 13076 }, { "epoch": 0.89, "learning_rate": 6.148724722518707e-07, "loss": 0.7471, "step": 13077 }, { "epoch": 0.89, "learning_rate": 6.141106564730636e-07, "loss": 0.7686, "step": 13078 }, { "epoch": 0.89, "learning_rate": 6.133492979743272e-07, "loss": 0.7168, "step": 13079 }, { "epoch": 0.89, "learning_rate": 6.125883967927571e-07, "loss": 0.7871, "step": 13080 }, { "epoch": 0.89, "learning_rate": 6.118279529654203e-07, "loss": 0.7568, "step": 13081 }, { "epoch": 0.89, "learning_rate": 6.110679665293684e-07, "loss": 0.7725, "step": 13082 }, { "epoch": 0.89, "learning_rate": 6.103084375216273e-07, "loss": 0.8311, "step": 13083 }, { "epoch": 0.89, "learning_rate": 6.095493659792018e-07, "loss": 0.7676, "step": 13084 }, { "epoch": 0.89, "learning_rate": 6.087907519390723e-07, "loss": 0.791, "step": 13085 }, { "epoch": 0.89, "learning_rate": 6.080325954381994e-07, "loss": 0.6748, "step": 13086 }, { "epoch": 0.89, "learning_rate": 6.072748965135222e-07, "loss": 0.6943, "step": 13087 }, { "epoch": 0.89, "learning_rate": 6.065176552019525e-07, "loss": 0.7412, "step": 13088 }, { "epoch": 0.89, "learning_rate": 6.057608715403829e-07, "loss": 0.7207, "step": 13089 }, { "epoch": 0.89, "learning_rate": 6.050045455656895e-07, "loss": 0.7363, "step": 13090 }, { "epoch": 0.89, "learning_rate": 6.042486773147139e-07, "loss": 0.8311, "step": 13091 }, { "epoch": 0.89, "learning_rate": 6.034932668242843e-07, "loss": 0.7559, "step": 13092 }, { "epoch": 0.89, "learning_rate": 6.027383141312071e-07, "loss": 0.7939, "step": 13093 }, { "epoch": 0.89, "learning_rate": 6.019838192722583e-07, "loss": 0.7275, "step": 13094 }, { "epoch": 0.89, "learning_rate": 6.012297822841984e-07, "loss": 0.8076, "step": 13095 }, { "epoch": 0.89, "learning_rate": 6.00476203203768e-07, "loss": 0.6689, "step": 13096 }, { "epoch": 0.89, "learning_rate": 5.997230820676781e-07, "loss": 0.833, "step": 13097 }, { "epoch": 0.89, "learning_rate": 5.989704189126199e-07, "loss": 0.71, "step": 13098 }, { "epoch": 0.89, "learning_rate": 5.982182137752657e-07, "loss": 0.7441, "step": 13099 }, { "epoch": 0.89, "learning_rate": 5.974664666922625e-07, "loss": 0.7627, "step": 13100 }, { "epoch": 0.89, "learning_rate": 5.967151777002312e-07, "loss": 0.752, "step": 13101 }, { "epoch": 0.89, "learning_rate": 5.9596434683578e-07, "loss": 0.7314, "step": 13102 }, { "epoch": 0.89, "learning_rate": 5.95213974135489e-07, "loss": 0.6885, "step": 13103 }, { "epoch": 0.89, "learning_rate": 5.944640596359119e-07, "loss": 0.6924, "step": 13104 }, { "epoch": 0.89, "learning_rate": 5.937146033735874e-07, "loss": 0.8057, "step": 13105 }, { "epoch": 0.89, "learning_rate": 5.929656053850297e-07, "loss": 0.7422, "step": 13106 }, { "epoch": 0.89, "learning_rate": 5.922170657067283e-07, "loss": 0.7217, "step": 13107 }, { "epoch": 0.89, "learning_rate": 5.91468984375152e-07, "loss": 0.7646, "step": 13108 }, { "epoch": 0.89, "learning_rate": 5.907213614267493e-07, "loss": 0.7764, "step": 13109 }, { "epoch": 0.89, "learning_rate": 5.899741968979433e-07, "loss": 0.7344, "step": 13110 }, { "epoch": 0.89, "learning_rate": 5.89227490825135e-07, "loss": 0.8105, "step": 13111 }, { "epoch": 0.89, "learning_rate": 5.88481243244704e-07, "loss": 0.7441, "step": 13112 }, { "epoch": 0.89, "learning_rate": 5.877354541930069e-07, "loss": 0.7412, "step": 13113 }, { "epoch": 0.89, "learning_rate": 5.869901237063813e-07, "loss": 0.6904, "step": 13114 }, { "epoch": 0.89, "learning_rate": 5.862452518211359e-07, "loss": 0.7266, "step": 13115 }, { "epoch": 0.89, "learning_rate": 5.85500838573566e-07, "loss": 0.7373, "step": 13116 }, { "epoch": 0.89, "learning_rate": 5.84756883999934e-07, "loss": 0.7822, "step": 13117 }, { "epoch": 0.89, "learning_rate": 5.840133881364873e-07, "loss": 0.7275, "step": 13118 }, { "epoch": 0.89, "learning_rate": 5.832703510194493e-07, "loss": 0.7871, "step": 13119 }, { "epoch": 0.89, "learning_rate": 5.825277726850198e-07, "loss": 0.7412, "step": 13120 }, { "epoch": 0.89, "learning_rate": 5.817856531693789e-07, "loss": 0.71, "step": 13121 }, { "epoch": 0.89, "learning_rate": 5.81043992508682e-07, "loss": 0.7324, "step": 13122 }, { "epoch": 0.89, "learning_rate": 5.803027907390623e-07, "loss": 0.7432, "step": 13123 }, { "epoch": 0.89, "learning_rate": 5.795620478966302e-07, "loss": 0.7715, "step": 13124 }, { "epoch": 0.89, "learning_rate": 5.788217640174764e-07, "loss": 0.7559, "step": 13125 }, { "epoch": 0.89, "learning_rate": 5.78081939137668e-07, "loss": 0.7812, "step": 13126 }, { "epoch": 0.89, "learning_rate": 5.77342573293247e-07, "loss": 0.8213, "step": 13127 }, { "epoch": 0.89, "learning_rate": 5.766036665202356e-07, "loss": 0.7715, "step": 13128 }, { "epoch": 0.89, "learning_rate": 5.758652188546365e-07, "loss": 0.7119, "step": 13129 }, { "epoch": 0.89, "learning_rate": 5.751272303324207e-07, "loss": 0.7129, "step": 13130 }, { "epoch": 0.89, "learning_rate": 5.743897009895482e-07, "loss": 0.7969, "step": 13131 }, { "epoch": 0.89, "learning_rate": 5.736526308619516e-07, "loss": 0.8047, "step": 13132 }, { "epoch": 0.89, "learning_rate": 5.729160199855377e-07, "loss": 0.7451, "step": 13133 }, { "epoch": 0.9, "learning_rate": 5.721798683961955e-07, "loss": 0.7109, "step": 13134 }, { "epoch": 0.9, "learning_rate": 5.714441761297906e-07, "loss": 0.7539, "step": 13135 }, { "epoch": 0.9, "learning_rate": 5.707089432221646e-07, "loss": 0.7275, "step": 13136 }, { "epoch": 0.9, "learning_rate": 5.699741697091398e-07, "loss": 0.7939, "step": 13137 }, { "epoch": 0.9, "learning_rate": 5.692398556265133e-07, "loss": 0.7822, "step": 13138 }, { "epoch": 0.9, "learning_rate": 5.68506001010063e-07, "loss": 0.7266, "step": 13139 }, { "epoch": 0.9, "learning_rate": 5.677726058955391e-07, "loss": 0.7559, "step": 13140 }, { "epoch": 0.9, "learning_rate": 5.670396703186731e-07, "loss": 0.7041, "step": 13141 }, { "epoch": 0.9, "learning_rate": 5.663071943151743e-07, "loss": 0.7695, "step": 13142 }, { "epoch": 0.9, "learning_rate": 5.655751779207297e-07, "loss": 0.6943, "step": 13143 }, { "epoch": 0.9, "learning_rate": 5.648436211710018e-07, "loss": 0.6475, "step": 13144 }, { "epoch": 0.9, "learning_rate": 5.641125241016344e-07, "loss": 0.7988, "step": 13145 }, { "epoch": 0.9, "learning_rate": 5.633818867482432e-07, "loss": 0.7383, "step": 13146 }, { "epoch": 0.9, "learning_rate": 5.626517091464268e-07, "loss": 0.7578, "step": 13147 }, { "epoch": 0.9, "learning_rate": 5.619219913317575e-07, "loss": 0.7627, "step": 13148 }, { "epoch": 0.9, "learning_rate": 5.611927333397893e-07, "loss": 0.7871, "step": 13149 }, { "epoch": 0.9, "learning_rate": 5.604639352060504e-07, "loss": 0.7676, "step": 13150 }, { "epoch": 0.9, "learning_rate": 5.59735596966049e-07, "loss": 0.6533, "step": 13151 }, { "epoch": 0.9, "learning_rate": 5.5900771865527e-07, "loss": 0.7764, "step": 13152 }, { "epoch": 0.9, "learning_rate": 5.58280300309173e-07, "loss": 0.6992, "step": 13153 }, { "epoch": 0.9, "learning_rate": 5.575533419631984e-07, "loss": 0.7461, "step": 13154 }, { "epoch": 0.9, "learning_rate": 5.568268436527669e-07, "loss": 0.7236, "step": 13155 }, { "epoch": 0.9, "learning_rate": 5.561008054132699e-07, "loss": 0.7061, "step": 13156 }, { "epoch": 0.9, "learning_rate": 5.553752272800805e-07, "loss": 0.8096, "step": 13157 }, { "epoch": 0.9, "learning_rate": 5.546501092885504e-07, "loss": 0.7158, "step": 13158 }, { "epoch": 0.9, "learning_rate": 5.539254514740066e-07, "loss": 0.7627, "step": 13159 }, { "epoch": 0.9, "learning_rate": 5.532012538717524e-07, "loss": 0.7568, "step": 13160 }, { "epoch": 0.9, "learning_rate": 5.524775165170737e-07, "loss": 0.8135, "step": 13161 }, { "epoch": 0.9, "learning_rate": 5.517542394452302e-07, "loss": 0.834, "step": 13162 }, { "epoch": 0.9, "learning_rate": 5.510314226914593e-07, "loss": 0.8311, "step": 13163 }, { "epoch": 0.9, "learning_rate": 5.503090662909749e-07, "loss": 0.6914, "step": 13164 }, { "epoch": 0.9, "learning_rate": 5.495871702789746e-07, "loss": 0.6377, "step": 13165 }, { "epoch": 0.9, "learning_rate": 5.488657346906234e-07, "loss": 0.7344, "step": 13166 }, { "epoch": 0.9, "learning_rate": 5.481447595610745e-07, "loss": 0.793, "step": 13167 }, { "epoch": 0.9, "learning_rate": 5.47424244925453e-07, "loss": 0.7686, "step": 13168 }, { "epoch": 0.9, "learning_rate": 5.467041908188608e-07, "loss": 0.7139, "step": 13169 }, { "epoch": 0.9, "learning_rate": 5.459845972763777e-07, "loss": 0.7344, "step": 13170 }, { "epoch": 0.9, "learning_rate": 5.452654643330657e-07, "loss": 0.8291, "step": 13171 }, { "epoch": 0.9, "learning_rate": 5.445467920239577e-07, "loss": 0.7637, "step": 13172 }, { "epoch": 0.9, "learning_rate": 5.438285803840704e-07, "loss": 0.7314, "step": 13173 }, { "epoch": 0.9, "learning_rate": 5.431108294483922e-07, "loss": 0.7109, "step": 13174 }, { "epoch": 0.9, "learning_rate": 5.423935392518953e-07, "loss": 0.7754, "step": 13175 }, { "epoch": 0.9, "learning_rate": 5.416767098295228e-07, "loss": 0.7354, "step": 13176 }, { "epoch": 0.9, "learning_rate": 5.40960341216199e-07, "loss": 0.7266, "step": 13177 }, { "epoch": 0.9, "learning_rate": 5.402444334468259e-07, "loss": 0.7393, "step": 13178 }, { "epoch": 0.9, "learning_rate": 5.395289865562836e-07, "loss": 0.7178, "step": 13179 }, { "epoch": 0.9, "learning_rate": 5.388140005794274e-07, "loss": 0.7051, "step": 13180 }, { "epoch": 0.9, "learning_rate": 5.380994755510926e-07, "loss": 0.7969, "step": 13181 }, { "epoch": 0.9, "learning_rate": 5.373854115060894e-07, "loss": 0.6797, "step": 13182 }, { "epoch": 0.9, "learning_rate": 5.366718084792067e-07, "loss": 0.7725, "step": 13183 }, { "epoch": 0.9, "learning_rate": 5.35958666505213e-07, "loss": 0.75, "step": 13184 }, { "epoch": 0.9, "learning_rate": 5.352459856188508e-07, "loss": 0.7881, "step": 13185 }, { "epoch": 0.9, "learning_rate": 5.345337658548422e-07, "loss": 0.7363, "step": 13186 }, { "epoch": 0.9, "learning_rate": 5.338220072478872e-07, "loss": 0.708, "step": 13187 }, { "epoch": 0.9, "learning_rate": 5.331107098326649e-07, "loss": 0.71, "step": 13188 }, { "epoch": 0.9, "learning_rate": 5.323998736438241e-07, "loss": 0.7158, "step": 13189 }, { "epoch": 0.9, "learning_rate": 5.316894987159993e-07, "loss": 0.7393, "step": 13190 }, { "epoch": 0.9, "learning_rate": 5.309795850838028e-07, "loss": 0.7256, "step": 13191 }, { "epoch": 0.9, "learning_rate": 5.302701327818183e-07, "loss": 0.7607, "step": 13192 }, { "epoch": 0.9, "learning_rate": 5.295611418446111e-07, "loss": 0.6846, "step": 13193 }, { "epoch": 0.9, "learning_rate": 5.288526123067228e-07, "loss": 0.7832, "step": 13194 }, { "epoch": 0.9, "learning_rate": 5.281445442026744e-07, "loss": 0.7002, "step": 13195 }, { "epoch": 0.9, "learning_rate": 5.274369375669597e-07, "loss": 0.7139, "step": 13196 }, { "epoch": 0.9, "learning_rate": 5.267297924340565e-07, "loss": 0.8574, "step": 13197 }, { "epoch": 0.9, "learning_rate": 5.260231088384171e-07, "loss": 0.6846, "step": 13198 }, { "epoch": 0.9, "learning_rate": 5.253168868144687e-07, "loss": 0.7637, "step": 13199 }, { "epoch": 0.9, "learning_rate": 5.246111263966203e-07, "loss": 0.6924, "step": 13200 }, { "epoch": 0.9, "learning_rate": 5.239058276192566e-07, "loss": 0.7705, "step": 13201 }, { "epoch": 0.9, "learning_rate": 5.232009905167356e-07, "loss": 0.8223, "step": 13202 }, { "epoch": 0.9, "learning_rate": 5.224966151234012e-07, "loss": 0.7588, "step": 13203 }, { "epoch": 0.9, "learning_rate": 5.217927014735724e-07, "loss": 0.7549, "step": 13204 }, { "epoch": 0.9, "learning_rate": 5.210892496015385e-07, "loss": 0.7793, "step": 13205 }, { "epoch": 0.9, "learning_rate": 5.203862595415743e-07, "loss": 0.7891, "step": 13206 }, { "epoch": 0.9, "learning_rate": 5.196837313279291e-07, "loss": 0.8232, "step": 13207 }, { "epoch": 0.9, "learning_rate": 5.189816649948309e-07, "loss": 0.6377, "step": 13208 }, { "epoch": 0.9, "learning_rate": 5.182800605764826e-07, "loss": 0.6455, "step": 13209 }, { "epoch": 0.9, "learning_rate": 5.175789181070678e-07, "loss": 0.7471, "step": 13210 }, { "epoch": 0.9, "learning_rate": 5.168782376207471e-07, "loss": 0.8174, "step": 13211 }, { "epoch": 0.9, "learning_rate": 5.161780191516552e-07, "loss": 0.7256, "step": 13212 }, { "epoch": 0.9, "learning_rate": 5.154782627339073e-07, "loss": 0.6816, "step": 13213 }, { "epoch": 0.9, "learning_rate": 5.147789684015958e-07, "loss": 0.7363, "step": 13214 }, { "epoch": 0.9, "learning_rate": 5.140801361887903e-07, "loss": 0.7754, "step": 13215 }, { "epoch": 0.9, "learning_rate": 5.133817661295382e-07, "loss": 0.7764, "step": 13216 }, { "epoch": 0.9, "learning_rate": 5.126838582578653e-07, "loss": 0.6631, "step": 13217 }, { "epoch": 0.9, "learning_rate": 5.119864126077711e-07, "loss": 0.8213, "step": 13218 }, { "epoch": 0.9, "learning_rate": 5.112894292132365e-07, "loss": 0.7793, "step": 13219 }, { "epoch": 0.9, "learning_rate": 5.105929081082173e-07, "loss": 0.7021, "step": 13220 }, { "epoch": 0.9, "learning_rate": 5.098968493266487e-07, "loss": 0.7666, "step": 13221 }, { "epoch": 0.9, "learning_rate": 5.092012529024426e-07, "loss": 0.7617, "step": 13222 }, { "epoch": 0.9, "learning_rate": 5.085061188694895e-07, "loss": 0.7822, "step": 13223 }, { "epoch": 0.9, "learning_rate": 5.078114472616569e-07, "loss": 0.7939, "step": 13224 }, { "epoch": 0.9, "learning_rate": 5.071172381127853e-07, "loss": 0.7305, "step": 13225 }, { "epoch": 0.9, "learning_rate": 5.064234914566978e-07, "loss": 0.7959, "step": 13226 }, { "epoch": 0.9, "learning_rate": 5.057302073271985e-07, "loss": 0.8223, "step": 13227 }, { "epoch": 0.9, "learning_rate": 5.050373857580582e-07, "loss": 0.7617, "step": 13228 }, { "epoch": 0.9, "learning_rate": 5.04345026783034e-07, "loss": 0.7588, "step": 13229 }, { "epoch": 0.9, "learning_rate": 5.036531304358572e-07, "loss": 0.6934, "step": 13230 }, { "epoch": 0.9, "learning_rate": 5.02961696750237e-07, "loss": 0.7793, "step": 13231 }, { "epoch": 0.9, "learning_rate": 5.022707257598581e-07, "loss": 0.6953, "step": 13232 }, { "epoch": 0.9, "learning_rate": 5.015802174983886e-07, "loss": 0.7139, "step": 13233 }, { "epoch": 0.9, "learning_rate": 5.008901719994663e-07, "loss": 0.6523, "step": 13234 }, { "epoch": 0.9, "learning_rate": 5.002005892967122e-07, "loss": 0.8232, "step": 13235 }, { "epoch": 0.9, "learning_rate": 4.995114694237213e-07, "loss": 0.6631, "step": 13236 }, { "epoch": 0.9, "learning_rate": 4.988228124140704e-07, "loss": 0.7305, "step": 13237 }, { "epoch": 0.9, "learning_rate": 4.981346183013047e-07, "loss": 0.6611, "step": 13238 }, { "epoch": 0.9, "learning_rate": 4.974468871189597e-07, "loss": 0.6719, "step": 13239 }, { "epoch": 0.9, "learning_rate": 4.967596189005397e-07, "loss": 0.7402, "step": 13240 }, { "epoch": 0.9, "learning_rate": 4.960728136795267e-07, "loss": 0.707, "step": 13241 }, { "epoch": 0.9, "learning_rate": 4.953864714893819e-07, "loss": 0.75, "step": 13242 }, { "epoch": 0.9, "learning_rate": 4.947005923635462e-07, "loss": 0.7529, "step": 13243 }, { "epoch": 0.9, "learning_rate": 4.940151763354328e-07, "loss": 0.708, "step": 13244 }, { "epoch": 0.9, "learning_rate": 4.933302234384374e-07, "loss": 0.6719, "step": 13245 }, { "epoch": 0.9, "learning_rate": 4.926457337059287e-07, "loss": 0.6963, "step": 13246 }, { "epoch": 0.9, "learning_rate": 4.919617071712579e-07, "loss": 0.6895, "step": 13247 }, { "epoch": 0.9, "learning_rate": 4.912781438677483e-07, "loss": 0.7529, "step": 13248 }, { "epoch": 0.9, "learning_rate": 4.905950438287021e-07, "loss": 0.7773, "step": 13249 }, { "epoch": 0.9, "learning_rate": 4.899124070874051e-07, "loss": 0.6631, "step": 13250 }, { "epoch": 0.9, "learning_rate": 4.892302336771093e-07, "loss": 0.8096, "step": 13251 }, { "epoch": 0.9, "learning_rate": 4.885485236310528e-07, "loss": 0.709, "step": 13252 }, { "epoch": 0.9, "learning_rate": 4.878672769824511e-07, "loss": 0.7441, "step": 13253 }, { "epoch": 0.9, "learning_rate": 4.871864937644888e-07, "loss": 0.7588, "step": 13254 }, { "epoch": 0.9, "learning_rate": 4.865061740103361e-07, "loss": 0.791, "step": 13255 }, { "epoch": 0.9, "learning_rate": 4.858263177531409e-07, "loss": 0.7402, "step": 13256 }, { "epoch": 0.9, "learning_rate": 4.851469250260233e-07, "loss": 0.7109, "step": 13257 }, { "epoch": 0.9, "learning_rate": 4.844679958620824e-07, "loss": 0.7822, "step": 13258 }, { "epoch": 0.9, "learning_rate": 4.837895302943962e-07, "loss": 0.8447, "step": 13259 }, { "epoch": 0.9, "learning_rate": 4.831115283560229e-07, "loss": 0.7578, "step": 13260 }, { "epoch": 0.9, "learning_rate": 4.82433990079988e-07, "loss": 0.6963, "step": 13261 }, { "epoch": 0.9, "learning_rate": 4.817569154993074e-07, "loss": 0.7246, "step": 13262 }, { "epoch": 0.9, "learning_rate": 4.810803046469658e-07, "loss": 0.7549, "step": 13263 }, { "epoch": 0.9, "learning_rate": 4.80404157555927e-07, "loss": 0.7949, "step": 13264 }, { "epoch": 0.9, "learning_rate": 4.797284742591324e-07, "loss": 0.7832, "step": 13265 }, { "epoch": 0.9, "learning_rate": 4.790532547895044e-07, "loss": 0.7783, "step": 13266 }, { "epoch": 0.9, "learning_rate": 4.783784991799356e-07, "loss": 0.749, "step": 13267 }, { "epoch": 0.9, "learning_rate": 4.77704207463302e-07, "loss": 0.7363, "step": 13268 }, { "epoch": 0.9, "learning_rate": 4.770303796724574e-07, "loss": 0.7832, "step": 13269 }, { "epoch": 0.9, "learning_rate": 4.7635701584022644e-07, "loss": 0.7441, "step": 13270 }, { "epoch": 0.9, "learning_rate": 4.7568411599941744e-07, "loss": 0.748, "step": 13271 }, { "epoch": 0.9, "learning_rate": 4.750116801828131e-07, "loss": 0.7949, "step": 13272 }, { "epoch": 0.9, "learning_rate": 4.74339708423176e-07, "loss": 0.749, "step": 13273 }, { "epoch": 0.9, "learning_rate": 4.736682007532434e-07, "loss": 0.7646, "step": 13274 }, { "epoch": 0.9, "learning_rate": 4.7299715720573125e-07, "loss": 0.7705, "step": 13275 }, { "epoch": 0.9, "learning_rate": 4.7232657781333455e-07, "loss": 0.7139, "step": 13276 }, { "epoch": 0.9, "learning_rate": 4.7165646260872166e-07, "loss": 0.7373, "step": 13277 }, { "epoch": 0.9, "learning_rate": 4.7098681162454083e-07, "loss": 0.7383, "step": 13278 }, { "epoch": 0.9, "learning_rate": 4.703176248934183e-07, "loss": 0.709, "step": 13279 }, { "epoch": 0.91, "learning_rate": 4.6964890244795556e-07, "loss": 0.7324, "step": 13280 }, { "epoch": 0.91, "learning_rate": 4.6898064432073343e-07, "loss": 0.7578, "step": 13281 }, { "epoch": 0.91, "learning_rate": 4.683128505443102e-07, "loss": 0.7363, "step": 13282 }, { "epoch": 0.91, "learning_rate": 4.67645521151221e-07, "loss": 0.7207, "step": 13283 }, { "epoch": 0.91, "learning_rate": 4.669786561739753e-07, "loss": 0.7197, "step": 13284 }, { "epoch": 0.91, "learning_rate": 4.663122556450661e-07, "loss": 0.709, "step": 13285 }, { "epoch": 0.91, "learning_rate": 4.656463195969574e-07, "loss": 0.7051, "step": 13286 }, { "epoch": 0.91, "learning_rate": 4.6498084806209543e-07, "loss": 0.7676, "step": 13287 }, { "epoch": 0.91, "learning_rate": 4.643158410729021e-07, "loss": 0.7656, "step": 13288 }, { "epoch": 0.91, "learning_rate": 4.6365129866177694e-07, "loss": 0.7305, "step": 13289 }, { "epoch": 0.91, "learning_rate": 4.6298722086109414e-07, "loss": 0.709, "step": 13290 }, { "epoch": 0.91, "learning_rate": 4.6232360770320673e-07, "loss": 0.6104, "step": 13291 }, { "epoch": 0.91, "learning_rate": 4.616604592204521e-07, "loss": 0.7412, "step": 13292 }, { "epoch": 0.91, "learning_rate": 4.6099777544513227e-07, "loss": 0.8096, "step": 13293 }, { "epoch": 0.91, "learning_rate": 4.6033555640953686e-07, "loss": 0.8242, "step": 13294 }, { "epoch": 0.91, "learning_rate": 4.5967380214592685e-07, "loss": 0.748, "step": 13295 }, { "epoch": 0.91, "learning_rate": 4.5901251268654523e-07, "loss": 0.7861, "step": 13296 }, { "epoch": 0.91, "learning_rate": 4.583516880636063e-07, "loss": 0.7178, "step": 13297 }, { "epoch": 0.91, "learning_rate": 4.576913283093098e-07, "loss": 0.7764, "step": 13298 }, { "epoch": 0.91, "learning_rate": 4.570314334558268e-07, "loss": 0.6689, "step": 13299 }, { "epoch": 0.91, "learning_rate": 4.56372003535307e-07, "loss": 0.8057, "step": 13300 }, { "epoch": 0.91, "learning_rate": 4.557130385798758e-07, "loss": 0.7031, "step": 13301 }, { "epoch": 0.91, "learning_rate": 4.550545386216432e-07, "loss": 0.6855, "step": 13302 }, { "epoch": 0.91, "learning_rate": 4.543965036926845e-07, "loss": 0.7607, "step": 13303 }, { "epoch": 0.91, "learning_rate": 4.5373893382506306e-07, "loss": 0.7188, "step": 13304 }, { "epoch": 0.91, "learning_rate": 4.5308182905081763e-07, "loss": 0.6934, "step": 13305 }, { "epoch": 0.91, "learning_rate": 4.524251894019582e-07, "loss": 0.7871, "step": 13306 }, { "epoch": 0.91, "learning_rate": 4.517690149104781e-07, "loss": 0.8174, "step": 13307 }, { "epoch": 0.91, "learning_rate": 4.511133056083461e-07, "loss": 0.7402, "step": 13308 }, { "epoch": 0.91, "learning_rate": 4.504580615275089e-07, "loss": 0.708, "step": 13309 }, { "epoch": 0.91, "learning_rate": 4.498032826998877e-07, "loss": 0.7598, "step": 13310 }, { "epoch": 0.91, "learning_rate": 4.491489691573858e-07, "loss": 0.7354, "step": 13311 }, { "epoch": 0.91, "learning_rate": 4.484951209318811e-07, "loss": 0.7461, "step": 13312 }, { "epoch": 0.91, "learning_rate": 4.47841738055228e-07, "loss": 0.645, "step": 13313 }, { "epoch": 0.91, "learning_rate": 4.4718882055925893e-07, "loss": 0.8369, "step": 13314 }, { "epoch": 0.91, "learning_rate": 4.4653636847578395e-07, "loss": 0.6582, "step": 13315 }, { "epoch": 0.91, "learning_rate": 4.4588438183659213e-07, "loss": 0.6758, "step": 13316 }, { "epoch": 0.91, "learning_rate": 4.4523286067344685e-07, "loss": 0.7559, "step": 13317 }, { "epoch": 0.91, "learning_rate": 4.445818050180917e-07, "loss": 0.7783, "step": 13318 }, { "epoch": 0.91, "learning_rate": 4.4393121490224456e-07, "loss": 0.7344, "step": 13319 }, { "epoch": 0.91, "learning_rate": 4.4328109035760235e-07, "loss": 0.6943, "step": 13320 }, { "epoch": 0.91, "learning_rate": 4.4263143141583975e-07, "loss": 0.79, "step": 13321 }, { "epoch": 0.91, "learning_rate": 4.4198223810860694e-07, "loss": 0.6602, "step": 13322 }, { "epoch": 0.91, "learning_rate": 4.4133351046753426e-07, "loss": 0.7168, "step": 13323 }, { "epoch": 0.91, "learning_rate": 4.4068524852422634e-07, "loss": 0.7305, "step": 13324 }, { "epoch": 0.91, "learning_rate": 4.4003745231026794e-07, "loss": 0.7139, "step": 13325 }, { "epoch": 0.91, "learning_rate": 4.393901218572172e-07, "loss": 0.7783, "step": 13326 }, { "epoch": 0.91, "learning_rate": 4.3874325719661216e-07, "loss": 0.8037, "step": 13327 }, { "epoch": 0.91, "learning_rate": 4.380968583599732e-07, "loss": 0.7598, "step": 13328 }, { "epoch": 0.91, "learning_rate": 4.374509253787862e-07, "loss": 0.7256, "step": 13329 }, { "epoch": 0.91, "learning_rate": 4.368054582845249e-07, "loss": 0.7988, "step": 13330 }, { "epoch": 0.91, "learning_rate": 4.3616045710863417e-07, "loss": 0.7061, "step": 13331 }, { "epoch": 0.91, "learning_rate": 4.355159218825422e-07, "loss": 0.7285, "step": 13332 }, { "epoch": 0.91, "learning_rate": 4.34871852637645e-07, "loss": 0.7549, "step": 13333 }, { "epoch": 0.91, "learning_rate": 4.3422824940532516e-07, "loss": 0.8027, "step": 13334 }, { "epoch": 0.91, "learning_rate": 4.33585112216941e-07, "loss": 0.791, "step": 13335 }, { "epoch": 0.91, "learning_rate": 4.329424411038219e-07, "loss": 0.748, "step": 13336 }, { "epoch": 0.91, "learning_rate": 4.3230023609728055e-07, "loss": 0.708, "step": 13337 }, { "epoch": 0.91, "learning_rate": 4.316584972286053e-07, "loss": 0.7383, "step": 13338 }, { "epoch": 0.91, "learning_rate": 4.3101722452906005e-07, "loss": 0.7764, "step": 13339 }, { "epoch": 0.91, "learning_rate": 4.3037641802989084e-07, "loss": 0.8271, "step": 13340 }, { "epoch": 0.91, "learning_rate": 4.297360777623161e-07, "loss": 0.8291, "step": 13341 }, { "epoch": 0.91, "learning_rate": 4.2909620375753194e-07, "loss": 0.7324, "step": 13342 }, { "epoch": 0.91, "learning_rate": 4.2845679604671343e-07, "loss": 0.793, "step": 13343 }, { "epoch": 0.91, "learning_rate": 4.278178546610134e-07, "loss": 0.7891, "step": 13344 }, { "epoch": 0.91, "learning_rate": 4.2717937963156154e-07, "loss": 0.7109, "step": 13345 }, { "epoch": 0.91, "learning_rate": 4.265413709894628e-07, "loss": 0.7715, "step": 13346 }, { "epoch": 0.91, "learning_rate": 4.2590382876580125e-07, "loss": 0.749, "step": 13347 }, { "epoch": 0.91, "learning_rate": 4.2526675299163986e-07, "loss": 0.7529, "step": 13348 }, { "epoch": 0.91, "learning_rate": 4.246301436980138e-07, "loss": 0.7061, "step": 13349 }, { "epoch": 0.91, "learning_rate": 4.2399400091594154e-07, "loss": 0.7764, "step": 13350 }, { "epoch": 0.91, "learning_rate": 4.233583246764128e-07, "loss": 0.7803, "step": 13351 }, { "epoch": 0.91, "learning_rate": 4.2272311501040055e-07, "loss": 0.7441, "step": 13352 }, { "epoch": 0.91, "learning_rate": 4.2208837194884997e-07, "loss": 0.7529, "step": 13353 }, { "epoch": 0.91, "learning_rate": 4.214540955226898e-07, "loss": 0.7207, "step": 13354 }, { "epoch": 0.91, "learning_rate": 4.208202857628163e-07, "loss": 0.6787, "step": 13355 }, { "epoch": 0.91, "learning_rate": 4.201869427001115e-07, "loss": 0.7051, "step": 13356 }, { "epoch": 0.91, "learning_rate": 4.195540663654318e-07, "loss": 0.7734, "step": 13357 }, { "epoch": 0.91, "learning_rate": 4.189216567896115e-07, "loss": 0.7607, "step": 13358 }, { "epoch": 0.91, "learning_rate": 4.182897140034603e-07, "loss": 0.7441, "step": 13359 }, { "epoch": 0.91, "learning_rate": 4.1765823803776693e-07, "loss": 0.6943, "step": 13360 }, { "epoch": 0.91, "learning_rate": 4.1702722892329797e-07, "loss": 0.7148, "step": 13361 }, { "epoch": 0.91, "learning_rate": 4.1639668669079316e-07, "loss": 0.7715, "step": 13362 }, { "epoch": 0.91, "learning_rate": 4.157666113709746e-07, "loss": 0.75, "step": 13363 }, { "epoch": 0.91, "learning_rate": 4.151370029945423e-07, "loss": 0.7822, "step": 13364 }, { "epoch": 0.91, "learning_rate": 4.1450786159216496e-07, "loss": 0.7959, "step": 13365 }, { "epoch": 0.91, "learning_rate": 4.1387918719449805e-07, "loss": 0.7461, "step": 13366 }, { "epoch": 0.91, "learning_rate": 4.1325097983216935e-07, "loss": 0.7266, "step": 13367 }, { "epoch": 0.91, "learning_rate": 4.1262323953578544e-07, "loss": 0.7314, "step": 13368 }, { "epoch": 0.91, "learning_rate": 4.1199596633592963e-07, "loss": 0.748, "step": 13369 }, { "epoch": 0.91, "learning_rate": 4.113691602631631e-07, "loss": 0.7178, "step": 13370 }, { "epoch": 0.91, "learning_rate": 4.1074282134802355e-07, "loss": 0.7725, "step": 13371 }, { "epoch": 0.91, "learning_rate": 4.101169496210267e-07, "loss": 0.792, "step": 13372 }, { "epoch": 0.91, "learning_rate": 4.094915451126624e-07, "loss": 0.7422, "step": 13373 }, { "epoch": 0.91, "learning_rate": 4.088666078534043e-07, "loss": 0.6953, "step": 13374 }, { "epoch": 0.91, "learning_rate": 4.082421378736956e-07, "loss": 0.7373, "step": 13375 }, { "epoch": 0.91, "learning_rate": 4.076181352039632e-07, "loss": 0.7422, "step": 13376 }, { "epoch": 0.91, "learning_rate": 4.0699459987460834e-07, "loss": 0.7217, "step": 13377 }, { "epoch": 0.91, "learning_rate": 4.0637153191600774e-07, "loss": 0.6943, "step": 13378 }, { "epoch": 0.91, "learning_rate": 4.057489313585183e-07, "loss": 0.7061, "step": 13379 }, { "epoch": 0.91, "learning_rate": 4.051267982324736e-07, "loss": 0.6689, "step": 13380 }, { "epoch": 0.91, "learning_rate": 4.045051325681826e-07, "loss": 0.7666, "step": 13381 }, { "epoch": 0.91, "learning_rate": 4.0388393439593334e-07, "loss": 0.7744, "step": 13382 }, { "epoch": 0.91, "learning_rate": 4.032632037459916e-07, "loss": 0.7061, "step": 13383 }, { "epoch": 0.91, "learning_rate": 4.026429406485988e-07, "loss": 0.7891, "step": 13384 }, { "epoch": 0.91, "learning_rate": 4.02023145133974e-07, "loss": 0.7705, "step": 13385 }, { "epoch": 0.91, "learning_rate": 4.014038172323109e-07, "loss": 0.8467, "step": 13386 }, { "epoch": 0.91, "learning_rate": 4.007849569737887e-07, "loss": 0.6855, "step": 13387 }, { "epoch": 0.91, "learning_rate": 4.001665643885544e-07, "loss": 0.7354, "step": 13388 }, { "epoch": 0.91, "learning_rate": 3.995486395067372e-07, "loss": 0.7734, "step": 13389 }, { "epoch": 0.91, "learning_rate": 3.98931182358443e-07, "loss": 0.7773, "step": 13390 }, { "epoch": 0.91, "learning_rate": 3.983141929737522e-07, "loss": 0.7422, "step": 13391 }, { "epoch": 0.91, "learning_rate": 3.976976713827241e-07, "loss": 0.7842, "step": 13392 }, { "epoch": 0.91, "learning_rate": 3.970816176153991e-07, "loss": 0.7158, "step": 13393 }, { "epoch": 0.91, "learning_rate": 3.964660317017899e-07, "loss": 0.6729, "step": 13394 }, { "epoch": 0.91, "learning_rate": 3.9585091367188577e-07, "loss": 0.6934, "step": 13395 }, { "epoch": 0.91, "learning_rate": 3.9523626355565725e-07, "loss": 0.7666, "step": 13396 }, { "epoch": 0.91, "learning_rate": 3.946220813830504e-07, "loss": 0.6943, "step": 13397 }, { "epoch": 0.91, "learning_rate": 3.940083671839856e-07, "loss": 0.6992, "step": 13398 }, { "epoch": 0.91, "learning_rate": 3.9339512098836574e-07, "loss": 0.7588, "step": 13399 }, { "epoch": 0.91, "learning_rate": 3.9278234282606795e-07, "loss": 0.7822, "step": 13400 }, { "epoch": 0.91, "learning_rate": 3.9217003272694507e-07, "loss": 0.6953, "step": 13401 }, { "epoch": 0.91, "learning_rate": 3.915581907208299e-07, "loss": 0.8086, "step": 13402 }, { "epoch": 0.91, "learning_rate": 3.9094681683753075e-07, "loss": 0.7324, "step": 13403 }, { "epoch": 0.91, "learning_rate": 3.903359111068339e-07, "loss": 0.8018, "step": 13404 }, { "epoch": 0.91, "learning_rate": 3.897254735585032e-07, "loss": 0.8652, "step": 13405 }, { "epoch": 0.91, "learning_rate": 3.891155042222794e-07, "loss": 0.7227, "step": 13406 }, { "epoch": 0.91, "learning_rate": 3.8850600312787866e-07, "loss": 0.7822, "step": 13407 }, { "epoch": 0.91, "learning_rate": 3.878969703049973e-07, "loss": 0.7275, "step": 13408 }, { "epoch": 0.91, "learning_rate": 3.8728840578330595e-07, "loss": 0.7539, "step": 13409 }, { "epoch": 0.91, "learning_rate": 3.8668030959245537e-07, "loss": 0.7441, "step": 13410 }, { "epoch": 0.91, "learning_rate": 3.860726817620708e-07, "loss": 0.7939, "step": 13411 }, { "epoch": 0.91, "learning_rate": 3.8546552232175624e-07, "loss": 0.6729, "step": 13412 }, { "epoch": 0.91, "learning_rate": 3.848588313010937e-07, "loss": 0.8525, "step": 13413 }, { "epoch": 0.91, "learning_rate": 3.842526087296394e-07, "loss": 0.7158, "step": 13414 }, { "epoch": 0.91, "learning_rate": 3.8364685463692875e-07, "loss": 0.7412, "step": 13415 }, { "epoch": 0.91, "learning_rate": 3.830415690524747e-07, "loss": 0.8672, "step": 13416 }, { "epoch": 0.91, "learning_rate": 3.824367520057659e-07, "loss": 0.7109, "step": 13417 }, { "epoch": 0.91, "learning_rate": 3.8183240352626994e-07, "loss": 0.7373, "step": 13418 }, { "epoch": 0.91, "learning_rate": 3.8122852364342986e-07, "loss": 0.7734, "step": 13419 }, { "epoch": 0.91, "learning_rate": 3.806251123866689e-07, "loss": 0.7021, "step": 13420 }, { "epoch": 0.91, "learning_rate": 3.800221697853812e-07, "loss": 0.7607, "step": 13421 }, { "epoch": 0.91, "learning_rate": 3.7941969586894336e-07, "loss": 0.7031, "step": 13422 }, { "epoch": 0.91, "learning_rate": 3.788176906667118e-07, "loss": 0.7109, "step": 13423 }, { "epoch": 0.91, "learning_rate": 3.7821615420801094e-07, "loss": 0.7266, "step": 13424 }, { "epoch": 0.91, "learning_rate": 3.7761508652215063e-07, "loss": 0.8584, "step": 13425 }, { "epoch": 0.91, "learning_rate": 3.770144876384152e-07, "loss": 0.749, "step": 13426 }, { "epoch": 0.92, "learning_rate": 3.7641435758606347e-07, "loss": 0.6963, "step": 13427 }, { "epoch": 0.92, "learning_rate": 3.758146963943332e-07, "loss": 0.7275, "step": 13428 }, { "epoch": 0.92, "learning_rate": 3.752155040924443e-07, "loss": 0.6992, "step": 13429 }, { "epoch": 0.92, "learning_rate": 3.746167807095857e-07, "loss": 0.708, "step": 13430 }, { "epoch": 0.92, "learning_rate": 3.740185262749274e-07, "loss": 0.7217, "step": 13431 }, { "epoch": 0.92, "learning_rate": 3.7342074081761825e-07, "loss": 0.7432, "step": 13432 }, { "epoch": 0.92, "learning_rate": 3.7282342436678163e-07, "loss": 0.7432, "step": 13433 }, { "epoch": 0.92, "learning_rate": 3.722265769515154e-07, "loss": 0.7061, "step": 13434 }, { "epoch": 0.92, "learning_rate": 3.71630198600903e-07, "loss": 0.7266, "step": 13435 }, { "epoch": 0.92, "learning_rate": 3.710342893439989e-07, "loss": 0.748, "step": 13436 }, { "epoch": 0.92, "learning_rate": 3.704388492098332e-07, "loss": 0.7832, "step": 13437 }, { "epoch": 0.92, "learning_rate": 3.698438782274161e-07, "loss": 0.751, "step": 13438 }, { "epoch": 0.92, "learning_rate": 3.6924937642573656e-07, "loss": 0.7285, "step": 13439 }, { "epoch": 0.92, "learning_rate": 3.686553438337581e-07, "loss": 0.7344, "step": 13440 }, { "epoch": 0.92, "learning_rate": 3.680617804804221e-07, "loss": 0.8438, "step": 13441 }, { "epoch": 0.92, "learning_rate": 3.674686863946464e-07, "loss": 0.751, "step": 13442 }, { "epoch": 0.92, "learning_rate": 3.6687606160532576e-07, "loss": 0.7939, "step": 13443 }, { "epoch": 0.92, "learning_rate": 3.662839061413337e-07, "loss": 0.8086, "step": 13444 }, { "epoch": 0.92, "learning_rate": 3.6569222003151936e-07, "loss": 0.7041, "step": 13445 }, { "epoch": 0.92, "learning_rate": 3.651010033047109e-07, "loss": 0.7158, "step": 13446 }, { "epoch": 0.92, "learning_rate": 3.645102559897118e-07, "loss": 0.751, "step": 13447 }, { "epoch": 0.92, "learning_rate": 3.6391997811530243e-07, "loss": 0.7617, "step": 13448 }, { "epoch": 0.92, "learning_rate": 3.6333016971024426e-07, "loss": 0.7383, "step": 13449 }, { "epoch": 0.92, "learning_rate": 3.627408308032676e-07, "loss": 0.6602, "step": 13450 }, { "epoch": 0.92, "learning_rate": 3.6215196142308837e-07, "loss": 0.7334, "step": 13451 }, { "epoch": 0.92, "learning_rate": 3.615635615983959e-07, "loss": 0.8311, "step": 13452 }, { "epoch": 0.92, "learning_rate": 3.609756313578561e-07, "loss": 0.7393, "step": 13453 }, { "epoch": 0.92, "learning_rate": 3.603881707301138e-07, "loss": 0.7539, "step": 13454 }, { "epoch": 0.92, "learning_rate": 3.598011797437895e-07, "loss": 0.7529, "step": 13455 }, { "epoch": 0.92, "learning_rate": 3.592146584274836e-07, "loss": 0.7383, "step": 13456 }, { "epoch": 0.92, "learning_rate": 3.586286068097666e-07, "loss": 0.7754, "step": 13457 }, { "epoch": 0.92, "learning_rate": 3.580430249191935e-07, "loss": 0.6934, "step": 13458 }, { "epoch": 0.92, "learning_rate": 3.57457912784297e-07, "loss": 0.7363, "step": 13459 }, { "epoch": 0.92, "learning_rate": 3.568732704335787e-07, "loss": 0.748, "step": 13460 }, { "epoch": 0.92, "learning_rate": 3.5628909789552466e-07, "loss": 0.6875, "step": 13461 }, { "epoch": 0.92, "learning_rate": 3.557053951985967e-07, "loss": 0.7324, "step": 13462 }, { "epoch": 0.92, "learning_rate": 3.5512216237122974e-07, "loss": 0.8193, "step": 13463 }, { "epoch": 0.92, "learning_rate": 3.5453939944184e-07, "loss": 0.79, "step": 13464 }, { "epoch": 0.92, "learning_rate": 3.5395710643882364e-07, "loss": 0.7959, "step": 13465 }, { "epoch": 0.92, "learning_rate": 3.533752833905446e-07, "loss": 0.7314, "step": 13466 }, { "epoch": 0.92, "learning_rate": 3.527939303253514e-07, "loss": 0.7158, "step": 13467 }, { "epoch": 0.92, "learning_rate": 3.522130472715668e-07, "loss": 0.7295, "step": 13468 }, { "epoch": 0.92, "learning_rate": 3.5163263425749384e-07, "loss": 0.7617, "step": 13469 }, { "epoch": 0.92, "learning_rate": 3.510526913114065e-07, "loss": 0.6807, "step": 13470 }, { "epoch": 0.92, "learning_rate": 3.5047321846156224e-07, "loss": 0.708, "step": 13471 }, { "epoch": 0.92, "learning_rate": 3.4989421573619287e-07, "loss": 0.667, "step": 13472 }, { "epoch": 0.92, "learning_rate": 3.4931568316350586e-07, "loss": 0.6641, "step": 13473 }, { "epoch": 0.92, "learning_rate": 3.487376207716886e-07, "loss": 0.7227, "step": 13474 }, { "epoch": 0.92, "learning_rate": 3.4816002858890417e-07, "loss": 0.8125, "step": 13475 }, { "epoch": 0.92, "learning_rate": 3.475829066432912e-07, "loss": 0.7607, "step": 13476 }, { "epoch": 0.92, "learning_rate": 3.4700625496296825e-07, "loss": 0.7285, "step": 13477 }, { "epoch": 0.92, "learning_rate": 3.4643007357603176e-07, "loss": 0.7666, "step": 13478 }, { "epoch": 0.92, "learning_rate": 3.4585436251055036e-07, "loss": 0.8018, "step": 13479 }, { "epoch": 0.92, "learning_rate": 3.452791217945728e-07, "loss": 0.7627, "step": 13480 }, { "epoch": 0.92, "learning_rate": 3.4470435145612657e-07, "loss": 0.833, "step": 13481 }, { "epoch": 0.92, "learning_rate": 3.4413005152321265e-07, "loss": 0.7295, "step": 13482 }, { "epoch": 0.92, "learning_rate": 3.43556222023812e-07, "loss": 0.7012, "step": 13483 }, { "epoch": 0.92, "learning_rate": 3.4298286298588115e-07, "loss": 0.7227, "step": 13484 }, { "epoch": 0.92, "learning_rate": 3.424099744373555e-07, "loss": 0.7627, "step": 13485 }, { "epoch": 0.92, "learning_rate": 3.418375564061438e-07, "loss": 0.7324, "step": 13486 }, { "epoch": 0.92, "learning_rate": 3.4126560892013495e-07, "loss": 0.7998, "step": 13487 }, { "epoch": 0.92, "learning_rate": 3.4069413200719546e-07, "loss": 0.751, "step": 13488 }, { "epoch": 0.92, "learning_rate": 3.4012312569516646e-07, "loss": 0.7812, "step": 13489 }, { "epoch": 0.92, "learning_rate": 3.395525900118679e-07, "loss": 0.7725, "step": 13490 }, { "epoch": 0.92, "learning_rate": 3.3898252498509533e-07, "loss": 0.7246, "step": 13491 }, { "epoch": 0.92, "learning_rate": 3.384129306426254e-07, "loss": 0.6807, "step": 13492 }, { "epoch": 0.92, "learning_rate": 3.378438070122025e-07, "loss": 0.7246, "step": 13493 }, { "epoch": 0.92, "learning_rate": 3.372751541215613e-07, "loss": 0.708, "step": 13494 }, { "epoch": 0.92, "learning_rate": 3.3670697199840284e-07, "loss": 0.748, "step": 13495 }, { "epoch": 0.92, "learning_rate": 3.3613926067040837e-07, "loss": 0.7139, "step": 13496 }, { "epoch": 0.92, "learning_rate": 3.355720201652379e-07, "loss": 0.8184, "step": 13497 }, { "epoch": 0.92, "learning_rate": 3.350052505105295e-07, "loss": 0.6992, "step": 13498 }, { "epoch": 0.92, "learning_rate": 3.3443895173389087e-07, "loss": 0.6777, "step": 13499 }, { "epoch": 0.92, "learning_rate": 3.338731238629167e-07, "loss": 0.8428, "step": 13500 }, { "epoch": 0.92, "learning_rate": 3.3330776692517275e-07, "loss": 0.6396, "step": 13501 }, { "epoch": 0.92, "learning_rate": 3.3274288094820253e-07, "loss": 0.6748, "step": 13502 }, { "epoch": 0.92, "learning_rate": 3.321784659595273e-07, "loss": 0.8125, "step": 13503 }, { "epoch": 0.92, "learning_rate": 3.3161452198664624e-07, "loss": 0.7676, "step": 13504 }, { "epoch": 0.92, "learning_rate": 3.31051049057034e-07, "loss": 0.6553, "step": 13505 }, { "epoch": 0.92, "learning_rate": 3.304880471981431e-07, "loss": 0.7686, "step": 13506 }, { "epoch": 0.92, "learning_rate": 3.2992551643740377e-07, "loss": 0.7881, "step": 13507 }, { "epoch": 0.92, "learning_rate": 3.293634568022219e-07, "loss": 0.7861, "step": 13508 }, { "epoch": 0.92, "learning_rate": 3.2880186831998007e-07, "loss": 0.7012, "step": 13509 }, { "epoch": 0.92, "learning_rate": 3.282407510180385e-07, "loss": 0.8174, "step": 13510 }, { "epoch": 0.92, "learning_rate": 3.276801049237377e-07, "loss": 0.7939, "step": 13511 }, { "epoch": 0.92, "learning_rate": 3.27119930064389e-07, "loss": 0.7598, "step": 13512 }, { "epoch": 0.92, "learning_rate": 3.265602264672862e-07, "loss": 0.751, "step": 13513 }, { "epoch": 0.92, "learning_rate": 3.260009941596987e-07, "loss": 0.708, "step": 13514 }, { "epoch": 0.92, "learning_rate": 3.2544223316887003e-07, "loss": 0.7412, "step": 13515 }, { "epoch": 0.92, "learning_rate": 3.24883943522023e-07, "loss": 0.8242, "step": 13516 }, { "epoch": 0.92, "learning_rate": 3.243261252463592e-07, "loss": 0.7793, "step": 13517 }, { "epoch": 0.92, "learning_rate": 3.2376877836905464e-07, "loss": 0.7666, "step": 13518 }, { "epoch": 0.92, "learning_rate": 3.232119029172631e-07, "loss": 0.7061, "step": 13519 }, { "epoch": 0.92, "learning_rate": 3.226554989181163e-07, "loss": 0.7803, "step": 13520 }, { "epoch": 0.92, "learning_rate": 3.220995663987225e-07, "loss": 0.7529, "step": 13521 }, { "epoch": 0.92, "learning_rate": 3.2154410538616456e-07, "loss": 0.7783, "step": 13522 }, { "epoch": 0.92, "learning_rate": 3.2098911590750404e-07, "loss": 0.7061, "step": 13523 }, { "epoch": 0.92, "learning_rate": 3.204345979897849e-07, "loss": 0.7354, "step": 13524 }, { "epoch": 0.92, "learning_rate": 3.1988055166001894e-07, "loss": 0.8057, "step": 13525 }, { "epoch": 0.92, "learning_rate": 3.1932697694520007e-07, "loss": 0.7324, "step": 13526 }, { "epoch": 0.92, "learning_rate": 3.1877387387230117e-07, "loss": 0.7559, "step": 13527 }, { "epoch": 0.92, "learning_rate": 3.18221242468264e-07, "loss": 0.8037, "step": 13528 }, { "epoch": 0.92, "learning_rate": 3.1766908276001595e-07, "loss": 0.7412, "step": 13529 }, { "epoch": 0.92, "learning_rate": 3.171173947744599e-07, "loss": 0.6914, "step": 13530 }, { "epoch": 0.92, "learning_rate": 3.1656617853847106e-07, "loss": 0.751, "step": 13531 }, { "epoch": 0.92, "learning_rate": 3.1601543407890567e-07, "loss": 0.7578, "step": 13532 }, { "epoch": 0.92, "learning_rate": 3.1546516142259567e-07, "loss": 0.7715, "step": 13533 }, { "epoch": 0.92, "learning_rate": 3.149153605963529e-07, "loss": 0.6787, "step": 13534 }, { "epoch": 0.92, "learning_rate": 3.143660316269581e-07, "loss": 0.7627, "step": 13535 }, { "epoch": 0.92, "learning_rate": 3.1381717454118e-07, "loss": 0.7188, "step": 13536 }, { "epoch": 0.92, "learning_rate": 3.132687893657571e-07, "loss": 0.6479, "step": 13537 }, { "epoch": 0.92, "learning_rate": 3.127208761274059e-07, "loss": 0.8115, "step": 13538 }, { "epoch": 0.92, "learning_rate": 3.121734348528205e-07, "loss": 0.7383, "step": 13539 }, { "epoch": 0.92, "learning_rate": 3.116264655686729e-07, "loss": 0.6895, "step": 13540 }, { "epoch": 0.92, "learning_rate": 3.110799683016119e-07, "loss": 0.7031, "step": 13541 }, { "epoch": 0.92, "learning_rate": 3.105339430782628e-07, "loss": 0.7139, "step": 13542 }, { "epoch": 0.92, "learning_rate": 3.099883899252265e-07, "loss": 0.7959, "step": 13543 }, { "epoch": 0.92, "learning_rate": 3.094433088690851e-07, "loss": 0.7285, "step": 13544 }, { "epoch": 0.92, "learning_rate": 3.0889869993639186e-07, "loss": 0.7021, "step": 13545 }, { "epoch": 0.92, "learning_rate": 3.0835456315368107e-07, "loss": 0.7598, "step": 13546 }, { "epoch": 0.92, "learning_rate": 3.0781089854746373e-07, "loss": 0.7314, "step": 13547 }, { "epoch": 0.92, "learning_rate": 3.0726770614422643e-07, "loss": 0.7363, "step": 13548 }, { "epoch": 0.92, "learning_rate": 3.0672498597043465e-07, "loss": 0.8066, "step": 13549 }, { "epoch": 0.92, "learning_rate": 3.061827380525284e-07, "loss": 0.7061, "step": 13550 }, { "epoch": 0.92, "learning_rate": 3.0564096241692653e-07, "loss": 0.7256, "step": 13551 }, { "epoch": 0.92, "learning_rate": 3.050996590900235e-07, "loss": 0.7773, "step": 13552 }, { "epoch": 0.92, "learning_rate": 3.045588280981926e-07, "loss": 0.7021, "step": 13553 }, { "epoch": 0.92, "learning_rate": 3.040184694677828e-07, "loss": 0.7285, "step": 13554 }, { "epoch": 0.92, "learning_rate": 3.0347858322512083e-07, "loss": 0.7705, "step": 13555 }, { "epoch": 0.92, "learning_rate": 3.029391693965089e-07, "loss": 0.8027, "step": 13556 }, { "epoch": 0.92, "learning_rate": 3.0240022800822833e-07, "loss": 0.7676, "step": 13557 }, { "epoch": 0.92, "learning_rate": 3.018617590865358e-07, "loss": 0.7598, "step": 13558 }, { "epoch": 0.92, "learning_rate": 3.0132376265766374e-07, "loss": 0.7529, "step": 13559 }, { "epoch": 0.92, "learning_rate": 3.0078623874782664e-07, "loss": 0.7871, "step": 13560 }, { "epoch": 0.92, "learning_rate": 3.0024918738321027e-07, "loss": 0.7676, "step": 13561 }, { "epoch": 0.92, "learning_rate": 2.9971260858998043e-07, "loss": 0.749, "step": 13562 }, { "epoch": 0.92, "learning_rate": 2.991765023942805e-07, "loss": 0.6768, "step": 13563 }, { "epoch": 0.92, "learning_rate": 2.9864086882222754e-07, "loss": 0.7822, "step": 13564 }, { "epoch": 0.92, "learning_rate": 2.9810570789991724e-07, "loss": 0.6875, "step": 13565 }, { "epoch": 0.92, "learning_rate": 2.975710196534254e-07, "loss": 0.6768, "step": 13566 }, { "epoch": 0.92, "learning_rate": 2.9703680410879897e-07, "loss": 0.7188, "step": 13567 }, { "epoch": 0.92, "learning_rate": 2.965030612920672e-07, "loss": 0.749, "step": 13568 }, { "epoch": 0.92, "learning_rate": 2.9596979122923253e-07, "loss": 0.7471, "step": 13569 }, { "epoch": 0.92, "learning_rate": 2.954369939462776e-07, "loss": 0.7158, "step": 13570 }, { "epoch": 0.92, "learning_rate": 2.9490466946915707e-07, "loss": 0.7969, "step": 13571 }, { "epoch": 0.92, "learning_rate": 2.943728178238081e-07, "loss": 0.7529, "step": 13572 }, { "epoch": 0.92, "learning_rate": 2.9384143903614435e-07, "loss": 0.7158, "step": 13573 }, { "epoch": 0.93, "learning_rate": 2.933105331320496e-07, "loss": 0.7695, "step": 13574 }, { "epoch": 0.93, "learning_rate": 2.927801001373942e-07, "loss": 0.7598, "step": 13575 }, { "epoch": 0.93, "learning_rate": 2.922501400780176e-07, "loss": 0.7725, "step": 13576 }, { "epoch": 0.93, "learning_rate": 2.9172065297974115e-07, "loss": 0.7822, "step": 13577 }, { "epoch": 0.93, "learning_rate": 2.911916388683611e-07, "loss": 0.7773, "step": 13578 }, { "epoch": 0.93, "learning_rate": 2.906630977696512e-07, "loss": 0.7676, "step": 13579 }, { "epoch": 0.93, "learning_rate": 2.9013502970936304e-07, "loss": 0.6816, "step": 13580 }, { "epoch": 0.93, "learning_rate": 2.896074347132205e-07, "loss": 0.7207, "step": 13581 }, { "epoch": 0.93, "learning_rate": 2.890803128069308e-07, "loss": 0.7441, "step": 13582 }, { "epoch": 0.93, "learning_rate": 2.8855366401617455e-07, "loss": 0.7266, "step": 13583 }, { "epoch": 0.93, "learning_rate": 2.880274883666112e-07, "loss": 0.7695, "step": 13584 }, { "epoch": 0.93, "learning_rate": 2.8750178588387355e-07, "loss": 0.7148, "step": 13585 }, { "epoch": 0.93, "learning_rate": 2.869765565935778e-07, "loss": 0.7441, "step": 13586 }, { "epoch": 0.93, "learning_rate": 2.8645180052130795e-07, "loss": 0.8076, "step": 13587 }, { "epoch": 0.93, "learning_rate": 2.859275176926335e-07, "loss": 0.6963, "step": 13588 }, { "epoch": 0.93, "learning_rate": 2.8540370813309625e-07, "loss": 0.8096, "step": 13589 }, { "epoch": 0.93, "learning_rate": 2.8488037186821694e-07, "loss": 0.7432, "step": 13590 }, { "epoch": 0.93, "learning_rate": 2.843575089234918e-07, "loss": 0.6836, "step": 13591 }, { "epoch": 0.93, "learning_rate": 2.83835119324396e-07, "loss": 0.7021, "step": 13592 }, { "epoch": 0.93, "learning_rate": 2.833132030963792e-07, "loss": 0.7549, "step": 13593 }, { "epoch": 0.93, "learning_rate": 2.827917602648689e-07, "loss": 0.748, "step": 13594 }, { "epoch": 0.93, "learning_rate": 2.822707908552691e-07, "loss": 0.748, "step": 13595 }, { "epoch": 0.93, "learning_rate": 2.81750294892964e-07, "loss": 0.7881, "step": 13596 }, { "epoch": 0.93, "learning_rate": 2.8123027240331004e-07, "loss": 0.7256, "step": 13597 }, { "epoch": 0.93, "learning_rate": 2.807107234116435e-07, "loss": 0.6963, "step": 13598 }, { "epoch": 0.93, "learning_rate": 2.8019164794327756e-07, "loss": 0.7461, "step": 13599 }, { "epoch": 0.93, "learning_rate": 2.7967304602349754e-07, "loss": 0.7197, "step": 13600 }, { "epoch": 0.93, "learning_rate": 2.791549176775743e-07, "loss": 0.7754, "step": 13601 }, { "epoch": 0.93, "learning_rate": 2.78637262930751e-07, "loss": 0.748, "step": 13602 }, { "epoch": 0.93, "learning_rate": 2.781200818082441e-07, "loss": 0.7646, "step": 13603 }, { "epoch": 0.93, "learning_rate": 2.7760337433525353e-07, "loss": 0.6787, "step": 13604 }, { "epoch": 0.93, "learning_rate": 2.770871405369524e-07, "loss": 0.749, "step": 13605 }, { "epoch": 0.93, "learning_rate": 2.765713804384917e-07, "loss": 0.7598, "step": 13606 }, { "epoch": 0.93, "learning_rate": 2.760560940649981e-07, "loss": 0.7666, "step": 13607 }, { "epoch": 0.93, "learning_rate": 2.755412814415781e-07, "loss": 0.71, "step": 13608 }, { "epoch": 0.93, "learning_rate": 2.750269425933139e-07, "loss": 0.7744, "step": 13609 }, { "epoch": 0.93, "learning_rate": 2.7451307754526203e-07, "loss": 0.7822, "step": 13610 }, { "epoch": 0.93, "learning_rate": 2.739996863224581e-07, "loss": 0.7676, "step": 13611 }, { "epoch": 0.93, "learning_rate": 2.7348676894991545e-07, "loss": 0.7607, "step": 13612 }, { "epoch": 0.93, "learning_rate": 2.729743254526229e-07, "loss": 0.7314, "step": 13613 }, { "epoch": 0.93, "learning_rate": 2.724623558555473e-07, "loss": 0.7412, "step": 13614 }, { "epoch": 0.93, "learning_rate": 2.719508601836318e-07, "loss": 0.8047, "step": 13615 }, { "epoch": 0.93, "learning_rate": 2.714398384617956e-07, "loss": 0.7549, "step": 13616 }, { "epoch": 0.93, "learning_rate": 2.709292907149352e-07, "loss": 0.8008, "step": 13617 }, { "epoch": 0.93, "learning_rate": 2.704192169679254e-07, "loss": 0.6436, "step": 13618 }, { "epoch": 0.93, "learning_rate": 2.6990961724561727e-07, "loss": 0.7598, "step": 13619 }, { "epoch": 0.93, "learning_rate": 2.6940049157283875e-07, "loss": 0.752, "step": 13620 }, { "epoch": 0.93, "learning_rate": 2.6889183997439226e-07, "loss": 0.8037, "step": 13621 }, { "epoch": 0.93, "learning_rate": 2.683836624750624e-07, "loss": 0.7539, "step": 13622 }, { "epoch": 0.93, "learning_rate": 2.67875959099605e-07, "loss": 0.8145, "step": 13623 }, { "epoch": 0.93, "learning_rate": 2.6736872987275563e-07, "loss": 0.8359, "step": 13624 }, { "epoch": 0.93, "learning_rate": 2.6686197481922915e-07, "loss": 0.7754, "step": 13625 }, { "epoch": 0.93, "learning_rate": 2.663556939637113e-07, "loss": 0.7285, "step": 13626 }, { "epoch": 0.93, "learning_rate": 2.6584988733086904e-07, "loss": 0.7266, "step": 13627 }, { "epoch": 0.93, "learning_rate": 2.6534455494534597e-07, "loss": 0.7842, "step": 13628 }, { "epoch": 0.93, "learning_rate": 2.6483969683176236e-07, "loss": 0.7012, "step": 13629 }, { "epoch": 0.93, "learning_rate": 2.6433531301471194e-07, "loss": 0.7803, "step": 13630 }, { "epoch": 0.93, "learning_rate": 2.638314035187717e-07, "loss": 0.6982, "step": 13631 }, { "epoch": 0.93, "learning_rate": 2.6332796836849083e-07, "loss": 0.7529, "step": 13632 }, { "epoch": 0.93, "learning_rate": 2.6282500758839644e-07, "loss": 0.7383, "step": 13633 }, { "epoch": 0.93, "learning_rate": 2.6232252120299226e-07, "loss": 0.7168, "step": 13634 }, { "epoch": 0.93, "learning_rate": 2.6182050923676095e-07, "loss": 0.7373, "step": 13635 }, { "epoch": 0.93, "learning_rate": 2.6131897171415734e-07, "loss": 0.709, "step": 13636 }, { "epoch": 0.93, "learning_rate": 2.6081790865961967e-07, "loss": 0.6738, "step": 13637 }, { "epoch": 0.93, "learning_rate": 2.603173200975595e-07, "loss": 0.7598, "step": 13638 }, { "epoch": 0.93, "learning_rate": 2.5981720605236404e-07, "loss": 0.7246, "step": 13639 }, { "epoch": 0.93, "learning_rate": 2.5931756654839934e-07, "loss": 0.7432, "step": 13640 }, { "epoch": 0.93, "learning_rate": 2.5881840161000704e-07, "loss": 0.791, "step": 13641 }, { "epoch": 0.93, "learning_rate": 2.5831971126150767e-07, "loss": 0.7295, "step": 13642 }, { "epoch": 0.93, "learning_rate": 2.5782149552719626e-07, "loss": 0.7158, "step": 13643 }, { "epoch": 0.93, "learning_rate": 2.573237544313478e-07, "loss": 0.6777, "step": 13644 }, { "epoch": 0.93, "learning_rate": 2.5682648799821077e-07, "loss": 0.8096, "step": 13645 }, { "epoch": 0.93, "learning_rate": 2.5632969625201123e-07, "loss": 0.748, "step": 13646 }, { "epoch": 0.93, "learning_rate": 2.5583337921695426e-07, "loss": 0.7998, "step": 13647 }, { "epoch": 0.93, "learning_rate": 2.5533753691721954e-07, "loss": 0.8154, "step": 13648 }, { "epoch": 0.93, "learning_rate": 2.548421693769654e-07, "loss": 0.7988, "step": 13649 }, { "epoch": 0.93, "learning_rate": 2.5434727662032475e-07, "loss": 0.7334, "step": 13650 }, { "epoch": 0.93, "learning_rate": 2.538528586714106e-07, "loss": 0.6875, "step": 13651 }, { "epoch": 0.93, "learning_rate": 2.5335891555430923e-07, "loss": 0.7939, "step": 13652 }, { "epoch": 0.93, "learning_rate": 2.528654472930858e-07, "loss": 0.792, "step": 13653 }, { "epoch": 0.93, "learning_rate": 2.5237245391178224e-07, "loss": 0.7217, "step": 13654 }, { "epoch": 0.93, "learning_rate": 2.5187993543441814e-07, "loss": 0.7246, "step": 13655 }, { "epoch": 0.93, "learning_rate": 2.513878918849877e-07, "loss": 0.7725, "step": 13656 }, { "epoch": 0.93, "learning_rate": 2.5089632328746393e-07, "loss": 0.709, "step": 13657 }, { "epoch": 0.93, "learning_rate": 2.504052296657966e-07, "loss": 0.8027, "step": 13658 }, { "epoch": 0.93, "learning_rate": 2.499146110439099e-07, "loss": 0.7051, "step": 13659 }, { "epoch": 0.93, "learning_rate": 2.494244674457069e-07, "loss": 0.7695, "step": 13660 }, { "epoch": 0.93, "learning_rate": 2.4893479889507076e-07, "loss": 0.6992, "step": 13661 }, { "epoch": 0.93, "learning_rate": 2.484456054158546e-07, "loss": 0.7549, "step": 13662 }, { "epoch": 0.93, "learning_rate": 2.479568870318927e-07, "loss": 0.75, "step": 13663 }, { "epoch": 0.93, "learning_rate": 2.47468643766996e-07, "loss": 0.7461, "step": 13664 }, { "epoch": 0.93, "learning_rate": 2.4698087564495323e-07, "loss": 0.667, "step": 13665 }, { "epoch": 0.93, "learning_rate": 2.4649358268952315e-07, "loss": 0.7656, "step": 13666 }, { "epoch": 0.93, "learning_rate": 2.460067649244524e-07, "loss": 0.7168, "step": 13667 }, { "epoch": 0.93, "learning_rate": 2.455204223734553e-07, "loss": 0.7617, "step": 13668 }, { "epoch": 0.93, "learning_rate": 2.4503455506022846e-07, "loss": 0.7744, "step": 13669 }, { "epoch": 0.93, "learning_rate": 2.445491630084418e-07, "loss": 0.7549, "step": 13670 }, { "epoch": 0.93, "learning_rate": 2.440642462417453e-07, "loss": 0.7666, "step": 13671 }, { "epoch": 0.93, "learning_rate": 2.435798047837601e-07, "loss": 0.7158, "step": 13672 }, { "epoch": 0.93, "learning_rate": 2.430958386580928e-07, "loss": 0.6875, "step": 13673 }, { "epoch": 0.93, "learning_rate": 2.426123478883213e-07, "loss": 0.7051, "step": 13674 }, { "epoch": 0.93, "learning_rate": 2.421293324980001e-07, "loss": 0.7559, "step": 13675 }, { "epoch": 0.93, "learning_rate": 2.4164679251066024e-07, "loss": 0.7227, "step": 13676 }, { "epoch": 0.93, "learning_rate": 2.4116472794981417e-07, "loss": 0.7246, "step": 13677 }, { "epoch": 0.93, "learning_rate": 2.4068313883894633e-07, "loss": 0.7109, "step": 13678 }, { "epoch": 0.93, "learning_rate": 2.4020202520152024e-07, "loss": 0.7197, "step": 13679 }, { "epoch": 0.93, "learning_rate": 2.397213870609749e-07, "loss": 0.8711, "step": 13680 }, { "epoch": 0.93, "learning_rate": 2.392412244407294e-07, "loss": 0.7197, "step": 13681 }, { "epoch": 0.93, "learning_rate": 2.3876153736417384e-07, "loss": 0.792, "step": 13682 }, { "epoch": 0.93, "learning_rate": 2.382823258546807e-07, "loss": 0.7295, "step": 13683 }, { "epoch": 0.93, "learning_rate": 2.3780358993559572e-07, "loss": 0.7021, "step": 13684 }, { "epoch": 0.93, "learning_rate": 2.3732532963024468e-07, "loss": 0.6826, "step": 13685 }, { "epoch": 0.93, "learning_rate": 2.3684754496192674e-07, "loss": 0.7529, "step": 13686 }, { "epoch": 0.93, "learning_rate": 2.3637023595392106e-07, "loss": 0.7891, "step": 13687 }, { "epoch": 0.93, "learning_rate": 2.3589340262948123e-07, "loss": 0.7432, "step": 13688 }, { "epoch": 0.93, "learning_rate": 2.3541704501183872e-07, "loss": 0.7217, "step": 13689 }, { "epoch": 0.93, "learning_rate": 2.3494116312420046e-07, "loss": 0.6943, "step": 13690 }, { "epoch": 0.93, "learning_rate": 2.344657569897535e-07, "loss": 0.6895, "step": 13691 }, { "epoch": 0.93, "learning_rate": 2.3399082663165928e-07, "loss": 0.7568, "step": 13692 }, { "epoch": 0.93, "learning_rate": 2.3351637207305488e-07, "loss": 0.7266, "step": 13693 }, { "epoch": 0.93, "learning_rate": 2.3304239333705736e-07, "loss": 0.7842, "step": 13694 }, { "epoch": 0.93, "learning_rate": 2.3256889044675712e-07, "loss": 0.8037, "step": 13695 }, { "epoch": 0.93, "learning_rate": 2.320958634252235e-07, "loss": 0.7236, "step": 13696 }, { "epoch": 0.93, "learning_rate": 2.3162331229550473e-07, "loss": 0.7432, "step": 13697 }, { "epoch": 0.93, "learning_rate": 2.3115123708062127e-07, "loss": 0.6953, "step": 13698 }, { "epoch": 0.93, "learning_rate": 2.3067963780357249e-07, "loss": 0.7705, "step": 13699 }, { "epoch": 0.93, "learning_rate": 2.3020851448733562e-07, "loss": 0.7793, "step": 13700 }, { "epoch": 0.93, "learning_rate": 2.2973786715486445e-07, "loss": 0.792, "step": 13701 }, { "epoch": 0.93, "learning_rate": 2.2926769582908627e-07, "loss": 0.7783, "step": 13702 }, { "epoch": 0.93, "learning_rate": 2.2879800053291158e-07, "loss": 0.7383, "step": 13703 }, { "epoch": 0.93, "learning_rate": 2.2832878128922097e-07, "loss": 0.7275, "step": 13704 }, { "epoch": 0.93, "learning_rate": 2.278600381208751e-07, "loss": 0.7422, "step": 13705 }, { "epoch": 0.93, "learning_rate": 2.273917710507112e-07, "loss": 0.6992, "step": 13706 }, { "epoch": 0.93, "learning_rate": 2.269239801015455e-07, "loss": 0.7852, "step": 13707 }, { "epoch": 0.93, "learning_rate": 2.2645666529616417e-07, "loss": 0.7627, "step": 13708 }, { "epoch": 0.93, "learning_rate": 2.2598982665733905e-07, "loss": 0.6699, "step": 13709 }, { "epoch": 0.93, "learning_rate": 2.2552346420781412e-07, "loss": 0.7676, "step": 13710 }, { "epoch": 0.93, "learning_rate": 2.2505757797030793e-07, "loss": 0.7021, "step": 13711 }, { "epoch": 0.93, "learning_rate": 2.2459216796751894e-07, "loss": 0.7363, "step": 13712 }, { "epoch": 0.93, "learning_rate": 2.2412723422212458e-07, "loss": 0.7256, "step": 13713 }, { "epoch": 0.93, "learning_rate": 2.236627767567734e-07, "loss": 0.7412, "step": 13714 }, { "epoch": 0.93, "learning_rate": 2.2319879559409508e-07, "loss": 0.6826, "step": 13715 }, { "epoch": 0.93, "learning_rate": 2.2273529075669485e-07, "loss": 0.7344, "step": 13716 }, { "epoch": 0.93, "learning_rate": 2.2227226226715582e-07, "loss": 0.7705, "step": 13717 }, { "epoch": 0.93, "learning_rate": 2.218097101480343e-07, "loss": 0.8291, "step": 13718 }, { "epoch": 0.93, "learning_rate": 2.2134763442186569e-07, "loss": 0.7031, "step": 13719 }, { "epoch": 0.93, "learning_rate": 2.2088603511116524e-07, "loss": 0.7227, "step": 13720 }, { "epoch": 0.94, "learning_rate": 2.2042491223841943e-07, "loss": 0.71, "step": 13721 }, { "epoch": 0.94, "learning_rate": 2.1996426582609475e-07, "loss": 0.7051, "step": 13722 }, { "epoch": 0.94, "learning_rate": 2.1950409589663547e-07, "loss": 0.7646, "step": 13723 }, { "epoch": 0.94, "learning_rate": 2.1904440247245805e-07, "loss": 0.7432, "step": 13724 }, { "epoch": 0.94, "learning_rate": 2.185851855759602e-07, "loss": 0.7695, "step": 13725 }, { "epoch": 0.94, "learning_rate": 2.181264452295162e-07, "loss": 0.6982, "step": 13726 }, { "epoch": 0.94, "learning_rate": 2.1766818145547485e-07, "loss": 0.7607, "step": 13727 }, { "epoch": 0.94, "learning_rate": 2.1721039427616164e-07, "loss": 0.6807, "step": 13728 }, { "epoch": 0.94, "learning_rate": 2.1675308371388203e-07, "loss": 0.7363, "step": 13729 }, { "epoch": 0.94, "learning_rate": 2.162962497909149e-07, "loss": 0.7065, "step": 13730 }, { "epoch": 0.94, "learning_rate": 2.1583989252951575e-07, "loss": 0.7383, "step": 13731 }, { "epoch": 0.94, "learning_rate": 2.1538401195192128e-07, "loss": 0.8311, "step": 13732 }, { "epoch": 0.94, "learning_rate": 2.1492860808034143e-07, "loss": 0.6758, "step": 13733 }, { "epoch": 0.94, "learning_rate": 2.1447368093696185e-07, "loss": 0.7539, "step": 13734 }, { "epoch": 0.94, "learning_rate": 2.1401923054394703e-07, "loss": 0.7529, "step": 13735 }, { "epoch": 0.94, "learning_rate": 2.135652569234392e-07, "loss": 0.8008, "step": 13736 }, { "epoch": 0.94, "learning_rate": 2.1311176009755184e-07, "loss": 0.8428, "step": 13737 }, { "epoch": 0.94, "learning_rate": 2.1265874008838506e-07, "loss": 0.6992, "step": 13738 }, { "epoch": 0.94, "learning_rate": 2.122061969180067e-07, "loss": 0.7197, "step": 13739 }, { "epoch": 0.94, "learning_rate": 2.1175413060846471e-07, "loss": 0.7764, "step": 13740 }, { "epoch": 0.94, "learning_rate": 2.1130254118178372e-07, "loss": 0.6982, "step": 13741 }, { "epoch": 0.94, "learning_rate": 2.108514286599661e-07, "loss": 0.7539, "step": 13742 }, { "epoch": 0.94, "learning_rate": 2.1040079306498873e-07, "loss": 0.7344, "step": 13743 }, { "epoch": 0.94, "learning_rate": 2.0995063441880847e-07, "loss": 0.7451, "step": 13744 }, { "epoch": 0.94, "learning_rate": 2.0950095274335448e-07, "loss": 0.7744, "step": 13745 }, { "epoch": 0.94, "learning_rate": 2.090517480605392e-07, "loss": 0.749, "step": 13746 }, { "epoch": 0.94, "learning_rate": 2.086030203922429e-07, "loss": 0.7383, "step": 13747 }, { "epoch": 0.94, "learning_rate": 2.0815476976033032e-07, "loss": 0.6816, "step": 13748 }, { "epoch": 0.94, "learning_rate": 2.077069961866407e-07, "loss": 0.7539, "step": 13749 }, { "epoch": 0.94, "learning_rate": 2.0725969969298766e-07, "loss": 0.7285, "step": 13750 }, { "epoch": 0.94, "learning_rate": 2.0681288030116487e-07, "loss": 0.792, "step": 13751 }, { "epoch": 0.94, "learning_rate": 2.0636653803294048e-07, "loss": 0.6729, "step": 13752 }, { "epoch": 0.94, "learning_rate": 2.059206729100627e-07, "loss": 0.7451, "step": 13753 }, { "epoch": 0.94, "learning_rate": 2.0547528495425072e-07, "loss": 0.7285, "step": 13754 }, { "epoch": 0.94, "learning_rate": 2.0503037418720506e-07, "loss": 0.7354, "step": 13755 }, { "epoch": 0.94, "learning_rate": 2.0458594063060165e-07, "loss": 0.7881, "step": 13756 }, { "epoch": 0.94, "learning_rate": 2.0414198430609433e-07, "loss": 0.7764, "step": 13757 }, { "epoch": 0.94, "learning_rate": 2.0369850523531132e-07, "loss": 0.7373, "step": 13758 }, { "epoch": 0.94, "learning_rate": 2.032555034398598e-07, "loss": 0.7002, "step": 13759 }, { "epoch": 0.94, "learning_rate": 2.0281297894132246e-07, "loss": 0.752, "step": 13760 }, { "epoch": 0.94, "learning_rate": 2.0237093176125767e-07, "loss": 0.7031, "step": 13761 }, { "epoch": 0.94, "learning_rate": 2.0192936192120484e-07, "loss": 0.7988, "step": 13762 }, { "epoch": 0.94, "learning_rate": 2.0148826944267562e-07, "loss": 0.6895, "step": 13763 }, { "epoch": 0.94, "learning_rate": 2.0104765434715955e-07, "loss": 0.7236, "step": 13764 }, { "epoch": 0.94, "learning_rate": 2.0060751665612277e-07, "loss": 0.667, "step": 13765 }, { "epoch": 0.94, "learning_rate": 2.0016785639101254e-07, "loss": 0.8115, "step": 13766 }, { "epoch": 0.94, "learning_rate": 1.9972867357324398e-07, "loss": 0.7832, "step": 13767 }, { "epoch": 0.94, "learning_rate": 1.9928996822421774e-07, "loss": 0.7734, "step": 13768 }, { "epoch": 0.94, "learning_rate": 1.9885174036530675e-07, "loss": 0.7227, "step": 13769 }, { "epoch": 0.94, "learning_rate": 1.9841399001785943e-07, "loss": 0.7412, "step": 13770 }, { "epoch": 0.94, "learning_rate": 1.9797671720320543e-07, "loss": 0.7227, "step": 13771 }, { "epoch": 0.94, "learning_rate": 1.9753992194264882e-07, "loss": 0.7393, "step": 13772 }, { "epoch": 0.94, "learning_rate": 1.97103604257467e-07, "loss": 0.75, "step": 13773 }, { "epoch": 0.94, "learning_rate": 1.9666776416892075e-07, "loss": 0.7939, "step": 13774 }, { "epoch": 0.94, "learning_rate": 1.962324016982431e-07, "loss": 0.792, "step": 13775 }, { "epoch": 0.94, "learning_rate": 1.9579751686664484e-07, "loss": 0.7402, "step": 13776 }, { "epoch": 0.94, "learning_rate": 1.9536310969531235e-07, "loss": 0.7744, "step": 13777 }, { "epoch": 0.94, "learning_rate": 1.9492918020541208e-07, "loss": 0.7686, "step": 13778 }, { "epoch": 0.94, "learning_rate": 1.9449572841808373e-07, "loss": 0.7705, "step": 13779 }, { "epoch": 0.94, "learning_rate": 1.9406275435444487e-07, "loss": 0.6699, "step": 13780 }, { "epoch": 0.94, "learning_rate": 1.9363025803559087e-07, "loss": 0.7197, "step": 13781 }, { "epoch": 0.94, "learning_rate": 1.9319823948259265e-07, "loss": 0.7471, "step": 13782 }, { "epoch": 0.94, "learning_rate": 1.9276669871649777e-07, "loss": 0.7109, "step": 13783 }, { "epoch": 0.94, "learning_rate": 1.9233563575833058e-07, "loss": 0.7354, "step": 13784 }, { "epoch": 0.94, "learning_rate": 1.9190505062909425e-07, "loss": 0.7471, "step": 13785 }, { "epoch": 0.94, "learning_rate": 1.9147494334976425e-07, "loss": 0.665, "step": 13786 }, { "epoch": 0.94, "learning_rate": 1.910453139412971e-07, "loss": 0.7412, "step": 13787 }, { "epoch": 0.94, "learning_rate": 1.9061616242462389e-07, "loss": 0.6055, "step": 13788 }, { "epoch": 0.94, "learning_rate": 1.901874888206534e-07, "loss": 0.7998, "step": 13789 }, { "epoch": 0.94, "learning_rate": 1.8975929315026897e-07, "loss": 0.7246, "step": 13790 }, { "epoch": 0.94, "learning_rate": 1.893315754343339e-07, "loss": 0.8037, "step": 13791 }, { "epoch": 0.94, "learning_rate": 1.8890433569368592e-07, "loss": 0.8242, "step": 13792 }, { "epoch": 0.94, "learning_rate": 1.884775739491407e-07, "loss": 0.7549, "step": 13793 }, { "epoch": 0.94, "learning_rate": 1.8805129022148926e-07, "loss": 0.6543, "step": 13794 }, { "epoch": 0.94, "learning_rate": 1.8762548453150065e-07, "loss": 0.8154, "step": 13795 }, { "epoch": 0.94, "learning_rate": 1.8720015689991932e-07, "loss": 0.7686, "step": 13796 }, { "epoch": 0.94, "learning_rate": 1.8677530734746764e-07, "loss": 0.7637, "step": 13797 }, { "epoch": 0.94, "learning_rate": 1.8635093589484566e-07, "loss": 0.6602, "step": 13798 }, { "epoch": 0.94, "learning_rate": 1.8592704256272686e-07, "loss": 0.7217, "step": 13799 }, { "epoch": 0.94, "learning_rate": 1.8550362737176365e-07, "loss": 0.6973, "step": 13800 }, { "epoch": 0.94, "learning_rate": 1.8508069034258613e-07, "loss": 0.6387, "step": 13801 }, { "epoch": 0.94, "learning_rate": 1.8465823149579787e-07, "loss": 0.6641, "step": 13802 }, { "epoch": 0.94, "learning_rate": 1.8423625085198128e-07, "loss": 0.71, "step": 13803 }, { "epoch": 0.94, "learning_rate": 1.8381474843169656e-07, "loss": 0.7451, "step": 13804 }, { "epoch": 0.94, "learning_rate": 1.8339372425547952e-07, "loss": 0.7793, "step": 13805 }, { "epoch": 0.94, "learning_rate": 1.8297317834384044e-07, "loss": 0.8359, "step": 13806 }, { "epoch": 0.94, "learning_rate": 1.8255311071726955e-07, "loss": 0.7363, "step": 13807 }, { "epoch": 0.94, "learning_rate": 1.8213352139623385e-07, "loss": 0.6719, "step": 13808 }, { "epoch": 0.94, "learning_rate": 1.8171441040117144e-07, "loss": 0.7197, "step": 13809 }, { "epoch": 0.94, "learning_rate": 1.8129577775250483e-07, "loss": 0.7217, "step": 13810 }, { "epoch": 0.94, "learning_rate": 1.808776234706311e-07, "loss": 0.7285, "step": 13811 }, { "epoch": 0.94, "learning_rate": 1.8045994757591944e-07, "loss": 0.7607, "step": 13812 }, { "epoch": 0.94, "learning_rate": 1.800427500887192e-07, "loss": 0.7959, "step": 13813 }, { "epoch": 0.94, "learning_rate": 1.7962603102935848e-07, "loss": 0.7275, "step": 13814 }, { "epoch": 0.94, "learning_rate": 1.792097904181378e-07, "loss": 0.7822, "step": 13815 }, { "epoch": 0.94, "learning_rate": 1.7879402827533865e-07, "loss": 0.7744, "step": 13816 }, { "epoch": 0.94, "learning_rate": 1.7837874462121374e-07, "loss": 0.8428, "step": 13817 }, { "epoch": 0.94, "learning_rate": 1.779639394759991e-07, "loss": 0.75, "step": 13818 }, { "epoch": 0.94, "learning_rate": 1.775496128599019e-07, "loss": 0.6982, "step": 13819 }, { "epoch": 0.94, "learning_rate": 1.7713576479310823e-07, "loss": 0.7158, "step": 13820 }, { "epoch": 0.94, "learning_rate": 1.7672239529578082e-07, "loss": 0.7617, "step": 13821 }, { "epoch": 0.94, "learning_rate": 1.7630950438805917e-07, "loss": 0.8633, "step": 13822 }, { "epoch": 0.94, "learning_rate": 1.7589709209005934e-07, "loss": 0.7402, "step": 13823 }, { "epoch": 0.94, "learning_rate": 1.754851584218753e-07, "loss": 0.7783, "step": 13824 }, { "epoch": 0.94, "learning_rate": 1.7507370340357433e-07, "loss": 0.7188, "step": 13825 }, { "epoch": 0.94, "learning_rate": 1.746627270552037e-07, "loss": 0.7363, "step": 13826 }, { "epoch": 0.94, "learning_rate": 1.742522293967852e-07, "loss": 0.71, "step": 13827 }, { "epoch": 0.94, "learning_rate": 1.738422104483195e-07, "loss": 0.7314, "step": 13828 }, { "epoch": 0.94, "learning_rate": 1.7343267022978173e-07, "loss": 0.7705, "step": 13829 }, { "epoch": 0.94, "learning_rate": 1.730236087611259e-07, "loss": 0.6768, "step": 13830 }, { "epoch": 0.94, "learning_rate": 1.7261502606228054e-07, "loss": 0.7383, "step": 13831 }, { "epoch": 0.94, "learning_rate": 1.7220692215315082e-07, "loss": 0.7314, "step": 13832 }, { "epoch": 0.94, "learning_rate": 1.7179929705362087e-07, "loss": 0.6855, "step": 13833 }, { "epoch": 0.94, "learning_rate": 1.713921507835503e-07, "loss": 0.7217, "step": 13834 }, { "epoch": 0.94, "learning_rate": 1.7098548336277444e-07, "loss": 0.7305, "step": 13835 }, { "epoch": 0.94, "learning_rate": 1.7057929481110736e-07, "loss": 0.8301, "step": 13836 }, { "epoch": 0.94, "learning_rate": 1.701735851483366e-07, "loss": 0.6514, "step": 13837 }, { "epoch": 0.94, "learning_rate": 1.6976835439422968e-07, "loss": 0.8145, "step": 13838 }, { "epoch": 0.94, "learning_rate": 1.6936360256852967e-07, "loss": 0.7471, "step": 13839 }, { "epoch": 0.94, "learning_rate": 1.6895932969095418e-07, "loss": 0.6973, "step": 13840 }, { "epoch": 0.94, "learning_rate": 1.6855553578120297e-07, "loss": 0.7002, "step": 13841 }, { "epoch": 0.94, "learning_rate": 1.6815222085894478e-07, "loss": 0.6885, "step": 13842 }, { "epoch": 0.94, "learning_rate": 1.6774938494383163e-07, "loss": 0.79, "step": 13843 }, { "epoch": 0.94, "learning_rate": 1.6734702805548896e-07, "loss": 0.7129, "step": 13844 }, { "epoch": 0.94, "learning_rate": 1.6694515021351888e-07, "loss": 0.7705, "step": 13845 }, { "epoch": 0.94, "learning_rate": 1.6654375143750235e-07, "loss": 0.7842, "step": 13846 }, { "epoch": 0.94, "learning_rate": 1.6614283174699487e-07, "loss": 0.7549, "step": 13847 }, { "epoch": 0.94, "learning_rate": 1.6574239116152857e-07, "loss": 0.7334, "step": 13848 }, { "epoch": 0.94, "learning_rate": 1.6534242970061342e-07, "loss": 0.7246, "step": 13849 }, { "epoch": 0.94, "learning_rate": 1.6494294738373606e-07, "loss": 0.7666, "step": 13850 }, { "epoch": 0.94, "learning_rate": 1.6454394423035757e-07, "loss": 0.7109, "step": 13851 }, { "epoch": 0.94, "learning_rate": 1.6414542025991908e-07, "loss": 0.7139, "step": 13852 }, { "epoch": 0.94, "learning_rate": 1.6374737549183617e-07, "loss": 0.7578, "step": 13853 }, { "epoch": 0.94, "learning_rate": 1.633498099455022e-07, "loss": 0.6953, "step": 13854 }, { "epoch": 0.94, "learning_rate": 1.6295272364028503e-07, "loss": 0.7686, "step": 13855 }, { "epoch": 0.94, "learning_rate": 1.6255611659553027e-07, "loss": 0.7725, "step": 13856 }, { "epoch": 0.94, "learning_rate": 1.621599888305636e-07, "loss": 0.708, "step": 13857 }, { "epoch": 0.94, "learning_rate": 1.617643403646818e-07, "loss": 0.7402, "step": 13858 }, { "epoch": 0.94, "learning_rate": 1.6136917121716168e-07, "loss": 0.6963, "step": 13859 }, { "epoch": 0.94, "learning_rate": 1.6097448140725558e-07, "loss": 0.7383, "step": 13860 }, { "epoch": 0.94, "learning_rate": 1.605802709541937e-07, "loss": 0.7207, "step": 13861 }, { "epoch": 0.94, "learning_rate": 1.601865398771796e-07, "loss": 0.8066, "step": 13862 }, { "epoch": 0.94, "learning_rate": 1.5979328819539895e-07, "loss": 0.7734, "step": 13863 }, { "epoch": 0.94, "learning_rate": 1.5940051592800766e-07, "loss": 0.7109, "step": 13864 }, { "epoch": 0.94, "learning_rate": 1.5900822309414475e-07, "loss": 0.7539, "step": 13865 }, { "epoch": 0.94, "learning_rate": 1.5861640971292058e-07, "loss": 0.7285, "step": 13866 }, { "epoch": 0.95, "learning_rate": 1.582250758034265e-07, "loss": 0.7725, "step": 13867 }, { "epoch": 0.95, "learning_rate": 1.5783422138472503e-07, "loss": 0.7939, "step": 13868 }, { "epoch": 0.95, "learning_rate": 1.5744384647586098e-07, "loss": 0.8467, "step": 13869 }, { "epoch": 0.95, "learning_rate": 1.5705395109585242e-07, "loss": 0.7588, "step": 13870 }, { "epoch": 0.95, "learning_rate": 1.566645352636964e-07, "loss": 0.7832, "step": 13871 }, { "epoch": 0.95, "learning_rate": 1.562755989983633e-07, "loss": 0.751, "step": 13872 }, { "epoch": 0.95, "learning_rate": 1.5588714231880243e-07, "loss": 0.6948, "step": 13873 }, { "epoch": 0.95, "learning_rate": 1.5549916524394083e-07, "loss": 0.7686, "step": 13874 }, { "epoch": 0.95, "learning_rate": 1.5511166779267895e-07, "loss": 0.7529, "step": 13875 }, { "epoch": 0.95, "learning_rate": 1.5472464998389836e-07, "loss": 0.7764, "step": 13876 }, { "epoch": 0.95, "learning_rate": 1.5433811183645175e-07, "loss": 0.7822, "step": 13877 }, { "epoch": 0.95, "learning_rate": 1.5395205336917185e-07, "loss": 0.7393, "step": 13878 }, { "epoch": 0.95, "learning_rate": 1.5356647460086692e-07, "loss": 0.8018, "step": 13879 }, { "epoch": 0.95, "learning_rate": 1.531813755503242e-07, "loss": 0.708, "step": 13880 }, { "epoch": 0.95, "learning_rate": 1.527967562363042e-07, "loss": 0.6748, "step": 13881 }, { "epoch": 0.95, "learning_rate": 1.5241261667754635e-07, "loss": 0.6699, "step": 13882 }, { "epoch": 0.95, "learning_rate": 1.5202895689276687e-07, "loss": 0.7168, "step": 13883 }, { "epoch": 0.95, "learning_rate": 1.5164577690065518e-07, "loss": 0.6406, "step": 13884 }, { "epoch": 0.95, "learning_rate": 1.5126307671988084e-07, "loss": 0.7637, "step": 13885 }, { "epoch": 0.95, "learning_rate": 1.5088085636908888e-07, "loss": 0.7021, "step": 13886 }, { "epoch": 0.95, "learning_rate": 1.5049911586690113e-07, "loss": 0.8037, "step": 13887 }, { "epoch": 0.95, "learning_rate": 1.5011785523191714e-07, "loss": 0.8018, "step": 13888 }, { "epoch": 0.95, "learning_rate": 1.497370744827098e-07, "loss": 0.7705, "step": 13889 }, { "epoch": 0.95, "learning_rate": 1.4935677363783318e-07, "loss": 0.8105, "step": 13890 }, { "epoch": 0.95, "learning_rate": 1.4897695271581247e-07, "loss": 0.7637, "step": 13891 }, { "epoch": 0.95, "learning_rate": 1.4859761173515507e-07, "loss": 0.833, "step": 13892 }, { "epoch": 0.95, "learning_rate": 1.4821875071434177e-07, "loss": 0.7422, "step": 13893 }, { "epoch": 0.95, "learning_rate": 1.4784036967183003e-07, "loss": 0.7197, "step": 13894 }, { "epoch": 0.95, "learning_rate": 1.4746246862605616e-07, "loss": 0.751, "step": 13895 }, { "epoch": 0.95, "learning_rate": 1.4708504759542997e-07, "loss": 0.7295, "step": 13896 }, { "epoch": 0.95, "learning_rate": 1.467081065983389e-07, "loss": 0.7607, "step": 13897 }, { "epoch": 0.95, "learning_rate": 1.4633164565314827e-07, "loss": 0.7178, "step": 13898 }, { "epoch": 0.95, "learning_rate": 1.4595566477820012e-07, "loss": 0.7891, "step": 13899 }, { "epoch": 0.95, "learning_rate": 1.4558016399181086e-07, "loss": 0.7783, "step": 13900 }, { "epoch": 0.95, "learning_rate": 1.4520514331227587e-07, "loss": 0.7891, "step": 13901 }, { "epoch": 0.95, "learning_rate": 1.448306027578661e-07, "loss": 0.7881, "step": 13902 }, { "epoch": 0.95, "learning_rate": 1.4445654234682806e-07, "loss": 0.7139, "step": 13903 }, { "epoch": 0.95, "learning_rate": 1.4408296209738603e-07, "loss": 0.7588, "step": 13904 }, { "epoch": 0.95, "learning_rate": 1.4370986202774217e-07, "loss": 0.7275, "step": 13905 }, { "epoch": 0.95, "learning_rate": 1.4333724215607414e-07, "loss": 0.7285, "step": 13906 }, { "epoch": 0.95, "learning_rate": 1.429651025005341e-07, "loss": 0.7773, "step": 13907 }, { "epoch": 0.95, "learning_rate": 1.4259344307925415e-07, "loss": 0.6514, "step": 13908 }, { "epoch": 0.95, "learning_rate": 1.42222263910341e-07, "loss": 0.7373, "step": 13909 }, { "epoch": 0.95, "learning_rate": 1.418515650118768e-07, "loss": 0.7773, "step": 13910 }, { "epoch": 0.95, "learning_rate": 1.4148134640192378e-07, "loss": 0.6924, "step": 13911 }, { "epoch": 0.95, "learning_rate": 1.4111160809852087e-07, "loss": 0.7715, "step": 13912 }, { "epoch": 0.95, "learning_rate": 1.4074235011967808e-07, "loss": 0.8252, "step": 13913 }, { "epoch": 0.95, "learning_rate": 1.4037357248338767e-07, "loss": 0.8467, "step": 13914 }, { "epoch": 0.95, "learning_rate": 1.400052752076153e-07, "loss": 0.6797, "step": 13915 }, { "epoch": 0.95, "learning_rate": 1.396374583103055e-07, "loss": 0.7363, "step": 13916 }, { "epoch": 0.95, "learning_rate": 1.3927012180937838e-07, "loss": 0.7383, "step": 13917 }, { "epoch": 0.95, "learning_rate": 1.389032657227296e-07, "loss": 0.7637, "step": 13918 }, { "epoch": 0.95, "learning_rate": 1.3853689006823268e-07, "loss": 0.7017, "step": 13919 }, { "epoch": 0.95, "learning_rate": 1.3817099486373774e-07, "loss": 0.7666, "step": 13920 }, { "epoch": 0.95, "learning_rate": 1.378055801270717e-07, "loss": 0.6689, "step": 13921 }, { "epoch": 0.95, "learning_rate": 1.3744064587603578e-07, "loss": 0.6787, "step": 13922 }, { "epoch": 0.95, "learning_rate": 1.370761921284114e-07, "loss": 0.7256, "step": 13923 }, { "epoch": 0.95, "learning_rate": 1.367122189019532e-07, "loss": 0.8047, "step": 13924 }, { "epoch": 0.95, "learning_rate": 1.3634872621439477e-07, "loss": 0.791, "step": 13925 }, { "epoch": 0.95, "learning_rate": 1.359857140834464e-07, "loss": 0.8037, "step": 13926 }, { "epoch": 0.95, "learning_rate": 1.3562318252679173e-07, "loss": 0.8271, "step": 13927 }, { "epoch": 0.95, "learning_rate": 1.3526113156209552e-07, "loss": 0.7549, "step": 13928 }, { "epoch": 0.95, "learning_rate": 1.3489956120699475e-07, "loss": 0.7764, "step": 13929 }, { "epoch": 0.95, "learning_rate": 1.345384714791076e-07, "loss": 0.752, "step": 13930 }, { "epoch": 0.95, "learning_rate": 1.3417786239602438e-07, "loss": 0.8105, "step": 13931 }, { "epoch": 0.95, "learning_rate": 1.338177339753155e-07, "loss": 0.7285, "step": 13932 }, { "epoch": 0.95, "learning_rate": 1.3345808623452362e-07, "loss": 0.7373, "step": 13933 }, { "epoch": 0.95, "learning_rate": 1.3309891919117358e-07, "loss": 0.7637, "step": 13934 }, { "epoch": 0.95, "learning_rate": 1.327402328627636e-07, "loss": 0.7588, "step": 13935 }, { "epoch": 0.95, "learning_rate": 1.3238202726676751e-07, "loss": 0.6592, "step": 13936 }, { "epoch": 0.95, "learning_rate": 1.3202430242063802e-07, "loss": 0.7725, "step": 13937 }, { "epoch": 0.95, "learning_rate": 1.3166705834180337e-07, "loss": 0.7109, "step": 13938 }, { "epoch": 0.95, "learning_rate": 1.3131029504766857e-07, "loss": 0.6963, "step": 13939 }, { "epoch": 0.95, "learning_rate": 1.3095401255561413e-07, "loss": 0.6836, "step": 13940 }, { "epoch": 0.95, "learning_rate": 1.305982108829995e-07, "loss": 0.8672, "step": 13941 }, { "epoch": 0.95, "learning_rate": 1.3024289004715973e-07, "loss": 0.7041, "step": 13942 }, { "epoch": 0.95, "learning_rate": 1.2988805006540317e-07, "loss": 0.7432, "step": 13943 }, { "epoch": 0.95, "learning_rate": 1.2953369095502045e-07, "loss": 0.7295, "step": 13944 }, { "epoch": 0.95, "learning_rate": 1.291798127332755e-07, "loss": 0.791, "step": 13945 }, { "epoch": 0.95, "learning_rate": 1.2882641541740793e-07, "loss": 0.7617, "step": 13946 }, { "epoch": 0.95, "learning_rate": 1.2847349902463614e-07, "loss": 0.7646, "step": 13947 }, { "epoch": 0.95, "learning_rate": 1.2812106357215414e-07, "loss": 0.7852, "step": 13948 }, { "epoch": 0.95, "learning_rate": 1.2776910907713268e-07, "loss": 0.7568, "step": 13949 }, { "epoch": 0.95, "learning_rate": 1.2741763555671805e-07, "loss": 0.7578, "step": 13950 }, { "epoch": 0.95, "learning_rate": 1.270666430280354e-07, "loss": 0.7627, "step": 13951 }, { "epoch": 0.95, "learning_rate": 1.267161315081844e-07, "loss": 0.7275, "step": 13952 }, { "epoch": 0.95, "learning_rate": 1.263661010142414e-07, "loss": 0.7832, "step": 13953 }, { "epoch": 0.95, "learning_rate": 1.2601655156326166e-07, "loss": 0.7197, "step": 13954 }, { "epoch": 0.95, "learning_rate": 1.2566748317227373e-07, "loss": 0.7559, "step": 13955 }, { "epoch": 0.95, "learning_rate": 1.2531889585828406e-07, "loss": 0.748, "step": 13956 }, { "epoch": 0.95, "learning_rate": 1.2497078963827457e-07, "loss": 0.7295, "step": 13957 }, { "epoch": 0.95, "learning_rate": 1.2462316452920954e-07, "loss": 0.7227, "step": 13958 }, { "epoch": 0.95, "learning_rate": 1.242760205480209e-07, "loss": 0.7705, "step": 13959 }, { "epoch": 0.95, "learning_rate": 1.2392935771162295e-07, "loss": 0.7197, "step": 13960 }, { "epoch": 0.95, "learning_rate": 1.235831760369055e-07, "loss": 0.7764, "step": 13961 }, { "epoch": 0.95, "learning_rate": 1.2323747554073396e-07, "loss": 0.7598, "step": 13962 }, { "epoch": 0.95, "learning_rate": 1.228922562399504e-07, "loss": 0.7314, "step": 13963 }, { "epoch": 0.95, "learning_rate": 1.2254751815137576e-07, "loss": 0.6953, "step": 13964 }, { "epoch": 0.95, "learning_rate": 1.2220326129180337e-07, "loss": 0.7266, "step": 13965 }, { "epoch": 0.95, "learning_rate": 1.2185948567800643e-07, "loss": 0.751, "step": 13966 }, { "epoch": 0.95, "learning_rate": 1.2151619132673266e-07, "loss": 0.7715, "step": 13967 }, { "epoch": 0.95, "learning_rate": 1.2117337825471087e-07, "loss": 0.6797, "step": 13968 }, { "epoch": 0.95, "learning_rate": 1.2083104647863774e-07, "loss": 0.7627, "step": 13969 }, { "epoch": 0.95, "learning_rate": 1.204891960151955e-07, "loss": 0.6699, "step": 13970 }, { "epoch": 0.95, "learning_rate": 1.2014782688103743e-07, "loss": 0.7393, "step": 13971 }, { "epoch": 0.95, "learning_rate": 1.1980693909279585e-07, "loss": 0.6748, "step": 13972 }, { "epoch": 0.95, "learning_rate": 1.1946653266707854e-07, "loss": 0.6465, "step": 13973 }, { "epoch": 0.95, "learning_rate": 1.191266076204689e-07, "loss": 0.7744, "step": 13974 }, { "epoch": 0.95, "learning_rate": 1.1878716396952928e-07, "loss": 0.6992, "step": 13975 }, { "epoch": 0.95, "learning_rate": 1.1844820173079752e-07, "loss": 0.7676, "step": 13976 }, { "epoch": 0.95, "learning_rate": 1.181097209207882e-07, "loss": 0.7793, "step": 13977 }, { "epoch": 0.95, "learning_rate": 1.1777172155599148e-07, "loss": 0.7383, "step": 13978 }, { "epoch": 0.95, "learning_rate": 1.1743420365287306e-07, "loss": 0.7354, "step": 13979 }, { "epoch": 0.95, "learning_rate": 1.1709716722787867e-07, "loss": 0.7432, "step": 13980 }, { "epoch": 0.95, "learning_rate": 1.1676061229742963e-07, "loss": 0.7617, "step": 13981 }, { "epoch": 0.95, "learning_rate": 1.1642453887791949e-07, "loss": 0.7266, "step": 13982 }, { "epoch": 0.95, "learning_rate": 1.1608894698572515e-07, "loss": 0.6943, "step": 13983 }, { "epoch": 0.95, "learning_rate": 1.1575383663719575e-07, "loss": 0.7422, "step": 13984 }, { "epoch": 0.95, "learning_rate": 1.1541920784865713e-07, "loss": 0.8145, "step": 13985 }, { "epoch": 0.95, "learning_rate": 1.1508506063641178e-07, "loss": 0.7441, "step": 13986 }, { "epoch": 0.95, "learning_rate": 1.1475139501674115e-07, "loss": 0.6562, "step": 13987 }, { "epoch": 0.95, "learning_rate": 1.144182110059e-07, "loss": 0.7881, "step": 13988 }, { "epoch": 0.95, "learning_rate": 1.1408550862012201e-07, "loss": 0.6553, "step": 13989 }, { "epoch": 0.95, "learning_rate": 1.1375328787561535e-07, "loss": 0.7812, "step": 13990 }, { "epoch": 0.95, "learning_rate": 1.1342154878856704e-07, "loss": 0.7725, "step": 13991 }, { "epoch": 0.95, "learning_rate": 1.1309029137513861e-07, "loss": 0.6826, "step": 13992 }, { "epoch": 0.95, "learning_rate": 1.1275951565146715e-07, "loss": 0.7334, "step": 13993 }, { "epoch": 0.95, "learning_rate": 1.1242922163367198e-07, "loss": 0.7051, "step": 13994 }, { "epoch": 0.95, "learning_rate": 1.1209940933784247e-07, "loss": 0.7344, "step": 13995 }, { "epoch": 0.95, "learning_rate": 1.1177007878004797e-07, "loss": 0.6533, "step": 13996 }, { "epoch": 0.95, "learning_rate": 1.1144122997633345e-07, "loss": 0.7646, "step": 13997 }, { "epoch": 0.95, "learning_rate": 1.1111286294271828e-07, "loss": 0.7979, "step": 13998 }, { "epoch": 0.95, "learning_rate": 1.1078497769520302e-07, "loss": 0.8047, "step": 13999 }, { "epoch": 0.95, "learning_rate": 1.1045757424976156e-07, "loss": 0.7461, "step": 14000 }, { "epoch": 0.95, "learning_rate": 1.1013065262234446e-07, "loss": 0.7793, "step": 14001 }, { "epoch": 0.95, "learning_rate": 1.098042128288801e-07, "loss": 0.7158, "step": 14002 }, { "epoch": 0.95, "learning_rate": 1.094782548852713e-07, "loss": 0.6504, "step": 14003 }, { "epoch": 0.95, "learning_rate": 1.0915277880740094e-07, "loss": 0.7617, "step": 14004 }, { "epoch": 0.95, "learning_rate": 1.0882778461112298e-07, "loss": 0.7236, "step": 14005 }, { "epoch": 0.95, "learning_rate": 1.0850327231227476e-07, "loss": 0.7061, "step": 14006 }, { "epoch": 0.95, "learning_rate": 1.0817924192666473e-07, "loss": 0.749, "step": 14007 }, { "epoch": 0.95, "learning_rate": 1.0785569347007807e-07, "loss": 0.7461, "step": 14008 }, { "epoch": 0.95, "learning_rate": 1.0753262695828104e-07, "loss": 0.7236, "step": 14009 }, { "epoch": 0.95, "learning_rate": 1.0721004240701106e-07, "loss": 0.7324, "step": 14010 }, { "epoch": 0.95, "learning_rate": 1.0688793983198664e-07, "loss": 0.7393, "step": 14011 }, { "epoch": 0.95, "learning_rate": 1.0656631924889749e-07, "loss": 0.7334, "step": 14012 }, { "epoch": 0.95, "learning_rate": 1.062451806734166e-07, "loss": 0.7256, "step": 14013 }, { "epoch": 0.96, "learning_rate": 1.0592452412118704e-07, "loss": 0.7246, "step": 14014 }, { "epoch": 0.96, "learning_rate": 1.0560434960783294e-07, "loss": 0.7002, "step": 14015 }, { "epoch": 0.96, "learning_rate": 1.0528465714895186e-07, "loss": 0.7178, "step": 14016 }, { "epoch": 0.96, "learning_rate": 1.049654467601191e-07, "loss": 0.6523, "step": 14017 }, { "epoch": 0.96, "learning_rate": 1.0464671845688779e-07, "loss": 0.583, "step": 14018 }, { "epoch": 0.96, "learning_rate": 1.043284722547866e-07, "loss": 0.6865, "step": 14019 }, { "epoch": 0.96, "learning_rate": 1.0401070816931869e-07, "loss": 0.6865, "step": 14020 }, { "epoch": 0.96, "learning_rate": 1.0369342621596723e-07, "loss": 0.7344, "step": 14021 }, { "epoch": 0.96, "learning_rate": 1.0337662641018875e-07, "loss": 0.7529, "step": 14022 }, { "epoch": 0.96, "learning_rate": 1.0306030876741868e-07, "loss": 0.7354, "step": 14023 }, { "epoch": 0.96, "learning_rate": 1.0274447330306691e-07, "loss": 0.7432, "step": 14024 }, { "epoch": 0.96, "learning_rate": 1.0242912003252226e-07, "loss": 0.7441, "step": 14025 }, { "epoch": 0.96, "learning_rate": 1.0211424897114908e-07, "loss": 0.748, "step": 14026 }, { "epoch": 0.96, "learning_rate": 1.0179986013428623e-07, "loss": 0.7959, "step": 14027 }, { "epoch": 0.96, "learning_rate": 1.0148595353725255e-07, "loss": 0.7559, "step": 14028 }, { "epoch": 0.96, "learning_rate": 1.0117252919533804e-07, "loss": 0.7373, "step": 14029 }, { "epoch": 0.96, "learning_rate": 1.0085958712381716e-07, "loss": 0.7637, "step": 14030 }, { "epoch": 0.96, "learning_rate": 1.0054712733793437e-07, "loss": 0.7275, "step": 14031 }, { "epoch": 0.96, "learning_rate": 1.0023514985291193e-07, "loss": 0.6953, "step": 14032 }, { "epoch": 0.96, "learning_rate": 9.992365468395104e-08, "loss": 0.7764, "step": 14033 }, { "epoch": 0.96, "learning_rate": 9.961264184622731e-08, "loss": 0.8115, "step": 14034 }, { "epoch": 0.96, "learning_rate": 9.930211135489087e-08, "loss": 0.7158, "step": 14035 }, { "epoch": 0.96, "learning_rate": 9.899206322507515e-08, "loss": 0.7783, "step": 14036 }, { "epoch": 0.96, "learning_rate": 9.86824974718814e-08, "loss": 0.7197, "step": 14037 }, { "epoch": 0.96, "learning_rate": 9.837341411039425e-08, "loss": 0.7363, "step": 14038 }, { "epoch": 0.96, "step": 14038, "total_flos": 2257997778616320.0, "train_loss": 0.8202478387345954, "train_runtime": 101491.3468, "train_samples_per_second": 9.253, "train_steps_per_second": 0.145 } ], "max_steps": 14674, "num_train_epochs": 1, "total_flos": 2257997778616320.0, "trial_name": null, "trial_params": null }