{ "best_metric": null, "best_model_checkpoint": null, "epoch": 2.9998819780479167, "eval_steps": 500, "global_step": 38127, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 0.00029999999949079136, "loss": 10.8263, "step": 1 }, { "epoch": 0.0, "learning_rate": 0.0002999999979631655, "loss": 9.6257, "step": 2 }, { "epoch": 0.0, "learning_rate": 0.0002999999954171225, "loss": 10.047, "step": 3 }, { "epoch": 0.0, "learning_rate": 0.00029999999185266224, "loss": 10.146, "step": 4 }, { "epoch": 0.0, "learning_rate": 0.00029999998726978487, "loss": 9.148, "step": 5 }, { "epoch": 0.0, "learning_rate": 0.0002999999816684903, "loss": 8.6304, "step": 6 }, { "epoch": 0.0, "learning_rate": 0.0002999999750487787, "loss": 8.3464, "step": 7 }, { "epoch": 0.0, "learning_rate": 0.00029999996741064997, "loss": 8.1256, "step": 8 }, { "epoch": 0.0, "learning_rate": 0.00029999995875410433, "loss": 7.8647, "step": 9 }, { "epoch": 0.0, "learning_rate": 0.0002999999490791416, "loss": 7.6842, "step": 10 }, { "epoch": 0.0, "learning_rate": 0.0002999999383857622, "loss": 7.5368, "step": 11 }, { "epoch": 0.0, "learning_rate": 0.00029999992667396587, "loss": 7.4578, "step": 12 }, { "epoch": 0.0, "learning_rate": 0.0002999999139437528, "loss": 7.3552, "step": 13 }, { "epoch": 0.0, "learning_rate": 0.0002999999001951231, "loss": 7.3954, "step": 14 }, { "epoch": 0.0, "learning_rate": 0.0002999998854280769, "loss": 7.3702, "step": 15 }, { "epoch": 0.0, "learning_rate": 0.0002999998696426142, "loss": 7.3327, "step": 16 }, { "epoch": 0.0, "learning_rate": 0.0002999998528387352, "loss": 7.3107, "step": 17 }, { "epoch": 0.0, "learning_rate": 0.00029999983501643996, "loss": 7.2468, "step": 18 }, { "epoch": 0.0, "learning_rate": 0.00029999981617572863, "loss": 7.2979, "step": 19 }, { "epoch": 0.0, "learning_rate": 0.0002999997963166013, "loss": 7.2101, "step": 20 }, { "epoch": 0.0, "learning_rate": 0.0002999997754390582, "loss": 7.2101, "step": 21 }, { "epoch": 0.0, "learning_rate": 0.0002999997535430993, "loss": 7.1943, "step": 22 }, { "epoch": 0.0, "learning_rate": 0.0002999997306287249, "loss": 7.1691, "step": 23 }, { "epoch": 0.0, "learning_rate": 0.00029999970669593513, "loss": 7.0904, "step": 24 }, { "epoch": 0.0, "learning_rate": 0.0002999996817447301, "loss": 7.097, "step": 25 }, { "epoch": 0.0, "learning_rate": 0.00029999965577511, "loss": 7.1219, "step": 26 }, { "epoch": 0.0, "learning_rate": 0.00029999962878707505, "loss": 7.0476, "step": 27 }, { "epoch": 0.0, "learning_rate": 0.00029999960078062535, "loss": 7.0578, "step": 28 }, { "epoch": 0.0, "learning_rate": 0.0002999995717557612, "loss": 7.0238, "step": 29 }, { "epoch": 0.0, "learning_rate": 0.00029999954171248266, "loss": 6.9804, "step": 30 }, { "epoch": 0.0, "learning_rate": 0.00029999951065079, "loss": 6.997, "step": 31 }, { "epoch": 0.0, "learning_rate": 0.00029999947857068353, "loss": 6.9591, "step": 32 }, { "epoch": 0.0, "learning_rate": 0.00029999944547216335, "loss": 6.9196, "step": 33 }, { "epoch": 0.0, "learning_rate": 0.0002999994113552296, "loss": 6.8851, "step": 34 }, { "epoch": 0.0, "learning_rate": 0.0002999993762198828, "loss": 6.8979, "step": 35 }, { "epoch": 0.0, "learning_rate": 0.0002999993400661229, "loss": 6.788, "step": 36 }, { "epoch": 0.0, "learning_rate": 0.0002999993028939503, "loss": 6.7845, "step": 37 }, { "epoch": 0.0, "learning_rate": 0.0002999992647033652, "loss": 6.7746, "step": 38 }, { "epoch": 0.0, "learning_rate": 0.0002999992254943678, "loss": 6.7175, "step": 39 }, { "epoch": 0.0, "learning_rate": 0.0002999991852669585, "loss": 6.6889, "step": 40 }, { "epoch": 0.0, "learning_rate": 0.00029999914402113753, "loss": 6.6795, "step": 41 }, { "epoch": 0.0, "learning_rate": 0.00029999910175690516, "loss": 6.6665, "step": 42 }, { "epoch": 0.0, "learning_rate": 0.0002999990584742616, "loss": 6.6377, "step": 43 }, { "epoch": 0.0, "learning_rate": 0.0002999990141732072, "loss": 6.5646, "step": 44 }, { "epoch": 0.0, "learning_rate": 0.00029999896885374235, "loss": 6.4904, "step": 45 }, { "epoch": 0.0, "learning_rate": 0.00029999892251586724, "loss": 6.4492, "step": 46 }, { "epoch": 0.0, "learning_rate": 0.0002999988751595822, "loss": 6.4633, "step": 47 }, { "epoch": 0.0, "learning_rate": 0.0002999988267848876, "loss": 6.4431, "step": 48 }, { "epoch": 0.0, "learning_rate": 0.00029999877739178376, "loss": 6.4306, "step": 49 }, { "epoch": 0.0, "learning_rate": 0.00029999872698027095, "loss": 6.4155, "step": 50 }, { "epoch": 0.0, "learning_rate": 0.0002999986755503496, "loss": 6.3593, "step": 51 }, { "epoch": 0.0, "learning_rate": 0.00029999862310202, "loss": 6.3509, "step": 52 }, { "epoch": 0.0, "learning_rate": 0.0002999985696352825, "loss": 6.2662, "step": 53 }, { "epoch": 0.0, "learning_rate": 0.00029999851515013755, "loss": 6.3003, "step": 54 }, { "epoch": 0.0, "learning_rate": 0.00029999845964658544, "loss": 6.2946, "step": 55 }, { "epoch": 0.0, "learning_rate": 0.0002999984031246265, "loss": 6.2259, "step": 56 }, { "epoch": 0.0, "learning_rate": 0.00029999834558426124, "loss": 6.1623, "step": 57 }, { "epoch": 0.0, "learning_rate": 0.00029999828702549, "loss": 6.1292, "step": 58 }, { "epoch": 0.0, "learning_rate": 0.00029999822744831316, "loss": 6.137, "step": 59 }, { "epoch": 0.0, "learning_rate": 0.00029999816685273106, "loss": 6.0887, "step": 60 }, { "epoch": 0.0, "learning_rate": 0.00029999810523874426, "loss": 6.0979, "step": 61 }, { "epoch": 0.0, "learning_rate": 0.00029999804260635307, "loss": 6.0342, "step": 62 }, { "epoch": 0.0, "learning_rate": 0.000299997978955558, "loss": 5.9838, "step": 63 }, { "epoch": 0.01, "learning_rate": 0.00029999791428635933, "loss": 5.9474, "step": 64 }, { "epoch": 0.01, "learning_rate": 0.0002999978485987577, "loss": 5.9451, "step": 65 }, { "epoch": 0.01, "learning_rate": 0.0002999977818927534, "loss": 5.9931, "step": 66 }, { "epoch": 0.01, "learning_rate": 0.0002999977141683469, "loss": 5.8736, "step": 67 }, { "epoch": 0.01, "learning_rate": 0.0002999976454255388, "loss": 5.8801, "step": 68 }, { "epoch": 0.01, "learning_rate": 0.00029999757566432934, "loss": 5.8562, "step": 69 }, { "epoch": 0.01, "learning_rate": 0.0002999975048847192, "loss": 5.8236, "step": 70 }, { "epoch": 0.01, "learning_rate": 0.00029999743308670873, "loss": 5.8224, "step": 71 }, { "epoch": 0.01, "learning_rate": 0.0002999973602702985, "loss": 5.7981, "step": 72 }, { "epoch": 0.01, "learning_rate": 0.00029999728643548897, "loss": 5.7025, "step": 73 }, { "epoch": 0.01, "learning_rate": 0.00029999721158228065, "loss": 5.6899, "step": 74 }, { "epoch": 0.01, "learning_rate": 0.00029999713571067396, "loss": 5.653, "step": 75 }, { "epoch": 0.01, "learning_rate": 0.0002999970588206696, "loss": 5.6553, "step": 76 }, { "epoch": 0.01, "learning_rate": 0.00029999698091226793, "loss": 5.5973, "step": 77 }, { "epoch": 0.01, "learning_rate": 0.0002999969019854695, "loss": 5.6341, "step": 78 }, { "epoch": 0.01, "learning_rate": 0.00029999682204027495, "loss": 5.6035, "step": 79 }, { "epoch": 0.01, "learning_rate": 0.0002999967410766848, "loss": 5.5762, "step": 80 }, { "epoch": 0.01, "learning_rate": 0.0002999966590946994, "loss": 5.5966, "step": 81 }, { "epoch": 0.01, "learning_rate": 0.00029999657609431957, "loss": 5.6069, "step": 82 }, { "epoch": 0.01, "learning_rate": 0.00029999649207554575, "loss": 5.51, "step": 83 }, { "epoch": 0.01, "learning_rate": 0.0002999964070383785, "loss": 5.5384, "step": 84 }, { "epoch": 0.01, "learning_rate": 0.0002999963209828184, "loss": 5.4613, "step": 85 }, { "epoch": 0.01, "learning_rate": 0.0002999962339088661, "loss": 5.5278, "step": 86 }, { "epoch": 0.01, "learning_rate": 0.0002999961458165221, "loss": 5.4587, "step": 87 }, { "epoch": 0.01, "learning_rate": 0.00029999605670578706, "loss": 5.4138, "step": 88 }, { "epoch": 0.01, "learning_rate": 0.00029999596657666165, "loss": 5.4319, "step": 89 }, { "epoch": 0.01, "learning_rate": 0.00029999587542914633, "loss": 5.3703, "step": 90 }, { "epoch": 0.01, "learning_rate": 0.00029999578326324176, "loss": 5.3929, "step": 91 }, { "epoch": 0.01, "learning_rate": 0.00029999569007894863, "loss": 5.3934, "step": 92 }, { "epoch": 0.01, "learning_rate": 0.00029999559587626755, "loss": 5.3809, "step": 93 }, { "epoch": 0.01, "learning_rate": 0.00029999550065519916, "loss": 5.4258, "step": 94 }, { "epoch": 0.01, "learning_rate": 0.00029999540441574406, "loss": 5.3402, "step": 95 }, { "epoch": 0.01, "learning_rate": 0.000299995307157903, "loss": 5.3044, "step": 96 }, { "epoch": 0.01, "learning_rate": 0.0002999952088816765, "loss": 5.387, "step": 97 }, { "epoch": 0.01, "learning_rate": 0.00029999510958706534, "loss": 5.3063, "step": 98 }, { "epoch": 0.01, "learning_rate": 0.0002999950092740702, "loss": 5.2135, "step": 99 }, { "epoch": 0.01, "learning_rate": 0.0002999949079426916, "loss": 5.219, "step": 100 }, { "epoch": 0.01, "learning_rate": 0.00029999480559293046, "loss": 5.1805, "step": 101 }, { "epoch": 0.01, "learning_rate": 0.0002999947022247873, "loss": 5.1834, "step": 102 }, { "epoch": 0.01, "learning_rate": 0.000299994597838263, "loss": 5.2355, "step": 103 }, { "epoch": 0.01, "learning_rate": 0.000299994492433358, "loss": 5.1719, "step": 104 }, { "epoch": 0.01, "learning_rate": 0.00029999438601007323, "loss": 5.1662, "step": 105 }, { "epoch": 0.01, "learning_rate": 0.00029999427856840943, "loss": 5.1674, "step": 106 }, { "epoch": 0.01, "learning_rate": 0.00029999417010836716, "loss": 5.1132, "step": 107 }, { "epoch": 0.01, "learning_rate": 0.0002999940606299473, "loss": 5.126, "step": 108 }, { "epoch": 0.01, "learning_rate": 0.00029999395013315046, "loss": 5.1225, "step": 109 }, { "epoch": 0.01, "learning_rate": 0.00029999383861797755, "loss": 5.104, "step": 110 }, { "epoch": 0.01, "learning_rate": 0.00029999372608442926, "loss": 5.0844, "step": 111 }, { "epoch": 0.01, "learning_rate": 0.0002999936125325063, "loss": 5.047, "step": 112 }, { "epoch": 0.01, "learning_rate": 0.00029999349796220947, "loss": 5.0473, "step": 113 }, { "epoch": 0.01, "learning_rate": 0.00029999338237353965, "loss": 4.9838, "step": 114 }, { "epoch": 0.01, "learning_rate": 0.00029999326576649743, "loss": 5.0187, "step": 115 }, { "epoch": 0.01, "learning_rate": 0.00029999314814108374, "loss": 4.9802, "step": 116 }, { "epoch": 0.01, "learning_rate": 0.0002999930294972994, "loss": 5.0482, "step": 117 }, { "epoch": 0.01, "learning_rate": 0.00029999290983514506, "loss": 5.0848, "step": 118 }, { "epoch": 0.01, "learning_rate": 0.00029999278915462176, "loss": 4.987, "step": 119 }, { "epoch": 0.01, "learning_rate": 0.00029999266745573013, "loss": 5.0122, "step": 120 }, { "epoch": 0.01, "learning_rate": 0.00029999254473847103, "loss": 5.0057, "step": 121 }, { "epoch": 0.01, "learning_rate": 0.0002999924210028454, "loss": 4.9281, "step": 122 }, { "epoch": 0.01, "learning_rate": 0.0002999922962488539, "loss": 4.9386, "step": 123 }, { "epoch": 0.01, "learning_rate": 0.00029999217047649757, "loss": 4.9355, "step": 124 }, { "epoch": 0.01, "learning_rate": 0.0002999920436857772, "loss": 4.8219, "step": 125 }, { "epoch": 0.01, "learning_rate": 0.00029999191587669355, "loss": 4.8698, "step": 126 }, { "epoch": 0.01, "learning_rate": 0.00029999178704924755, "loss": 4.897, "step": 127 }, { "epoch": 0.01, "learning_rate": 0.00029999165720344016, "loss": 4.8923, "step": 128 }, { "epoch": 0.01, "learning_rate": 0.00029999152633927213, "loss": 4.8457, "step": 129 }, { "epoch": 0.01, "learning_rate": 0.00029999139445674444, "loss": 4.8464, "step": 130 }, { "epoch": 0.01, "learning_rate": 0.00029999126155585797, "loss": 4.8345, "step": 131 }, { "epoch": 0.01, "learning_rate": 0.00029999112763661357, "loss": 4.8542, "step": 132 }, { "epoch": 0.01, "learning_rate": 0.0002999909926990122, "loss": 4.8239, "step": 133 }, { "epoch": 0.01, "learning_rate": 0.00029999085674305473, "loss": 4.8497, "step": 134 }, { "epoch": 0.01, "learning_rate": 0.0002999907197687422, "loss": 4.7598, "step": 135 }, { "epoch": 0.01, "learning_rate": 0.00029999058177607537, "loss": 4.8297, "step": 136 }, { "epoch": 0.01, "learning_rate": 0.0002999904427650553, "loss": 4.7698, "step": 137 }, { "epoch": 0.01, "learning_rate": 0.0002999903027356829, "loss": 4.781, "step": 138 }, { "epoch": 0.01, "learning_rate": 0.0002999901616879591, "loss": 4.7935, "step": 139 }, { "epoch": 0.01, "learning_rate": 0.0002999900196218849, "loss": 4.7196, "step": 140 }, { "epoch": 0.01, "learning_rate": 0.0002999898765374612, "loss": 4.7244, "step": 141 }, { "epoch": 0.01, "learning_rate": 0.000299989732434689, "loss": 4.6923, "step": 142 }, { "epoch": 0.01, "learning_rate": 0.0002999895873135693, "loss": 4.7321, "step": 143 }, { "epoch": 0.01, "learning_rate": 0.00029998944117410307, "loss": 4.6675, "step": 144 }, { "epoch": 0.01, "learning_rate": 0.00029998929401629137, "loss": 4.6667, "step": 145 }, { "epoch": 0.01, "learning_rate": 0.00029998914584013507, "loss": 4.659, "step": 146 }, { "epoch": 0.01, "learning_rate": 0.00029998899664563527, "loss": 4.7102, "step": 147 }, { "epoch": 0.01, "learning_rate": 0.00029998884643279294, "loss": 4.6546, "step": 148 }, { "epoch": 0.01, "learning_rate": 0.0002999886952016091, "loss": 4.6442, "step": 149 }, { "epoch": 0.01, "learning_rate": 0.00029998854295208477, "loss": 4.6421, "step": 150 }, { "epoch": 0.01, "learning_rate": 0.00029998838968422104, "loss": 4.6408, "step": 151 }, { "epoch": 0.01, "learning_rate": 0.0002999882353980189, "loss": 4.6317, "step": 152 }, { "epoch": 0.01, "learning_rate": 0.0002999880800934795, "loss": 4.5644, "step": 153 }, { "epoch": 0.01, "learning_rate": 0.0002999879237706037, "loss": 4.6313, "step": 154 }, { "epoch": 0.01, "learning_rate": 0.00029998776642939265, "loss": 4.623, "step": 155 }, { "epoch": 0.01, "learning_rate": 0.0002999876080698475, "loss": 4.5865, "step": 156 }, { "epoch": 0.01, "learning_rate": 0.00029998744869196925, "loss": 4.4979, "step": 157 }, { "epoch": 0.01, "learning_rate": 0.000299987288295759, "loss": 4.5336, "step": 158 }, { "epoch": 0.01, "learning_rate": 0.0002999871268812178, "loss": 4.5288, "step": 159 }, { "epoch": 0.01, "learning_rate": 0.0002999869644483468, "loss": 4.4542, "step": 160 }, { "epoch": 0.01, "learning_rate": 0.0002999868009971471, "loss": 4.4658, "step": 161 }, { "epoch": 0.01, "learning_rate": 0.00029998663652761975, "loss": 4.4747, "step": 162 }, { "epoch": 0.01, "learning_rate": 0.0002999864710397659, "loss": 4.4708, "step": 163 }, { "epoch": 0.01, "learning_rate": 0.00029998630453358674, "loss": 4.477, "step": 164 }, { "epoch": 0.01, "learning_rate": 0.0002999861370090833, "loss": 4.5103, "step": 165 }, { "epoch": 0.01, "learning_rate": 0.0002999859684662568, "loss": 4.4611, "step": 166 }, { "epoch": 0.01, "learning_rate": 0.00029998579890510825, "loss": 4.4862, "step": 167 }, { "epoch": 0.01, "learning_rate": 0.000299985628325639, "loss": 4.4651, "step": 168 }, { "epoch": 0.01, "learning_rate": 0.0002999854567278501, "loss": 4.4672, "step": 169 }, { "epoch": 0.01, "learning_rate": 0.00029998528411174266, "loss": 4.4404, "step": 170 }, { "epoch": 0.01, "learning_rate": 0.0002999851104773179, "loss": 4.4826, "step": 171 }, { "epoch": 0.01, "learning_rate": 0.00029998493582457706, "loss": 4.4619, "step": 172 }, { "epoch": 0.01, "learning_rate": 0.00029998476015352123, "loss": 4.3926, "step": 173 }, { "epoch": 0.01, "learning_rate": 0.00029998458346415166, "loss": 4.385, "step": 174 }, { "epoch": 0.01, "learning_rate": 0.00029998440575646954, "loss": 4.3887, "step": 175 }, { "epoch": 0.01, "learning_rate": 0.00029998422703047606, "loss": 4.4201, "step": 176 }, { "epoch": 0.01, "learning_rate": 0.00029998404728617253, "loss": 4.3839, "step": 177 }, { "epoch": 0.01, "learning_rate": 0.00029998386652355997, "loss": 4.4229, "step": 178 }, { "epoch": 0.01, "learning_rate": 0.0002999836847426398, "loss": 4.3861, "step": 179 }, { "epoch": 0.01, "learning_rate": 0.00029998350194341313, "loss": 4.332, "step": 180 }, { "epoch": 0.01, "learning_rate": 0.0002999833181258813, "loss": 4.3391, "step": 181 }, { "epoch": 0.01, "learning_rate": 0.0002999831332900455, "loss": 4.3121, "step": 182 }, { "epoch": 0.01, "learning_rate": 0.0002999829474359069, "loss": 4.3118, "step": 183 }, { "epoch": 0.01, "learning_rate": 0.000299982760563467, "loss": 4.3351, "step": 184 }, { "epoch": 0.01, "learning_rate": 0.00029998257267272685, "loss": 4.3679, "step": 185 }, { "epoch": 0.01, "learning_rate": 0.00029998238376368773, "loss": 4.2416, "step": 186 }, { "epoch": 0.01, "learning_rate": 0.00029998219383635107, "loss": 4.3281, "step": 187 }, { "epoch": 0.01, "learning_rate": 0.00029998200289071806, "loss": 4.278, "step": 188 }, { "epoch": 0.01, "learning_rate": 0.00029998181092679, "loss": 4.2585, "step": 189 }, { "epoch": 0.01, "learning_rate": 0.0002999816179445683, "loss": 4.3055, "step": 190 }, { "epoch": 0.02, "learning_rate": 0.0002999814239440541, "loss": 4.1961, "step": 191 }, { "epoch": 0.02, "learning_rate": 0.0002999812289252488, "loss": 4.2319, "step": 192 }, { "epoch": 0.02, "learning_rate": 0.0002999810328881538, "loss": 4.2092, "step": 193 }, { "epoch": 0.02, "learning_rate": 0.0002999808358327702, "loss": 4.3242, "step": 194 }, { "epoch": 0.02, "learning_rate": 0.00029998063775909964, "loss": 4.1855, "step": 195 }, { "epoch": 0.02, "learning_rate": 0.00029998043866714323, "loss": 4.303, "step": 196 }, { "epoch": 0.02, "learning_rate": 0.00029998023855690246, "loss": 4.1591, "step": 197 }, { "epoch": 0.02, "learning_rate": 0.00029998003742837863, "loss": 4.1983, "step": 198 }, { "epoch": 0.02, "learning_rate": 0.0002999798352815731, "loss": 4.3276, "step": 199 }, { "epoch": 0.02, "learning_rate": 0.0002999796321164872, "loss": 4.2653, "step": 200 }, { "epoch": 0.02, "learning_rate": 0.00029997942793312245, "loss": 4.2074, "step": 201 }, { "epoch": 0.02, "learning_rate": 0.0002999792227314801, "loss": 4.2234, "step": 202 }, { "epoch": 0.02, "learning_rate": 0.0002999790165115616, "loss": 4.2097, "step": 203 }, { "epoch": 0.02, "learning_rate": 0.0002999788092733683, "loss": 4.2144, "step": 204 }, { "epoch": 0.02, "learning_rate": 0.0002999786010169017, "loss": 4.1698, "step": 205 }, { "epoch": 0.02, "learning_rate": 0.0002999783917421632, "loss": 4.2162, "step": 206 }, { "epoch": 0.02, "learning_rate": 0.00029997818144915416, "loss": 4.1766, "step": 207 }, { "epoch": 0.02, "learning_rate": 0.000299977970137876, "loss": 4.0721, "step": 208 }, { "epoch": 0.02, "learning_rate": 0.00029997775780833024, "loss": 4.1178, "step": 209 }, { "epoch": 0.02, "learning_rate": 0.0002999775444605182, "loss": 4.1111, "step": 210 }, { "epoch": 0.02, "learning_rate": 0.00029997733009444146, "loss": 4.1418, "step": 211 }, { "epoch": 0.02, "learning_rate": 0.0002999771147101014, "loss": 4.1061, "step": 212 }, { "epoch": 0.02, "learning_rate": 0.0002999768983074995, "loss": 4.1108, "step": 213 }, { "epoch": 0.02, "learning_rate": 0.00029997668088663714, "loss": 4.1349, "step": 214 }, { "epoch": 0.02, "learning_rate": 0.00029997646244751597, "loss": 4.0807, "step": 215 }, { "epoch": 0.02, "learning_rate": 0.00029997624299013737, "loss": 4.1052, "step": 216 }, { "epoch": 0.02, "learning_rate": 0.0002999760225145028, "loss": 4.118, "step": 217 }, { "epoch": 0.02, "learning_rate": 0.0002999758010206139, "loss": 4.1122, "step": 218 }, { "epoch": 0.02, "learning_rate": 0.000299975578508472, "loss": 4.1162, "step": 219 }, { "epoch": 0.02, "learning_rate": 0.0002999753549780787, "loss": 4.1254, "step": 220 }, { "epoch": 0.02, "learning_rate": 0.00029997513042943544, "loss": 4.0779, "step": 221 }, { "epoch": 0.02, "learning_rate": 0.0002999749048625439, "loss": 4.0547, "step": 222 }, { "epoch": 0.02, "learning_rate": 0.0002999746782774055, "loss": 4.081, "step": 223 }, { "epoch": 0.02, "learning_rate": 0.00029997445067402175, "loss": 4.0886, "step": 224 }, { "epoch": 0.02, "learning_rate": 0.0002999742220523943, "loss": 4.0712, "step": 225 }, { "epoch": 0.02, "learning_rate": 0.00029997399241252465, "loss": 4.1302, "step": 226 }, { "epoch": 0.02, "learning_rate": 0.0002999737617544143, "loss": 3.97, "step": 227 }, { "epoch": 0.02, "learning_rate": 0.0002999735300780649, "loss": 4.0399, "step": 228 }, { "epoch": 0.02, "learning_rate": 0.00029997329738347796, "loss": 4.0173, "step": 229 }, { "epoch": 0.02, "learning_rate": 0.00029997306367065516, "loss": 4.026, "step": 230 }, { "epoch": 0.02, "learning_rate": 0.000299972828939598, "loss": 4.0269, "step": 231 }, { "epoch": 0.02, "learning_rate": 0.00029997259319030804, "loss": 4.037, "step": 232 }, { "epoch": 0.02, "learning_rate": 0.0002999723564227869, "loss": 3.9136, "step": 233 }, { "epoch": 0.02, "learning_rate": 0.00029997211863703636, "loss": 3.9446, "step": 234 }, { "epoch": 0.02, "learning_rate": 0.0002999718798330578, "loss": 3.9837, "step": 235 }, { "epoch": 0.02, "learning_rate": 0.00029997164001085297, "loss": 4.0232, "step": 236 }, { "epoch": 0.02, "learning_rate": 0.00029997139917042345, "loss": 3.9559, "step": 237 }, { "epoch": 0.02, "learning_rate": 0.00029997115731177093, "loss": 3.9762, "step": 238 }, { "epoch": 0.02, "learning_rate": 0.000299970914434897, "loss": 3.9527, "step": 239 }, { "epoch": 0.02, "learning_rate": 0.00029997067053980325, "loss": 3.9775, "step": 240 }, { "epoch": 0.02, "learning_rate": 0.0002999704256264915, "loss": 3.9603, "step": 241 }, { "epoch": 0.02, "learning_rate": 0.00029997017969496327, "loss": 3.9555, "step": 242 }, { "epoch": 0.02, "learning_rate": 0.0002999699327452203, "loss": 3.9495, "step": 243 }, { "epoch": 0.02, "learning_rate": 0.0002999696847772642, "loss": 3.9491, "step": 244 }, { "epoch": 0.02, "learning_rate": 0.00029996943579109676, "loss": 3.9303, "step": 245 }, { "epoch": 0.02, "learning_rate": 0.0002999691857867196, "loss": 3.8839, "step": 246 }, { "epoch": 0.02, "learning_rate": 0.0002999689347641344, "loss": 3.9252, "step": 247 }, { "epoch": 0.02, "learning_rate": 0.00029996868272334293, "loss": 3.9429, "step": 248 }, { "epoch": 0.02, "learning_rate": 0.0002999684296643468, "loss": 3.9003, "step": 249 }, { "epoch": 0.02, "learning_rate": 0.00029996817558714786, "loss": 3.9223, "step": 250 }, { "epoch": 0.02, "learning_rate": 0.00029996792049174776, "loss": 3.9366, "step": 251 }, { "epoch": 0.02, "learning_rate": 0.0002999676643781482, "loss": 3.9667, "step": 252 }, { "epoch": 0.02, "learning_rate": 0.000299967407246351, "loss": 3.8674, "step": 253 }, { "epoch": 0.02, "learning_rate": 0.0002999671490963578, "loss": 3.8993, "step": 254 }, { "epoch": 0.02, "learning_rate": 0.0002999668899281705, "loss": 3.8674, "step": 255 }, { "epoch": 0.02, "learning_rate": 0.00029996662974179076, "loss": 3.8797, "step": 256 }, { "epoch": 0.02, "learning_rate": 0.0002999663685372203, "loss": 3.8734, "step": 257 }, { "epoch": 0.02, "learning_rate": 0.00029996610631446096, "loss": 3.8857, "step": 258 }, { "epoch": 0.02, "learning_rate": 0.0002999658430735146, "loss": 3.7975, "step": 259 }, { "epoch": 0.02, "learning_rate": 0.0002999655788143829, "loss": 3.9391, "step": 260 }, { "epoch": 0.02, "learning_rate": 0.00029996531353706764, "loss": 3.8268, "step": 261 }, { "epoch": 0.02, "learning_rate": 0.00029996504724157065, "loss": 3.8626, "step": 262 }, { "epoch": 0.02, "learning_rate": 0.00029996477992789376, "loss": 3.8168, "step": 263 }, { "epoch": 0.02, "learning_rate": 0.0002999645115960388, "loss": 3.8726, "step": 264 }, { "epoch": 0.02, "learning_rate": 0.00029996424224600754, "loss": 3.8246, "step": 265 }, { "epoch": 0.02, "learning_rate": 0.00029996397187780186, "loss": 3.8001, "step": 266 }, { "epoch": 0.02, "learning_rate": 0.00029996370049142353, "loss": 3.7944, "step": 267 }, { "epoch": 0.02, "learning_rate": 0.0002999634280868744, "loss": 3.6991, "step": 268 }, { "epoch": 0.02, "learning_rate": 0.0002999631546641564, "loss": 3.8191, "step": 269 }, { "epoch": 0.02, "learning_rate": 0.0002999628802232713, "loss": 3.7679, "step": 270 }, { "epoch": 0.02, "learning_rate": 0.0002999626047642211, "loss": 3.8535, "step": 271 }, { "epoch": 0.02, "learning_rate": 0.0002999623282870075, "loss": 3.7943, "step": 272 }, { "epoch": 0.02, "learning_rate": 0.00029996205079163243, "loss": 3.7432, "step": 273 }, { "epoch": 0.02, "learning_rate": 0.00029996177227809776, "loss": 3.7871, "step": 274 }, { "epoch": 0.02, "learning_rate": 0.00029996149274640554, "loss": 3.771, "step": 275 }, { "epoch": 0.02, "learning_rate": 0.00029996121219655743, "loss": 3.7222, "step": 276 }, { "epoch": 0.02, "learning_rate": 0.00029996093062855544, "loss": 3.774, "step": 277 }, { "epoch": 0.02, "learning_rate": 0.00029996064804240153, "loss": 3.6882, "step": 278 }, { "epoch": 0.02, "learning_rate": 0.0002999603644380976, "loss": 3.7667, "step": 279 }, { "epoch": 0.02, "learning_rate": 0.0002999600798156455, "loss": 3.8107, "step": 280 }, { "epoch": 0.02, "learning_rate": 0.0002999597941750472, "loss": 3.7369, "step": 281 }, { "epoch": 0.02, "learning_rate": 0.0002999595075163047, "loss": 3.715, "step": 282 }, { "epoch": 0.02, "learning_rate": 0.0002999592198394199, "loss": 3.7312, "step": 283 }, { "epoch": 0.02, "learning_rate": 0.00029995893114439473, "loss": 3.7781, "step": 284 }, { "epoch": 0.02, "learning_rate": 0.00029995864143123117, "loss": 3.747, "step": 285 }, { "epoch": 0.02, "learning_rate": 0.0002999583506999312, "loss": 3.7143, "step": 286 }, { "epoch": 0.02, "learning_rate": 0.00029995805895049674, "loss": 3.7797, "step": 287 }, { "epoch": 0.02, "learning_rate": 0.0002999577661829299, "loss": 3.7805, "step": 288 }, { "epoch": 0.02, "learning_rate": 0.0002999574723972325, "loss": 3.788, "step": 289 }, { "epoch": 0.02, "learning_rate": 0.0002999571775934066, "loss": 3.7218, "step": 290 }, { "epoch": 0.02, "learning_rate": 0.0002999568817714543, "loss": 3.7922, "step": 291 }, { "epoch": 0.02, "learning_rate": 0.00029995658493137746, "loss": 3.691, "step": 292 }, { "epoch": 0.02, "learning_rate": 0.0002999562870731782, "loss": 3.6587, "step": 293 }, { "epoch": 0.02, "learning_rate": 0.0002999559881968585, "loss": 3.7278, "step": 294 }, { "epoch": 0.02, "learning_rate": 0.0002999556883024204, "loss": 3.6881, "step": 295 }, { "epoch": 0.02, "learning_rate": 0.0002999553873898659, "loss": 3.7996, "step": 296 }, { "epoch": 0.02, "learning_rate": 0.0002999550854591971, "loss": 3.6761, "step": 297 }, { "epoch": 0.02, "learning_rate": 0.000299954782510416, "loss": 3.6604, "step": 298 }, { "epoch": 0.02, "learning_rate": 0.0002999544785435247, "loss": 3.622, "step": 299 }, { "epoch": 0.02, "learning_rate": 0.0002999541735585252, "loss": 3.7345, "step": 300 }, { "epoch": 0.02, "learning_rate": 0.00029995386755541964, "loss": 3.678, "step": 301 }, { "epoch": 0.02, "learning_rate": 0.0002999535605342101, "loss": 3.7082, "step": 302 }, { "epoch": 0.02, "learning_rate": 0.00029995325249489857, "loss": 3.7032, "step": 303 }, { "epoch": 0.02, "learning_rate": 0.00029995294343748724, "loss": 3.6546, "step": 304 }, { "epoch": 0.02, "learning_rate": 0.0002999526333619782, "loss": 3.7053, "step": 305 }, { "epoch": 0.02, "learning_rate": 0.00029995232226837353, "loss": 3.6493, "step": 306 }, { "epoch": 0.02, "learning_rate": 0.0002999520101566753, "loss": 3.6268, "step": 307 }, { "epoch": 0.02, "learning_rate": 0.0002999516970268857, "loss": 3.6729, "step": 308 }, { "epoch": 0.02, "learning_rate": 0.00029995138287900684, "loss": 3.6733, "step": 309 }, { "epoch": 0.02, "learning_rate": 0.0002999510677130408, "loss": 3.5923, "step": 310 }, { "epoch": 0.02, "learning_rate": 0.00029995075152898976, "loss": 3.6958, "step": 311 }, { "epoch": 0.02, "learning_rate": 0.00029995043432685595, "loss": 3.6217, "step": 312 }, { "epoch": 0.02, "learning_rate": 0.00029995011610664134, "loss": 3.6087, "step": 313 }, { "epoch": 0.02, "learning_rate": 0.0002999497968683482, "loss": 3.6249, "step": 314 }, { "epoch": 0.02, "learning_rate": 0.0002999494766119787, "loss": 3.6491, "step": 315 }, { "epoch": 0.02, "learning_rate": 0.0002999491553375351, "loss": 3.591, "step": 316 }, { "epoch": 0.02, "learning_rate": 0.0002999488330450194, "loss": 3.6178, "step": 317 }, { "epoch": 0.03, "learning_rate": 0.00029994850973443383, "loss": 3.6651, "step": 318 }, { "epoch": 0.03, "learning_rate": 0.0002999481854057807, "loss": 3.5771, "step": 319 }, { "epoch": 0.03, "learning_rate": 0.0002999478600590621, "loss": 3.6254, "step": 320 }, { "epoch": 0.03, "learning_rate": 0.00029994753369428024, "loss": 3.5805, "step": 321 }, { "epoch": 0.03, "learning_rate": 0.00029994720631143745, "loss": 3.656, "step": 322 }, { "epoch": 0.03, "learning_rate": 0.00029994687791053587, "loss": 3.6891, "step": 323 }, { "epoch": 0.03, "learning_rate": 0.0002999465484915777, "loss": 3.5846, "step": 324 }, { "epoch": 0.03, "learning_rate": 0.0002999462180545653, "loss": 3.6018, "step": 325 }, { "epoch": 0.03, "learning_rate": 0.0002999458865995007, "loss": 3.5023, "step": 326 }, { "epoch": 0.03, "learning_rate": 0.0002999455541263863, "loss": 3.5587, "step": 327 }, { "epoch": 0.03, "learning_rate": 0.0002999452206352244, "loss": 3.6164, "step": 328 }, { "epoch": 0.03, "learning_rate": 0.0002999448861260172, "loss": 3.5607, "step": 329 }, { "epoch": 0.03, "learning_rate": 0.0002999445505987669, "loss": 3.6474, "step": 330 }, { "epoch": 0.03, "learning_rate": 0.00029994421405347586, "loss": 3.5786, "step": 331 }, { "epoch": 0.03, "learning_rate": 0.0002999438764901464, "loss": 3.5564, "step": 332 }, { "epoch": 0.03, "learning_rate": 0.0002999435379087808, "loss": 3.5337, "step": 333 }, { "epoch": 0.03, "learning_rate": 0.00029994319830938123, "loss": 3.5182, "step": 334 }, { "epoch": 0.03, "learning_rate": 0.0002999428576919501, "loss": 3.5075, "step": 335 }, { "epoch": 0.03, "learning_rate": 0.00029994251605648973, "loss": 3.6318, "step": 336 }, { "epoch": 0.03, "learning_rate": 0.00029994217340300244, "loss": 3.6346, "step": 337 }, { "epoch": 0.03, "learning_rate": 0.0002999418297314905, "loss": 3.4845, "step": 338 }, { "epoch": 0.03, "learning_rate": 0.00029994148504195633, "loss": 3.5481, "step": 339 }, { "epoch": 0.03, "learning_rate": 0.0002999411393344022, "loss": 3.4799, "step": 340 }, { "epoch": 0.03, "learning_rate": 0.00029994079260883046, "loss": 3.5433, "step": 341 }, { "epoch": 0.03, "learning_rate": 0.0002999404448652435, "loss": 3.5505, "step": 342 }, { "epoch": 0.03, "learning_rate": 0.0002999400961036437, "loss": 3.5395, "step": 343 }, { "epoch": 0.03, "learning_rate": 0.0002999397463240333, "loss": 3.5285, "step": 344 }, { "epoch": 0.03, "learning_rate": 0.0002999393955264149, "loss": 3.5803, "step": 345 }, { "epoch": 0.03, "learning_rate": 0.0002999390437107906, "loss": 3.5289, "step": 346 }, { "epoch": 0.03, "learning_rate": 0.00029993869087716307, "loss": 3.516, "step": 347 }, { "epoch": 0.03, "learning_rate": 0.00029993833702553446, "loss": 3.4995, "step": 348 }, { "epoch": 0.03, "learning_rate": 0.00029993798215590734, "loss": 3.4694, "step": 349 }, { "epoch": 0.03, "learning_rate": 0.00029993762626828404, "loss": 3.5153, "step": 350 }, { "epoch": 0.03, "learning_rate": 0.000299937269362667, "loss": 3.5131, "step": 351 }, { "epoch": 0.03, "learning_rate": 0.00029993691143905866, "loss": 3.4829, "step": 352 }, { "epoch": 0.03, "learning_rate": 0.00029993655249746146, "loss": 3.4813, "step": 353 }, { "epoch": 0.03, "learning_rate": 0.0002999361925378778, "loss": 3.5926, "step": 354 }, { "epoch": 0.03, "learning_rate": 0.00029993583156031007, "loss": 3.5124, "step": 355 }, { "epoch": 0.03, "learning_rate": 0.0002999354695647608, "loss": 3.4817, "step": 356 }, { "epoch": 0.03, "learning_rate": 0.0002999351065512325, "loss": 3.4733, "step": 357 }, { "epoch": 0.03, "learning_rate": 0.0002999347425197275, "loss": 3.5251, "step": 358 }, { "epoch": 0.03, "learning_rate": 0.0002999343774702484, "loss": 3.5314, "step": 359 }, { "epoch": 0.03, "learning_rate": 0.00029993401140279756, "loss": 3.4583, "step": 360 }, { "epoch": 0.03, "learning_rate": 0.0002999336443173776, "loss": 3.4635, "step": 361 }, { "epoch": 0.03, "learning_rate": 0.00029993327621399086, "loss": 3.456, "step": 362 }, { "epoch": 0.03, "learning_rate": 0.0002999329070926399, "loss": 3.4824, "step": 363 }, { "epoch": 0.03, "learning_rate": 0.00029993253695332733, "loss": 3.4846, "step": 364 }, { "epoch": 0.03, "learning_rate": 0.0002999321657960555, "loss": 3.5, "step": 365 }, { "epoch": 0.03, "learning_rate": 0.00029993179362082707, "loss": 3.4837, "step": 366 }, { "epoch": 0.03, "learning_rate": 0.00029993142042764444, "loss": 3.4955, "step": 367 }, { "epoch": 0.03, "learning_rate": 0.0002999310462165102, "loss": 3.5033, "step": 368 }, { "epoch": 0.03, "learning_rate": 0.0002999306709874269, "loss": 3.4598, "step": 369 }, { "epoch": 0.03, "learning_rate": 0.0002999302947403971, "loss": 3.4585, "step": 370 }, { "epoch": 0.03, "learning_rate": 0.0002999299174754233, "loss": 3.4963, "step": 371 }, { "epoch": 0.03, "learning_rate": 0.0002999295391925082, "loss": 3.5095, "step": 372 }, { "epoch": 0.03, "learning_rate": 0.0002999291598916542, "loss": 3.4137, "step": 373 }, { "epoch": 0.03, "learning_rate": 0.0002999287795728639, "loss": 3.4546, "step": 374 }, { "epoch": 0.03, "learning_rate": 0.00029992839823614, "loss": 3.4099, "step": 375 }, { "epoch": 0.03, "learning_rate": 0.00029992801588148496, "loss": 3.4493, "step": 376 }, { "epoch": 0.03, "learning_rate": 0.0002999276325089015, "loss": 3.4755, "step": 377 }, { "epoch": 0.03, "learning_rate": 0.00029992724811839206, "loss": 3.4423, "step": 378 }, { "epoch": 0.03, "learning_rate": 0.0002999268627099594, "loss": 3.4219, "step": 379 }, { "epoch": 0.03, "learning_rate": 0.00029992647628360603, "loss": 3.4129, "step": 380 }, { "epoch": 0.03, "learning_rate": 0.00029992608883933465, "loss": 3.4411, "step": 381 }, { "epoch": 0.03, "learning_rate": 0.0002999257003771479, "loss": 3.4778, "step": 382 }, { "epoch": 0.03, "learning_rate": 0.0002999253108970484, "loss": 3.4326, "step": 383 }, { "epoch": 0.03, "learning_rate": 0.00029992492039903864, "loss": 3.3993, "step": 384 }, { "epoch": 0.03, "learning_rate": 0.0002999245288831215, "loss": 3.3898, "step": 385 }, { "epoch": 0.03, "learning_rate": 0.00029992413634929955, "loss": 3.4255, "step": 386 }, { "epoch": 0.03, "learning_rate": 0.00029992374279757546, "loss": 3.3929, "step": 387 }, { "epoch": 0.03, "learning_rate": 0.00029992334822795185, "loss": 3.4002, "step": 388 }, { "epoch": 0.03, "learning_rate": 0.0002999229526404315, "loss": 3.3688, "step": 389 }, { "epoch": 0.03, "learning_rate": 0.00029992255603501696, "loss": 3.3356, "step": 390 }, { "epoch": 0.03, "learning_rate": 0.000299922158411711, "loss": 3.3853, "step": 391 }, { "epoch": 0.03, "learning_rate": 0.00029992175977051633, "loss": 3.3704, "step": 392 }, { "epoch": 0.03, "learning_rate": 0.0002999213601114357, "loss": 3.4197, "step": 393 }, { "epoch": 0.03, "learning_rate": 0.0002999209594344717, "loss": 3.3395, "step": 394 }, { "epoch": 0.03, "learning_rate": 0.0002999205577396272, "loss": 3.3234, "step": 395 }, { "epoch": 0.03, "learning_rate": 0.00029992015502690474, "loss": 3.3223, "step": 396 }, { "epoch": 0.03, "learning_rate": 0.00029991975129630723, "loss": 3.3458, "step": 397 }, { "epoch": 0.03, "learning_rate": 0.00029991934654783736, "loss": 3.3912, "step": 398 }, { "epoch": 0.03, "learning_rate": 0.00029991894078149783, "loss": 3.3862, "step": 399 }, { "epoch": 0.03, "learning_rate": 0.0002999185339972914, "loss": 3.365, "step": 400 }, { "epoch": 0.03, "learning_rate": 0.00029991812619522087, "loss": 3.3797, "step": 401 }, { "epoch": 0.03, "learning_rate": 0.000299917717375289, "loss": 3.3347, "step": 402 }, { "epoch": 0.03, "learning_rate": 0.0002999173075374986, "loss": 3.3421, "step": 403 }, { "epoch": 0.03, "learning_rate": 0.0002999168966818523, "loss": 3.4062, "step": 404 }, { "epoch": 0.03, "learning_rate": 0.0002999164848083531, "loss": 3.3438, "step": 405 }, { "epoch": 0.03, "learning_rate": 0.00029991607191700366, "loss": 3.2981, "step": 406 }, { "epoch": 0.03, "learning_rate": 0.00029991565800780687, "loss": 3.3278, "step": 407 }, { "epoch": 0.03, "learning_rate": 0.00029991524308076547, "loss": 3.3876, "step": 408 }, { "epoch": 0.03, "learning_rate": 0.0002999148271358823, "loss": 3.3242, "step": 409 }, { "epoch": 0.03, "learning_rate": 0.0002999144101731601, "loss": 3.314, "step": 410 }, { "epoch": 0.03, "learning_rate": 0.00029991399219260185, "loss": 3.3267, "step": 411 }, { "epoch": 0.03, "learning_rate": 0.00029991357319421037, "loss": 3.2674, "step": 412 }, { "epoch": 0.03, "learning_rate": 0.00029991315317798843, "loss": 3.3884, "step": 413 }, { "epoch": 0.03, "learning_rate": 0.0002999127321439389, "loss": 3.3839, "step": 414 }, { "epoch": 0.03, "learning_rate": 0.0002999123100920646, "loss": 3.3184, "step": 415 }, { "epoch": 0.03, "learning_rate": 0.0002999118870223685, "loss": 3.3089, "step": 416 }, { "epoch": 0.03, "learning_rate": 0.0002999114629348534, "loss": 3.3404, "step": 417 }, { "epoch": 0.03, "learning_rate": 0.0002999110378295222, "loss": 3.3075, "step": 418 }, { "epoch": 0.03, "learning_rate": 0.0002999106117063778, "loss": 3.3059, "step": 419 }, { "epoch": 0.03, "learning_rate": 0.0002999101845654231, "loss": 3.3482, "step": 420 }, { "epoch": 0.03, "learning_rate": 0.0002999097564066609, "loss": 3.3484, "step": 421 }, { "epoch": 0.03, "learning_rate": 0.00029990932723009415, "loss": 3.305, "step": 422 }, { "epoch": 0.03, "learning_rate": 0.00029990889703572585, "loss": 3.3064, "step": 423 }, { "epoch": 0.03, "learning_rate": 0.0002999084658235589, "loss": 3.263, "step": 424 }, { "epoch": 0.03, "learning_rate": 0.00029990803359359616, "loss": 3.3036, "step": 425 }, { "epoch": 0.03, "learning_rate": 0.0002999076003458406, "loss": 3.2776, "step": 426 }, { "epoch": 0.03, "learning_rate": 0.00029990716608029516, "loss": 3.2948, "step": 427 }, { "epoch": 0.03, "learning_rate": 0.0002999067307969628, "loss": 3.2468, "step": 428 }, { "epoch": 0.03, "learning_rate": 0.0002999062944958464, "loss": 3.2286, "step": 429 }, { "epoch": 0.03, "learning_rate": 0.00029990585717694905, "loss": 3.2593, "step": 430 }, { "epoch": 0.03, "learning_rate": 0.00029990541884027366, "loss": 3.2648, "step": 431 }, { "epoch": 0.03, "learning_rate": 0.00029990497948582316, "loss": 3.2489, "step": 432 }, { "epoch": 0.03, "learning_rate": 0.0002999045391136006, "loss": 3.2649, "step": 433 }, { "epoch": 0.03, "learning_rate": 0.00029990409772360897, "loss": 3.2866, "step": 434 }, { "epoch": 0.03, "learning_rate": 0.0002999036553158512, "loss": 3.2414, "step": 435 }, { "epoch": 0.03, "learning_rate": 0.00029990321189033033, "loss": 3.2652, "step": 436 }, { "epoch": 0.03, "learning_rate": 0.0002999027674470494, "loss": 3.2923, "step": 437 }, { "epoch": 0.03, "learning_rate": 0.00029990232198601137, "loss": 3.23, "step": 438 }, { "epoch": 0.03, "learning_rate": 0.00029990187550721934, "loss": 3.2453, "step": 439 }, { "epoch": 0.03, "learning_rate": 0.0002999014280106762, "loss": 3.2658, "step": 440 }, { "epoch": 0.03, "learning_rate": 0.0002999009794963852, "loss": 3.2777, "step": 441 }, { "epoch": 0.03, "learning_rate": 0.00029990052996434923, "loss": 3.3127, "step": 442 }, { "epoch": 0.03, "learning_rate": 0.00029990007941457135, "loss": 3.3072, "step": 443 }, { "epoch": 0.03, "learning_rate": 0.00029989962784705474, "loss": 3.2399, "step": 444 }, { "epoch": 0.04, "learning_rate": 0.0002998991752618023, "loss": 3.2192, "step": 445 }, { "epoch": 0.04, "learning_rate": 0.0002998987216588172, "loss": 3.2204, "step": 446 }, { "epoch": 0.04, "learning_rate": 0.00029989826703810256, "loss": 3.283, "step": 447 }, { "epoch": 0.04, "learning_rate": 0.0002998978113996613, "loss": 3.2228, "step": 448 }, { "epoch": 0.04, "learning_rate": 0.00029989735474349665, "loss": 3.2552, "step": 449 }, { "epoch": 0.04, "learning_rate": 0.00029989689706961175, "loss": 3.2266, "step": 450 }, { "epoch": 0.04, "learning_rate": 0.0002998964383780096, "loss": 3.272, "step": 451 }, { "epoch": 0.04, "learning_rate": 0.00029989597866869334, "loss": 3.2204, "step": 452 }, { "epoch": 0.04, "learning_rate": 0.0002998955179416661, "loss": 3.2473, "step": 453 }, { "epoch": 0.04, "learning_rate": 0.00029989505619693106, "loss": 3.1992, "step": 454 }, { "epoch": 0.04, "learning_rate": 0.0002998945934344912, "loss": 3.2689, "step": 455 }, { "epoch": 0.04, "learning_rate": 0.00029989412965434985, "loss": 3.2824, "step": 456 }, { "epoch": 0.04, "learning_rate": 0.0002998936648565101, "loss": 3.2405, "step": 457 }, { "epoch": 0.04, "learning_rate": 0.0002998931990409751, "loss": 3.2571, "step": 458 }, { "epoch": 0.04, "learning_rate": 0.0002998927322077479, "loss": 3.1744, "step": 459 }, { "epoch": 0.04, "learning_rate": 0.00029989226435683184, "loss": 3.2192, "step": 460 }, { "epoch": 0.04, "learning_rate": 0.00029989179548823, "loss": 3.1929, "step": 461 }, { "epoch": 0.04, "learning_rate": 0.00029989132560194557, "loss": 3.1559, "step": 462 }, { "epoch": 0.04, "learning_rate": 0.0002998908546979818, "loss": 3.2255, "step": 463 }, { "epoch": 0.04, "learning_rate": 0.0002998903827763418, "loss": 3.16, "step": 464 }, { "epoch": 0.04, "learning_rate": 0.0002998899098370288, "loss": 3.1441, "step": 465 }, { "epoch": 0.04, "learning_rate": 0.0002998894358800461, "loss": 3.1374, "step": 466 }, { "epoch": 0.04, "learning_rate": 0.0002998889609053968, "loss": 3.2022, "step": 467 }, { "epoch": 0.04, "learning_rate": 0.0002998884849130842, "loss": 3.2187, "step": 468 }, { "epoch": 0.04, "learning_rate": 0.0002998880079031115, "loss": 3.1887, "step": 469 }, { "epoch": 0.04, "learning_rate": 0.00029988752987548185, "loss": 3.1583, "step": 470 }, { "epoch": 0.04, "learning_rate": 0.0002998870508301987, "loss": 3.1046, "step": 471 }, { "epoch": 0.04, "learning_rate": 0.0002998865707672651, "loss": 3.1383, "step": 472 }, { "epoch": 0.04, "learning_rate": 0.0002998860896866845, "loss": 3.1351, "step": 473 }, { "epoch": 0.04, "learning_rate": 0.00029988560758845996, "loss": 3.1745, "step": 474 }, { "epoch": 0.04, "learning_rate": 0.00029988512447259494, "loss": 3.132, "step": 475 }, { "epoch": 0.04, "learning_rate": 0.0002998846403390926, "loss": 3.1297, "step": 476 }, { "epoch": 0.04, "learning_rate": 0.0002998841551879563, "loss": 3.1711, "step": 477 }, { "epoch": 0.04, "learning_rate": 0.00029988366901918925, "loss": 3.1424, "step": 478 }, { "epoch": 0.04, "learning_rate": 0.00029988318183279484, "loss": 3.1174, "step": 479 }, { "epoch": 0.04, "learning_rate": 0.0002998826936287763, "loss": 3.1397, "step": 480 }, { "epoch": 0.04, "learning_rate": 0.000299882204407137, "loss": 3.1701, "step": 481 }, { "epoch": 0.04, "learning_rate": 0.0002998817141678802, "loss": 3.1798, "step": 482 }, { "epoch": 0.04, "learning_rate": 0.00029988122291100936, "loss": 3.1283, "step": 483 }, { "epoch": 0.04, "learning_rate": 0.00029988073063652766, "loss": 3.1025, "step": 484 }, { "epoch": 0.04, "learning_rate": 0.00029988023734443857, "loss": 3.1207, "step": 485 }, { "epoch": 0.04, "learning_rate": 0.00029987974303474535, "loss": 3.1344, "step": 486 }, { "epoch": 0.04, "learning_rate": 0.00029987924770745136, "loss": 3.105, "step": 487 }, { "epoch": 0.04, "learning_rate": 0.00029987875136256, "loss": 3.1359, "step": 488 }, { "epoch": 0.04, "learning_rate": 0.00029987825400007467, "loss": 3.1229, "step": 489 }, { "epoch": 0.04, "learning_rate": 0.0002998777556199987, "loss": 3.1058, "step": 490 }, { "epoch": 0.04, "learning_rate": 0.00029987725622233544, "loss": 3.0607, "step": 491 }, { "epoch": 0.04, "learning_rate": 0.0002998767558070883, "loss": 3.0856, "step": 492 }, { "epoch": 0.04, "learning_rate": 0.0002998762543742607, "loss": 2.9987, "step": 493 }, { "epoch": 0.04, "learning_rate": 0.0002998757519238561, "loss": 3.0655, "step": 494 }, { "epoch": 0.04, "learning_rate": 0.00029987524845587784, "loss": 3.1465, "step": 495 }, { "epoch": 0.04, "learning_rate": 0.0002998747439703293, "loss": 3.1124, "step": 496 }, { "epoch": 0.04, "learning_rate": 0.000299874238467214, "loss": 3.0728, "step": 497 }, { "epoch": 0.04, "learning_rate": 0.0002998737319465353, "loss": 3.1369, "step": 498 }, { "epoch": 0.04, "learning_rate": 0.00029987322440829667, "loss": 3.1197, "step": 499 }, { "epoch": 0.04, "learning_rate": 0.0002998727158525016, "loss": 3.0726, "step": 500 }, { "epoch": 0.04, "learning_rate": 0.00029987220627915344, "loss": 3.1129, "step": 501 }, { "epoch": 0.04, "learning_rate": 0.00029987169568825576, "loss": 3.0882, "step": 502 }, { "epoch": 0.04, "learning_rate": 0.00029987118407981194, "loss": 3.028, "step": 503 }, { "epoch": 0.04, "learning_rate": 0.00029987067145382547, "loss": 3.0593, "step": 504 }, { "epoch": 0.04, "learning_rate": 0.00029987015781029986, "loss": 3.0912, "step": 505 }, { "epoch": 0.04, "learning_rate": 0.0002998696431492386, "loss": 3.0887, "step": 506 }, { "epoch": 0.04, "learning_rate": 0.0002998691274706452, "loss": 3.091, "step": 507 }, { "epoch": 0.04, "learning_rate": 0.00029986861077452304, "loss": 3.054, "step": 508 }, { "epoch": 0.04, "learning_rate": 0.00029986809306087575, "loss": 3.0896, "step": 509 }, { "epoch": 0.04, "learning_rate": 0.00029986757432970683, "loss": 3.0379, "step": 510 }, { "epoch": 0.04, "learning_rate": 0.00029986705458101976, "loss": 3.0625, "step": 511 }, { "epoch": 0.04, "learning_rate": 0.0002998665338148181, "loss": 3.033, "step": 512 }, { "epoch": 0.04, "learning_rate": 0.0002998660120311054, "loss": 3.0174, "step": 513 }, { "epoch": 0.04, "learning_rate": 0.00029986548922988514, "loss": 3.0736, "step": 514 }, { "epoch": 0.04, "learning_rate": 0.00029986496541116095, "loss": 3.0877, "step": 515 }, { "epoch": 0.04, "learning_rate": 0.00029986444057493634, "loss": 2.9844, "step": 516 }, { "epoch": 0.04, "learning_rate": 0.00029986391472121494, "loss": 3.0893, "step": 517 }, { "epoch": 0.04, "learning_rate": 0.0002998633878500002, "loss": 3.0505, "step": 518 }, { "epoch": 0.04, "learning_rate": 0.0002998628599612957, "loss": 3.0343, "step": 519 }, { "epoch": 0.04, "learning_rate": 0.0002998623310551052, "loss": 3.0546, "step": 520 }, { "epoch": 0.04, "learning_rate": 0.00029986180113143203, "loss": 2.9731, "step": 521 }, { "epoch": 0.04, "learning_rate": 0.0002998612701902801, "loss": 3.0947, "step": 522 }, { "epoch": 0.04, "learning_rate": 0.0002998607382316527, "loss": 3.0458, "step": 523 }, { "epoch": 0.04, "learning_rate": 0.0002998602052555537, "loss": 2.9464, "step": 524 }, { "epoch": 0.04, "learning_rate": 0.0002998596712619865, "loss": 3.0588, "step": 525 }, { "epoch": 0.04, "learning_rate": 0.0002998591362509549, "loss": 3.0908, "step": 526 }, { "epoch": 0.04, "learning_rate": 0.00029985860022246246, "loss": 2.9842, "step": 527 }, { "epoch": 0.04, "learning_rate": 0.0002998580631765128, "loss": 3.1067, "step": 528 }, { "epoch": 0.04, "learning_rate": 0.0002998575251131096, "loss": 3.0265, "step": 529 }, { "epoch": 0.04, "learning_rate": 0.00029985698603225653, "loss": 2.9895, "step": 530 }, { "epoch": 0.04, "learning_rate": 0.00029985644593395717, "loss": 3.0481, "step": 531 }, { "epoch": 0.04, "learning_rate": 0.0002998559048182152, "loss": 3.009, "step": 532 }, { "epoch": 0.04, "learning_rate": 0.0002998553626850345, "loss": 3.0404, "step": 533 }, { "epoch": 0.04, "learning_rate": 0.00029985481953441847, "loss": 3.0198, "step": 534 }, { "epoch": 0.04, "learning_rate": 0.00029985427536637093, "loss": 2.9818, "step": 535 }, { "epoch": 0.04, "learning_rate": 0.0002998537301808955, "loss": 2.9981, "step": 536 }, { "epoch": 0.04, "learning_rate": 0.000299853183977996, "loss": 3.0112, "step": 537 }, { "epoch": 0.04, "learning_rate": 0.0002998526367576761, "loss": 3.058, "step": 538 }, { "epoch": 0.04, "learning_rate": 0.00029985208851993945, "loss": 2.9824, "step": 539 }, { "epoch": 0.04, "learning_rate": 0.00029985153926478985, "loss": 2.9641, "step": 540 }, { "epoch": 0.04, "learning_rate": 0.00029985098899223094, "loss": 3.0193, "step": 541 }, { "epoch": 0.04, "learning_rate": 0.0002998504377022665, "loss": 2.9502, "step": 542 }, { "epoch": 0.04, "learning_rate": 0.00029984988539490034, "loss": 2.9858, "step": 543 }, { "epoch": 0.04, "learning_rate": 0.0002998493320701361, "loss": 3.031, "step": 544 }, { "epoch": 0.04, "learning_rate": 0.0002998487777279777, "loss": 2.9623, "step": 545 }, { "epoch": 0.04, "learning_rate": 0.00029984822236842865, "loss": 3.0078, "step": 546 }, { "epoch": 0.04, "learning_rate": 0.0002998476659914929, "loss": 2.9393, "step": 547 }, { "epoch": 0.04, "learning_rate": 0.0002998471085971743, "loss": 2.9405, "step": 548 }, { "epoch": 0.04, "learning_rate": 0.00029984655018547643, "loss": 2.9701, "step": 549 }, { "epoch": 0.04, "learning_rate": 0.00029984599075640316, "loss": 2.9684, "step": 550 }, { "epoch": 0.04, "learning_rate": 0.0002998454303099583, "loss": 3.0025, "step": 551 }, { "epoch": 0.04, "learning_rate": 0.0002998448688461457, "loss": 3.005, "step": 552 }, { "epoch": 0.04, "learning_rate": 0.00029984430636496916, "loss": 2.9699, "step": 553 }, { "epoch": 0.04, "learning_rate": 0.0002998437428664324, "loss": 2.955, "step": 554 }, { "epoch": 0.04, "learning_rate": 0.00029984317835053936, "loss": 2.8974, "step": 555 }, { "epoch": 0.04, "learning_rate": 0.00029984261281729385, "loss": 2.9148, "step": 556 }, { "epoch": 0.04, "learning_rate": 0.00029984204626669965, "loss": 3.0008, "step": 557 }, { "epoch": 0.04, "learning_rate": 0.0002998414786987606, "loss": 3.0046, "step": 558 }, { "epoch": 0.04, "learning_rate": 0.00029984091011348073, "loss": 2.9123, "step": 559 }, { "epoch": 0.04, "learning_rate": 0.00029984034051086365, "loss": 2.9313, "step": 560 }, { "epoch": 0.04, "learning_rate": 0.00029983976989091343, "loss": 2.9623, "step": 561 }, { "epoch": 0.04, "learning_rate": 0.0002998391982536338, "loss": 2.9309, "step": 562 }, { "epoch": 0.04, "learning_rate": 0.0002998386255990287, "loss": 2.9293, "step": 563 }, { "epoch": 0.04, "learning_rate": 0.0002998380519271021, "loss": 2.8694, "step": 564 }, { "epoch": 0.04, "learning_rate": 0.00029983747723785775, "loss": 2.8473, "step": 565 }, { "epoch": 0.04, "learning_rate": 0.0002998369015312996, "loss": 2.933, "step": 566 }, { "epoch": 0.04, "learning_rate": 0.0002998363248074316, "loss": 2.9198, "step": 567 }, { "epoch": 0.04, "learning_rate": 0.00029983574706625763, "loss": 2.9053, "step": 568 }, { "epoch": 0.04, "learning_rate": 0.00029983516830778164, "loss": 2.9249, "step": 569 }, { "epoch": 0.04, "learning_rate": 0.00029983458853200754, "loss": 2.9805, "step": 570 }, { "epoch": 0.04, "learning_rate": 0.0002998340077389392, "loss": 2.965, "step": 571 }, { "epoch": 0.05, "learning_rate": 0.00029983342592858076, "loss": 2.8676, "step": 572 }, { "epoch": 0.05, "learning_rate": 0.00029983284310093595, "loss": 2.9428, "step": 573 }, { "epoch": 0.05, "learning_rate": 0.00029983225925600884, "loss": 2.9323, "step": 574 }, { "epoch": 0.05, "learning_rate": 0.0002998316743938034, "loss": 2.8882, "step": 575 }, { "epoch": 0.05, "learning_rate": 0.0002998310885143236, "loss": 2.9232, "step": 576 }, { "epoch": 0.05, "learning_rate": 0.00029983050161757333, "loss": 2.9208, "step": 577 }, { "epoch": 0.05, "learning_rate": 0.00029982991370355665, "loss": 2.8978, "step": 578 }, { "epoch": 0.05, "learning_rate": 0.0002998293247722776, "loss": 2.8934, "step": 579 }, { "epoch": 0.05, "learning_rate": 0.00029982873482374, "loss": 2.9157, "step": 580 }, { "epoch": 0.05, "learning_rate": 0.00029982814385794805, "loss": 2.9203, "step": 581 }, { "epoch": 0.05, "learning_rate": 0.0002998275518749057, "loss": 2.8976, "step": 582 }, { "epoch": 0.05, "learning_rate": 0.0002998269588746169, "loss": 2.912, "step": 583 }, { "epoch": 0.05, "learning_rate": 0.0002998263648570858, "loss": 2.8397, "step": 584 }, { "epoch": 0.05, "learning_rate": 0.00029982576982231634, "loss": 2.8763, "step": 585 }, { "epoch": 0.05, "learning_rate": 0.0002998251737703126, "loss": 2.8731, "step": 586 }, { "epoch": 0.05, "learning_rate": 0.0002998245767010785, "loss": 2.8994, "step": 587 }, { "epoch": 0.05, "learning_rate": 0.0002998239786146183, "loss": 2.8959, "step": 588 }, { "epoch": 0.05, "learning_rate": 0.000299823379510936, "loss": 2.9344, "step": 589 }, { "epoch": 0.05, "learning_rate": 0.0002998227793900355, "loss": 2.9004, "step": 590 }, { "epoch": 0.05, "learning_rate": 0.00029982217825192113, "loss": 2.9039, "step": 591 }, { "epoch": 0.05, "learning_rate": 0.0002998215760965968, "loss": 2.8548, "step": 592 }, { "epoch": 0.05, "learning_rate": 0.00029982097292406663, "loss": 2.8582, "step": 593 }, { "epoch": 0.05, "learning_rate": 0.0002998203687343348, "loss": 2.8568, "step": 594 }, { "epoch": 0.05, "learning_rate": 0.0002998197635274053, "loss": 2.8544, "step": 595 }, { "epoch": 0.05, "learning_rate": 0.00029981915730328227, "loss": 2.9275, "step": 596 }, { "epoch": 0.05, "learning_rate": 0.0002998185500619698, "loss": 2.8658, "step": 597 }, { "epoch": 0.05, "learning_rate": 0.00029981794180347214, "loss": 2.9085, "step": 598 }, { "epoch": 0.05, "learning_rate": 0.0002998173325277933, "loss": 2.8681, "step": 599 }, { "epoch": 0.05, "learning_rate": 0.00029981672223493744, "loss": 2.807, "step": 600 }, { "epoch": 0.05, "learning_rate": 0.0002998161109249087, "loss": 2.848, "step": 601 }, { "epoch": 0.05, "learning_rate": 0.0002998154985977113, "loss": 2.8962, "step": 602 }, { "epoch": 0.05, "learning_rate": 0.0002998148852533492, "loss": 2.9375, "step": 603 }, { "epoch": 0.05, "learning_rate": 0.00029981427089182685, "loss": 2.8912, "step": 604 }, { "epoch": 0.05, "learning_rate": 0.0002998136555131482, "loss": 2.8608, "step": 605 }, { "epoch": 0.05, "learning_rate": 0.0002998130391173175, "loss": 2.8124, "step": 606 }, { "epoch": 0.05, "learning_rate": 0.00029981242170433903, "loss": 2.7887, "step": 607 }, { "epoch": 0.05, "learning_rate": 0.0002998118032742168, "loss": 2.8788, "step": 608 }, { "epoch": 0.05, "learning_rate": 0.0002998111838269551, "loss": 2.8294, "step": 609 }, { "epoch": 0.05, "learning_rate": 0.0002998105633625582, "loss": 2.8548, "step": 610 }, { "epoch": 0.05, "learning_rate": 0.0002998099418810302, "loss": 2.841, "step": 611 }, { "epoch": 0.05, "learning_rate": 0.00029980931938237537, "loss": 2.9162, "step": 612 }, { "epoch": 0.05, "learning_rate": 0.00029980869586659795, "loss": 2.8521, "step": 613 }, { "epoch": 0.05, "learning_rate": 0.0002998080713337021, "loss": 2.8271, "step": 614 }, { "epoch": 0.05, "learning_rate": 0.0002998074457836922, "loss": 2.84, "step": 615 }, { "epoch": 0.05, "learning_rate": 0.00029980681921657235, "loss": 2.7782, "step": 616 }, { "epoch": 0.05, "learning_rate": 0.0002998061916323469, "loss": 2.7358, "step": 617 }, { "epoch": 0.05, "learning_rate": 0.00029980556303102, "loss": 2.8618, "step": 618 }, { "epoch": 0.05, "learning_rate": 0.0002998049334125961, "loss": 2.8669, "step": 619 }, { "epoch": 0.05, "learning_rate": 0.0002998043027770794, "loss": 2.8121, "step": 620 }, { "epoch": 0.05, "learning_rate": 0.00029980367112447404, "loss": 2.841, "step": 621 }, { "epoch": 0.05, "learning_rate": 0.00029980303845478446, "loss": 2.8193, "step": 622 }, { "epoch": 0.05, "learning_rate": 0.00029980240476801495, "loss": 2.8047, "step": 623 }, { "epoch": 0.05, "learning_rate": 0.00029980177006416975, "loss": 2.7937, "step": 624 }, { "epoch": 0.05, "learning_rate": 0.0002998011343432532, "loss": 2.8147, "step": 625 }, { "epoch": 0.05, "learning_rate": 0.0002998004976052696, "loss": 2.8271, "step": 626 }, { "epoch": 0.05, "learning_rate": 0.00029979985985022336, "loss": 2.7999, "step": 627 }, { "epoch": 0.05, "learning_rate": 0.00029979922107811866, "loss": 2.8938, "step": 628 }, { "epoch": 0.05, "learning_rate": 0.00029979858128895994, "loss": 2.8051, "step": 629 }, { "epoch": 0.05, "learning_rate": 0.0002997979404827515, "loss": 2.8158, "step": 630 }, { "epoch": 0.05, "learning_rate": 0.00029979729865949777, "loss": 2.7271, "step": 631 }, { "epoch": 0.05, "learning_rate": 0.000299796655819203, "loss": 2.8752, "step": 632 }, { "epoch": 0.05, "learning_rate": 0.0002997960119618716, "loss": 2.7863, "step": 633 }, { "epoch": 0.05, "learning_rate": 0.00029979536708750796, "loss": 2.763, "step": 634 }, { "epoch": 0.05, "learning_rate": 0.0002997947211961164, "loss": 2.784, "step": 635 }, { "epoch": 0.05, "learning_rate": 0.0002997940742877014, "loss": 2.8061, "step": 636 }, { "epoch": 0.05, "learning_rate": 0.0002997934263622673, "loss": 2.7848, "step": 637 }, { "epoch": 0.05, "learning_rate": 0.00029979277741981847, "loss": 2.7763, "step": 638 }, { "epoch": 0.05, "learning_rate": 0.00029979212746035933, "loss": 2.8128, "step": 639 }, { "epoch": 0.05, "learning_rate": 0.0002997914764838943, "loss": 2.822, "step": 640 }, { "epoch": 0.05, "learning_rate": 0.00029979082449042784, "loss": 2.7838, "step": 641 }, { "epoch": 0.05, "learning_rate": 0.00029979017147996437, "loss": 2.7593, "step": 642 }, { "epoch": 0.05, "learning_rate": 0.0002997895174525082, "loss": 2.7969, "step": 643 }, { "epoch": 0.05, "learning_rate": 0.00029978886240806396, "loss": 2.8005, "step": 644 }, { "epoch": 0.05, "learning_rate": 0.000299788206346636, "loss": 2.8598, "step": 645 }, { "epoch": 0.05, "learning_rate": 0.00029978754926822875, "loss": 2.8033, "step": 646 }, { "epoch": 0.05, "learning_rate": 0.0002997868911728467, "loss": 2.8566, "step": 647 }, { "epoch": 0.05, "learning_rate": 0.0002997862320604943, "loss": 2.8095, "step": 648 }, { "epoch": 0.05, "learning_rate": 0.0002997855719311761, "loss": 2.8218, "step": 649 }, { "epoch": 0.05, "learning_rate": 0.00029978491078489644, "loss": 2.8158, "step": 650 }, { "epoch": 0.05, "learning_rate": 0.00029978424862166, "loss": 2.8407, "step": 651 }, { "epoch": 0.05, "learning_rate": 0.0002997835854414711, "loss": 2.8192, "step": 652 }, { "epoch": 0.05, "learning_rate": 0.0002997829212443343, "loss": 2.7773, "step": 653 }, { "epoch": 0.05, "learning_rate": 0.00029978225603025414, "loss": 2.766, "step": 654 }, { "epoch": 0.05, "learning_rate": 0.00029978158979923516, "loss": 2.7477, "step": 655 }, { "epoch": 0.05, "learning_rate": 0.0002997809225512818, "loss": 2.789, "step": 656 }, { "epoch": 0.05, "learning_rate": 0.0002997802542863986, "loss": 2.7875, "step": 657 }, { "epoch": 0.05, "learning_rate": 0.00029977958500459025, "loss": 2.7513, "step": 658 }, { "epoch": 0.05, "learning_rate": 0.000299778914705861, "loss": 2.773, "step": 659 }, { "epoch": 0.05, "learning_rate": 0.0002997782433902157, "loss": 2.7224, "step": 660 }, { "epoch": 0.05, "learning_rate": 0.0002997775710576587, "loss": 2.7683, "step": 661 }, { "epoch": 0.05, "learning_rate": 0.00029977689770819475, "loss": 2.7416, "step": 662 }, { "epoch": 0.05, "learning_rate": 0.0002997762233418283, "loss": 2.7285, "step": 663 }, { "epoch": 0.05, "learning_rate": 0.0002997755479585639, "loss": 2.7482, "step": 664 }, { "epoch": 0.05, "learning_rate": 0.00029977487155840617, "loss": 2.749, "step": 665 }, { "epoch": 0.05, "learning_rate": 0.0002997741941413598, "loss": 2.7525, "step": 666 }, { "epoch": 0.05, "learning_rate": 0.00029977351570742916, "loss": 2.756, "step": 667 }, { "epoch": 0.05, "learning_rate": 0.0002997728362566191, "loss": 2.7868, "step": 668 }, { "epoch": 0.05, "learning_rate": 0.0002997721557889341, "loss": 2.7722, "step": 669 }, { "epoch": 0.05, "learning_rate": 0.00029977147430437887, "loss": 2.7262, "step": 670 }, { "epoch": 0.05, "learning_rate": 0.0002997707918029579, "loss": 2.6959, "step": 671 }, { "epoch": 0.05, "learning_rate": 0.00029977010828467597, "loss": 2.7339, "step": 672 }, { "epoch": 0.05, "learning_rate": 0.0002997694237495376, "loss": 2.7857, "step": 673 }, { "epoch": 0.05, "learning_rate": 0.00029976873819754753, "loss": 2.7681, "step": 674 }, { "epoch": 0.05, "learning_rate": 0.0002997680516287104, "loss": 2.8482, "step": 675 }, { "epoch": 0.05, "learning_rate": 0.0002997673640430308, "loss": 2.7562, "step": 676 }, { "epoch": 0.05, "learning_rate": 0.00029976667544051345, "loss": 2.7379, "step": 677 }, { "epoch": 0.05, "learning_rate": 0.000299765985821163, "loss": 2.7353, "step": 678 }, { "epoch": 0.05, "learning_rate": 0.00029976529518498416, "loss": 2.7259, "step": 679 }, { "epoch": 0.05, "learning_rate": 0.00029976460353198166, "loss": 2.6819, "step": 680 }, { "epoch": 0.05, "learning_rate": 0.0002997639108621601, "loss": 2.7155, "step": 681 }, { "epoch": 0.05, "learning_rate": 0.0002997632171755243, "loss": 2.7437, "step": 682 }, { "epoch": 0.05, "learning_rate": 0.00029976252247207886, "loss": 2.7525, "step": 683 }, { "epoch": 0.05, "learning_rate": 0.0002997618267518285, "loss": 2.7651, "step": 684 }, { "epoch": 0.05, "learning_rate": 0.00029976113001477803, "loss": 2.7274, "step": 685 }, { "epoch": 0.05, "learning_rate": 0.00029976043226093217, "loss": 2.7239, "step": 686 }, { "epoch": 0.05, "learning_rate": 0.00029975973349029555, "loss": 2.7285, "step": 687 }, { "epoch": 0.05, "learning_rate": 0.00029975903370287304, "loss": 2.7144, "step": 688 }, { "epoch": 0.05, "learning_rate": 0.0002997583328986693, "loss": 2.7124, "step": 689 }, { "epoch": 0.05, "learning_rate": 0.00029975763107768907, "loss": 2.7374, "step": 690 }, { "epoch": 0.05, "learning_rate": 0.0002997569282399372, "loss": 2.6965, "step": 691 }, { "epoch": 0.05, "learning_rate": 0.0002997562243854185, "loss": 2.6688, "step": 692 }, { "epoch": 0.05, "learning_rate": 0.0002997555195141376, "loss": 2.6655, "step": 693 }, { "epoch": 0.05, "learning_rate": 0.00029975481362609944, "loss": 2.7675, "step": 694 }, { "epoch": 0.05, "learning_rate": 0.00029975410672130866, "loss": 2.6698, "step": 695 }, { "epoch": 0.05, "learning_rate": 0.00029975339879977016, "loss": 2.6249, "step": 696 }, { "epoch": 0.05, "learning_rate": 0.00029975268986148876, "loss": 2.7753, "step": 697 }, { "epoch": 0.05, "learning_rate": 0.0002997519799064692, "loss": 2.6617, "step": 698 }, { "epoch": 0.05, "learning_rate": 0.00029975126893471636, "loss": 2.7121, "step": 699 }, { "epoch": 0.06, "learning_rate": 0.000299750556946235, "loss": 2.703, "step": 700 }, { "epoch": 0.06, "learning_rate": 0.00029974984394103005, "loss": 2.6435, "step": 701 }, { "epoch": 0.06, "learning_rate": 0.00029974912991910627, "loss": 2.7209, "step": 702 }, { "epoch": 0.06, "learning_rate": 0.00029974841488046854, "loss": 2.6562, "step": 703 }, { "epoch": 0.06, "learning_rate": 0.0002997476988251217, "loss": 2.7547, "step": 704 }, { "epoch": 0.06, "learning_rate": 0.00029974698175307064, "loss": 2.725, "step": 705 }, { "epoch": 0.06, "learning_rate": 0.00029974626366432023, "loss": 2.6492, "step": 706 }, { "epoch": 0.06, "learning_rate": 0.0002997455445588753, "loss": 2.7403, "step": 707 }, { "epoch": 0.06, "learning_rate": 0.00029974482443674073, "loss": 2.6681, "step": 708 }, { "epoch": 0.06, "learning_rate": 0.0002997441032979215, "loss": 2.6877, "step": 709 }, { "epoch": 0.06, "learning_rate": 0.00029974338114242236, "loss": 2.6949, "step": 710 }, { "epoch": 0.06, "learning_rate": 0.00029974265797024836, "loss": 2.715, "step": 711 }, { "epoch": 0.06, "learning_rate": 0.0002997419337814043, "loss": 2.7013, "step": 712 }, { "epoch": 0.06, "learning_rate": 0.00029974120857589523, "loss": 2.6937, "step": 713 }, { "epoch": 0.06, "learning_rate": 0.00029974048235372597, "loss": 2.7083, "step": 714 }, { "epoch": 0.06, "learning_rate": 0.0002997397551149014, "loss": 2.6838, "step": 715 }, { "epoch": 0.06, "learning_rate": 0.00029973902685942656, "loss": 2.6127, "step": 716 }, { "epoch": 0.06, "learning_rate": 0.0002997382975873064, "loss": 2.6922, "step": 717 }, { "epoch": 0.06, "learning_rate": 0.00029973756729854577, "loss": 2.671, "step": 718 }, { "epoch": 0.06, "learning_rate": 0.00029973683599314975, "loss": 2.6742, "step": 719 }, { "epoch": 0.06, "learning_rate": 0.0002997361036711232, "loss": 2.6964, "step": 720 }, { "epoch": 0.06, "learning_rate": 0.0002997353703324711, "loss": 2.7109, "step": 721 }, { "epoch": 0.06, "learning_rate": 0.00029973463597719854, "loss": 2.6909, "step": 722 }, { "epoch": 0.06, "learning_rate": 0.00029973390060531043, "loss": 2.6496, "step": 723 }, { "epoch": 0.06, "learning_rate": 0.0002997331642168117, "loss": 2.6552, "step": 724 }, { "epoch": 0.06, "learning_rate": 0.0002997324268117075, "loss": 2.6508, "step": 725 }, { "epoch": 0.06, "learning_rate": 0.0002997316883900027, "loss": 2.6862, "step": 726 }, { "epoch": 0.06, "learning_rate": 0.0002997309489517024, "loss": 2.6635, "step": 727 }, { "epoch": 0.06, "learning_rate": 0.0002997302084968115, "loss": 2.7271, "step": 728 }, { "epoch": 0.06, "learning_rate": 0.0002997294670253352, "loss": 2.7378, "step": 729 }, { "epoch": 0.06, "learning_rate": 0.00029972872453727845, "loss": 2.6311, "step": 730 }, { "epoch": 0.06, "learning_rate": 0.0002997279810326462, "loss": 2.6636, "step": 731 }, { "epoch": 0.06, "learning_rate": 0.00029972723651144363, "loss": 2.6636, "step": 732 }, { "epoch": 0.06, "learning_rate": 0.0002997264909736758, "loss": 2.6617, "step": 733 }, { "epoch": 0.06, "learning_rate": 0.00029972574441934765, "loss": 2.6394, "step": 734 }, { "epoch": 0.06, "learning_rate": 0.00029972499684846436, "loss": 2.6642, "step": 735 }, { "epoch": 0.06, "learning_rate": 0.00029972424826103095, "loss": 2.6409, "step": 736 }, { "epoch": 0.06, "learning_rate": 0.00029972349865705256, "loss": 2.693, "step": 737 }, { "epoch": 0.06, "learning_rate": 0.0002997227480365342, "loss": 2.663, "step": 738 }, { "epoch": 0.06, "learning_rate": 0.000299721996399481, "loss": 2.6709, "step": 739 }, { "epoch": 0.06, "learning_rate": 0.00029972124374589806, "loss": 2.6218, "step": 740 }, { "epoch": 0.06, "learning_rate": 0.00029972049007579056, "loss": 2.6124, "step": 741 }, { "epoch": 0.06, "learning_rate": 0.0002997197353891635, "loss": 2.6537, "step": 742 }, { "epoch": 0.06, "learning_rate": 0.000299718979686022, "loss": 2.6436, "step": 743 }, { "epoch": 0.06, "learning_rate": 0.00029971822296637136, "loss": 2.7085, "step": 744 }, { "epoch": 0.06, "learning_rate": 0.0002997174652302166, "loss": 2.6817, "step": 745 }, { "epoch": 0.06, "learning_rate": 0.0002997167064775628, "loss": 2.6789, "step": 746 }, { "epoch": 0.06, "learning_rate": 0.0002997159467084152, "loss": 2.63, "step": 747 }, { "epoch": 0.06, "learning_rate": 0.000299715185922779, "loss": 2.6452, "step": 748 }, { "epoch": 0.06, "learning_rate": 0.0002997144241206593, "loss": 2.62, "step": 749 }, { "epoch": 0.06, "learning_rate": 0.00029971366130206124, "loss": 2.5923, "step": 750 }, { "epoch": 0.06, "learning_rate": 0.00029971289746699004, "loss": 2.6451, "step": 751 }, { "epoch": 0.06, "learning_rate": 0.0002997121326154509, "loss": 2.686, "step": 752 }, { "epoch": 0.06, "learning_rate": 0.000299711366747449, "loss": 2.6839, "step": 753 }, { "epoch": 0.06, "learning_rate": 0.00029971059986298954, "loss": 2.6962, "step": 754 }, { "epoch": 0.06, "learning_rate": 0.0002997098319620777, "loss": 2.7167, "step": 755 }, { "epoch": 0.06, "learning_rate": 0.0002997090630447187, "loss": 2.6266, "step": 756 }, { "epoch": 0.06, "learning_rate": 0.00029970829311091785, "loss": 2.6245, "step": 757 }, { "epoch": 0.06, "learning_rate": 0.0002997075221606802, "loss": 2.6621, "step": 758 }, { "epoch": 0.06, "learning_rate": 0.00029970675019401125, "loss": 2.6386, "step": 759 }, { "epoch": 0.06, "learning_rate": 0.00029970597721091596, "loss": 2.5819, "step": 760 }, { "epoch": 0.06, "learning_rate": 0.00029970520321139974, "loss": 2.5905, "step": 761 }, { "epoch": 0.06, "learning_rate": 0.0002997044281954678, "loss": 2.5932, "step": 762 }, { "epoch": 0.06, "learning_rate": 0.0002997036521631254, "loss": 2.6202, "step": 763 }, { "epoch": 0.06, "learning_rate": 0.00029970287511437777, "loss": 2.6357, "step": 764 }, { "epoch": 0.06, "learning_rate": 0.00029970209704923025, "loss": 2.6803, "step": 765 }, { "epoch": 0.06, "learning_rate": 0.00029970131796768813, "loss": 2.6636, "step": 766 }, { "epoch": 0.06, "learning_rate": 0.0002997005378697567, "loss": 2.6329, "step": 767 }, { "epoch": 0.06, "learning_rate": 0.0002996997567554412, "loss": 2.6367, "step": 768 }, { "epoch": 0.06, "learning_rate": 0.00029969897462474695, "loss": 2.6472, "step": 769 }, { "epoch": 0.06, "learning_rate": 0.0002996981914776793, "loss": 2.6662, "step": 770 }, { "epoch": 0.06, "learning_rate": 0.0002996974073142435, "loss": 2.6139, "step": 771 }, { "epoch": 0.06, "learning_rate": 0.00029969662213444494, "loss": 2.6069, "step": 772 }, { "epoch": 0.06, "learning_rate": 0.0002996958359382889, "loss": 2.645, "step": 773 }, { "epoch": 0.06, "learning_rate": 0.0002996950487257808, "loss": 2.6586, "step": 774 }, { "epoch": 0.06, "learning_rate": 0.0002996942604969259, "loss": 2.5542, "step": 775 }, { "epoch": 0.06, "learning_rate": 0.00029969347125172955, "loss": 2.5838, "step": 776 }, { "epoch": 0.06, "learning_rate": 0.0002996926809901972, "loss": 2.5294, "step": 777 }, { "epoch": 0.06, "learning_rate": 0.00029969188971233407, "loss": 2.5473, "step": 778 }, { "epoch": 0.06, "learning_rate": 0.0002996910974181457, "loss": 2.619, "step": 779 }, { "epoch": 0.06, "learning_rate": 0.00029969030410763737, "loss": 2.6307, "step": 780 }, { "epoch": 0.06, "learning_rate": 0.0002996895097808144, "loss": 2.5601, "step": 781 }, { "epoch": 0.06, "learning_rate": 0.00029968871443768235, "loss": 2.6346, "step": 782 }, { "epoch": 0.06, "learning_rate": 0.0002996879180782465, "loss": 2.556, "step": 783 }, { "epoch": 0.06, "learning_rate": 0.0002996871207025123, "loss": 2.6346, "step": 784 }, { "epoch": 0.06, "learning_rate": 0.0002996863223104852, "loss": 2.6499, "step": 785 }, { "epoch": 0.06, "learning_rate": 0.00029968552290217046, "loss": 2.5265, "step": 786 }, { "epoch": 0.06, "learning_rate": 0.0002996847224775737, "loss": 2.6261, "step": 787 }, { "epoch": 0.06, "learning_rate": 0.0002996839210367003, "loss": 2.5314, "step": 788 }, { "epoch": 0.06, "learning_rate": 0.0002996831185795556, "loss": 2.5658, "step": 789 }, { "epoch": 0.06, "learning_rate": 0.0002996823151061452, "loss": 2.5705, "step": 790 }, { "epoch": 0.06, "learning_rate": 0.00029968151061647444, "loss": 2.6045, "step": 791 }, { "epoch": 0.06, "learning_rate": 0.0002996807051105488, "loss": 2.5943, "step": 792 }, { "epoch": 0.06, "learning_rate": 0.00029967989858837386, "loss": 2.6569, "step": 793 }, { "epoch": 0.06, "learning_rate": 0.0002996790910499549, "loss": 2.5255, "step": 794 }, { "epoch": 0.06, "learning_rate": 0.0002996782824952976, "loss": 2.5351, "step": 795 }, { "epoch": 0.06, "learning_rate": 0.00029967747292440736, "loss": 2.6453, "step": 796 }, { "epoch": 0.06, "learning_rate": 0.00029967666233728964, "loss": 2.6611, "step": 797 }, { "epoch": 0.06, "learning_rate": 0.00029967585073395, "loss": 2.6491, "step": 798 }, { "epoch": 0.06, "learning_rate": 0.00029967503811439386, "loss": 2.5658, "step": 799 }, { "epoch": 0.06, "learning_rate": 0.0002996742244786269, "loss": 2.5757, "step": 800 }, { "epoch": 0.06, "learning_rate": 0.0002996734098266545, "loss": 2.5302, "step": 801 }, { "epoch": 0.06, "learning_rate": 0.0002996725941584823, "loss": 2.6165, "step": 802 }, { "epoch": 0.06, "learning_rate": 0.0002996717774741158, "loss": 2.6171, "step": 803 }, { "epoch": 0.06, "learning_rate": 0.0002996709597735604, "loss": 2.5399, "step": 804 }, { "epoch": 0.06, "learning_rate": 0.0002996701410568219, "loss": 2.5831, "step": 805 }, { "epoch": 0.06, "learning_rate": 0.0002996693213239057, "loss": 2.6413, "step": 806 }, { "epoch": 0.06, "learning_rate": 0.0002996685005748174, "loss": 2.5815, "step": 807 }, { "epoch": 0.06, "learning_rate": 0.00029966767880956253, "loss": 2.5611, "step": 808 }, { "epoch": 0.06, "learning_rate": 0.0002996668560281468, "loss": 2.5994, "step": 809 }, { "epoch": 0.06, "learning_rate": 0.0002996660322305756, "loss": 2.5329, "step": 810 }, { "epoch": 0.06, "learning_rate": 0.00029966520741685475, "loss": 2.5664, "step": 811 }, { "epoch": 0.06, "learning_rate": 0.00029966438158698965, "loss": 2.5142, "step": 812 }, { "epoch": 0.06, "learning_rate": 0.00029966355474098604, "loss": 2.6147, "step": 813 }, { "epoch": 0.06, "learning_rate": 0.00029966272687884945, "loss": 2.5826, "step": 814 }, { "epoch": 0.06, "learning_rate": 0.0002996618980005855, "loss": 2.5187, "step": 815 }, { "epoch": 0.06, "learning_rate": 0.0002996610681062, "loss": 2.5356, "step": 816 }, { "epoch": 0.06, "learning_rate": 0.0002996602371956983, "loss": 2.5211, "step": 817 }, { "epoch": 0.06, "learning_rate": 0.0002996594052690862, "loss": 2.6099, "step": 818 }, { "epoch": 0.06, "learning_rate": 0.00029965857232636936, "loss": 2.5885, "step": 819 }, { "epoch": 0.06, "learning_rate": 0.0002996577383675534, "loss": 2.5264, "step": 820 }, { "epoch": 0.06, "learning_rate": 0.00029965690339264393, "loss": 2.5787, "step": 821 }, { "epoch": 0.06, "learning_rate": 0.00029965606740164674, "loss": 2.5851, "step": 822 }, { "epoch": 0.06, "learning_rate": 0.00029965523039456743, "loss": 2.5709, "step": 823 }, { "epoch": 0.06, "learning_rate": 0.0002996543923714117, "loss": 2.6202, "step": 824 }, { "epoch": 0.06, "learning_rate": 0.0002996535533321852, "loss": 2.6058, "step": 825 }, { "epoch": 0.06, "learning_rate": 0.00029965271327689363, "loss": 2.5827, "step": 826 }, { "epoch": 0.07, "learning_rate": 0.0002996518722055428, "loss": 2.5765, "step": 827 }, { "epoch": 0.07, "learning_rate": 0.0002996510301181383, "loss": 2.596, "step": 828 }, { "epoch": 0.07, "learning_rate": 0.0002996501870146859, "loss": 2.5547, "step": 829 }, { "epoch": 0.07, "learning_rate": 0.00029964934289519133, "loss": 2.5631, "step": 830 }, { "epoch": 0.07, "learning_rate": 0.0002996484977596603, "loss": 2.6027, "step": 831 }, { "epoch": 0.07, "learning_rate": 0.0002996476516080985, "loss": 2.5882, "step": 832 }, { "epoch": 0.07, "learning_rate": 0.00029964680444051175, "loss": 2.5488, "step": 833 }, { "epoch": 0.07, "learning_rate": 0.0002996459562569058, "loss": 2.6001, "step": 834 }, { "epoch": 0.07, "learning_rate": 0.0002996451070572864, "loss": 2.5521, "step": 835 }, { "epoch": 0.07, "learning_rate": 0.0002996442568416592, "loss": 2.5387, "step": 836 }, { "epoch": 0.07, "learning_rate": 0.00029964340561003025, "loss": 2.5248, "step": 837 }, { "epoch": 0.07, "learning_rate": 0.0002996425533624051, "loss": 2.5476, "step": 838 }, { "epoch": 0.07, "learning_rate": 0.0002996417000987895, "loss": 2.6041, "step": 839 }, { "epoch": 0.07, "learning_rate": 0.0002996408458191894, "loss": 2.5255, "step": 840 }, { "epoch": 0.07, "learning_rate": 0.00029963999052361054, "loss": 2.504, "step": 841 }, { "epoch": 0.07, "learning_rate": 0.00029963913421205877, "loss": 2.5725, "step": 842 }, { "epoch": 0.07, "learning_rate": 0.0002996382768845398, "loss": 2.5711, "step": 843 }, { "epoch": 0.07, "learning_rate": 0.00029963741854105945, "loss": 2.5388, "step": 844 }, { "epoch": 0.07, "learning_rate": 0.0002996365591816237, "loss": 2.5449, "step": 845 }, { "epoch": 0.07, "learning_rate": 0.0002996356988062382, "loss": 2.5452, "step": 846 }, { "epoch": 0.07, "learning_rate": 0.00029963483741490897, "loss": 2.5475, "step": 847 }, { "epoch": 0.07, "learning_rate": 0.00029963397500764173, "loss": 2.5254, "step": 848 }, { "epoch": 0.07, "learning_rate": 0.00029963311158444237, "loss": 2.5781, "step": 849 }, { "epoch": 0.07, "learning_rate": 0.0002996322471453168, "loss": 2.5725, "step": 850 }, { "epoch": 0.07, "learning_rate": 0.00029963138169027077, "loss": 2.5344, "step": 851 }, { "epoch": 0.07, "learning_rate": 0.0002996305152193103, "loss": 2.5037, "step": 852 }, { "epoch": 0.07, "learning_rate": 0.0002996296477324412, "loss": 2.526, "step": 853 }, { "epoch": 0.07, "learning_rate": 0.0002996287792296693, "loss": 2.5008, "step": 854 }, { "epoch": 0.07, "learning_rate": 0.0002996279097110006, "loss": 2.5345, "step": 855 }, { "epoch": 0.07, "learning_rate": 0.00029962703917644096, "loss": 2.5446, "step": 856 }, { "epoch": 0.07, "learning_rate": 0.0002996261676259963, "loss": 2.5178, "step": 857 }, { "epoch": 0.07, "learning_rate": 0.00029962529505967253, "loss": 2.5473, "step": 858 }, { "epoch": 0.07, "learning_rate": 0.00029962442147747555, "loss": 2.5066, "step": 859 }, { "epoch": 0.07, "learning_rate": 0.0002996235468794114, "loss": 2.5714, "step": 860 }, { "epoch": 0.07, "learning_rate": 0.0002996226712654859, "loss": 2.5312, "step": 861 }, { "epoch": 0.07, "learning_rate": 0.00029962179463570497, "loss": 2.5288, "step": 862 }, { "epoch": 0.07, "learning_rate": 0.0002996209169900747, "loss": 2.5205, "step": 863 }, { "epoch": 0.07, "learning_rate": 0.00029962003832860093, "loss": 2.5438, "step": 864 }, { "epoch": 0.07, "learning_rate": 0.00029961915865128963, "loss": 2.4147, "step": 865 }, { "epoch": 0.07, "learning_rate": 0.0002996182779581469, "loss": 2.4565, "step": 866 }, { "epoch": 0.07, "learning_rate": 0.0002996173962491786, "loss": 2.5225, "step": 867 }, { "epoch": 0.07, "learning_rate": 0.0002996165135243907, "loss": 2.5473, "step": 868 }, { "epoch": 0.07, "learning_rate": 0.0002996156297837893, "loss": 2.5291, "step": 869 }, { "epoch": 0.07, "learning_rate": 0.0002996147450273803, "loss": 2.469, "step": 870 }, { "epoch": 0.07, "learning_rate": 0.00029961385925516973, "loss": 2.4727, "step": 871 }, { "epoch": 0.07, "learning_rate": 0.00029961297246716364, "loss": 2.545, "step": 872 }, { "epoch": 0.07, "learning_rate": 0.000299612084663368, "loss": 2.4788, "step": 873 }, { "epoch": 0.07, "learning_rate": 0.00029961119584378897, "loss": 2.4692, "step": 874 }, { "epoch": 0.07, "learning_rate": 0.00029961030600843237, "loss": 2.5087, "step": 875 }, { "epoch": 0.07, "learning_rate": 0.0002996094151573044, "loss": 2.5419, "step": 876 }, { "epoch": 0.07, "learning_rate": 0.0002996085232904111, "loss": 2.4337, "step": 877 }, { "epoch": 0.07, "learning_rate": 0.0002996076304077584, "loss": 2.5069, "step": 878 }, { "epoch": 0.07, "learning_rate": 0.0002996067365093525, "loss": 2.4574, "step": 879 }, { "epoch": 0.07, "learning_rate": 0.0002996058415951994, "loss": 2.5347, "step": 880 }, { "epoch": 0.07, "learning_rate": 0.00029960494566530526, "loss": 2.5104, "step": 881 }, { "epoch": 0.07, "learning_rate": 0.000299604048719676, "loss": 2.4503, "step": 882 }, { "epoch": 0.07, "learning_rate": 0.00029960315075831784, "loss": 2.4959, "step": 883 }, { "epoch": 0.07, "learning_rate": 0.0002996022517812369, "loss": 2.4698, "step": 884 }, { "epoch": 0.07, "learning_rate": 0.0002996013517884392, "loss": 2.5045, "step": 885 }, { "epoch": 0.07, "learning_rate": 0.0002996004507799308, "loss": 2.4809, "step": 886 }, { "epoch": 0.07, "learning_rate": 0.000299599548755718, "loss": 2.503, "step": 887 }, { "epoch": 0.07, "learning_rate": 0.00029959864571580677, "loss": 2.4994, "step": 888 }, { "epoch": 0.07, "learning_rate": 0.00029959774166020333, "loss": 2.5109, "step": 889 }, { "epoch": 0.07, "learning_rate": 0.0002995968365889137, "loss": 2.5131, "step": 890 }, { "epoch": 0.07, "learning_rate": 0.00029959593050194415, "loss": 2.5158, "step": 891 }, { "epoch": 0.07, "learning_rate": 0.00029959502339930083, "loss": 2.4482, "step": 892 }, { "epoch": 0.07, "learning_rate": 0.0002995941152809898, "loss": 2.4369, "step": 893 }, { "epoch": 0.07, "learning_rate": 0.0002995932061470173, "loss": 2.5019, "step": 894 }, { "epoch": 0.07, "learning_rate": 0.00029959229599738947, "loss": 2.5694, "step": 895 }, { "epoch": 0.07, "learning_rate": 0.0002995913848321125, "loss": 2.4724, "step": 896 }, { "epoch": 0.07, "learning_rate": 0.0002995904726511926, "loss": 2.4821, "step": 897 }, { "epoch": 0.07, "learning_rate": 0.0002995895594546359, "loss": 2.4301, "step": 898 }, { "epoch": 0.07, "learning_rate": 0.00029958864524244866, "loss": 2.4892, "step": 899 }, { "epoch": 0.07, "learning_rate": 0.0002995877300146371, "loss": 2.4758, "step": 900 }, { "epoch": 0.07, "learning_rate": 0.0002995868137712074, "loss": 2.5378, "step": 901 }, { "epoch": 0.07, "learning_rate": 0.00029958589651216577, "loss": 2.5377, "step": 902 }, { "epoch": 0.07, "learning_rate": 0.0002995849782375184, "loss": 2.5067, "step": 903 }, { "epoch": 0.07, "learning_rate": 0.00029958405894727163, "loss": 2.4893, "step": 904 }, { "epoch": 0.07, "learning_rate": 0.00029958313864143164, "loss": 2.4583, "step": 905 }, { "epoch": 0.07, "learning_rate": 0.0002995822173200047, "loss": 2.5087, "step": 906 }, { "epoch": 0.07, "learning_rate": 0.00029958129498299706, "loss": 2.4668, "step": 907 }, { "epoch": 0.07, "learning_rate": 0.00029958037163041495, "loss": 2.4651, "step": 908 }, { "epoch": 0.07, "learning_rate": 0.0002995794472622646, "loss": 2.4443, "step": 909 }, { "epoch": 0.07, "learning_rate": 0.00029957852187855247, "loss": 2.4472, "step": 910 }, { "epoch": 0.07, "learning_rate": 0.0002995775954792846, "loss": 2.4927, "step": 911 }, { "epoch": 0.07, "learning_rate": 0.0002995766680644675, "loss": 2.4594, "step": 912 }, { "epoch": 0.07, "learning_rate": 0.00029957573963410733, "loss": 2.4903, "step": 913 }, { "epoch": 0.07, "learning_rate": 0.00029957481018821045, "loss": 2.4069, "step": 914 }, { "epoch": 0.07, "learning_rate": 0.0002995738797267831, "loss": 2.4509, "step": 915 }, { "epoch": 0.07, "learning_rate": 0.00029957294824983164, "loss": 2.4611, "step": 916 }, { "epoch": 0.07, "learning_rate": 0.00029957201575736244, "loss": 2.4849, "step": 917 }, { "epoch": 0.07, "learning_rate": 0.0002995710822493818, "loss": 2.439, "step": 918 }, { "epoch": 0.07, "learning_rate": 0.00029957014772589606, "loss": 2.4639, "step": 919 }, { "epoch": 0.07, "learning_rate": 0.0002995692121869115, "loss": 2.4206, "step": 920 }, { "epoch": 0.07, "learning_rate": 0.00029956827563243463, "loss": 2.4601, "step": 921 }, { "epoch": 0.07, "learning_rate": 0.0002995673380624716, "loss": 2.4707, "step": 922 }, { "epoch": 0.07, "learning_rate": 0.00029956639947702896, "loss": 2.4538, "step": 923 }, { "epoch": 0.07, "learning_rate": 0.000299565459876113, "loss": 2.4373, "step": 924 }, { "epoch": 0.07, "learning_rate": 0.00029956451925973004, "loss": 2.5479, "step": 925 }, { "epoch": 0.07, "learning_rate": 0.0002995635776278866, "loss": 2.403, "step": 926 }, { "epoch": 0.07, "learning_rate": 0.00029956263498058896, "loss": 2.4772, "step": 927 }, { "epoch": 0.07, "learning_rate": 0.0002995616913178435, "loss": 2.4567, "step": 928 }, { "epoch": 0.07, "learning_rate": 0.0002995607466396568, "loss": 2.419, "step": 929 }, { "epoch": 0.07, "learning_rate": 0.00029955980094603516, "loss": 2.5241, "step": 930 }, { "epoch": 0.07, "learning_rate": 0.000299558854236985, "loss": 2.4799, "step": 931 }, { "epoch": 0.07, "learning_rate": 0.0002995579065125127, "loss": 2.4064, "step": 932 }, { "epoch": 0.07, "learning_rate": 0.00029955695777262475, "loss": 2.4598, "step": 933 }, { "epoch": 0.07, "learning_rate": 0.00029955600801732766, "loss": 2.4473, "step": 934 }, { "epoch": 0.07, "learning_rate": 0.00029955505724662775, "loss": 2.4555, "step": 935 }, { "epoch": 0.07, "learning_rate": 0.0002995541054605316, "loss": 2.489, "step": 936 }, { "epoch": 0.07, "learning_rate": 0.0002995531526590455, "loss": 2.468, "step": 937 }, { "epoch": 0.07, "learning_rate": 0.0002995521988421761, "loss": 2.5146, "step": 938 }, { "epoch": 0.07, "learning_rate": 0.0002995512440099298, "loss": 2.4364, "step": 939 }, { "epoch": 0.07, "learning_rate": 0.000299550288162313, "loss": 2.4377, "step": 940 }, { "epoch": 0.07, "learning_rate": 0.00029954933129933234, "loss": 2.4465, "step": 941 }, { "epoch": 0.07, "learning_rate": 0.0002995483734209942, "loss": 2.3763, "step": 942 }, { "epoch": 0.07, "learning_rate": 0.0002995474145273052, "loss": 2.4142, "step": 943 }, { "epoch": 0.07, "learning_rate": 0.0002995464546182718, "loss": 2.4981, "step": 944 }, { "epoch": 0.07, "learning_rate": 0.0002995454936939004, "loss": 2.4564, "step": 945 }, { "epoch": 0.07, "learning_rate": 0.0002995445317541977, "loss": 2.4549, "step": 946 }, { "epoch": 0.07, "learning_rate": 0.00029954356879917013, "loss": 2.4502, "step": 947 }, { "epoch": 0.07, "learning_rate": 0.00029954260482882426, "loss": 2.5091, "step": 948 }, { "epoch": 0.07, "learning_rate": 0.00029954163984316663, "loss": 2.4336, "step": 949 }, { "epoch": 0.07, "learning_rate": 0.00029954067384220376, "loss": 2.4883, "step": 950 }, { "epoch": 0.07, "learning_rate": 0.00029953970682594226, "loss": 2.3717, "step": 951 }, { "epoch": 0.07, "learning_rate": 0.0002995387387943887, "loss": 2.4009, "step": 952 }, { "epoch": 0.07, "learning_rate": 0.00029953776974754956, "loss": 2.4802, "step": 953 }, { "epoch": 0.08, "learning_rate": 0.0002995367996854315, "loss": 2.446, "step": 954 }, { "epoch": 0.08, "learning_rate": 0.00029953582860804115, "loss": 2.4634, "step": 955 }, { "epoch": 0.08, "learning_rate": 0.000299534856515385, "loss": 2.5318, "step": 956 }, { "epoch": 0.08, "learning_rate": 0.0002995338834074697, "loss": 2.4799, "step": 957 }, { "epoch": 0.08, "learning_rate": 0.00029953290928430186, "loss": 2.4091, "step": 958 }, { "epoch": 0.08, "learning_rate": 0.0002995319341458881, "loss": 2.4339, "step": 959 }, { "epoch": 0.08, "learning_rate": 0.00029953095799223497, "loss": 2.4347, "step": 960 }, { "epoch": 0.08, "learning_rate": 0.00029952998082334923, "loss": 2.5073, "step": 961 }, { "epoch": 0.08, "learning_rate": 0.0002995290026392374, "loss": 2.4782, "step": 962 }, { "epoch": 0.08, "learning_rate": 0.0002995280234399061, "loss": 2.4541, "step": 963 }, { "epoch": 0.08, "learning_rate": 0.00029952704322536215, "loss": 2.4737, "step": 964 }, { "epoch": 0.08, "learning_rate": 0.00029952606199561203, "loss": 2.4332, "step": 965 }, { "epoch": 0.08, "learning_rate": 0.0002995250797506625, "loss": 2.4217, "step": 966 }, { "epoch": 0.08, "learning_rate": 0.00029952409649052007, "loss": 2.4552, "step": 967 }, { "epoch": 0.08, "learning_rate": 0.00029952311221519167, "loss": 2.4707, "step": 968 }, { "epoch": 0.08, "learning_rate": 0.0002995221269246838, "loss": 2.4569, "step": 969 }, { "epoch": 0.08, "learning_rate": 0.0002995211406190032, "loss": 2.4627, "step": 970 }, { "epoch": 0.08, "learning_rate": 0.0002995201532981566, "loss": 2.371, "step": 971 }, { "epoch": 0.08, "learning_rate": 0.00029951916496215065, "loss": 2.4857, "step": 972 }, { "epoch": 0.08, "learning_rate": 0.0002995181756109921, "loss": 2.4537, "step": 973 }, { "epoch": 0.08, "learning_rate": 0.0002995171852446876, "loss": 2.3908, "step": 974 }, { "epoch": 0.08, "learning_rate": 0.000299516193863244, "loss": 2.4091, "step": 975 }, { "epoch": 0.08, "learning_rate": 0.00029951520146666793, "loss": 2.4143, "step": 976 }, { "epoch": 0.08, "learning_rate": 0.0002995142080549661, "loss": 2.3941, "step": 977 }, { "epoch": 0.08, "learning_rate": 0.00029951321362814534, "loss": 2.4339, "step": 978 }, { "epoch": 0.08, "learning_rate": 0.00029951221818621236, "loss": 2.4741, "step": 979 }, { "epoch": 0.08, "learning_rate": 0.00029951122172917395, "loss": 2.4196, "step": 980 }, { "epoch": 0.08, "learning_rate": 0.00029951022425703683, "loss": 2.3997, "step": 981 }, { "epoch": 0.08, "learning_rate": 0.0002995092257698078, "loss": 2.4117, "step": 982 }, { "epoch": 0.08, "learning_rate": 0.0002995082262674936, "loss": 2.4115, "step": 983 }, { "epoch": 0.08, "learning_rate": 0.0002995072257501011, "loss": 2.4152, "step": 984 }, { "epoch": 0.08, "learning_rate": 0.00029950622421763697, "loss": 2.496, "step": 985 }, { "epoch": 0.08, "learning_rate": 0.0002995052216701082, "loss": 2.4278, "step": 986 }, { "epoch": 0.08, "learning_rate": 0.0002995042181075214, "loss": 2.4514, "step": 987 }, { "epoch": 0.08, "learning_rate": 0.00029950321352988345, "loss": 2.4254, "step": 988 }, { "epoch": 0.08, "learning_rate": 0.00029950220793720125, "loss": 2.391, "step": 989 }, { "epoch": 0.08, "learning_rate": 0.0002995012013294815, "loss": 2.4277, "step": 990 }, { "epoch": 0.08, "learning_rate": 0.00029950019370673106, "loss": 2.3824, "step": 991 }, { "epoch": 0.08, "learning_rate": 0.0002994991850689569, "loss": 2.4789, "step": 992 }, { "epoch": 0.08, "learning_rate": 0.00029949817541616574, "loss": 2.4771, "step": 993 }, { "epoch": 0.08, "learning_rate": 0.00029949716474836444, "loss": 2.4451, "step": 994 }, { "epoch": 0.08, "learning_rate": 0.0002994961530655599, "loss": 2.4752, "step": 995 }, { "epoch": 0.08, "learning_rate": 0.000299495140367759, "loss": 2.487, "step": 996 }, { "epoch": 0.08, "learning_rate": 0.00029949412665496855, "loss": 2.4093, "step": 997 }, { "epoch": 0.08, "learning_rate": 0.00029949311192719555, "loss": 2.4467, "step": 998 }, { "epoch": 0.08, "learning_rate": 0.0002994920961844468, "loss": 2.3478, "step": 999 }, { "epoch": 0.08, "learning_rate": 0.0002994910794267292, "loss": 2.4378, "step": 1000 }, { "epoch": 0.08, "learning_rate": 0.0002994900616540496, "loss": 2.475, "step": 1001 }, { "epoch": 0.08, "learning_rate": 0.00029948904286641507, "loss": 2.4273, "step": 1002 }, { "epoch": 0.08, "learning_rate": 0.0002994880230638324, "loss": 2.4318, "step": 1003 }, { "epoch": 0.08, "learning_rate": 0.00029948700224630853, "loss": 2.3908, "step": 1004 }, { "epoch": 0.08, "learning_rate": 0.0002994859804138504, "loss": 2.4367, "step": 1005 }, { "epoch": 0.08, "learning_rate": 0.00029948495756646507, "loss": 2.3635, "step": 1006 }, { "epoch": 0.08, "learning_rate": 0.00029948393370415926, "loss": 2.3885, "step": 1007 }, { "epoch": 0.08, "learning_rate": 0.00029948290882694003, "loss": 2.3733, "step": 1008 }, { "epoch": 0.08, "learning_rate": 0.0002994818829348144, "loss": 2.4475, "step": 1009 }, { "epoch": 0.08, "learning_rate": 0.0002994808560277892, "loss": 2.3787, "step": 1010 }, { "epoch": 0.08, "learning_rate": 0.0002994798281058716, "loss": 2.435, "step": 1011 }, { "epoch": 0.08, "learning_rate": 0.0002994787991690683, "loss": 2.4531, "step": 1012 }, { "epoch": 0.08, "learning_rate": 0.00029947776921738654, "loss": 2.38, "step": 1013 }, { "epoch": 0.08, "learning_rate": 0.0002994767382508332, "loss": 2.4337, "step": 1014 }, { "epoch": 0.08, "learning_rate": 0.0002994757062694153, "loss": 2.4192, "step": 1015 }, { "epoch": 0.08, "learning_rate": 0.0002994746732731398, "loss": 2.3856, "step": 1016 }, { "epoch": 0.08, "learning_rate": 0.0002994736392620138, "loss": 2.4188, "step": 1017 }, { "epoch": 0.08, "learning_rate": 0.0002994726042360443, "loss": 2.4096, "step": 1018 }, { "epoch": 0.08, "learning_rate": 0.00029947156819523825, "loss": 2.4401, "step": 1019 }, { "epoch": 0.08, "learning_rate": 0.0002994705311396027, "loss": 2.4234, "step": 1020 }, { "epoch": 0.08, "learning_rate": 0.00029946949306914483, "loss": 2.398, "step": 1021 }, { "epoch": 0.08, "learning_rate": 0.00029946845398387155, "loss": 2.3451, "step": 1022 }, { "epoch": 0.08, "learning_rate": 0.0002994674138837899, "loss": 2.4133, "step": 1023 }, { "epoch": 0.08, "learning_rate": 0.0002994663727689071, "loss": 2.3542, "step": 1024 }, { "epoch": 0.08, "learning_rate": 0.00029946533063923, "loss": 2.3276, "step": 1025 }, { "epoch": 0.08, "learning_rate": 0.00029946428749476583, "loss": 2.3944, "step": 1026 }, { "epoch": 0.08, "learning_rate": 0.00029946324333552163, "loss": 2.4432, "step": 1027 }, { "epoch": 0.08, "learning_rate": 0.0002994621981615045, "loss": 2.3894, "step": 1028 }, { "epoch": 0.08, "learning_rate": 0.0002994611519727215, "loss": 2.4597, "step": 1029 }, { "epoch": 0.08, "learning_rate": 0.00029946010476917975, "loss": 2.4048, "step": 1030 }, { "epoch": 0.08, "learning_rate": 0.0002994590565508864, "loss": 2.4021, "step": 1031 }, { "epoch": 0.08, "learning_rate": 0.00029945800731784853, "loss": 2.383, "step": 1032 }, { "epoch": 0.08, "learning_rate": 0.0002994569570700733, "loss": 2.3822, "step": 1033 }, { "epoch": 0.08, "learning_rate": 0.00029945590580756774, "loss": 2.3227, "step": 1034 }, { "epoch": 0.08, "learning_rate": 0.00029945485353033907, "loss": 2.4405, "step": 1035 }, { "epoch": 0.08, "learning_rate": 0.00029945380023839446, "loss": 2.3948, "step": 1036 }, { "epoch": 0.08, "learning_rate": 0.000299452745931741, "loss": 2.4439, "step": 1037 }, { "epoch": 0.08, "learning_rate": 0.00029945169061038583, "loss": 2.371, "step": 1038 }, { "epoch": 0.08, "learning_rate": 0.0002994506342743362, "loss": 2.3856, "step": 1039 }, { "epoch": 0.08, "learning_rate": 0.00029944957692359925, "loss": 2.3976, "step": 1040 }, { "epoch": 0.08, "learning_rate": 0.00029944851855818214, "loss": 2.4161, "step": 1041 }, { "epoch": 0.08, "learning_rate": 0.00029944745917809203, "loss": 2.4012, "step": 1042 }, { "epoch": 0.08, "learning_rate": 0.00029944639878333614, "loss": 2.3819, "step": 1043 }, { "epoch": 0.08, "learning_rate": 0.00029944533737392173, "loss": 2.3812, "step": 1044 }, { "epoch": 0.08, "learning_rate": 0.00029944427494985585, "loss": 2.4046, "step": 1045 }, { "epoch": 0.08, "learning_rate": 0.00029944321151114593, "loss": 2.3437, "step": 1046 }, { "epoch": 0.08, "learning_rate": 0.000299442147057799, "loss": 2.3255, "step": 1047 }, { "epoch": 0.08, "learning_rate": 0.0002994410815898224, "loss": 2.3473, "step": 1048 }, { "epoch": 0.08, "learning_rate": 0.0002994400151072233, "loss": 2.3679, "step": 1049 }, { "epoch": 0.08, "learning_rate": 0.000299438947610009, "loss": 2.4013, "step": 1050 }, { "epoch": 0.08, "learning_rate": 0.00029943787909818666, "loss": 2.3646, "step": 1051 }, { "epoch": 0.08, "learning_rate": 0.0002994368095717636, "loss": 2.3633, "step": 1052 }, { "epoch": 0.08, "learning_rate": 0.00029943573903074705, "loss": 2.3307, "step": 1053 }, { "epoch": 0.08, "learning_rate": 0.00029943466747514434, "loss": 2.4129, "step": 1054 }, { "epoch": 0.08, "learning_rate": 0.00029943359490496274, "loss": 2.3662, "step": 1055 }, { "epoch": 0.08, "learning_rate": 0.0002994325213202094, "loss": 2.4338, "step": 1056 }, { "epoch": 0.08, "learning_rate": 0.0002994314467208918, "loss": 2.382, "step": 1057 }, { "epoch": 0.08, "learning_rate": 0.0002994303711070171, "loss": 2.4172, "step": 1058 }, { "epoch": 0.08, "learning_rate": 0.0002994292944785926, "loss": 2.3932, "step": 1059 }, { "epoch": 0.08, "learning_rate": 0.0002994282168356257, "loss": 2.3519, "step": 1060 }, { "epoch": 0.08, "learning_rate": 0.0002994271381781236, "loss": 2.3415, "step": 1061 }, { "epoch": 0.08, "learning_rate": 0.0002994260585060938, "loss": 2.3339, "step": 1062 }, { "epoch": 0.08, "learning_rate": 0.00029942497781954345, "loss": 2.3717, "step": 1063 }, { "epoch": 0.08, "learning_rate": 0.00029942389611848, "loss": 2.3452, "step": 1064 }, { "epoch": 0.08, "learning_rate": 0.0002994228134029107, "loss": 2.387, "step": 1065 }, { "epoch": 0.08, "learning_rate": 0.000299421729672843, "loss": 2.4084, "step": 1066 }, { "epoch": 0.08, "learning_rate": 0.00029942064492828423, "loss": 2.378, "step": 1067 }, { "epoch": 0.08, "learning_rate": 0.00029941955916924166, "loss": 2.3161, "step": 1068 }, { "epoch": 0.08, "learning_rate": 0.0002994184723957228, "loss": 2.3644, "step": 1069 }, { "epoch": 0.08, "learning_rate": 0.00029941738460773494, "loss": 2.3616, "step": 1070 }, { "epoch": 0.08, "learning_rate": 0.00029941629580528553, "loss": 2.4232, "step": 1071 }, { "epoch": 0.08, "learning_rate": 0.00029941520598838193, "loss": 2.4228, "step": 1072 }, { "epoch": 0.08, "learning_rate": 0.0002994141151570315, "loss": 2.3709, "step": 1073 }, { "epoch": 0.08, "learning_rate": 0.0002994130233112417, "loss": 2.3049, "step": 1074 }, { "epoch": 0.08, "learning_rate": 0.0002994119304510199, "loss": 2.3026, "step": 1075 }, { "epoch": 0.08, "learning_rate": 0.00029941083657637356, "loss": 2.4302, "step": 1076 }, { "epoch": 0.08, "learning_rate": 0.00029940974168731014, "loss": 2.3535, "step": 1077 }, { "epoch": 0.08, "learning_rate": 0.00029940864578383697, "loss": 2.3673, "step": 1078 }, { "epoch": 0.08, "learning_rate": 0.0002994075488659616, "loss": 2.4297, "step": 1079 }, { "epoch": 0.08, "learning_rate": 0.0002994064509336913, "loss": 2.3842, "step": 1080 }, { "epoch": 0.09, "learning_rate": 0.00029940535198703374, "loss": 2.4028, "step": 1081 }, { "epoch": 0.09, "learning_rate": 0.0002994042520259963, "loss": 2.351, "step": 1082 }, { "epoch": 0.09, "learning_rate": 0.0002994031510505864, "loss": 2.3518, "step": 1083 }, { "epoch": 0.09, "learning_rate": 0.00029940204906081156, "loss": 2.3705, "step": 1084 }, { "epoch": 0.09, "learning_rate": 0.00029940094605667924, "loss": 2.3662, "step": 1085 }, { "epoch": 0.09, "learning_rate": 0.000299399842038197, "loss": 2.3791, "step": 1086 }, { "epoch": 0.09, "learning_rate": 0.00029939873700537224, "loss": 2.3287, "step": 1087 }, { "epoch": 0.09, "learning_rate": 0.0002993976309582125, "loss": 2.3227, "step": 1088 }, { "epoch": 0.09, "learning_rate": 0.00029939652389672527, "loss": 2.382, "step": 1089 }, { "epoch": 0.09, "learning_rate": 0.0002993954158209181, "loss": 2.3469, "step": 1090 }, { "epoch": 0.09, "learning_rate": 0.0002993943067307985, "loss": 2.3566, "step": 1091 }, { "epoch": 0.09, "learning_rate": 0.00029939319662637405, "loss": 2.4023, "step": 1092 }, { "epoch": 0.09, "learning_rate": 0.00029939208550765217, "loss": 2.3514, "step": 1093 }, { "epoch": 0.09, "learning_rate": 0.00029939097337464046, "loss": 2.4021, "step": 1094 }, { "epoch": 0.09, "learning_rate": 0.0002993898602273465, "loss": 2.3949, "step": 1095 }, { "epoch": 0.09, "learning_rate": 0.0002993887460657779, "loss": 2.4319, "step": 1096 }, { "epoch": 0.09, "learning_rate": 0.0002993876308899421, "loss": 2.304, "step": 1097 }, { "epoch": 0.09, "learning_rate": 0.0002993865146998467, "loss": 2.3651, "step": 1098 }, { "epoch": 0.09, "learning_rate": 0.00029938539749549935, "loss": 2.3467, "step": 1099 }, { "epoch": 0.09, "learning_rate": 0.0002993842792769075, "loss": 2.3879, "step": 1100 }, { "epoch": 0.09, "learning_rate": 0.00029938316004407897, "loss": 2.3875, "step": 1101 }, { "epoch": 0.09, "learning_rate": 0.00029938203979702115, "loss": 2.3303, "step": 1102 }, { "epoch": 0.09, "learning_rate": 0.0002993809185357417, "loss": 2.3821, "step": 1103 }, { "epoch": 0.09, "learning_rate": 0.00029937979626024823, "loss": 2.2558, "step": 1104 }, { "epoch": 0.09, "learning_rate": 0.0002993786729705485, "loss": 2.3245, "step": 1105 }, { "epoch": 0.09, "learning_rate": 0.00029937754866664985, "loss": 2.3711, "step": 1106 }, { "epoch": 0.09, "learning_rate": 0.00029937642334856016, "loss": 2.365, "step": 1107 }, { "epoch": 0.09, "learning_rate": 0.000299375297016287, "loss": 2.3451, "step": 1108 }, { "epoch": 0.09, "learning_rate": 0.00029937416966983795, "loss": 2.3633, "step": 1109 }, { "epoch": 0.09, "learning_rate": 0.00029937304130922077, "loss": 2.2995, "step": 1110 }, { "epoch": 0.09, "learning_rate": 0.00029937191193444304, "loss": 2.3672, "step": 1111 }, { "epoch": 0.09, "learning_rate": 0.00029937078154551247, "loss": 2.3361, "step": 1112 }, { "epoch": 0.09, "learning_rate": 0.0002993696501424367, "loss": 2.3314, "step": 1113 }, { "epoch": 0.09, "learning_rate": 0.0002993685177252235, "loss": 2.3841, "step": 1114 }, { "epoch": 0.09, "learning_rate": 0.00029936738429388044, "loss": 2.4108, "step": 1115 }, { "epoch": 0.09, "learning_rate": 0.00029936624984841525, "loss": 2.3474, "step": 1116 }, { "epoch": 0.09, "learning_rate": 0.0002993651143888357, "loss": 2.3531, "step": 1117 }, { "epoch": 0.09, "learning_rate": 0.00029936397791514944, "loss": 2.4115, "step": 1118 }, { "epoch": 0.09, "learning_rate": 0.0002993628404273642, "loss": 2.3839, "step": 1119 }, { "epoch": 0.09, "learning_rate": 0.0002993617019254877, "loss": 2.3253, "step": 1120 }, { "epoch": 0.09, "learning_rate": 0.0002993605624095276, "loss": 2.4003, "step": 1121 }, { "epoch": 0.09, "learning_rate": 0.00029935942187949175, "loss": 2.3408, "step": 1122 }, { "epoch": 0.09, "learning_rate": 0.0002993582803353879, "loss": 2.3725, "step": 1123 }, { "epoch": 0.09, "learning_rate": 0.0002993571377772237, "loss": 2.2697, "step": 1124 }, { "epoch": 0.09, "learning_rate": 0.00029935599420500696, "loss": 2.3347, "step": 1125 }, { "epoch": 0.09, "learning_rate": 0.0002993548496187454, "loss": 2.3484, "step": 1126 }, { "epoch": 0.09, "learning_rate": 0.0002993537040184469, "loss": 2.297, "step": 1127 }, { "epoch": 0.09, "learning_rate": 0.0002993525574041192, "loss": 2.3223, "step": 1128 }, { "epoch": 0.09, "learning_rate": 0.00029935140977576996, "loss": 2.335, "step": 1129 }, { "epoch": 0.09, "learning_rate": 0.00029935026113340715, "loss": 2.3161, "step": 1130 }, { "epoch": 0.09, "learning_rate": 0.00029934911147703845, "loss": 2.3505, "step": 1131 }, { "epoch": 0.09, "learning_rate": 0.00029934796080667163, "loss": 2.3098, "step": 1132 }, { "epoch": 0.09, "learning_rate": 0.00029934680912231464, "loss": 2.3859, "step": 1133 }, { "epoch": 0.09, "learning_rate": 0.00029934565642397525, "loss": 2.3531, "step": 1134 }, { "epoch": 0.09, "learning_rate": 0.00029934450271166125, "loss": 2.3284, "step": 1135 }, { "epoch": 0.09, "learning_rate": 0.0002993433479853805, "loss": 2.3244, "step": 1136 }, { "epoch": 0.09, "learning_rate": 0.0002993421922451408, "loss": 2.3494, "step": 1137 }, { "epoch": 0.09, "learning_rate": 0.0002993410354909501, "loss": 2.3158, "step": 1138 }, { "epoch": 0.09, "learning_rate": 0.0002993398777228161, "loss": 2.3333, "step": 1139 }, { "epoch": 0.09, "learning_rate": 0.0002993387189407468, "loss": 2.3285, "step": 1140 }, { "epoch": 0.09, "learning_rate": 0.00029933755914475, "loss": 2.2959, "step": 1141 }, { "epoch": 0.09, "learning_rate": 0.0002993363983348335, "loss": 2.3677, "step": 1142 }, { "epoch": 0.09, "learning_rate": 0.0002993352365110054, "loss": 2.3779, "step": 1143 }, { "epoch": 0.09, "learning_rate": 0.0002993340736732734, "loss": 2.3492, "step": 1144 }, { "epoch": 0.09, "learning_rate": 0.0002993329098216454, "loss": 2.3765, "step": 1145 }, { "epoch": 0.09, "learning_rate": 0.00029933174495612935, "loss": 2.2705, "step": 1146 }, { "epoch": 0.09, "learning_rate": 0.00029933057907673323, "loss": 2.2813, "step": 1147 }, { "epoch": 0.09, "learning_rate": 0.00029932941218346486, "loss": 2.3203, "step": 1148 }, { "epoch": 0.09, "learning_rate": 0.0002993282442763322, "loss": 2.3697, "step": 1149 }, { "epoch": 0.09, "learning_rate": 0.0002993270753553431, "loss": 2.345, "step": 1150 }, { "epoch": 0.09, "learning_rate": 0.00029932590542050563, "loss": 2.3425, "step": 1151 }, { "epoch": 0.09, "learning_rate": 0.0002993247344718277, "loss": 2.309, "step": 1152 }, { "epoch": 0.09, "learning_rate": 0.00029932356250931717, "loss": 2.3064, "step": 1153 }, { "epoch": 0.09, "learning_rate": 0.0002993223895329821, "loss": 2.3906, "step": 1154 }, { "epoch": 0.09, "learning_rate": 0.0002993212155428303, "loss": 2.3233, "step": 1155 }, { "epoch": 0.09, "learning_rate": 0.00029932004053886995, "loss": 2.2987, "step": 1156 }, { "epoch": 0.09, "learning_rate": 0.00029931886452110886, "loss": 2.3208, "step": 1157 }, { "epoch": 0.09, "learning_rate": 0.00029931768748955515, "loss": 2.3308, "step": 1158 }, { "epoch": 0.09, "learning_rate": 0.0002993165094442167, "loss": 2.2566, "step": 1159 }, { "epoch": 0.09, "learning_rate": 0.0002993153303851016, "loss": 2.2499, "step": 1160 }, { "epoch": 0.09, "learning_rate": 0.00029931415031221777, "loss": 2.3562, "step": 1161 }, { "epoch": 0.09, "learning_rate": 0.0002993129692255732, "loss": 2.4091, "step": 1162 }, { "epoch": 0.09, "learning_rate": 0.00029931178712517604, "loss": 2.2999, "step": 1163 }, { "epoch": 0.09, "learning_rate": 0.00029931060401103423, "loss": 2.3525, "step": 1164 }, { "epoch": 0.09, "learning_rate": 0.0002993094198831558, "loss": 2.345, "step": 1165 }, { "epoch": 0.09, "learning_rate": 0.0002993082347415488, "loss": 2.3671, "step": 1166 }, { "epoch": 0.09, "learning_rate": 0.00029930704858622127, "loss": 2.3732, "step": 1167 }, { "epoch": 0.09, "learning_rate": 0.00029930586141718133, "loss": 2.2735, "step": 1168 }, { "epoch": 0.09, "learning_rate": 0.00029930467323443697, "loss": 2.3849, "step": 1169 }, { "epoch": 0.09, "learning_rate": 0.0002993034840379962, "loss": 2.3249, "step": 1170 }, { "epoch": 0.09, "learning_rate": 0.00029930229382786724, "loss": 2.2889, "step": 1171 }, { "epoch": 0.09, "learning_rate": 0.0002993011026040581, "loss": 2.3531, "step": 1172 }, { "epoch": 0.09, "learning_rate": 0.0002992999103665768, "loss": 2.3658, "step": 1173 }, { "epoch": 0.09, "learning_rate": 0.0002992987171154316, "loss": 2.2872, "step": 1174 }, { "epoch": 0.09, "learning_rate": 0.00029929752285063043, "loss": 2.227, "step": 1175 }, { "epoch": 0.09, "learning_rate": 0.00029929632757218146, "loss": 2.3207, "step": 1176 }, { "epoch": 0.09, "learning_rate": 0.00029929513128009285, "loss": 2.3177, "step": 1177 }, { "epoch": 0.09, "learning_rate": 0.0002992939339743726, "loss": 2.3545, "step": 1178 }, { "epoch": 0.09, "learning_rate": 0.0002992927356550291, "loss": 2.3748, "step": 1179 }, { "epoch": 0.09, "learning_rate": 0.0002992915363220701, "loss": 2.3329, "step": 1180 }, { "epoch": 0.09, "learning_rate": 0.00029929033597550416, "loss": 2.3714, "step": 1181 }, { "epoch": 0.09, "learning_rate": 0.0002992891346153391, "loss": 2.3309, "step": 1182 }, { "epoch": 0.09, "learning_rate": 0.0002992879322415832, "loss": 2.3011, "step": 1183 }, { "epoch": 0.09, "learning_rate": 0.0002992867288542447, "loss": 2.3083, "step": 1184 }, { "epoch": 0.09, "learning_rate": 0.00029928552445333167, "loss": 2.3324, "step": 1185 }, { "epoch": 0.09, "learning_rate": 0.0002992843190388522, "loss": 2.2712, "step": 1186 }, { "epoch": 0.09, "learning_rate": 0.00029928311261081473, "loss": 2.287, "step": 1187 }, { "epoch": 0.09, "learning_rate": 0.0002992819051692272, "loss": 2.3039, "step": 1188 }, { "epoch": 0.09, "learning_rate": 0.000299280696714098, "loss": 2.31, "step": 1189 }, { "epoch": 0.09, "learning_rate": 0.0002992794872454352, "loss": 2.3548, "step": 1190 }, { "epoch": 0.09, "learning_rate": 0.0002992782767632471, "loss": 2.346, "step": 1191 }, { "epoch": 0.09, "learning_rate": 0.00029927706526754183, "loss": 2.3461, "step": 1192 }, { "epoch": 0.09, "learning_rate": 0.0002992758527583277, "loss": 2.3094, "step": 1193 }, { "epoch": 0.09, "learning_rate": 0.0002992746392356129, "loss": 2.3003, "step": 1194 }, { "epoch": 0.09, "learning_rate": 0.00029927342469940565, "loss": 2.2723, "step": 1195 }, { "epoch": 0.09, "learning_rate": 0.00029927220914971426, "loss": 2.3339, "step": 1196 }, { "epoch": 0.09, "learning_rate": 0.00029927099258654694, "loss": 2.2432, "step": 1197 }, { "epoch": 0.09, "learning_rate": 0.00029926977500991194, "loss": 2.2951, "step": 1198 }, { "epoch": 0.09, "learning_rate": 0.00029926855641981755, "loss": 2.3517, "step": 1199 }, { "epoch": 0.09, "learning_rate": 0.000299267336816272, "loss": 2.3117, "step": 1200 }, { "epoch": 0.09, "learning_rate": 0.0002992661161992836, "loss": 2.38, "step": 1201 }, { "epoch": 0.09, "learning_rate": 0.00029926489456886076, "loss": 2.2939, "step": 1202 }, { "epoch": 0.09, "learning_rate": 0.00029926367192501153, "loss": 2.3006, "step": 1203 }, { "epoch": 0.09, "learning_rate": 0.0002992624482677444, "loss": 2.2403, "step": 1204 }, { "epoch": 0.09, "learning_rate": 0.0002992612235970676, "loss": 2.3654, "step": 1205 }, { "epoch": 0.09, "learning_rate": 0.00029925999791298945, "loss": 2.3106, "step": 1206 }, { "epoch": 0.09, "learning_rate": 0.0002992587712155183, "loss": 2.3772, "step": 1207 }, { "epoch": 0.1, "learning_rate": 0.00029925754350466243, "loss": 2.3017, "step": 1208 }, { "epoch": 0.1, "learning_rate": 0.00029925631478043026, "loss": 2.3505, "step": 1209 }, { "epoch": 0.1, "learning_rate": 0.00029925508504283004, "loss": 2.3589, "step": 1210 }, { "epoch": 0.1, "learning_rate": 0.0002992538542918702, "loss": 2.3399, "step": 1211 }, { "epoch": 0.1, "learning_rate": 0.000299252622527559, "loss": 2.303, "step": 1212 }, { "epoch": 0.1, "learning_rate": 0.0002992513897499049, "loss": 2.3314, "step": 1213 }, { "epoch": 0.1, "learning_rate": 0.0002992501559589162, "loss": 2.2983, "step": 1214 }, { "epoch": 0.1, "learning_rate": 0.00029924892115460133, "loss": 2.3586, "step": 1215 }, { "epoch": 0.1, "learning_rate": 0.0002992476853369686, "loss": 2.3238, "step": 1216 }, { "epoch": 0.1, "learning_rate": 0.0002992464485060265, "loss": 2.2895, "step": 1217 }, { "epoch": 0.1, "learning_rate": 0.00029924521066178333, "loss": 2.3198, "step": 1218 }, { "epoch": 0.1, "learning_rate": 0.00029924397180424757, "loss": 2.3352, "step": 1219 }, { "epoch": 0.1, "learning_rate": 0.0002992427319334276, "loss": 2.3122, "step": 1220 }, { "epoch": 0.1, "learning_rate": 0.0002992414910493318, "loss": 2.2916, "step": 1221 }, { "epoch": 0.1, "learning_rate": 0.0002992402491519687, "loss": 2.3309, "step": 1222 }, { "epoch": 0.1, "learning_rate": 0.0002992390062413466, "loss": 2.3214, "step": 1223 }, { "epoch": 0.1, "learning_rate": 0.00029923776231747406, "loss": 2.2273, "step": 1224 }, { "epoch": 0.1, "learning_rate": 0.00029923651738035945, "loss": 2.2507, "step": 1225 }, { "epoch": 0.1, "learning_rate": 0.00029923527143001124, "loss": 2.2916, "step": 1226 }, { "epoch": 0.1, "learning_rate": 0.0002992340244664379, "loss": 2.3058, "step": 1227 }, { "epoch": 0.1, "learning_rate": 0.00029923277648964783, "loss": 2.3431, "step": 1228 }, { "epoch": 0.1, "learning_rate": 0.0002992315274996496, "loss": 2.2535, "step": 1229 }, { "epoch": 0.1, "learning_rate": 0.0002992302774964517, "loss": 2.2523, "step": 1230 }, { "epoch": 0.1, "learning_rate": 0.00029922902648006253, "loss": 2.2878, "step": 1231 }, { "epoch": 0.1, "learning_rate": 0.00029922777445049066, "loss": 2.2703, "step": 1232 }, { "epoch": 0.1, "learning_rate": 0.0002992265214077445, "loss": 2.3091, "step": 1233 }, { "epoch": 0.1, "learning_rate": 0.0002992252673518326, "loss": 2.243, "step": 1234 }, { "epoch": 0.1, "learning_rate": 0.0002992240122827635, "loss": 2.3052, "step": 1235 }, { "epoch": 0.1, "learning_rate": 0.00029922275620054573, "loss": 2.2856, "step": 1236 }, { "epoch": 0.1, "learning_rate": 0.0002992214991051878, "loss": 2.3244, "step": 1237 }, { "epoch": 0.1, "learning_rate": 0.0002992202409966982, "loss": 2.3054, "step": 1238 }, { "epoch": 0.1, "learning_rate": 0.00029921898187508554, "loss": 2.3059, "step": 1239 }, { "epoch": 0.1, "learning_rate": 0.0002992177217403583, "loss": 2.2835, "step": 1240 }, { "epoch": 0.1, "learning_rate": 0.0002992164605925251, "loss": 2.2558, "step": 1241 }, { "epoch": 0.1, "learning_rate": 0.0002992151984315944, "loss": 2.2837, "step": 1242 }, { "epoch": 0.1, "learning_rate": 0.000299213935257575, "loss": 2.2823, "step": 1243 }, { "epoch": 0.1, "learning_rate": 0.0002992126710704752, "loss": 2.2721, "step": 1244 }, { "epoch": 0.1, "learning_rate": 0.00029921140587030375, "loss": 2.3294, "step": 1245 }, { "epoch": 0.1, "learning_rate": 0.0002992101396570692, "loss": 2.2795, "step": 1246 }, { "epoch": 0.1, "learning_rate": 0.00029920887243078015, "loss": 2.2918, "step": 1247 }, { "epoch": 0.1, "learning_rate": 0.0002992076041914452, "loss": 2.2752, "step": 1248 }, { "epoch": 0.1, "learning_rate": 0.00029920633493907294, "loss": 2.3004, "step": 1249 }, { "epoch": 0.1, "learning_rate": 0.000299205064673672, "loss": 2.2249, "step": 1250 }, { "epoch": 0.1, "learning_rate": 0.00029920379339525103, "loss": 2.3005, "step": 1251 }, { "epoch": 0.1, "learning_rate": 0.00029920252110381866, "loss": 2.2747, "step": 1252 }, { "epoch": 0.1, "learning_rate": 0.00029920124779938347, "loss": 2.2074, "step": 1253 }, { "epoch": 0.1, "learning_rate": 0.0002991999734819541, "loss": 2.2401, "step": 1254 }, { "epoch": 0.1, "learning_rate": 0.00029919869815153927, "loss": 2.2449, "step": 1255 }, { "epoch": 0.1, "learning_rate": 0.00029919742180814767, "loss": 2.362, "step": 1256 }, { "epoch": 0.1, "learning_rate": 0.0002991961444517879, "loss": 2.2386, "step": 1257 }, { "epoch": 0.1, "learning_rate": 0.0002991948660824686, "loss": 2.2823, "step": 1258 }, { "epoch": 0.1, "learning_rate": 0.0002991935867001985, "loss": 2.2594, "step": 1259 }, { "epoch": 0.1, "learning_rate": 0.0002991923063049863, "loss": 2.2936, "step": 1260 }, { "epoch": 0.1, "learning_rate": 0.00029919102489684064, "loss": 2.3273, "step": 1261 }, { "epoch": 0.1, "learning_rate": 0.0002991897424757703, "loss": 2.2155, "step": 1262 }, { "epoch": 0.1, "learning_rate": 0.0002991884590417839, "loss": 2.2727, "step": 1263 }, { "epoch": 0.1, "learning_rate": 0.0002991871745948902, "loss": 2.2812, "step": 1264 }, { "epoch": 0.1, "learning_rate": 0.0002991858891350979, "loss": 2.3013, "step": 1265 }, { "epoch": 0.1, "learning_rate": 0.0002991846026624158, "loss": 2.2453, "step": 1266 }, { "epoch": 0.1, "learning_rate": 0.0002991833151768525, "loss": 2.3341, "step": 1267 }, { "epoch": 0.1, "learning_rate": 0.0002991820266784169, "loss": 2.2844, "step": 1268 }, { "epoch": 0.1, "learning_rate": 0.00029918073716711757, "loss": 2.276, "step": 1269 }, { "epoch": 0.1, "learning_rate": 0.0002991794466429634, "loss": 2.2514, "step": 1270 }, { "epoch": 0.1, "learning_rate": 0.0002991781551059631, "loss": 2.2779, "step": 1271 }, { "epoch": 0.1, "learning_rate": 0.0002991768625561255, "loss": 2.2921, "step": 1272 }, { "epoch": 0.1, "learning_rate": 0.0002991755689934592, "loss": 2.3068, "step": 1273 }, { "epoch": 0.1, "learning_rate": 0.0002991742744179733, "loss": 2.2414, "step": 1274 }, { "epoch": 0.1, "learning_rate": 0.0002991729788296763, "loss": 2.2875, "step": 1275 }, { "epoch": 0.1, "learning_rate": 0.00029917168222857706, "loss": 2.3323, "step": 1276 }, { "epoch": 0.1, "learning_rate": 0.0002991703846146844, "loss": 2.2571, "step": 1277 }, { "epoch": 0.1, "learning_rate": 0.00029916908598800725, "loss": 2.286, "step": 1278 }, { "epoch": 0.1, "learning_rate": 0.00029916778634855423, "loss": 2.3245, "step": 1279 }, { "epoch": 0.1, "learning_rate": 0.00029916648569633435, "loss": 2.2922, "step": 1280 }, { "epoch": 0.1, "learning_rate": 0.00029916518403135623, "loss": 2.3175, "step": 1281 }, { "epoch": 0.1, "learning_rate": 0.0002991638813536289, "loss": 2.2577, "step": 1282 }, { "epoch": 0.1, "learning_rate": 0.0002991625776631611, "loss": 2.2547, "step": 1283 }, { "epoch": 0.1, "learning_rate": 0.00029916127295996175, "loss": 2.2539, "step": 1284 }, { "epoch": 0.1, "learning_rate": 0.0002991599672440397, "loss": 2.2686, "step": 1285 }, { "epoch": 0.1, "learning_rate": 0.0002991586605154037, "loss": 2.2998, "step": 1286 }, { "epoch": 0.1, "learning_rate": 0.00029915735277406276, "loss": 2.2583, "step": 1287 }, { "epoch": 0.1, "learning_rate": 0.0002991560440200257, "loss": 2.2717, "step": 1288 }, { "epoch": 0.1, "learning_rate": 0.00029915473425330143, "loss": 2.3273, "step": 1289 }, { "epoch": 0.1, "learning_rate": 0.00029915342347389877, "loss": 2.3117, "step": 1290 }, { "epoch": 0.1, "learning_rate": 0.0002991521116818267, "loss": 2.2886, "step": 1291 }, { "epoch": 0.1, "learning_rate": 0.0002991507988770941, "loss": 2.2959, "step": 1292 }, { "epoch": 0.1, "learning_rate": 0.0002991494850597099, "loss": 2.2705, "step": 1293 }, { "epoch": 0.1, "learning_rate": 0.000299148170229683, "loss": 2.2778, "step": 1294 }, { "epoch": 0.1, "learning_rate": 0.00029914685438702237, "loss": 2.2373, "step": 1295 }, { "epoch": 0.1, "learning_rate": 0.0002991455375317368, "loss": 2.2591, "step": 1296 }, { "epoch": 0.1, "learning_rate": 0.0002991442196638354, "loss": 2.2761, "step": 1297 }, { "epoch": 0.1, "learning_rate": 0.00029914290078332707, "loss": 2.3094, "step": 1298 }, { "epoch": 0.1, "learning_rate": 0.00029914158089022075, "loss": 2.2261, "step": 1299 }, { "epoch": 0.1, "learning_rate": 0.0002991402599845254, "loss": 2.2192, "step": 1300 }, { "epoch": 0.1, "learning_rate": 0.00029913893806624996, "loss": 2.2404, "step": 1301 }, { "epoch": 0.1, "learning_rate": 0.0002991376151354034, "loss": 2.3354, "step": 1302 }, { "epoch": 0.1, "learning_rate": 0.00029913629119199476, "loss": 2.2274, "step": 1303 }, { "epoch": 0.1, "learning_rate": 0.000299134966236033, "loss": 2.249, "step": 1304 }, { "epoch": 0.1, "learning_rate": 0.00029913364026752713, "loss": 2.2798, "step": 1305 }, { "epoch": 0.1, "learning_rate": 0.0002991323132864862, "loss": 2.2279, "step": 1306 }, { "epoch": 0.1, "learning_rate": 0.0002991309852929191, "loss": 2.31, "step": 1307 }, { "epoch": 0.1, "learning_rate": 0.00029912965628683486, "loss": 2.226, "step": 1308 }, { "epoch": 0.1, "learning_rate": 0.00029912832626824263, "loss": 2.2669, "step": 1309 }, { "epoch": 0.1, "learning_rate": 0.00029912699523715135, "loss": 2.2233, "step": 1310 }, { "epoch": 0.1, "learning_rate": 0.00029912566319357, "loss": 2.2139, "step": 1311 }, { "epoch": 0.1, "learning_rate": 0.0002991243301375078, "loss": 2.1867, "step": 1312 }, { "epoch": 0.1, "learning_rate": 0.0002991229960689736, "loss": 2.3259, "step": 1313 }, { "epoch": 0.1, "learning_rate": 0.00029912166098797655, "loss": 2.2711, "step": 1314 }, { "epoch": 0.1, "learning_rate": 0.0002991203248945258, "loss": 2.2433, "step": 1315 }, { "epoch": 0.1, "learning_rate": 0.00029911898778863026, "loss": 2.2516, "step": 1316 }, { "epoch": 0.1, "learning_rate": 0.00029911764967029906, "loss": 2.3148, "step": 1317 }, { "epoch": 0.1, "learning_rate": 0.0002991163105395414, "loss": 2.2438, "step": 1318 }, { "epoch": 0.1, "learning_rate": 0.00029911497039636624, "loss": 2.3155, "step": 1319 }, { "epoch": 0.1, "learning_rate": 0.0002991136292407827, "loss": 2.3223, "step": 1320 }, { "epoch": 0.1, "learning_rate": 0.0002991122870727999, "loss": 2.2481, "step": 1321 }, { "epoch": 0.1, "learning_rate": 0.000299110943892427, "loss": 2.1777, "step": 1322 }, { "epoch": 0.1, "learning_rate": 0.00029910959969967304, "loss": 2.237, "step": 1323 }, { "epoch": 0.1, "learning_rate": 0.0002991082544945472, "loss": 2.2744, "step": 1324 }, { "epoch": 0.1, "learning_rate": 0.0002991069082770586, "loss": 2.3008, "step": 1325 }, { "epoch": 0.1, "learning_rate": 0.00029910556104721637, "loss": 2.2419, "step": 1326 }, { "epoch": 0.1, "learning_rate": 0.0002991042128050297, "loss": 2.256, "step": 1327 }, { "epoch": 0.1, "learning_rate": 0.00029910286355050767, "loss": 2.2861, "step": 1328 }, { "epoch": 0.1, "learning_rate": 0.00029910151328365947, "loss": 2.2915, "step": 1329 }, { "epoch": 0.1, "learning_rate": 0.00029910016200449424, "loss": 2.2158, "step": 1330 }, { "epoch": 0.1, "learning_rate": 0.00029909880971302127, "loss": 2.2429, "step": 1331 }, { "epoch": 0.1, "learning_rate": 0.0002990974564092496, "loss": 2.3137, "step": 1332 }, { "epoch": 0.1, "learning_rate": 0.0002990961020931885, "loss": 2.2434, "step": 1333 }, { "epoch": 0.1, "learning_rate": 0.0002990947467648472, "loss": 2.283, "step": 1334 }, { "epoch": 0.11, "learning_rate": 0.0002990933904242348, "loss": 2.2016, "step": 1335 }, { "epoch": 0.11, "learning_rate": 0.0002990920330713605, "loss": 2.2708, "step": 1336 }, { "epoch": 0.11, "learning_rate": 0.00029909067470623366, "loss": 2.2704, "step": 1337 }, { "epoch": 0.11, "learning_rate": 0.00029908931532886333, "loss": 2.2657, "step": 1338 }, { "epoch": 0.11, "learning_rate": 0.0002990879549392589, "loss": 2.2082, "step": 1339 }, { "epoch": 0.11, "learning_rate": 0.0002990865935374295, "loss": 2.156, "step": 1340 }, { "epoch": 0.11, "learning_rate": 0.0002990852311233844, "loss": 2.2998, "step": 1341 }, { "epoch": 0.11, "learning_rate": 0.00029908386769713285, "loss": 2.2839, "step": 1342 }, { "epoch": 0.11, "learning_rate": 0.0002990825032586841, "loss": 2.238, "step": 1343 }, { "epoch": 0.11, "learning_rate": 0.0002990811378080475, "loss": 2.3014, "step": 1344 }, { "epoch": 0.11, "learning_rate": 0.00029907977134523215, "loss": 2.2402, "step": 1345 }, { "epoch": 0.11, "learning_rate": 0.00029907840387024745, "loss": 2.1791, "step": 1346 }, { "epoch": 0.11, "learning_rate": 0.0002990770353831027, "loss": 2.2696, "step": 1347 }, { "epoch": 0.11, "learning_rate": 0.0002990756658838071, "loss": 2.2638, "step": 1348 }, { "epoch": 0.11, "learning_rate": 0.00029907429537237, "loss": 2.2995, "step": 1349 }, { "epoch": 0.11, "learning_rate": 0.0002990729238488007, "loss": 2.279, "step": 1350 }, { "epoch": 0.11, "learning_rate": 0.00029907155131310854, "loss": 2.2776, "step": 1351 }, { "epoch": 0.11, "learning_rate": 0.00029907017776530277, "loss": 2.2641, "step": 1352 }, { "epoch": 0.11, "learning_rate": 0.0002990688032053928, "loss": 2.2566, "step": 1353 }, { "epoch": 0.11, "learning_rate": 0.0002990674276333879, "loss": 2.1764, "step": 1354 }, { "epoch": 0.11, "learning_rate": 0.0002990660510492974, "loss": 2.249, "step": 1355 }, { "epoch": 0.11, "learning_rate": 0.0002990646734531307, "loss": 2.2813, "step": 1356 }, { "epoch": 0.11, "learning_rate": 0.0002990632948448971, "loss": 2.2117, "step": 1357 }, { "epoch": 0.11, "learning_rate": 0.00029906191522460605, "loss": 2.2857, "step": 1358 }, { "epoch": 0.11, "learning_rate": 0.0002990605345922668, "loss": 2.2811, "step": 1359 }, { "epoch": 0.11, "learning_rate": 0.0002990591529478888, "loss": 2.156, "step": 1360 }, { "epoch": 0.11, "learning_rate": 0.0002990577702914814, "loss": 2.2633, "step": 1361 }, { "epoch": 0.11, "learning_rate": 0.000299056386623054, "loss": 2.2355, "step": 1362 }, { "epoch": 0.11, "learning_rate": 0.000299055001942616, "loss": 2.2899, "step": 1363 }, { "epoch": 0.11, "learning_rate": 0.0002990536162501768, "loss": 2.1595, "step": 1364 }, { "epoch": 0.11, "learning_rate": 0.00029905222954574576, "loss": 2.2554, "step": 1365 }, { "epoch": 0.11, "learning_rate": 0.0002990508418293324, "loss": 2.2497, "step": 1366 }, { "epoch": 0.11, "learning_rate": 0.00029904945310094605, "loss": 2.2659, "step": 1367 }, { "epoch": 0.11, "learning_rate": 0.0002990480633605961, "loss": 2.1866, "step": 1368 }, { "epoch": 0.11, "learning_rate": 0.0002990466726082921, "loss": 2.1895, "step": 1369 }, { "epoch": 0.11, "learning_rate": 0.00029904528084404345, "loss": 2.2193, "step": 1370 }, { "epoch": 0.11, "learning_rate": 0.0002990438880678596, "loss": 2.2468, "step": 1371 }, { "epoch": 0.11, "learning_rate": 0.00029904249427975, "loss": 2.2725, "step": 1372 }, { "epoch": 0.11, "learning_rate": 0.0002990410994797241, "loss": 2.3099, "step": 1373 }, { "epoch": 0.11, "learning_rate": 0.0002990397036677914, "loss": 2.2717, "step": 1374 }, { "epoch": 0.11, "learning_rate": 0.0002990383068439613, "loss": 2.306, "step": 1375 }, { "epoch": 0.11, "learning_rate": 0.00029903690900824343, "loss": 2.2852, "step": 1376 }, { "epoch": 0.11, "learning_rate": 0.0002990355101606472, "loss": 2.2374, "step": 1377 }, { "epoch": 0.11, "learning_rate": 0.000299034110301182, "loss": 2.2756, "step": 1378 }, { "epoch": 0.11, "learning_rate": 0.0002990327094298575, "loss": 2.2199, "step": 1379 }, { "epoch": 0.11, "learning_rate": 0.00029903130754668317, "loss": 2.2428, "step": 1380 }, { "epoch": 0.11, "learning_rate": 0.00029902990465166844, "loss": 2.2253, "step": 1381 }, { "epoch": 0.11, "learning_rate": 0.0002990285007448229, "loss": 2.2212, "step": 1382 }, { "epoch": 0.11, "learning_rate": 0.0002990270958261561, "loss": 2.1472, "step": 1383 }, { "epoch": 0.11, "learning_rate": 0.00029902568989567755, "loss": 2.1944, "step": 1384 }, { "epoch": 0.11, "learning_rate": 0.0002990242829533968, "loss": 2.2057, "step": 1385 }, { "epoch": 0.11, "learning_rate": 0.0002990228749993235, "loss": 2.2136, "step": 1386 }, { "epoch": 0.11, "learning_rate": 0.000299021466033467, "loss": 2.2321, "step": 1387 }, { "epoch": 0.11, "learning_rate": 0.00029902005605583705, "loss": 2.2625, "step": 1388 }, { "epoch": 0.11, "learning_rate": 0.00029901864506644315, "loss": 2.1827, "step": 1389 }, { "epoch": 0.11, "learning_rate": 0.0002990172330652949, "loss": 2.2403, "step": 1390 }, { "epoch": 0.11, "learning_rate": 0.00029901582005240177, "loss": 2.1749, "step": 1391 }, { "epoch": 0.11, "learning_rate": 0.00029901440602777353, "loss": 2.2954, "step": 1392 }, { "epoch": 0.11, "learning_rate": 0.0002990129909914197, "loss": 2.1392, "step": 1393 }, { "epoch": 0.11, "learning_rate": 0.0002990115749433499, "loss": 2.2645, "step": 1394 }, { "epoch": 0.11, "learning_rate": 0.0002990101578835737, "loss": 2.2146, "step": 1395 }, { "epoch": 0.11, "learning_rate": 0.0002990087398121008, "loss": 2.1732, "step": 1396 }, { "epoch": 0.11, "learning_rate": 0.0002990073207289408, "loss": 2.2542, "step": 1397 }, { "epoch": 0.11, "learning_rate": 0.0002990059006341033, "loss": 2.2259, "step": 1398 }, { "epoch": 0.11, "learning_rate": 0.0002990044795275979, "loss": 2.2574, "step": 1399 }, { "epoch": 0.11, "learning_rate": 0.00029900305740943446, "loss": 2.2283, "step": 1400 }, { "epoch": 0.11, "learning_rate": 0.0002990016342796224, "loss": 2.2289, "step": 1401 }, { "epoch": 0.11, "learning_rate": 0.0002990002101381714, "loss": 2.2219, "step": 1402 }, { "epoch": 0.11, "learning_rate": 0.0002989987849850913, "loss": 2.2482, "step": 1403 }, { "epoch": 0.11, "learning_rate": 0.00029899735882039165, "loss": 2.2349, "step": 1404 }, { "epoch": 0.11, "learning_rate": 0.0002989959316440821, "loss": 2.2729, "step": 1405 }, { "epoch": 0.11, "learning_rate": 0.00029899450345617244, "loss": 2.2761, "step": 1406 }, { "epoch": 0.11, "learning_rate": 0.0002989930742566724, "loss": 2.1782, "step": 1407 }, { "epoch": 0.11, "learning_rate": 0.00029899164404559146, "loss": 2.1507, "step": 1408 }, { "epoch": 0.11, "learning_rate": 0.00029899021282293956, "loss": 2.2426, "step": 1409 }, { "epoch": 0.11, "learning_rate": 0.00029898878058872634, "loss": 2.2458, "step": 1410 }, { "epoch": 0.11, "learning_rate": 0.00029898734734296154, "loss": 2.2228, "step": 1411 }, { "epoch": 0.11, "learning_rate": 0.0002989859130856548, "loss": 2.1809, "step": 1412 }, { "epoch": 0.11, "learning_rate": 0.000298984477816816, "loss": 2.2409, "step": 1413 }, { "epoch": 0.11, "learning_rate": 0.0002989830415364548, "loss": 2.1761, "step": 1414 }, { "epoch": 0.11, "learning_rate": 0.0002989816042445809, "loss": 2.2293, "step": 1415 }, { "epoch": 0.11, "learning_rate": 0.00029898016594120415, "loss": 2.2045, "step": 1416 }, { "epoch": 0.11, "learning_rate": 0.00029897872662633433, "loss": 2.2635, "step": 1417 }, { "epoch": 0.11, "learning_rate": 0.00029897728629998114, "loss": 2.2475, "step": 1418 }, { "epoch": 0.11, "learning_rate": 0.0002989758449621544, "loss": 2.2031, "step": 1419 }, { "epoch": 0.11, "learning_rate": 0.0002989744026128638, "loss": 2.1903, "step": 1420 }, { "epoch": 0.11, "learning_rate": 0.0002989729592521193, "loss": 2.2399, "step": 1421 }, { "epoch": 0.11, "learning_rate": 0.0002989715148799306, "loss": 2.2325, "step": 1422 }, { "epoch": 0.11, "learning_rate": 0.00029897006949630755, "loss": 2.2861, "step": 1423 }, { "epoch": 0.11, "learning_rate": 0.0002989686231012599, "loss": 2.2586, "step": 1424 }, { "epoch": 0.11, "learning_rate": 0.0002989671756947975, "loss": 2.2288, "step": 1425 }, { "epoch": 0.11, "learning_rate": 0.00029896572727693024, "loss": 2.2129, "step": 1426 }, { "epoch": 0.11, "learning_rate": 0.00029896427784766787, "loss": 2.2348, "step": 1427 }, { "epoch": 0.11, "learning_rate": 0.00029896282740702023, "loss": 2.2703, "step": 1428 }, { "epoch": 0.11, "learning_rate": 0.0002989613759549972, "loss": 2.2204, "step": 1429 }, { "epoch": 0.11, "learning_rate": 0.00029895992349160866, "loss": 2.223, "step": 1430 }, { "epoch": 0.11, "learning_rate": 0.00029895847001686445, "loss": 2.1746, "step": 1431 }, { "epoch": 0.11, "learning_rate": 0.0002989570155307744, "loss": 2.1627, "step": 1432 }, { "epoch": 0.11, "learning_rate": 0.0002989555600333484, "loss": 2.2254, "step": 1433 }, { "epoch": 0.11, "learning_rate": 0.00029895410352459643, "loss": 2.2195, "step": 1434 }, { "epoch": 0.11, "learning_rate": 0.00029895264600452825, "loss": 2.2381, "step": 1435 }, { "epoch": 0.11, "learning_rate": 0.00029895118747315375, "loss": 2.1993, "step": 1436 }, { "epoch": 0.11, "learning_rate": 0.00029894972793048294, "loss": 2.2728, "step": 1437 }, { "epoch": 0.11, "learning_rate": 0.00029894826737652565, "loss": 2.2043, "step": 1438 }, { "epoch": 0.11, "learning_rate": 0.00029894680581129185, "loss": 2.1461, "step": 1439 }, { "epoch": 0.11, "learning_rate": 0.0002989453432347914, "loss": 2.2156, "step": 1440 }, { "epoch": 0.11, "learning_rate": 0.00029894387964703433, "loss": 2.1993, "step": 1441 }, { "epoch": 0.11, "learning_rate": 0.00029894241504803046, "loss": 2.1735, "step": 1442 }, { "epoch": 0.11, "learning_rate": 0.00029894094943778976, "loss": 2.1631, "step": 1443 }, { "epoch": 0.11, "learning_rate": 0.00029893948281632226, "loss": 2.2642, "step": 1444 }, { "epoch": 0.11, "learning_rate": 0.0002989380151836378, "loss": 2.2007, "step": 1445 }, { "epoch": 0.11, "learning_rate": 0.0002989365465397465, "loss": 2.206, "step": 1446 }, { "epoch": 0.11, "learning_rate": 0.00029893507688465816, "loss": 2.192, "step": 1447 }, { "epoch": 0.11, "learning_rate": 0.00029893360621838287, "loss": 2.188, "step": 1448 }, { "epoch": 0.11, "learning_rate": 0.00029893213454093055, "loss": 2.2701, "step": 1449 }, { "epoch": 0.11, "learning_rate": 0.0002989306618523112, "loss": 2.2279, "step": 1450 }, { "epoch": 0.11, "learning_rate": 0.00029892918815253497, "loss": 2.1853, "step": 1451 }, { "epoch": 0.11, "learning_rate": 0.00029892771344161166, "loss": 2.2011, "step": 1452 }, { "epoch": 0.11, "learning_rate": 0.0002989262377195513, "loss": 2.2103, "step": 1453 }, { "epoch": 0.11, "learning_rate": 0.0002989247609863641, "loss": 2.2034, "step": 1454 }, { "epoch": 0.11, "learning_rate": 0.00029892328324205984, "loss": 2.2322, "step": 1455 }, { "epoch": 0.11, "learning_rate": 0.00029892180448664875, "loss": 2.2289, "step": 1456 }, { "epoch": 0.11, "learning_rate": 0.00029892032472014074, "loss": 2.1437, "step": 1457 }, { "epoch": 0.11, "learning_rate": 0.0002989188439425459, "loss": 2.1984, "step": 1458 }, { "epoch": 0.11, "learning_rate": 0.0002989173621538743, "loss": 2.2417, "step": 1459 }, { "epoch": 0.11, "learning_rate": 0.000298915879354136, "loss": 2.2136, "step": 1460 }, { "epoch": 0.11, "learning_rate": 0.0002989143955433411, "loss": 2.184, "step": 1461 }, { "epoch": 0.12, "learning_rate": 0.0002989129107214996, "loss": 2.2474, "step": 1462 }, { "epoch": 0.12, "learning_rate": 0.0002989114248886216, "loss": 2.2761, "step": 1463 }, { "epoch": 0.12, "learning_rate": 0.0002989099380447172, "loss": 2.2075, "step": 1464 }, { "epoch": 0.12, "learning_rate": 0.00029890845018979654, "loss": 2.1724, "step": 1465 }, { "epoch": 0.12, "learning_rate": 0.0002989069613238696, "loss": 2.2103, "step": 1466 }, { "epoch": 0.12, "learning_rate": 0.0002989054714469466, "loss": 2.2627, "step": 1467 }, { "epoch": 0.12, "learning_rate": 0.0002989039805590376, "loss": 2.1205, "step": 1468 }, { "epoch": 0.12, "learning_rate": 0.0002989024886601528, "loss": 2.2104, "step": 1469 }, { "epoch": 0.12, "learning_rate": 0.00029890099575030226, "loss": 2.2042, "step": 1470 }, { "epoch": 0.12, "learning_rate": 0.00029889950182949613, "loss": 2.166, "step": 1471 }, { "epoch": 0.12, "learning_rate": 0.0002988980068977445, "loss": 2.2088, "step": 1472 }, { "epoch": 0.12, "learning_rate": 0.0002988965109550576, "loss": 2.1938, "step": 1473 }, { "epoch": 0.12, "learning_rate": 0.0002988950140014456, "loss": 2.169, "step": 1474 }, { "epoch": 0.12, "learning_rate": 0.0002988935160369186, "loss": 2.2156, "step": 1475 }, { "epoch": 0.12, "learning_rate": 0.00029889201706148676, "loss": 2.2353, "step": 1476 }, { "epoch": 0.12, "learning_rate": 0.0002988905170751603, "loss": 2.1904, "step": 1477 }, { "epoch": 0.12, "learning_rate": 0.0002988890160779494, "loss": 2.243, "step": 1478 }, { "epoch": 0.12, "learning_rate": 0.00029888751406986427, "loss": 2.1584, "step": 1479 }, { "epoch": 0.12, "learning_rate": 0.00029888601105091506, "loss": 2.2631, "step": 1480 }, { "epoch": 0.12, "learning_rate": 0.000298884507021112, "loss": 2.2254, "step": 1481 }, { "epoch": 0.12, "learning_rate": 0.00029888300198046533, "loss": 2.2107, "step": 1482 }, { "epoch": 0.12, "learning_rate": 0.0002988814959289852, "loss": 2.1813, "step": 1483 }, { "epoch": 0.12, "learning_rate": 0.00029887998886668184, "loss": 2.2832, "step": 1484 }, { "epoch": 0.12, "learning_rate": 0.0002988784807935656, "loss": 2.1508, "step": 1485 }, { "epoch": 0.12, "learning_rate": 0.00029887697170964656, "loss": 2.2261, "step": 1486 }, { "epoch": 0.12, "learning_rate": 0.00029887546161493507, "loss": 2.1346, "step": 1487 }, { "epoch": 0.12, "learning_rate": 0.00029887395050944135, "loss": 2.2042, "step": 1488 }, { "epoch": 0.12, "learning_rate": 0.0002988724383931756, "loss": 2.2109, "step": 1489 }, { "epoch": 0.12, "learning_rate": 0.0002988709252661482, "loss": 2.1533, "step": 1490 }, { "epoch": 0.12, "learning_rate": 0.0002988694111283694, "loss": 2.1824, "step": 1491 }, { "epoch": 0.12, "learning_rate": 0.0002988678959798494, "loss": 2.2079, "step": 1492 }, { "epoch": 0.12, "learning_rate": 0.0002988663798205986, "loss": 2.2151, "step": 1493 }, { "epoch": 0.12, "learning_rate": 0.0002988648626506272, "loss": 2.1928, "step": 1494 }, { "epoch": 0.12, "learning_rate": 0.00029886334446994553, "loss": 2.2146, "step": 1495 }, { "epoch": 0.12, "learning_rate": 0.0002988618252785639, "loss": 2.1861, "step": 1496 }, { "epoch": 0.12, "learning_rate": 0.00029886030507649263, "loss": 2.2149, "step": 1497 }, { "epoch": 0.12, "learning_rate": 0.000298858783863742, "loss": 2.1886, "step": 1498 }, { "epoch": 0.12, "learning_rate": 0.00029885726164032245, "loss": 2.1713, "step": 1499 }, { "epoch": 0.12, "learning_rate": 0.0002988557384062442, "loss": 2.1847, "step": 1500 }, { "epoch": 0.12, "learning_rate": 0.0002988542141615176, "loss": 2.2112, "step": 1501 }, { "epoch": 0.12, "learning_rate": 0.00029885268890615305, "loss": 2.1595, "step": 1502 }, { "epoch": 0.12, "learning_rate": 0.00029885116264016093, "loss": 2.1959, "step": 1503 }, { "epoch": 0.12, "learning_rate": 0.00029884963536355155, "loss": 2.1425, "step": 1504 }, { "epoch": 0.12, "learning_rate": 0.0002988481070763352, "loss": 2.1818, "step": 1505 }, { "epoch": 0.12, "learning_rate": 0.0002988465777785224, "loss": 2.1529, "step": 1506 }, { "epoch": 0.12, "learning_rate": 0.0002988450474701235, "loss": 2.2113, "step": 1507 }, { "epoch": 0.12, "learning_rate": 0.00029884351615114887, "loss": 2.203, "step": 1508 }, { "epoch": 0.12, "learning_rate": 0.00029884198382160886, "loss": 2.1563, "step": 1509 }, { "epoch": 0.12, "learning_rate": 0.00029884045048151394, "loss": 2.1907, "step": 1510 }, { "epoch": 0.12, "learning_rate": 0.0002988389161308745, "loss": 2.1973, "step": 1511 }, { "epoch": 0.12, "learning_rate": 0.00029883738076970096, "loss": 2.2092, "step": 1512 }, { "epoch": 0.12, "learning_rate": 0.00029883584439800373, "loss": 2.1936, "step": 1513 }, { "epoch": 0.12, "learning_rate": 0.00029883430701579326, "loss": 2.212, "step": 1514 }, { "epoch": 0.12, "learning_rate": 0.00029883276862307997, "loss": 2.168, "step": 1515 }, { "epoch": 0.12, "learning_rate": 0.0002988312292198743, "loss": 2.183, "step": 1516 }, { "epoch": 0.12, "learning_rate": 0.0002988296888061868, "loss": 2.2227, "step": 1517 }, { "epoch": 0.12, "learning_rate": 0.00029882814738202776, "loss": 2.2064, "step": 1518 }, { "epoch": 0.12, "learning_rate": 0.00029882660494740773, "loss": 2.2372, "step": 1519 }, { "epoch": 0.12, "learning_rate": 0.00029882506150233725, "loss": 2.1928, "step": 1520 }, { "epoch": 0.12, "learning_rate": 0.00029882351704682667, "loss": 2.1667, "step": 1521 }, { "epoch": 0.12, "learning_rate": 0.0002988219715808865, "loss": 2.1858, "step": 1522 }, { "epoch": 0.12, "learning_rate": 0.00029882042510452736, "loss": 2.2124, "step": 1523 }, { "epoch": 0.12, "learning_rate": 0.00029881887761775956, "loss": 2.194, "step": 1524 }, { "epoch": 0.12, "learning_rate": 0.0002988173291205938, "loss": 2.1799, "step": 1525 }, { "epoch": 0.12, "learning_rate": 0.0002988157796130405, "loss": 2.1445, "step": 1526 }, { "epoch": 0.12, "learning_rate": 0.00029881422909511007, "loss": 2.212, "step": 1527 }, { "epoch": 0.12, "learning_rate": 0.00029881267756681323, "loss": 2.1268, "step": 1528 }, { "epoch": 0.12, "learning_rate": 0.0002988111250281604, "loss": 2.2192, "step": 1529 }, { "epoch": 0.12, "learning_rate": 0.0002988095714791622, "loss": 2.2349, "step": 1530 }, { "epoch": 0.12, "learning_rate": 0.0002988080169198291, "loss": 2.2881, "step": 1531 }, { "epoch": 0.12, "learning_rate": 0.0002988064613501717, "loss": 2.1888, "step": 1532 }, { "epoch": 0.12, "learning_rate": 0.0002988049047702005, "loss": 2.1631, "step": 1533 }, { "epoch": 0.12, "learning_rate": 0.0002988033471799262, "loss": 2.1618, "step": 1534 }, { "epoch": 0.12, "learning_rate": 0.0002988017885793592, "loss": 2.1457, "step": 1535 }, { "epoch": 0.12, "learning_rate": 0.00029880022896851017, "loss": 2.2007, "step": 1536 }, { "epoch": 0.12, "learning_rate": 0.00029879866834738977, "loss": 2.1804, "step": 1537 }, { "epoch": 0.12, "learning_rate": 0.00029879710671600854, "loss": 2.2279, "step": 1538 }, { "epoch": 0.12, "learning_rate": 0.00029879554407437694, "loss": 2.2549, "step": 1539 }, { "epoch": 0.12, "learning_rate": 0.0002987939804225058, "loss": 2.1679, "step": 1540 }, { "epoch": 0.12, "learning_rate": 0.00029879241576040563, "loss": 2.2338, "step": 1541 }, { "epoch": 0.12, "learning_rate": 0.0002987908500880871, "loss": 2.1545, "step": 1542 }, { "epoch": 0.12, "learning_rate": 0.0002987892834055608, "loss": 2.1905, "step": 1543 }, { "epoch": 0.12, "learning_rate": 0.0002987877157128373, "loss": 2.2264, "step": 1544 }, { "epoch": 0.12, "learning_rate": 0.0002987861470099274, "loss": 2.1504, "step": 1545 }, { "epoch": 0.12, "learning_rate": 0.00029878457729684164, "loss": 2.1733, "step": 1546 }, { "epoch": 0.12, "learning_rate": 0.0002987830065735907, "loss": 2.1416, "step": 1547 }, { "epoch": 0.12, "learning_rate": 0.00029878143484018526, "loss": 2.1406, "step": 1548 }, { "epoch": 0.12, "learning_rate": 0.000298779862096636, "loss": 2.1978, "step": 1549 }, { "epoch": 0.12, "learning_rate": 0.00029877828834295355, "loss": 2.2242, "step": 1550 }, { "epoch": 0.12, "learning_rate": 0.00029877671357914857, "loss": 2.179, "step": 1551 }, { "epoch": 0.12, "learning_rate": 0.0002987751378052319, "loss": 2.23, "step": 1552 }, { "epoch": 0.12, "learning_rate": 0.00029877356102121414, "loss": 2.1981, "step": 1553 }, { "epoch": 0.12, "learning_rate": 0.00029877198322710594, "loss": 2.2069, "step": 1554 }, { "epoch": 0.12, "learning_rate": 0.00029877040442291813, "loss": 2.1688, "step": 1555 }, { "epoch": 0.12, "learning_rate": 0.00029876882460866134, "loss": 2.163, "step": 1556 }, { "epoch": 0.12, "learning_rate": 0.00029876724378434636, "loss": 2.1265, "step": 1557 }, { "epoch": 0.12, "learning_rate": 0.00029876566194998386, "loss": 2.1042, "step": 1558 }, { "epoch": 0.12, "learning_rate": 0.00029876407910558463, "loss": 2.2501, "step": 1559 }, { "epoch": 0.12, "learning_rate": 0.00029876249525115936, "loss": 2.191, "step": 1560 }, { "epoch": 0.12, "learning_rate": 0.00029876091038671883, "loss": 2.2461, "step": 1561 }, { "epoch": 0.12, "learning_rate": 0.0002987593245122739, "loss": 2.1558, "step": 1562 }, { "epoch": 0.12, "learning_rate": 0.0002987577376278352, "loss": 2.1951, "step": 1563 }, { "epoch": 0.12, "learning_rate": 0.00029875614973341356, "loss": 2.1827, "step": 1564 }, { "epoch": 0.12, "learning_rate": 0.0002987545608290197, "loss": 2.1871, "step": 1565 }, { "epoch": 0.12, "learning_rate": 0.00029875297091466453, "loss": 2.1709, "step": 1566 }, { "epoch": 0.12, "learning_rate": 0.00029875137999035877, "loss": 2.166, "step": 1567 }, { "epoch": 0.12, "learning_rate": 0.0002987497880561132, "loss": 2.2106, "step": 1568 }, { "epoch": 0.12, "learning_rate": 0.00029874819511193864, "loss": 2.1877, "step": 1569 }, { "epoch": 0.12, "learning_rate": 0.000298746601157846, "loss": 2.1716, "step": 1570 }, { "epoch": 0.12, "learning_rate": 0.0002987450061938459, "loss": 2.2267, "step": 1571 }, { "epoch": 0.12, "learning_rate": 0.0002987434102199494, "loss": 2.2037, "step": 1572 }, { "epoch": 0.12, "learning_rate": 0.0002987418132361672, "loss": 2.105, "step": 1573 }, { "epoch": 0.12, "learning_rate": 0.00029874021524251015, "loss": 2.1917, "step": 1574 }, { "epoch": 0.12, "learning_rate": 0.00029873861623898914, "loss": 2.1727, "step": 1575 }, { "epoch": 0.12, "learning_rate": 0.000298737016225615, "loss": 2.1393, "step": 1576 }, { "epoch": 0.12, "learning_rate": 0.0002987354152023986, "loss": 2.1622, "step": 1577 }, { "epoch": 0.12, "learning_rate": 0.0002987338131693508, "loss": 2.1551, "step": 1578 }, { "epoch": 0.12, "learning_rate": 0.0002987322101264825, "loss": 2.1921, "step": 1579 }, { "epoch": 0.12, "learning_rate": 0.00029873060607380457, "loss": 2.1609, "step": 1580 }, { "epoch": 0.12, "learning_rate": 0.0002987290010113279, "loss": 2.1404, "step": 1581 }, { "epoch": 0.12, "learning_rate": 0.0002987273949390634, "loss": 2.1939, "step": 1582 }, { "epoch": 0.12, "learning_rate": 0.00029872578785702193, "loss": 2.1734, "step": 1583 }, { "epoch": 0.12, "learning_rate": 0.0002987241797652145, "loss": 2.1535, "step": 1584 }, { "epoch": 0.12, "learning_rate": 0.0002987225706636519, "loss": 2.1899, "step": 1585 }, { "epoch": 0.12, "learning_rate": 0.0002987209605523451, "loss": 2.1826, "step": 1586 }, { "epoch": 0.12, "learning_rate": 0.00029871934943130504, "loss": 2.2027, "step": 1587 }, { "epoch": 0.12, "learning_rate": 0.00029871773730054277, "loss": 2.2024, "step": 1588 }, { "epoch": 0.13, "learning_rate": 0.00029871612416006903, "loss": 2.1965, "step": 1589 }, { "epoch": 0.13, "learning_rate": 0.00029871451000989494, "loss": 2.1987, "step": 1590 }, { "epoch": 0.13, "learning_rate": 0.00029871289485003134, "loss": 2.1309, "step": 1591 }, { "epoch": 0.13, "learning_rate": 0.0002987112786804893, "loss": 2.136, "step": 1592 }, { "epoch": 0.13, "learning_rate": 0.0002987096615012797, "loss": 2.1502, "step": 1593 }, { "epoch": 0.13, "learning_rate": 0.0002987080433124136, "loss": 2.1717, "step": 1594 }, { "epoch": 0.13, "learning_rate": 0.00029870642411390197, "loss": 2.1368, "step": 1595 }, { "epoch": 0.13, "learning_rate": 0.0002987048039057557, "loss": 2.1807, "step": 1596 }, { "epoch": 0.13, "learning_rate": 0.00029870318268798593, "loss": 2.0779, "step": 1597 }, { "epoch": 0.13, "learning_rate": 0.00029870156046060367, "loss": 2.1779, "step": 1598 }, { "epoch": 0.13, "learning_rate": 0.00029869993722361977, "loss": 2.1772, "step": 1599 }, { "epoch": 0.13, "learning_rate": 0.0002986983129770454, "loss": 2.1448, "step": 1600 }, { "epoch": 0.13, "learning_rate": 0.0002986966877208915, "loss": 2.217, "step": 1601 }, { "epoch": 0.13, "learning_rate": 0.0002986950614551692, "loss": 2.1402, "step": 1602 }, { "epoch": 0.13, "learning_rate": 0.0002986934341798895, "loss": 2.1366, "step": 1603 }, { "epoch": 0.13, "learning_rate": 0.00029869180589506343, "loss": 2.1701, "step": 1604 }, { "epoch": 0.13, "learning_rate": 0.000298690176600702, "loss": 2.1613, "step": 1605 }, { "epoch": 0.13, "learning_rate": 0.0002986885462968164, "loss": 2.1917, "step": 1606 }, { "epoch": 0.13, "learning_rate": 0.0002986869149834176, "loss": 2.104, "step": 1607 }, { "epoch": 0.13, "learning_rate": 0.00029868528266051666, "loss": 2.1767, "step": 1608 }, { "epoch": 0.13, "learning_rate": 0.00029868364932812474, "loss": 2.1956, "step": 1609 }, { "epoch": 0.13, "learning_rate": 0.00029868201498625284, "loss": 2.1908, "step": 1610 }, { "epoch": 0.13, "learning_rate": 0.00029868037963491216, "loss": 2.0974, "step": 1611 }, { "epoch": 0.13, "learning_rate": 0.0002986787432741138, "loss": 2.1681, "step": 1612 }, { "epoch": 0.13, "learning_rate": 0.0002986771059038687, "loss": 2.1826, "step": 1613 }, { "epoch": 0.13, "learning_rate": 0.00029867546752418813, "loss": 2.2034, "step": 1614 }, { "epoch": 0.13, "learning_rate": 0.00029867382813508325, "loss": 2.1469, "step": 1615 }, { "epoch": 0.13, "learning_rate": 0.00029867218773656505, "loss": 2.1692, "step": 1616 }, { "epoch": 0.13, "learning_rate": 0.00029867054632864477, "loss": 2.1702, "step": 1617 }, { "epoch": 0.13, "learning_rate": 0.00029866890391133357, "loss": 2.1748, "step": 1618 }, { "epoch": 0.13, "learning_rate": 0.0002986672604846425, "loss": 2.0923, "step": 1619 }, { "epoch": 0.13, "learning_rate": 0.0002986656160485828, "loss": 2.0945, "step": 1620 }, { "epoch": 0.13, "learning_rate": 0.0002986639706031655, "loss": 2.1307, "step": 1621 }, { "epoch": 0.13, "learning_rate": 0.00029866232414840196, "loss": 2.1507, "step": 1622 }, { "epoch": 0.13, "learning_rate": 0.00029866067668430333, "loss": 2.1876, "step": 1623 }, { "epoch": 0.13, "learning_rate": 0.0002986590282108807, "loss": 2.2496, "step": 1624 }, { "epoch": 0.13, "learning_rate": 0.0002986573787281453, "loss": 2.1585, "step": 1625 }, { "epoch": 0.13, "learning_rate": 0.00029865572823610834, "loss": 2.1524, "step": 1626 }, { "epoch": 0.13, "learning_rate": 0.000298654076734781, "loss": 2.1303, "step": 1627 }, { "epoch": 0.13, "learning_rate": 0.0002986524242241745, "loss": 2.1074, "step": 1628 }, { "epoch": 0.13, "learning_rate": 0.00029865077070430015, "loss": 2.197, "step": 1629 }, { "epoch": 0.13, "learning_rate": 0.00029864911617516905, "loss": 2.1973, "step": 1630 }, { "epoch": 0.13, "learning_rate": 0.00029864746063679247, "loss": 2.1203, "step": 1631 }, { "epoch": 0.13, "learning_rate": 0.0002986458040891817, "loss": 2.1545, "step": 1632 }, { "epoch": 0.13, "learning_rate": 0.0002986441465323479, "loss": 2.1817, "step": 1633 }, { "epoch": 0.13, "learning_rate": 0.00029864248796630246, "loss": 2.1906, "step": 1634 }, { "epoch": 0.13, "learning_rate": 0.00029864082839105646, "loss": 2.1046, "step": 1635 }, { "epoch": 0.13, "learning_rate": 0.0002986391678066213, "loss": 2.1656, "step": 1636 }, { "epoch": 0.13, "learning_rate": 0.00029863750621300823, "loss": 2.2246, "step": 1637 }, { "epoch": 0.13, "learning_rate": 0.0002986358436102285, "loss": 2.1789, "step": 1638 }, { "epoch": 0.13, "learning_rate": 0.0002986341799982934, "loss": 2.1392, "step": 1639 }, { "epoch": 0.13, "learning_rate": 0.0002986325153772142, "loss": 2.1503, "step": 1640 }, { "epoch": 0.13, "learning_rate": 0.00029863084974700234, "loss": 2.231, "step": 1641 }, { "epoch": 0.13, "learning_rate": 0.000298629183107669, "loss": 2.1608, "step": 1642 }, { "epoch": 0.13, "learning_rate": 0.0002986275154592255, "loss": 2.1695, "step": 1643 }, { "epoch": 0.13, "learning_rate": 0.00029862584680168325, "loss": 2.1409, "step": 1644 }, { "epoch": 0.13, "learning_rate": 0.00029862417713505347, "loss": 2.11, "step": 1645 }, { "epoch": 0.13, "learning_rate": 0.0002986225064593475, "loss": 2.1576, "step": 1646 }, { "epoch": 0.13, "learning_rate": 0.0002986208347745768, "loss": 2.1858, "step": 1647 }, { "epoch": 0.13, "learning_rate": 0.00029861916208075265, "loss": 2.1326, "step": 1648 }, { "epoch": 0.13, "learning_rate": 0.00029861748837788635, "loss": 2.1728, "step": 1649 }, { "epoch": 0.13, "learning_rate": 0.0002986158136659894, "loss": 2.1791, "step": 1650 }, { "epoch": 0.13, "learning_rate": 0.000298614137945073, "loss": 2.1387, "step": 1651 }, { "epoch": 0.13, "learning_rate": 0.00029861246121514867, "loss": 2.1347, "step": 1652 }, { "epoch": 0.13, "learning_rate": 0.00029861078347622773, "loss": 2.212, "step": 1653 }, { "epoch": 0.13, "learning_rate": 0.0002986091047283216, "loss": 2.136, "step": 1654 }, { "epoch": 0.13, "learning_rate": 0.0002986074249714416, "loss": 2.1591, "step": 1655 }, { "epoch": 0.13, "learning_rate": 0.00029860574420559924, "loss": 2.1468, "step": 1656 }, { "epoch": 0.13, "learning_rate": 0.00029860406243080586, "loss": 2.1566, "step": 1657 }, { "epoch": 0.13, "learning_rate": 0.0002986023796470729, "loss": 2.1466, "step": 1658 }, { "epoch": 0.13, "learning_rate": 0.00029860069585441185, "loss": 2.1327, "step": 1659 }, { "epoch": 0.13, "learning_rate": 0.000298599011052834, "loss": 2.1703, "step": 1660 }, { "epoch": 0.13, "learning_rate": 0.0002985973252423509, "loss": 2.1211, "step": 1661 }, { "epoch": 0.13, "learning_rate": 0.00029859563842297396, "loss": 2.0964, "step": 1662 }, { "epoch": 0.13, "learning_rate": 0.00029859395059471464, "loss": 2.1919, "step": 1663 }, { "epoch": 0.13, "learning_rate": 0.0002985922617575844, "loss": 2.1765, "step": 1664 }, { "epoch": 0.13, "learning_rate": 0.0002985905719115947, "loss": 2.0886, "step": 1665 }, { "epoch": 0.13, "learning_rate": 0.000298588881056757, "loss": 2.1489, "step": 1666 }, { "epoch": 0.13, "learning_rate": 0.0002985871891930828, "loss": 2.1171, "step": 1667 }, { "epoch": 0.13, "learning_rate": 0.0002985854963205836, "loss": 2.1176, "step": 1668 }, { "epoch": 0.13, "learning_rate": 0.0002985838024392709, "loss": 2.194, "step": 1669 }, { "epoch": 0.13, "learning_rate": 0.00029858210754915614, "loss": 2.1693, "step": 1670 }, { "epoch": 0.13, "learning_rate": 0.00029858041165025084, "loss": 2.1486, "step": 1671 }, { "epoch": 0.13, "learning_rate": 0.0002985787147425666, "loss": 2.1522, "step": 1672 }, { "epoch": 0.13, "learning_rate": 0.0002985770168261148, "loss": 2.0775, "step": 1673 }, { "epoch": 0.13, "learning_rate": 0.0002985753179009071, "loss": 2.129, "step": 1674 }, { "epoch": 0.13, "learning_rate": 0.000298573617966955, "loss": 2.1159, "step": 1675 }, { "epoch": 0.13, "learning_rate": 0.00029857191702426997, "loss": 2.1265, "step": 1676 }, { "epoch": 0.13, "learning_rate": 0.00029857021507286366, "loss": 2.1547, "step": 1677 }, { "epoch": 0.13, "learning_rate": 0.0002985685121127476, "loss": 2.1417, "step": 1678 }, { "epoch": 0.13, "learning_rate": 0.0002985668081439333, "loss": 2.1155, "step": 1679 }, { "epoch": 0.13, "learning_rate": 0.0002985651031664323, "loss": 2.1564, "step": 1680 }, { "epoch": 0.13, "learning_rate": 0.0002985633971802563, "loss": 2.1448, "step": 1681 }, { "epoch": 0.13, "learning_rate": 0.00029856169018541677, "loss": 2.1477, "step": 1682 }, { "epoch": 0.13, "learning_rate": 0.00029855998218192536, "loss": 2.1409, "step": 1683 }, { "epoch": 0.13, "learning_rate": 0.0002985582731697937, "loss": 2.2081, "step": 1684 }, { "epoch": 0.13, "learning_rate": 0.0002985565631490333, "loss": 2.1486, "step": 1685 }, { "epoch": 0.13, "learning_rate": 0.00029855485211965584, "loss": 2.1437, "step": 1686 }, { "epoch": 0.13, "learning_rate": 0.0002985531400816729, "loss": 2.1065, "step": 1687 }, { "epoch": 0.13, "learning_rate": 0.0002985514270350962, "loss": 2.1489, "step": 1688 }, { "epoch": 0.13, "learning_rate": 0.00029854971297993714, "loss": 2.1137, "step": 1689 }, { "epoch": 0.13, "learning_rate": 0.0002985479979162076, "loss": 2.0653, "step": 1690 }, { "epoch": 0.13, "learning_rate": 0.0002985462818439191, "loss": 2.1414, "step": 1691 }, { "epoch": 0.13, "learning_rate": 0.00029854456476308334, "loss": 2.1617, "step": 1692 }, { "epoch": 0.13, "learning_rate": 0.00029854284667371194, "loss": 2.0816, "step": 1693 }, { "epoch": 0.13, "learning_rate": 0.0002985411275758166, "loss": 2.1953, "step": 1694 }, { "epoch": 0.13, "learning_rate": 0.0002985394074694089, "loss": 2.1632, "step": 1695 }, { "epoch": 0.13, "learning_rate": 0.0002985376863545007, "loss": 2.1247, "step": 1696 }, { "epoch": 0.13, "learning_rate": 0.00029853596423110355, "loss": 2.1243, "step": 1697 }, { "epoch": 0.13, "learning_rate": 0.00029853424109922916, "loss": 2.1436, "step": 1698 }, { "epoch": 0.13, "learning_rate": 0.0002985325169588892, "loss": 2.0919, "step": 1699 }, { "epoch": 0.13, "learning_rate": 0.0002985307918100955, "loss": 2.114, "step": 1700 }, { "epoch": 0.13, "learning_rate": 0.00029852906565285963, "loss": 2.1471, "step": 1701 }, { "epoch": 0.13, "learning_rate": 0.0002985273384871934, "loss": 2.1755, "step": 1702 }, { "epoch": 0.13, "learning_rate": 0.0002985256103131085, "loss": 2.0671, "step": 1703 }, { "epoch": 0.13, "learning_rate": 0.0002985238811306167, "loss": 2.1626, "step": 1704 }, { "epoch": 0.13, "learning_rate": 0.00029852215093972964, "loss": 2.109, "step": 1705 }, { "epoch": 0.13, "learning_rate": 0.00029852041974045917, "loss": 2.1473, "step": 1706 }, { "epoch": 0.13, "learning_rate": 0.000298518687532817, "loss": 2.1695, "step": 1707 }, { "epoch": 0.13, "learning_rate": 0.0002985169543168149, "loss": 2.0578, "step": 1708 }, { "epoch": 0.13, "learning_rate": 0.00029851522009246466, "loss": 2.1915, "step": 1709 }, { "epoch": 0.13, "learning_rate": 0.000298513484859778, "loss": 2.1502, "step": 1710 }, { "epoch": 0.13, "learning_rate": 0.0002985117486187668, "loss": 2.1214, "step": 1711 }, { "epoch": 0.13, "learning_rate": 0.0002985100113694427, "loss": 2.1327, "step": 1712 }, { "epoch": 0.13, "learning_rate": 0.0002985082731118176, "loss": 2.1127, "step": 1713 }, { "epoch": 0.13, "learning_rate": 0.00029850653384590333, "loss": 2.1345, "step": 1714 }, { "epoch": 0.13, "learning_rate": 0.0002985047935717116, "loss": 2.1206, "step": 1715 }, { "epoch": 0.14, "learning_rate": 0.0002985030522892543, "loss": 2.1727, "step": 1716 }, { "epoch": 0.14, "learning_rate": 0.0002985013099985432, "loss": 2.1201, "step": 1717 }, { "epoch": 0.14, "learning_rate": 0.00029849956669959017, "loss": 2.1598, "step": 1718 }, { "epoch": 0.14, "learning_rate": 0.00029849782239240705, "loss": 2.1567, "step": 1719 }, { "epoch": 0.14, "learning_rate": 0.0002984960770770056, "loss": 2.0893, "step": 1720 }, { "epoch": 0.14, "learning_rate": 0.0002984943307533978, "loss": 2.1736, "step": 1721 }, { "epoch": 0.14, "learning_rate": 0.0002984925834215954, "loss": 2.1083, "step": 1722 }, { "epoch": 0.14, "learning_rate": 0.00029849083508161036, "loss": 2.2107, "step": 1723 }, { "epoch": 0.14, "learning_rate": 0.00029848908573345444, "loss": 2.1482, "step": 1724 }, { "epoch": 0.14, "learning_rate": 0.0002984873353771396, "loss": 2.0993, "step": 1725 }, { "epoch": 0.14, "learning_rate": 0.00029848558401267765, "loss": 2.1198, "step": 1726 }, { "epoch": 0.14, "learning_rate": 0.0002984838316400806, "loss": 2.1393, "step": 1727 }, { "epoch": 0.14, "learning_rate": 0.00029848207825936023, "loss": 2.1333, "step": 1728 }, { "epoch": 0.14, "learning_rate": 0.00029848032387052843, "loss": 2.1517, "step": 1729 }, { "epoch": 0.14, "learning_rate": 0.00029847856847359727, "loss": 2.076, "step": 1730 }, { "epoch": 0.14, "learning_rate": 0.0002984768120685785, "loss": 2.1096, "step": 1731 }, { "epoch": 0.14, "learning_rate": 0.0002984750546554841, "loss": 2.0964, "step": 1732 }, { "epoch": 0.14, "learning_rate": 0.0002984732962343261, "loss": 2.1119, "step": 1733 }, { "epoch": 0.14, "learning_rate": 0.0002984715368051163, "loss": 2.1913, "step": 1734 }, { "epoch": 0.14, "learning_rate": 0.0002984697763678667, "loss": 2.0996, "step": 1735 }, { "epoch": 0.14, "learning_rate": 0.00029846801492258924, "loss": 2.1228, "step": 1736 }, { "epoch": 0.14, "learning_rate": 0.0002984662524692959, "loss": 2.1225, "step": 1737 }, { "epoch": 0.14, "learning_rate": 0.0002984644890079986, "loss": 2.0825, "step": 1738 }, { "epoch": 0.14, "learning_rate": 0.0002984627245387094, "loss": 2.1463, "step": 1739 }, { "epoch": 0.14, "learning_rate": 0.0002984609590614402, "loss": 2.1498, "step": 1740 }, { "epoch": 0.14, "learning_rate": 0.00029845919257620303, "loss": 2.1505, "step": 1741 }, { "epoch": 0.14, "learning_rate": 0.00029845742508300994, "loss": 2.1349, "step": 1742 }, { "epoch": 0.14, "learning_rate": 0.00029845565658187273, "loss": 2.0794, "step": 1743 }, { "epoch": 0.14, "learning_rate": 0.0002984538870728036, "loss": 2.1205, "step": 1744 }, { "epoch": 0.14, "learning_rate": 0.0002984521165558145, "loss": 2.144, "step": 1745 }, { "epoch": 0.14, "learning_rate": 0.00029845034503091743, "loss": 2.1375, "step": 1746 }, { "epoch": 0.14, "learning_rate": 0.00029844857249812447, "loss": 2.2027, "step": 1747 }, { "epoch": 0.14, "learning_rate": 0.0002984467989574476, "loss": 2.2231, "step": 1748 }, { "epoch": 0.14, "learning_rate": 0.00029844502440889894, "loss": 2.165, "step": 1749 }, { "epoch": 0.14, "learning_rate": 0.0002984432488524904, "loss": 2.0761, "step": 1750 }, { "epoch": 0.14, "learning_rate": 0.00029844147228823417, "loss": 2.1433, "step": 1751 }, { "epoch": 0.14, "learning_rate": 0.0002984396947161422, "loss": 2.1032, "step": 1752 }, { "epoch": 0.14, "learning_rate": 0.0002984379161362267, "loss": 2.1027, "step": 1753 }, { "epoch": 0.14, "learning_rate": 0.0002984361365484996, "loss": 2.0934, "step": 1754 }, { "epoch": 0.14, "learning_rate": 0.0002984343559529731, "loss": 2.1541, "step": 1755 }, { "epoch": 0.14, "learning_rate": 0.0002984325743496592, "loss": 2.1226, "step": 1756 }, { "epoch": 0.14, "learning_rate": 0.0002984307917385701, "loss": 2.0648, "step": 1757 }, { "epoch": 0.14, "learning_rate": 0.00029842900811971775, "loss": 2.1117, "step": 1758 }, { "epoch": 0.14, "learning_rate": 0.00029842722349311435, "loss": 2.106, "step": 1759 }, { "epoch": 0.14, "learning_rate": 0.00029842543785877203, "loss": 2.0773, "step": 1760 }, { "epoch": 0.14, "learning_rate": 0.00029842365121670293, "loss": 2.167, "step": 1761 }, { "epoch": 0.14, "learning_rate": 0.0002984218635669191, "loss": 2.1321, "step": 1762 }, { "epoch": 0.14, "learning_rate": 0.00029842007490943275, "loss": 2.1468, "step": 1763 }, { "epoch": 0.14, "learning_rate": 0.00029841828524425595, "loss": 2.105, "step": 1764 }, { "epoch": 0.14, "learning_rate": 0.00029841649457140095, "loss": 2.1599, "step": 1765 }, { "epoch": 0.14, "learning_rate": 0.0002984147028908798, "loss": 2.09, "step": 1766 }, { "epoch": 0.14, "learning_rate": 0.0002984129102027048, "loss": 2.1181, "step": 1767 }, { "epoch": 0.14, "learning_rate": 0.00029841111650688796, "loss": 2.1486, "step": 1768 }, { "epoch": 0.14, "learning_rate": 0.00029840932180344156, "loss": 2.1206, "step": 1769 }, { "epoch": 0.14, "learning_rate": 0.00029840752609237777, "loss": 2.1056, "step": 1770 }, { "epoch": 0.14, "learning_rate": 0.0002984057293737088, "loss": 2.1371, "step": 1771 }, { "epoch": 0.14, "learning_rate": 0.00029840393164744683, "loss": 2.1292, "step": 1772 }, { "epoch": 0.14, "learning_rate": 0.000298402132913604, "loss": 2.1206, "step": 1773 }, { "epoch": 0.14, "learning_rate": 0.0002984003331721927, "loss": 2.1644, "step": 1774 }, { "epoch": 0.14, "learning_rate": 0.00029839853242322493, "loss": 2.1951, "step": 1775 }, { "epoch": 0.14, "learning_rate": 0.000298396730666713, "loss": 2.1413, "step": 1776 }, { "epoch": 0.14, "learning_rate": 0.0002983949279026692, "loss": 2.0627, "step": 1777 }, { "epoch": 0.14, "learning_rate": 0.00029839312413110577, "loss": 2.1125, "step": 1778 }, { "epoch": 0.14, "learning_rate": 0.00029839131935203484, "loss": 2.1571, "step": 1779 }, { "epoch": 0.14, "learning_rate": 0.0002983895135654688, "loss": 2.102, "step": 1780 }, { "epoch": 0.14, "learning_rate": 0.0002983877067714198, "loss": 2.1605, "step": 1781 }, { "epoch": 0.14, "learning_rate": 0.0002983858989699002, "loss": 2.1056, "step": 1782 }, { "epoch": 0.14, "learning_rate": 0.00029838409016092225, "loss": 2.1043, "step": 1783 }, { "epoch": 0.14, "learning_rate": 0.0002983822803444982, "loss": 2.1526, "step": 1784 }, { "epoch": 0.14, "learning_rate": 0.0002983804695206403, "loss": 2.1203, "step": 1785 }, { "epoch": 0.14, "learning_rate": 0.00029837865768936095, "loss": 2.1357, "step": 1786 }, { "epoch": 0.14, "learning_rate": 0.0002983768448506723, "loss": 2.074, "step": 1787 }, { "epoch": 0.14, "learning_rate": 0.0002983750310045869, "loss": 2.1207, "step": 1788 }, { "epoch": 0.14, "learning_rate": 0.00029837321615111686, "loss": 2.1483, "step": 1789 }, { "epoch": 0.14, "learning_rate": 0.0002983714002902746, "loss": 2.0702, "step": 1790 }, { "epoch": 0.14, "learning_rate": 0.0002983695834220723, "loss": 2.1475, "step": 1791 }, { "epoch": 0.14, "learning_rate": 0.00029836776554652245, "loss": 2.0906, "step": 1792 }, { "epoch": 0.14, "learning_rate": 0.0002983659466636374, "loss": 2.0866, "step": 1793 }, { "epoch": 0.14, "learning_rate": 0.0002983641267734294, "loss": 2.1692, "step": 1794 }, { "epoch": 0.14, "learning_rate": 0.00029836230587591085, "loss": 2.1635, "step": 1795 }, { "epoch": 0.14, "learning_rate": 0.00029836048397109417, "loss": 2.1463, "step": 1796 }, { "epoch": 0.14, "learning_rate": 0.0002983586610589916, "loss": 2.1025, "step": 1797 }, { "epoch": 0.14, "learning_rate": 0.0002983568371396156, "loss": 2.083, "step": 1798 }, { "epoch": 0.14, "learning_rate": 0.0002983550122129786, "loss": 2.1, "step": 1799 }, { "epoch": 0.14, "learning_rate": 0.0002983531862790929, "loss": 2.1389, "step": 1800 }, { "epoch": 0.14, "learning_rate": 0.000298351359337971, "loss": 2.1027, "step": 1801 }, { "epoch": 0.14, "learning_rate": 0.00029834953138962517, "loss": 2.1155, "step": 1802 }, { "epoch": 0.14, "learning_rate": 0.0002983477024340679, "loss": 2.1127, "step": 1803 }, { "epoch": 0.14, "learning_rate": 0.0002983458724713116, "loss": 2.1712, "step": 1804 }, { "epoch": 0.14, "learning_rate": 0.00029834404150136867, "loss": 2.1102, "step": 1805 }, { "epoch": 0.14, "learning_rate": 0.00029834220952425157, "loss": 2.1189, "step": 1806 }, { "epoch": 0.14, "learning_rate": 0.0002983403765399728, "loss": 2.1613, "step": 1807 }, { "epoch": 0.14, "learning_rate": 0.00029833854254854465, "loss": 2.0533, "step": 1808 }, { "epoch": 0.14, "learning_rate": 0.00029833670754997966, "loss": 2.0744, "step": 1809 }, { "epoch": 0.14, "learning_rate": 0.0002983348715442903, "loss": 2.086, "step": 1810 }, { "epoch": 0.14, "learning_rate": 0.000298333034531489, "loss": 2.1715, "step": 1811 }, { "epoch": 0.14, "learning_rate": 0.0002983311965115883, "loss": 2.0703, "step": 1812 }, { "epoch": 0.14, "learning_rate": 0.00029832935748460063, "loss": 2.1604, "step": 1813 }, { "epoch": 0.14, "learning_rate": 0.0002983275174505384, "loss": 2.1146, "step": 1814 }, { "epoch": 0.14, "learning_rate": 0.00029832567640941427, "loss": 2.1245, "step": 1815 }, { "epoch": 0.14, "learning_rate": 0.0002983238343612406, "loss": 2.1382, "step": 1816 }, { "epoch": 0.14, "learning_rate": 0.00029832199130603, "loss": 2.0584, "step": 1817 }, { "epoch": 0.14, "learning_rate": 0.0002983201472437948, "loss": 2.1155, "step": 1818 }, { "epoch": 0.14, "learning_rate": 0.0002983183021745478, "loss": 2.1389, "step": 1819 }, { "epoch": 0.14, "learning_rate": 0.00029831645609830135, "loss": 2.0812, "step": 1820 }, { "epoch": 0.14, "learning_rate": 0.0002983146090150679, "loss": 2.0847, "step": 1821 }, { "epoch": 0.14, "learning_rate": 0.00029831276092486024, "loss": 2.0771, "step": 1822 }, { "epoch": 0.14, "learning_rate": 0.0002983109118276907, "loss": 2.0103, "step": 1823 }, { "epoch": 0.14, "learning_rate": 0.00029830906172357197, "loss": 2.136, "step": 1824 }, { "epoch": 0.14, "learning_rate": 0.00029830721061251646, "loss": 2.0985, "step": 1825 }, { "epoch": 0.14, "learning_rate": 0.0002983053584945369, "loss": 2.0993, "step": 1826 }, { "epoch": 0.14, "learning_rate": 0.0002983035053696458, "loss": 2.1484, "step": 1827 }, { "epoch": 0.14, "learning_rate": 0.0002983016512378557, "loss": 2.0569, "step": 1828 }, { "epoch": 0.14, "learning_rate": 0.0002982997960991793, "loss": 2.1837, "step": 1829 }, { "epoch": 0.14, "learning_rate": 0.0002982979399536291, "loss": 2.0861, "step": 1830 }, { "epoch": 0.14, "learning_rate": 0.00029829608280121763, "loss": 2.1901, "step": 1831 }, { "epoch": 0.14, "learning_rate": 0.0002982942246419577, "loss": 2.1696, "step": 1832 }, { "epoch": 0.14, "learning_rate": 0.0002982923654758618, "loss": 2.0924, "step": 1833 }, { "epoch": 0.14, "learning_rate": 0.0002982905053029425, "loss": 2.1322, "step": 1834 }, { "epoch": 0.14, "learning_rate": 0.00029828864412321257, "loss": 2.1428, "step": 1835 }, { "epoch": 0.14, "learning_rate": 0.0002982867819366846, "loss": 2.1243, "step": 1836 }, { "epoch": 0.14, "learning_rate": 0.00029828491874337115, "loss": 2.0579, "step": 1837 }, { "epoch": 0.14, "learning_rate": 0.000298283054543285, "loss": 2.0992, "step": 1838 }, { "epoch": 0.14, "learning_rate": 0.0002982811893364387, "loss": 2.0864, "step": 1839 }, { "epoch": 0.14, "learning_rate": 0.000298279323122845, "loss": 2.1639, "step": 1840 }, { "epoch": 0.14, "learning_rate": 0.0002982774559025164, "loss": 2.042, "step": 1841 }, { "epoch": 0.14, "learning_rate": 0.0002982755876754658, "loss": 2.0863, "step": 1842 }, { "epoch": 0.15, "learning_rate": 0.00029827371844170575, "loss": 2.1037, "step": 1843 }, { "epoch": 0.15, "learning_rate": 0.000298271848201249, "loss": 2.1247, "step": 1844 }, { "epoch": 0.15, "learning_rate": 0.00029826997695410826, "loss": 2.1401, "step": 1845 }, { "epoch": 0.15, "learning_rate": 0.00029826810470029615, "loss": 2.099, "step": 1846 }, { "epoch": 0.15, "learning_rate": 0.00029826623143982547, "loss": 2.0617, "step": 1847 }, { "epoch": 0.15, "learning_rate": 0.0002982643571727088, "loss": 2.1113, "step": 1848 }, { "epoch": 0.15, "learning_rate": 0.00029826248189895904, "loss": 2.0926, "step": 1849 }, { "epoch": 0.15, "learning_rate": 0.00029826060561858887, "loss": 2.039, "step": 1850 }, { "epoch": 0.15, "learning_rate": 0.0002982587283316109, "loss": 2.0609, "step": 1851 }, { "epoch": 0.15, "learning_rate": 0.0002982568500380381, "loss": 2.0624, "step": 1852 }, { "epoch": 0.15, "learning_rate": 0.00029825497073788306, "loss": 2.0925, "step": 1853 }, { "epoch": 0.15, "learning_rate": 0.00029825309043115855, "loss": 2.1533, "step": 1854 }, { "epoch": 0.15, "learning_rate": 0.0002982512091178774, "loss": 2.1004, "step": 1855 }, { "epoch": 0.15, "learning_rate": 0.0002982493267980523, "loss": 2.1255, "step": 1856 }, { "epoch": 0.15, "learning_rate": 0.0002982474434716962, "loss": 2.0605, "step": 1857 }, { "epoch": 0.15, "learning_rate": 0.00029824555913882166, "loss": 2.1017, "step": 1858 }, { "epoch": 0.15, "learning_rate": 0.00029824367379944165, "loss": 2.0656, "step": 1859 }, { "epoch": 0.15, "learning_rate": 0.00029824178745356886, "loss": 2.133, "step": 1860 }, { "epoch": 0.15, "learning_rate": 0.0002982399001012161, "loss": 2.1528, "step": 1861 }, { "epoch": 0.15, "learning_rate": 0.0002982380117423963, "loss": 2.0659, "step": 1862 }, { "epoch": 0.15, "learning_rate": 0.00029823612237712217, "loss": 2.1178, "step": 1863 }, { "epoch": 0.15, "learning_rate": 0.0002982342320054066, "loss": 2.0502, "step": 1864 }, { "epoch": 0.15, "learning_rate": 0.0002982323406272624, "loss": 2.1164, "step": 1865 }, { "epoch": 0.15, "learning_rate": 0.00029823044824270236, "loss": 2.197, "step": 1866 }, { "epoch": 0.15, "learning_rate": 0.0002982285548517394, "loss": 2.1077, "step": 1867 }, { "epoch": 0.15, "learning_rate": 0.00029822666045438634, "loss": 2.1033, "step": 1868 }, { "epoch": 0.15, "learning_rate": 0.0002982247650506561, "loss": 2.1061, "step": 1869 }, { "epoch": 0.15, "learning_rate": 0.00029822286864056145, "loss": 2.1054, "step": 1870 }, { "epoch": 0.15, "learning_rate": 0.0002982209712241154, "loss": 2.0998, "step": 1871 }, { "epoch": 0.15, "learning_rate": 0.0002982190728013307, "loss": 2.0731, "step": 1872 }, { "epoch": 0.15, "learning_rate": 0.0002982171733722202, "loss": 2.097, "step": 1873 }, { "epoch": 0.15, "learning_rate": 0.000298215272936797, "loss": 2.0627, "step": 1874 }, { "epoch": 0.15, "learning_rate": 0.0002982133714950738, "loss": 2.0485, "step": 1875 }, { "epoch": 0.15, "learning_rate": 0.0002982114690470637, "loss": 2.0982, "step": 1876 }, { "epoch": 0.15, "learning_rate": 0.00029820956559277944, "loss": 2.1116, "step": 1877 }, { "epoch": 0.15, "learning_rate": 0.00029820766113223407, "loss": 2.0901, "step": 1878 }, { "epoch": 0.15, "learning_rate": 0.00029820575566544044, "loss": 2.1517, "step": 1879 }, { "epoch": 0.15, "learning_rate": 0.0002982038491924115, "loss": 2.0426, "step": 1880 }, { "epoch": 0.15, "learning_rate": 0.00029820194171316025, "loss": 2.1224, "step": 1881 }, { "epoch": 0.15, "learning_rate": 0.00029820003322769955, "loss": 2.1719, "step": 1882 }, { "epoch": 0.15, "learning_rate": 0.00029819812373604247, "loss": 2.1116, "step": 1883 }, { "epoch": 0.15, "learning_rate": 0.00029819621323820187, "loss": 2.1149, "step": 1884 }, { "epoch": 0.15, "learning_rate": 0.00029819430173419075, "loss": 2.0367, "step": 1885 }, { "epoch": 0.15, "learning_rate": 0.0002981923892240222, "loss": 2.1769, "step": 1886 }, { "epoch": 0.15, "learning_rate": 0.000298190475707709, "loss": 2.118, "step": 1887 }, { "epoch": 0.15, "learning_rate": 0.0002981885611852643, "loss": 2.0837, "step": 1888 }, { "epoch": 0.15, "learning_rate": 0.000298186645656701, "loss": 2.1307, "step": 1889 }, { "epoch": 0.15, "learning_rate": 0.0002981847291220322, "loss": 2.1015, "step": 1890 }, { "epoch": 0.15, "learning_rate": 0.00029818281158127086, "loss": 2.1098, "step": 1891 }, { "epoch": 0.15, "learning_rate": 0.00029818089303442993, "loss": 2.0871, "step": 1892 }, { "epoch": 0.15, "learning_rate": 0.00029817897348152257, "loss": 2.1796, "step": 1893 }, { "epoch": 0.15, "learning_rate": 0.00029817705292256173, "loss": 2.113, "step": 1894 }, { "epoch": 0.15, "learning_rate": 0.0002981751313575605, "loss": 2.0994, "step": 1895 }, { "epoch": 0.15, "learning_rate": 0.00029817320878653195, "loss": 2.0587, "step": 1896 }, { "epoch": 0.15, "learning_rate": 0.00029817128520948896, "loss": 2.1509, "step": 1897 }, { "epoch": 0.15, "learning_rate": 0.0002981693606264448, "loss": 2.1152, "step": 1898 }, { "epoch": 0.15, "learning_rate": 0.0002981674350374124, "loss": 2.0958, "step": 1899 }, { "epoch": 0.15, "learning_rate": 0.0002981655084424049, "loss": 2.1211, "step": 1900 }, { "epoch": 0.15, "learning_rate": 0.0002981635808414354, "loss": 2.1006, "step": 1901 }, { "epoch": 0.15, "learning_rate": 0.0002981616522345169, "loss": 2.1289, "step": 1902 }, { "epoch": 0.15, "learning_rate": 0.00029815972262166253, "loss": 2.116, "step": 1903 }, { "epoch": 0.15, "learning_rate": 0.00029815779200288543, "loss": 2.1032, "step": 1904 }, { "epoch": 0.15, "learning_rate": 0.0002981558603781987, "loss": 2.1299, "step": 1905 }, { "epoch": 0.15, "learning_rate": 0.0002981539277476154, "loss": 2.0542, "step": 1906 }, { "epoch": 0.15, "learning_rate": 0.00029815199411114873, "loss": 2.0813, "step": 1907 }, { "epoch": 0.15, "learning_rate": 0.0002981500594688117, "loss": 2.0603, "step": 1908 }, { "epoch": 0.15, "learning_rate": 0.00029814812382061764, "loss": 2.1037, "step": 1909 }, { "epoch": 0.15, "learning_rate": 0.0002981461871665795, "loss": 2.1415, "step": 1910 }, { "epoch": 0.15, "learning_rate": 0.0002981442495067105, "loss": 2.0485, "step": 1911 }, { "epoch": 0.15, "learning_rate": 0.0002981423108410238, "loss": 2.1192, "step": 1912 }, { "epoch": 0.15, "learning_rate": 0.00029814037116953257, "loss": 2.0676, "step": 1913 }, { "epoch": 0.15, "learning_rate": 0.00029813843049225, "loss": 2.1396, "step": 1914 }, { "epoch": 0.15, "learning_rate": 0.0002981364888091892, "loss": 2.0359, "step": 1915 }, { "epoch": 0.15, "learning_rate": 0.0002981345461203634, "loss": 2.0844, "step": 1916 }, { "epoch": 0.15, "learning_rate": 0.0002981326024257858, "loss": 2.0771, "step": 1917 }, { "epoch": 0.15, "learning_rate": 0.00029813065772546954, "loss": 1.9899, "step": 1918 }, { "epoch": 0.15, "learning_rate": 0.0002981287120194279, "loss": 2.1394, "step": 1919 }, { "epoch": 0.15, "learning_rate": 0.00029812676530767396, "loss": 2.1107, "step": 1920 }, { "epoch": 0.15, "learning_rate": 0.00029812481759022115, "loss": 2.1022, "step": 1921 }, { "epoch": 0.15, "learning_rate": 0.00029812286886708245, "loss": 2.0473, "step": 1922 }, { "epoch": 0.15, "learning_rate": 0.0002981209191382713, "loss": 2.0597, "step": 1923 }, { "epoch": 0.15, "learning_rate": 0.00029811896840380083, "loss": 2.0929, "step": 1924 }, { "epoch": 0.15, "learning_rate": 0.00029811701666368435, "loss": 2.0362, "step": 1925 }, { "epoch": 0.15, "learning_rate": 0.00029811506391793497, "loss": 2.0858, "step": 1926 }, { "epoch": 0.15, "learning_rate": 0.00029811311016656605, "loss": 2.0956, "step": 1927 }, { "epoch": 0.15, "learning_rate": 0.0002981111554095909, "loss": 2.1622, "step": 1928 }, { "epoch": 0.15, "learning_rate": 0.0002981091996470227, "loss": 2.0585, "step": 1929 }, { "epoch": 0.15, "learning_rate": 0.0002981072428788748, "loss": 2.0899, "step": 1930 }, { "epoch": 0.15, "learning_rate": 0.00029810528510516046, "loss": 2.1545, "step": 1931 }, { "epoch": 0.15, "learning_rate": 0.00029810332632589293, "loss": 2.122, "step": 1932 }, { "epoch": 0.15, "learning_rate": 0.00029810136654108557, "loss": 2.1382, "step": 1933 }, { "epoch": 0.15, "learning_rate": 0.00029809940575075165, "loss": 2.1048, "step": 1934 }, { "epoch": 0.15, "learning_rate": 0.0002980974439549045, "loss": 2.0918, "step": 1935 }, { "epoch": 0.15, "learning_rate": 0.00029809548115355744, "loss": 2.0786, "step": 1936 }, { "epoch": 0.15, "learning_rate": 0.0002980935173467237, "loss": 2.0457, "step": 1937 }, { "epoch": 0.15, "learning_rate": 0.0002980915525344168, "loss": 2.0637, "step": 1938 }, { "epoch": 0.15, "learning_rate": 0.00029808958671664995, "loss": 2.0678, "step": 1939 }, { "epoch": 0.15, "learning_rate": 0.0002980876198934366, "loss": 2.0648, "step": 1940 }, { "epoch": 0.15, "learning_rate": 0.00029808565206478993, "loss": 2.1495, "step": 1941 }, { "epoch": 0.15, "learning_rate": 0.00029808368323072345, "loss": 2.0806, "step": 1942 }, { "epoch": 0.15, "learning_rate": 0.0002980817133912505, "loss": 2.0858, "step": 1943 }, { "epoch": 0.15, "learning_rate": 0.0002980797425463844, "loss": 2.0444, "step": 1944 }, { "epoch": 0.15, "learning_rate": 0.0002980777706961385, "loss": 2.0482, "step": 1945 }, { "epoch": 0.15, "learning_rate": 0.0002980757978405264, "loss": 2.0571, "step": 1946 }, { "epoch": 0.15, "learning_rate": 0.0002980738239795613, "loss": 2.0845, "step": 1947 }, { "epoch": 0.15, "learning_rate": 0.00029807184911325655, "loss": 2.0928, "step": 1948 }, { "epoch": 0.15, "learning_rate": 0.00029806987324162575, "loss": 2.0836, "step": 1949 }, { "epoch": 0.15, "learning_rate": 0.0002980678963646822, "loss": 2.1321, "step": 1950 }, { "epoch": 0.15, "learning_rate": 0.0002980659184824394, "loss": 2.1398, "step": 1951 }, { "epoch": 0.15, "learning_rate": 0.0002980639395949106, "loss": 2.1146, "step": 1952 }, { "epoch": 0.15, "learning_rate": 0.00029806195970210947, "loss": 2.1719, "step": 1953 }, { "epoch": 0.15, "learning_rate": 0.0002980599788040493, "loss": 2.0902, "step": 1954 }, { "epoch": 0.15, "learning_rate": 0.0002980579969007436, "loss": 2.0675, "step": 1955 }, { "epoch": 0.15, "learning_rate": 0.00029805601399220577, "loss": 2.118, "step": 1956 }, { "epoch": 0.15, "learning_rate": 0.0002980540300784493, "loss": 2.0734, "step": 1957 }, { "epoch": 0.15, "learning_rate": 0.0002980520451594877, "loss": 2.0605, "step": 1958 }, { "epoch": 0.15, "learning_rate": 0.0002980500592353344, "loss": 2.0097, "step": 1959 }, { "epoch": 0.15, "learning_rate": 0.0002980480723060029, "loss": 2.0526, "step": 1960 }, { "epoch": 0.15, "learning_rate": 0.0002980460843715067, "loss": 2.0645, "step": 1961 }, { "epoch": 0.15, "learning_rate": 0.0002980440954318593, "loss": 2.0868, "step": 1962 }, { "epoch": 0.15, "learning_rate": 0.00029804210548707414, "loss": 2.0909, "step": 1963 }, { "epoch": 0.15, "learning_rate": 0.00029804011453716487, "loss": 2.129, "step": 1964 }, { "epoch": 0.15, "learning_rate": 0.00029803812258214483, "loss": 2.0605, "step": 1965 }, { "epoch": 0.15, "learning_rate": 0.0002980361296220277, "loss": 2.0563, "step": 1966 }, { "epoch": 0.15, "learning_rate": 0.00029803413565682684, "loss": 2.0395, "step": 1967 }, { "epoch": 0.15, "learning_rate": 0.000298032140686556, "loss": 2.0976, "step": 1968 }, { "epoch": 0.15, "learning_rate": 0.00029803014471122853, "loss": 2.1083, "step": 1969 }, { "epoch": 0.16, "learning_rate": 0.00029802814773085813, "loss": 2.0368, "step": 1970 }, { "epoch": 0.16, "learning_rate": 0.0002980261497454583, "loss": 2.0448, "step": 1971 }, { "epoch": 0.16, "learning_rate": 0.00029802415075504254, "loss": 2.0911, "step": 1972 }, { "epoch": 0.16, "learning_rate": 0.0002980221507596245, "loss": 2.1286, "step": 1973 }, { "epoch": 0.16, "learning_rate": 0.00029802014975921775, "loss": 2.079, "step": 1974 }, { "epoch": 0.16, "learning_rate": 0.0002980181477538359, "loss": 2.1284, "step": 1975 }, { "epoch": 0.16, "learning_rate": 0.0002980161447434925, "loss": 2.0862, "step": 1976 }, { "epoch": 0.16, "learning_rate": 0.0002980141407282011, "loss": 2.0963, "step": 1977 }, { "epoch": 0.16, "learning_rate": 0.0002980121357079754, "loss": 2.1027, "step": 1978 }, { "epoch": 0.16, "learning_rate": 0.000298010129682829, "loss": 2.0803, "step": 1979 }, { "epoch": 0.16, "learning_rate": 0.0002980081226527755, "loss": 2.1294, "step": 1980 }, { "epoch": 0.16, "learning_rate": 0.00029800611461782854, "loss": 2.0762, "step": 1981 }, { "epoch": 0.16, "learning_rate": 0.0002980041055780017, "loss": 2.1366, "step": 1982 }, { "epoch": 0.16, "learning_rate": 0.00029800209553330865, "loss": 2.0884, "step": 1983 }, { "epoch": 0.16, "learning_rate": 0.00029800008448376306, "loss": 2.1108, "step": 1984 }, { "epoch": 0.16, "learning_rate": 0.00029799807242937863, "loss": 2.0597, "step": 1985 }, { "epoch": 0.16, "learning_rate": 0.0002979960593701689, "loss": 2.0843, "step": 1986 }, { "epoch": 0.16, "learning_rate": 0.00029799404530614755, "loss": 2.0863, "step": 1987 }, { "epoch": 0.16, "learning_rate": 0.0002979920302373284, "loss": 2.0951, "step": 1988 }, { "epoch": 0.16, "learning_rate": 0.000297990014163725, "loss": 2.0718, "step": 1989 }, { "epoch": 0.16, "learning_rate": 0.000297987997085351, "loss": 2.0991, "step": 1990 }, { "epoch": 0.16, "learning_rate": 0.00029798597900222023, "loss": 2.1001, "step": 1991 }, { "epoch": 0.16, "learning_rate": 0.00029798395991434634, "loss": 2.0343, "step": 1992 }, { "epoch": 0.16, "learning_rate": 0.000297981939821743, "loss": 2.0072, "step": 1993 }, { "epoch": 0.16, "learning_rate": 0.000297979918724424, "loss": 2.1331, "step": 1994 }, { "epoch": 0.16, "learning_rate": 0.00029797789662240295, "loss": 2.0478, "step": 1995 }, { "epoch": 0.16, "learning_rate": 0.00029797587351569366, "loss": 2.096, "step": 1996 }, { "epoch": 0.16, "learning_rate": 0.00029797384940430984, "loss": 2.0997, "step": 1997 }, { "epoch": 0.16, "learning_rate": 0.00029797182428826526, "loss": 2.0899, "step": 1998 }, { "epoch": 0.16, "learning_rate": 0.0002979697981675737, "loss": 2.0784, "step": 1999 }, { "epoch": 0.16, "learning_rate": 0.00029796777104224877, "loss": 2.062, "step": 2000 }, { "epoch": 0.16, "learning_rate": 0.0002979657429123044, "loss": 2.1609, "step": 2001 }, { "epoch": 0.16, "learning_rate": 0.00029796371377775423, "loss": 2.0302, "step": 2002 }, { "epoch": 0.16, "learning_rate": 0.0002979616836386121, "loss": 2.0556, "step": 2003 }, { "epoch": 0.16, "learning_rate": 0.00029795965249489187, "loss": 2.1351, "step": 2004 }, { "epoch": 0.16, "learning_rate": 0.0002979576203466072, "loss": 2.0698, "step": 2005 }, { "epoch": 0.16, "learning_rate": 0.00029795558719377193, "loss": 2.0186, "step": 2006 }, { "epoch": 0.16, "learning_rate": 0.0002979535530363999, "loss": 2.1455, "step": 2007 }, { "epoch": 0.16, "learning_rate": 0.0002979515178745049, "loss": 2.097, "step": 2008 }, { "epoch": 0.16, "learning_rate": 0.00029794948170810064, "loss": 2.0649, "step": 2009 }, { "epoch": 0.16, "learning_rate": 0.00029794744453720117, "loss": 2.0702, "step": 2010 }, { "epoch": 0.16, "learning_rate": 0.00029794540636182015, "loss": 2.0724, "step": 2011 }, { "epoch": 0.16, "learning_rate": 0.00029794336718197146, "loss": 2.0918, "step": 2012 }, { "epoch": 0.16, "learning_rate": 0.00029794132699766893, "loss": 2.1205, "step": 2013 }, { "epoch": 0.16, "learning_rate": 0.00029793928580892643, "loss": 2.0488, "step": 2014 }, { "epoch": 0.16, "learning_rate": 0.00029793724361575785, "loss": 2.0626, "step": 2015 }, { "epoch": 0.16, "learning_rate": 0.00029793520041817705, "loss": 2.0544, "step": 2016 }, { "epoch": 0.16, "learning_rate": 0.0002979331562161978, "loss": 2.0483, "step": 2017 }, { "epoch": 0.16, "learning_rate": 0.0002979311110098341, "loss": 2.0416, "step": 2018 }, { "epoch": 0.16, "learning_rate": 0.0002979290647990998, "loss": 2.0207, "step": 2019 }, { "epoch": 0.16, "learning_rate": 0.00029792701758400876, "loss": 2.0848, "step": 2020 }, { "epoch": 0.16, "learning_rate": 0.0002979249693645749, "loss": 2.0843, "step": 2021 }, { "epoch": 0.16, "learning_rate": 0.0002979229201408122, "loss": 2.0351, "step": 2022 }, { "epoch": 0.16, "learning_rate": 0.00029792086991273437, "loss": 2.0054, "step": 2023 }, { "epoch": 0.16, "learning_rate": 0.00029791881868035554, "loss": 2.0135, "step": 2024 }, { "epoch": 0.16, "learning_rate": 0.00029791676644368956, "loss": 2.026, "step": 2025 }, { "epoch": 0.16, "learning_rate": 0.00029791471320275036, "loss": 2.0051, "step": 2026 }, { "epoch": 0.16, "learning_rate": 0.0002979126589575519, "loss": 2.0053, "step": 2027 }, { "epoch": 0.16, "learning_rate": 0.0002979106037081081, "loss": 1.9975, "step": 2028 }, { "epoch": 0.16, "learning_rate": 0.0002979085474544329, "loss": 2.04, "step": 2029 }, { "epoch": 0.16, "learning_rate": 0.0002979064901965403, "loss": 2.1558, "step": 2030 }, { "epoch": 0.16, "learning_rate": 0.00029790443193444425, "loss": 2.0497, "step": 2031 }, { "epoch": 0.16, "learning_rate": 0.00029790237266815876, "loss": 2.0991, "step": 2032 }, { "epoch": 0.16, "learning_rate": 0.00029790031239769775, "loss": 2.0086, "step": 2033 }, { "epoch": 0.16, "learning_rate": 0.00029789825112307524, "loss": 2.076, "step": 2034 }, { "epoch": 0.16, "learning_rate": 0.00029789618884430523, "loss": 2.0976, "step": 2035 }, { "epoch": 0.16, "learning_rate": 0.0002978941255614017, "loss": 2.0804, "step": 2036 }, { "epoch": 0.16, "learning_rate": 0.00029789206127437865, "loss": 2.098, "step": 2037 }, { "epoch": 0.16, "learning_rate": 0.00029788999598325016, "loss": 2.023, "step": 2038 }, { "epoch": 0.16, "learning_rate": 0.0002978879296880302, "loss": 2.0611, "step": 2039 }, { "epoch": 0.16, "learning_rate": 0.0002978858623887328, "loss": 2.0857, "step": 2040 }, { "epoch": 0.16, "learning_rate": 0.00029788379408537204, "loss": 2.0188, "step": 2041 }, { "epoch": 0.16, "learning_rate": 0.0002978817247779619, "loss": 2.0464, "step": 2042 }, { "epoch": 0.16, "learning_rate": 0.00029787965446651643, "loss": 2.0408, "step": 2043 }, { "epoch": 0.16, "learning_rate": 0.00029787758315104974, "loss": 2.0794, "step": 2044 }, { "epoch": 0.16, "learning_rate": 0.00029787551083157584, "loss": 2.1005, "step": 2045 }, { "epoch": 0.16, "learning_rate": 0.0002978734375081089, "loss": 2.1179, "step": 2046 }, { "epoch": 0.16, "learning_rate": 0.00029787136318066285, "loss": 2.0216, "step": 2047 }, { "epoch": 0.16, "learning_rate": 0.00029786928784925184, "loss": 2.0963, "step": 2048 }, { "epoch": 0.16, "learning_rate": 0.00029786721151389, "loss": 2.0275, "step": 2049 }, { "epoch": 0.16, "learning_rate": 0.00029786513417459144, "loss": 2.072, "step": 2050 }, { "epoch": 0.16, "learning_rate": 0.0002978630558313701, "loss": 2.0075, "step": 2051 }, { "epoch": 0.16, "learning_rate": 0.00029786097648424025, "loss": 2.0537, "step": 2052 }, { "epoch": 0.16, "learning_rate": 0.00029785889613321605, "loss": 2.0671, "step": 2053 }, { "epoch": 0.16, "learning_rate": 0.0002978568147783115, "loss": 2.0466, "step": 2054 }, { "epoch": 0.16, "learning_rate": 0.0002978547324195407, "loss": 2.0278, "step": 2055 }, { "epoch": 0.16, "learning_rate": 0.0002978526490569179, "loss": 2.0642, "step": 2056 }, { "epoch": 0.16, "learning_rate": 0.0002978505646904572, "loss": 2.11, "step": 2057 }, { "epoch": 0.16, "learning_rate": 0.0002978484793201728, "loss": 2.0614, "step": 2058 }, { "epoch": 0.16, "learning_rate": 0.00029784639294607877, "loss": 2.0719, "step": 2059 }, { "epoch": 0.16, "learning_rate": 0.00029784430556818937, "loss": 2.1282, "step": 2060 }, { "epoch": 0.16, "learning_rate": 0.00029784221718651865, "loss": 2.0671, "step": 2061 }, { "epoch": 0.16, "learning_rate": 0.0002978401278010809, "loss": 2.0684, "step": 2062 }, { "epoch": 0.16, "learning_rate": 0.0002978380374118903, "loss": 2.075, "step": 2063 }, { "epoch": 0.16, "learning_rate": 0.00029783594601896096, "loss": 2.0885, "step": 2064 }, { "epoch": 0.16, "learning_rate": 0.0002978338536223071, "loss": 2.0645, "step": 2065 }, { "epoch": 0.16, "learning_rate": 0.0002978317602219431, "loss": 2.0678, "step": 2066 }, { "epoch": 0.16, "learning_rate": 0.0002978296658178829, "loss": 1.9937, "step": 2067 }, { "epoch": 0.16, "learning_rate": 0.0002978275704101409, "loss": 2.0585, "step": 2068 }, { "epoch": 0.16, "learning_rate": 0.00029782547399873126, "loss": 2.0658, "step": 2069 }, { "epoch": 0.16, "learning_rate": 0.00029782337658366823, "loss": 2.0577, "step": 2070 }, { "epoch": 0.16, "learning_rate": 0.00029782127816496603, "loss": 2.0205, "step": 2071 }, { "epoch": 0.16, "learning_rate": 0.0002978191787426389, "loss": 2.0324, "step": 2072 }, { "epoch": 0.16, "learning_rate": 0.0002978170783167012, "loss": 2.0606, "step": 2073 }, { "epoch": 0.16, "learning_rate": 0.00029781497688716706, "loss": 2.0331, "step": 2074 }, { "epoch": 0.16, "learning_rate": 0.0002978128744540508, "loss": 2.103, "step": 2075 }, { "epoch": 0.16, "learning_rate": 0.0002978107710173667, "loss": 2.0845, "step": 2076 }, { "epoch": 0.16, "learning_rate": 0.00029780866657712904, "loss": 2.0656, "step": 2077 }, { "epoch": 0.16, "learning_rate": 0.00029780656113335204, "loss": 2.0141, "step": 2078 }, { "epoch": 0.16, "learning_rate": 0.00029780445468605013, "loss": 2.0724, "step": 2079 }, { "epoch": 0.16, "learning_rate": 0.00029780234723523753, "loss": 2.0112, "step": 2080 }, { "epoch": 0.16, "learning_rate": 0.0002978002387809285, "loss": 2.0819, "step": 2081 }, { "epoch": 0.16, "learning_rate": 0.0002977981293231375, "loss": 2.0999, "step": 2082 }, { "epoch": 0.16, "learning_rate": 0.0002977960188618787, "loss": 2.0487, "step": 2083 }, { "epoch": 0.16, "learning_rate": 0.0002977939073971665, "loss": 2.0621, "step": 2084 }, { "epoch": 0.16, "learning_rate": 0.00029779179492901524, "loss": 2.04, "step": 2085 }, { "epoch": 0.16, "learning_rate": 0.00029778968145743927, "loss": 2.1299, "step": 2086 }, { "epoch": 0.16, "learning_rate": 0.0002977875669824529, "loss": 2.0178, "step": 2087 }, { "epoch": 0.16, "learning_rate": 0.0002977854515040705, "loss": 2.1118, "step": 2088 }, { "epoch": 0.16, "learning_rate": 0.0002977833350223065, "loss": 2.0414, "step": 2089 }, { "epoch": 0.16, "learning_rate": 0.0002977812175371751, "loss": 2.121, "step": 2090 }, { "epoch": 0.16, "learning_rate": 0.0002977790990486909, "loss": 2.0813, "step": 2091 }, { "epoch": 0.16, "learning_rate": 0.00029777697955686805, "loss": 2.0198, "step": 2092 }, { "epoch": 0.16, "learning_rate": 0.0002977748590617211, "loss": 2.089, "step": 2093 }, { "epoch": 0.16, "learning_rate": 0.00029777273756326445, "loss": 2.0841, "step": 2094 }, { "epoch": 0.16, "learning_rate": 0.0002977706150615124, "loss": 2.1186, "step": 2095 }, { "epoch": 0.16, "learning_rate": 0.00029776849155647945, "loss": 2.0711, "step": 2096 }, { "epoch": 0.16, "learning_rate": 0.00029776636704818, "loss": 2.082, "step": 2097 }, { "epoch": 0.17, "learning_rate": 0.0002977642415366285, "loss": 2.032, "step": 2098 }, { "epoch": 0.17, "learning_rate": 0.00029776211502183925, "loss": 1.9796, "step": 2099 }, { "epoch": 0.17, "learning_rate": 0.00029775998750382685, "loss": 2.0689, "step": 2100 }, { "epoch": 0.17, "learning_rate": 0.00029775785898260564, "loss": 2.0642, "step": 2101 }, { "epoch": 0.17, "learning_rate": 0.0002977557294581901, "loss": 2.0572, "step": 2102 }, { "epoch": 0.17, "learning_rate": 0.00029775359893059473, "loss": 2.0389, "step": 2103 }, { "epoch": 0.17, "learning_rate": 0.0002977514673998339, "loss": 2.0647, "step": 2104 }, { "epoch": 0.17, "learning_rate": 0.0002977493348659222, "loss": 2.0641, "step": 2105 }, { "epoch": 0.17, "learning_rate": 0.0002977472013288741, "loss": 2.0664, "step": 2106 }, { "epoch": 0.17, "learning_rate": 0.00029774506678870394, "loss": 2.0554, "step": 2107 }, { "epoch": 0.17, "learning_rate": 0.00029774293124542635, "loss": 2.0276, "step": 2108 }, { "epoch": 0.17, "learning_rate": 0.0002977407946990558, "loss": 2.1035, "step": 2109 }, { "epoch": 0.17, "learning_rate": 0.00029773865714960673, "loss": 2.0557, "step": 2110 }, { "epoch": 0.17, "learning_rate": 0.0002977365185970937, "loss": 2.0137, "step": 2111 }, { "epoch": 0.17, "learning_rate": 0.00029773437904153136, "loss": 2.0536, "step": 2112 }, { "epoch": 0.17, "learning_rate": 0.000297732238482934, "loss": 2.074, "step": 2113 }, { "epoch": 0.17, "learning_rate": 0.0002977300969213163, "loss": 2.0864, "step": 2114 }, { "epoch": 0.17, "learning_rate": 0.00029772795435669276, "loss": 2.0714, "step": 2115 }, { "epoch": 0.17, "learning_rate": 0.00029772581078907795, "loss": 2.0288, "step": 2116 }, { "epoch": 0.17, "learning_rate": 0.00029772366621848637, "loss": 2.0503, "step": 2117 }, { "epoch": 0.17, "learning_rate": 0.0002977215206449327, "loss": 2.0838, "step": 2118 }, { "epoch": 0.17, "learning_rate": 0.00029771937406843134, "loss": 2.0481, "step": 2119 }, { "epoch": 0.17, "learning_rate": 0.00029771722648899696, "loss": 2.0937, "step": 2120 }, { "epoch": 0.17, "learning_rate": 0.0002977150779066441, "loss": 2.1101, "step": 2121 }, { "epoch": 0.17, "learning_rate": 0.0002977129283213875, "loss": 2.0104, "step": 2122 }, { "epoch": 0.17, "learning_rate": 0.0002977107777332415, "loss": 2.0527, "step": 2123 }, { "epoch": 0.17, "learning_rate": 0.0002977086261422209, "loss": 2.0377, "step": 2124 }, { "epoch": 0.17, "learning_rate": 0.0002977064735483402, "loss": 2.1298, "step": 2125 }, { "epoch": 0.17, "learning_rate": 0.0002977043199516141, "loss": 1.9907, "step": 2126 }, { "epoch": 0.17, "learning_rate": 0.00029770216535205714, "loss": 2.0703, "step": 2127 }, { "epoch": 0.17, "learning_rate": 0.000297700009749684, "loss": 2.0826, "step": 2128 }, { "epoch": 0.17, "learning_rate": 0.00029769785314450934, "loss": 2.1026, "step": 2129 }, { "epoch": 0.17, "learning_rate": 0.00029769569553654774, "loss": 1.9585, "step": 2130 }, { "epoch": 0.17, "learning_rate": 0.00029769353692581384, "loss": 2.0692, "step": 2131 }, { "epoch": 0.17, "learning_rate": 0.00029769137731232233, "loss": 2.0531, "step": 2132 }, { "epoch": 0.17, "learning_rate": 0.0002976892166960879, "loss": 2.0007, "step": 2133 }, { "epoch": 0.17, "learning_rate": 0.0002976870550771252, "loss": 2.0547, "step": 2134 }, { "epoch": 0.17, "learning_rate": 0.0002976848924554489, "loss": 2.0598, "step": 2135 }, { "epoch": 0.17, "learning_rate": 0.0002976827288310736, "loss": 2.048, "step": 2136 }, { "epoch": 0.17, "learning_rate": 0.0002976805642040141, "loss": 2.0446, "step": 2137 }, { "epoch": 0.17, "learning_rate": 0.0002976783985742851, "loss": 2.0287, "step": 2138 }, { "epoch": 0.17, "learning_rate": 0.0002976762319419013, "loss": 1.9962, "step": 2139 }, { "epoch": 0.17, "learning_rate": 0.00029767406430687737, "loss": 2.0513, "step": 2140 }, { "epoch": 0.17, "learning_rate": 0.00029767189566922797, "loss": 2.0286, "step": 2141 }, { "epoch": 0.17, "learning_rate": 0.00029766972602896793, "loss": 2.0442, "step": 2142 }, { "epoch": 0.17, "learning_rate": 0.00029766755538611193, "loss": 1.9561, "step": 2143 }, { "epoch": 0.17, "learning_rate": 0.0002976653837406748, "loss": 2.0029, "step": 2144 }, { "epoch": 0.17, "learning_rate": 0.00029766321109267105, "loss": 1.9993, "step": 2145 }, { "epoch": 0.17, "learning_rate": 0.0002976610374421157, "loss": 2.0265, "step": 2146 }, { "epoch": 0.17, "learning_rate": 0.00029765886278902335, "loss": 1.993, "step": 2147 }, { "epoch": 0.17, "learning_rate": 0.0002976566871334088, "loss": 2.005, "step": 2148 }, { "epoch": 0.17, "learning_rate": 0.00029765451047528683, "loss": 2.0068, "step": 2149 }, { "epoch": 0.17, "learning_rate": 0.0002976523328146723, "loss": 2.0281, "step": 2150 }, { "epoch": 0.17, "learning_rate": 0.0002976501541515798, "loss": 2.0225, "step": 2151 }, { "epoch": 0.17, "learning_rate": 0.00029764797448602427, "loss": 2.0236, "step": 2152 }, { "epoch": 0.17, "learning_rate": 0.00029764579381802046, "loss": 2.0292, "step": 2153 }, { "epoch": 0.17, "learning_rate": 0.0002976436121475832, "loss": 2.0494, "step": 2154 }, { "epoch": 0.17, "learning_rate": 0.0002976414294747273, "loss": 1.9895, "step": 2155 }, { "epoch": 0.17, "learning_rate": 0.00029763924579946757, "loss": 2.0417, "step": 2156 }, { "epoch": 0.17, "learning_rate": 0.0002976370611218188, "loss": 2.0193, "step": 2157 }, { "epoch": 0.17, "learning_rate": 0.0002976348754417959, "loss": 1.9845, "step": 2158 }, { "epoch": 0.17, "learning_rate": 0.0002976326887594137, "loss": 2.0772, "step": 2159 }, { "epoch": 0.17, "learning_rate": 0.0002976305010746869, "loss": 1.9947, "step": 2160 }, { "epoch": 0.17, "learning_rate": 0.00029762831238763055, "loss": 2.0011, "step": 2161 }, { "epoch": 0.17, "learning_rate": 0.00029762612269825943, "loss": 2.0307, "step": 2162 }, { "epoch": 0.17, "learning_rate": 0.00029762393200658834, "loss": 2.0028, "step": 2163 }, { "epoch": 0.17, "learning_rate": 0.0002976217403126323, "loss": 2.0346, "step": 2164 }, { "epoch": 0.17, "learning_rate": 0.00029761954761640605, "loss": 2.0064, "step": 2165 }, { "epoch": 0.17, "learning_rate": 0.0002976173539179246, "loss": 2.0099, "step": 2166 }, { "epoch": 0.17, "learning_rate": 0.00029761515921720267, "loss": 1.9836, "step": 2167 }, { "epoch": 0.17, "learning_rate": 0.00029761296351425536, "loss": 2.0739, "step": 2168 }, { "epoch": 0.17, "learning_rate": 0.00029761076680909747, "loss": 2.0707, "step": 2169 }, { "epoch": 0.17, "learning_rate": 0.0002976085691017439, "loss": 2.0542, "step": 2170 }, { "epoch": 0.17, "learning_rate": 0.00029760637039220964, "loss": 1.9908, "step": 2171 }, { "epoch": 0.17, "learning_rate": 0.0002976041706805096, "loss": 2.0917, "step": 2172 }, { "epoch": 0.17, "learning_rate": 0.00029760196996665863, "loss": 1.9794, "step": 2173 }, { "epoch": 0.17, "learning_rate": 0.0002975997682506718, "loss": 2.0231, "step": 2174 }, { "epoch": 0.17, "learning_rate": 0.00029759756553256395, "loss": 2.0645, "step": 2175 }, { "epoch": 0.17, "learning_rate": 0.0002975953618123501, "loss": 2.0146, "step": 2176 }, { "epoch": 0.17, "learning_rate": 0.00029759315709004515, "loss": 2.0661, "step": 2177 }, { "epoch": 0.17, "learning_rate": 0.0002975909513656642, "loss": 2.1059, "step": 2178 }, { "epoch": 0.17, "learning_rate": 0.000297588744639222, "loss": 2.0158, "step": 2179 }, { "epoch": 0.17, "learning_rate": 0.00029758653691073383, "loss": 2.0777, "step": 2180 }, { "epoch": 0.17, "learning_rate": 0.0002975843281802144, "loss": 2.0022, "step": 2181 }, { "epoch": 0.17, "learning_rate": 0.00029758211844767887, "loss": 2.065, "step": 2182 }, { "epoch": 0.17, "learning_rate": 0.00029757990771314225, "loss": 2.0385, "step": 2183 }, { "epoch": 0.17, "learning_rate": 0.0002975776959766194, "loss": 2.1027, "step": 2184 }, { "epoch": 0.17, "learning_rate": 0.0002975754832381255, "loss": 2.0524, "step": 2185 }, { "epoch": 0.17, "learning_rate": 0.0002975732694976755, "loss": 2.0303, "step": 2186 }, { "epoch": 0.17, "learning_rate": 0.0002975710547552844, "loss": 2.0443, "step": 2187 }, { "epoch": 0.17, "learning_rate": 0.0002975688390109673, "loss": 2.0221, "step": 2188 }, { "epoch": 0.17, "learning_rate": 0.0002975666222647393, "loss": 2.0339, "step": 2189 }, { "epoch": 0.17, "learning_rate": 0.00029756440451661524, "loss": 2.0506, "step": 2190 }, { "epoch": 0.17, "learning_rate": 0.00029756218576661034, "loss": 2.0456, "step": 2191 }, { "epoch": 0.17, "learning_rate": 0.00029755996601473964, "loss": 2.0234, "step": 2192 }, { "epoch": 0.17, "learning_rate": 0.0002975577452610182, "loss": 2.0346, "step": 2193 }, { "epoch": 0.17, "learning_rate": 0.0002975555235054611, "loss": 1.9801, "step": 2194 }, { "epoch": 0.17, "learning_rate": 0.0002975533007480835, "loss": 2.0117, "step": 2195 }, { "epoch": 0.17, "learning_rate": 0.0002975510769889003, "loss": 2.0455, "step": 2196 }, { "epoch": 0.17, "learning_rate": 0.00029754885222792676, "loss": 2.0469, "step": 2197 }, { "epoch": 0.17, "learning_rate": 0.00029754662646517795, "loss": 2.0352, "step": 2198 }, { "epoch": 0.17, "learning_rate": 0.00029754439970066895, "loss": 2.0883, "step": 2199 }, { "epoch": 0.17, "learning_rate": 0.00029754217193441487, "loss": 2.0761, "step": 2200 }, { "epoch": 0.17, "learning_rate": 0.00029753994316643095, "loss": 2.0705, "step": 2201 }, { "epoch": 0.17, "learning_rate": 0.00029753771339673216, "loss": 2.0135, "step": 2202 }, { "epoch": 0.17, "learning_rate": 0.0002975354826253337, "loss": 2.0529, "step": 2203 }, { "epoch": 0.17, "learning_rate": 0.00029753325085225075, "loss": 2.0421, "step": 2204 }, { "epoch": 0.17, "learning_rate": 0.0002975310180774985, "loss": 2.016, "step": 2205 }, { "epoch": 0.17, "learning_rate": 0.000297528784301092, "loss": 2.0118, "step": 2206 }, { "epoch": 0.17, "learning_rate": 0.0002975265495230465, "loss": 2.0527, "step": 2207 }, { "epoch": 0.17, "learning_rate": 0.0002975243137433771, "loss": 2.0918, "step": 2208 }, { "epoch": 0.17, "learning_rate": 0.000297522076962099, "loss": 2.0351, "step": 2209 }, { "epoch": 0.17, "learning_rate": 0.00029751983917922746, "loss": 2.0207, "step": 2210 }, { "epoch": 0.17, "learning_rate": 0.00029751760039477764, "loss": 1.9672, "step": 2211 }, { "epoch": 0.17, "learning_rate": 0.0002975153606087647, "loss": 2.0564, "step": 2212 }, { "epoch": 0.17, "learning_rate": 0.0002975131198212038, "loss": 2.0539, "step": 2213 }, { "epoch": 0.17, "learning_rate": 0.00029751087803211025, "loss": 2.0942, "step": 2214 }, { "epoch": 0.17, "learning_rate": 0.0002975086352414993, "loss": 2.0008, "step": 2215 }, { "epoch": 0.17, "learning_rate": 0.00029750639144938604, "loss": 2.0416, "step": 2216 }, { "epoch": 0.17, "learning_rate": 0.00029750414665578585, "loss": 2.0801, "step": 2217 }, { "epoch": 0.17, "learning_rate": 0.00029750190086071386, "loss": 2.1112, "step": 2218 }, { "epoch": 0.17, "learning_rate": 0.0002974996540641854, "loss": 2.0678, "step": 2219 }, { "epoch": 0.17, "learning_rate": 0.0002974974062662157, "loss": 2.0654, "step": 2220 }, { "epoch": 0.17, "learning_rate": 0.0002974951574668199, "loss": 1.9966, "step": 2221 }, { "epoch": 0.17, "learning_rate": 0.0002974929076660135, "loss": 2.0512, "step": 2222 }, { "epoch": 0.17, "learning_rate": 0.0002974906568638116, "loss": 1.9626, "step": 2223 }, { "epoch": 0.17, "learning_rate": 0.00029748840506022955, "loss": 2.0349, "step": 2224 }, { "epoch": 0.18, "learning_rate": 0.00029748615225528256, "loss": 2.0563, "step": 2225 }, { "epoch": 0.18, "learning_rate": 0.000297483898448986, "loss": 2.0378, "step": 2226 }, { "epoch": 0.18, "learning_rate": 0.0002974816436413552, "loss": 2.0308, "step": 2227 }, { "epoch": 0.18, "learning_rate": 0.0002974793878324054, "loss": 2.0502, "step": 2228 }, { "epoch": 0.18, "learning_rate": 0.000297477131022152, "loss": 2.0889, "step": 2229 }, { "epoch": 0.18, "learning_rate": 0.00029747487321061026, "loss": 2.0482, "step": 2230 }, { "epoch": 0.18, "learning_rate": 0.00029747261439779546, "loss": 2.0146, "step": 2231 }, { "epoch": 0.18, "learning_rate": 0.000297470354583723, "loss": 1.9986, "step": 2232 }, { "epoch": 0.18, "learning_rate": 0.0002974680937684082, "loss": 2.0331, "step": 2233 }, { "epoch": 0.18, "learning_rate": 0.0002974658319518664, "loss": 2.0258, "step": 2234 }, { "epoch": 0.18, "learning_rate": 0.00029746356913411303, "loss": 2.0237, "step": 2235 }, { "epoch": 0.18, "learning_rate": 0.0002974613053151634, "loss": 1.9972, "step": 2236 }, { "epoch": 0.18, "learning_rate": 0.0002974590404950329, "loss": 2.0583, "step": 2237 }, { "epoch": 0.18, "learning_rate": 0.00029745677467373687, "loss": 2.0153, "step": 2238 }, { "epoch": 0.18, "learning_rate": 0.0002974545078512907, "loss": 2.003, "step": 2239 }, { "epoch": 0.18, "learning_rate": 0.00029745224002770976, "loss": 2.0097, "step": 2240 }, { "epoch": 0.18, "learning_rate": 0.00029744997120300954, "loss": 2.0615, "step": 2241 }, { "epoch": 0.18, "learning_rate": 0.0002974477013772054, "loss": 2.0004, "step": 2242 }, { "epoch": 0.18, "learning_rate": 0.0002974454305503127, "loss": 2.0837, "step": 2243 }, { "epoch": 0.18, "learning_rate": 0.0002974431587223469, "loss": 2.016, "step": 2244 }, { "epoch": 0.18, "learning_rate": 0.0002974408858933234, "loss": 2.0561, "step": 2245 }, { "epoch": 0.18, "learning_rate": 0.00029743861206325763, "loss": 1.9982, "step": 2246 }, { "epoch": 0.18, "learning_rate": 0.0002974363372321651, "loss": 1.9744, "step": 2247 }, { "epoch": 0.18, "learning_rate": 0.0002974340614000612, "loss": 1.9857, "step": 2248 }, { "epoch": 0.18, "learning_rate": 0.0002974317845669614, "loss": 2.0216, "step": 2249 }, { "epoch": 0.18, "learning_rate": 0.00029742950673288107, "loss": 1.9925, "step": 2250 }, { "epoch": 0.18, "learning_rate": 0.00029742722789783576, "loss": 1.9485, "step": 2251 }, { "epoch": 0.18, "learning_rate": 0.00029742494806184096, "loss": 2.0601, "step": 2252 }, { "epoch": 0.18, "learning_rate": 0.00029742266722491213, "loss": 2.0974, "step": 2253 }, { "epoch": 0.18, "learning_rate": 0.00029742038538706477, "loss": 2.0268, "step": 2254 }, { "epoch": 0.18, "learning_rate": 0.00029741810254831427, "loss": 2.009, "step": 2255 }, { "epoch": 0.18, "learning_rate": 0.0002974158187086763, "loss": 2.0584, "step": 2256 }, { "epoch": 0.18, "learning_rate": 0.00029741353386816615, "loss": 1.9799, "step": 2257 }, { "epoch": 0.18, "learning_rate": 0.00029741124802679954, "loss": 2.0101, "step": 2258 }, { "epoch": 0.18, "learning_rate": 0.0002974089611845919, "loss": 1.9844, "step": 2259 }, { "epoch": 0.18, "learning_rate": 0.00029740667334155873, "loss": 1.9978, "step": 2260 }, { "epoch": 0.18, "learning_rate": 0.0002974043844977156, "loss": 2.0596, "step": 2261 }, { "epoch": 0.18, "learning_rate": 0.00029740209465307807, "loss": 1.9981, "step": 2262 }, { "epoch": 0.18, "learning_rate": 0.0002973998038076616, "loss": 2.0235, "step": 2263 }, { "epoch": 0.18, "learning_rate": 0.00029739751196148186, "loss": 2.0412, "step": 2264 }, { "epoch": 0.18, "learning_rate": 0.00029739521911455435, "loss": 2.0586, "step": 2265 }, { "epoch": 0.18, "learning_rate": 0.0002973929252668946, "loss": 2.0472, "step": 2266 }, { "epoch": 0.18, "learning_rate": 0.0002973906304185183, "loss": 1.9671, "step": 2267 }, { "epoch": 0.18, "learning_rate": 0.00029738833456944094, "loss": 2.0461, "step": 2268 }, { "epoch": 0.18, "learning_rate": 0.0002973860377196781, "loss": 2.0701, "step": 2269 }, { "epoch": 0.18, "learning_rate": 0.0002973837398692454, "loss": 2.0441, "step": 2270 }, { "epoch": 0.18, "learning_rate": 0.0002973814410181584, "loss": 2.0637, "step": 2271 }, { "epoch": 0.18, "learning_rate": 0.0002973791411664328, "loss": 1.9487, "step": 2272 }, { "epoch": 0.18, "learning_rate": 0.0002973768403140842, "loss": 2.0448, "step": 2273 }, { "epoch": 0.18, "learning_rate": 0.00029737453846112805, "loss": 1.9852, "step": 2274 }, { "epoch": 0.18, "learning_rate": 0.00029737223560758017, "loss": 1.99, "step": 2275 }, { "epoch": 0.18, "learning_rate": 0.0002973699317534562, "loss": 1.9973, "step": 2276 }, { "epoch": 0.18, "learning_rate": 0.00029736762689877165, "loss": 1.9632, "step": 2277 }, { "epoch": 0.18, "learning_rate": 0.0002973653210435423, "loss": 2.0139, "step": 2278 }, { "epoch": 0.18, "learning_rate": 0.0002973630141877837, "loss": 2.0155, "step": 2279 }, { "epoch": 0.18, "learning_rate": 0.00029736070633151155, "loss": 2.0101, "step": 2280 }, { "epoch": 0.18, "learning_rate": 0.00029735839747474155, "loss": 1.9569, "step": 2281 }, { "epoch": 0.18, "learning_rate": 0.0002973560876174893, "loss": 2.0218, "step": 2282 }, { "epoch": 0.18, "learning_rate": 0.0002973537767597706, "loss": 2.0646, "step": 2283 }, { "epoch": 0.18, "learning_rate": 0.000297351464901601, "loss": 2.0021, "step": 2284 }, { "epoch": 0.18, "learning_rate": 0.00029734915204299633, "loss": 2.0048, "step": 2285 }, { "epoch": 0.18, "learning_rate": 0.0002973468381839722, "loss": 2.0572, "step": 2286 }, { "epoch": 0.18, "learning_rate": 0.0002973445233245444, "loss": 1.9633, "step": 2287 }, { "epoch": 0.18, "learning_rate": 0.00029734220746472853, "loss": 2.0672, "step": 2288 }, { "epoch": 0.18, "learning_rate": 0.00029733989060454045, "loss": 2.0408, "step": 2289 }, { "epoch": 0.18, "learning_rate": 0.00029733757274399573, "loss": 2.0763, "step": 2290 }, { "epoch": 0.18, "learning_rate": 0.0002973352538831103, "loss": 2.014, "step": 2291 }, { "epoch": 0.18, "learning_rate": 0.0002973329340218998, "loss": 1.9616, "step": 2292 }, { "epoch": 0.18, "learning_rate": 0.0002973306131603799, "loss": 1.992, "step": 2293 }, { "epoch": 0.18, "learning_rate": 0.00029732829129856646, "loss": 1.9646, "step": 2294 }, { "epoch": 0.18, "learning_rate": 0.00029732596843647525, "loss": 2.0177, "step": 2295 }, { "epoch": 0.18, "learning_rate": 0.00029732364457412205, "loss": 2.0241, "step": 2296 }, { "epoch": 0.18, "learning_rate": 0.0002973213197115225, "loss": 2.0753, "step": 2297 }, { "epoch": 0.18, "learning_rate": 0.00029731899384869255, "loss": 2.0899, "step": 2298 }, { "epoch": 0.18, "learning_rate": 0.00029731666698564797, "loss": 2.0446, "step": 2299 }, { "epoch": 0.18, "learning_rate": 0.00029731433912240444, "loss": 1.9972, "step": 2300 }, { "epoch": 0.18, "learning_rate": 0.0002973120102589779, "loss": 2.0201, "step": 2301 }, { "epoch": 0.18, "learning_rate": 0.00029730968039538407, "loss": 1.9923, "step": 2302 }, { "epoch": 0.18, "learning_rate": 0.00029730734953163884, "loss": 1.9962, "step": 2303 }, { "epoch": 0.18, "learning_rate": 0.000297305017667758, "loss": 2.023, "step": 2304 }, { "epoch": 0.18, "learning_rate": 0.0002973026848037573, "loss": 2.0546, "step": 2305 }, { "epoch": 0.18, "learning_rate": 0.00029730035093965273, "loss": 2.0335, "step": 2306 }, { "epoch": 0.18, "learning_rate": 0.00029729801607546, "loss": 2.0116, "step": 2307 }, { "epoch": 0.18, "learning_rate": 0.0002972956802111951, "loss": 2.0399, "step": 2308 }, { "epoch": 0.18, "learning_rate": 0.0002972933433468738, "loss": 2.0488, "step": 2309 }, { "epoch": 0.18, "learning_rate": 0.00029729100548251194, "loss": 2.022, "step": 2310 }, { "epoch": 0.18, "learning_rate": 0.0002972886666181255, "loss": 2.0583, "step": 2311 }, { "epoch": 0.18, "learning_rate": 0.00029728632675373026, "loss": 2.0473, "step": 2312 }, { "epoch": 0.18, "learning_rate": 0.00029728398588934214, "loss": 2.0611, "step": 2313 }, { "epoch": 0.18, "learning_rate": 0.00029728164402497705, "loss": 1.9656, "step": 2314 }, { "epoch": 0.18, "learning_rate": 0.00029727930116065084, "loss": 1.9663, "step": 2315 }, { "epoch": 0.18, "learning_rate": 0.00029727695729637945, "loss": 1.9858, "step": 2316 }, { "epoch": 0.18, "learning_rate": 0.0002972746124321788, "loss": 1.9981, "step": 2317 }, { "epoch": 0.18, "learning_rate": 0.00029727226656806483, "loss": 2.0173, "step": 2318 }, { "epoch": 0.18, "learning_rate": 0.00029726991970405344, "loss": 2.0221, "step": 2319 }, { "epoch": 0.18, "learning_rate": 0.00029726757184016055, "loss": 2.0794, "step": 2320 }, { "epoch": 0.18, "learning_rate": 0.0002972652229764021, "loss": 1.9978, "step": 2321 }, { "epoch": 0.18, "learning_rate": 0.0002972628731127941, "loss": 2.0507, "step": 2322 }, { "epoch": 0.18, "learning_rate": 0.0002972605222493524, "loss": 1.9727, "step": 2323 }, { "epoch": 0.18, "learning_rate": 0.00029725817038609304, "loss": 1.9691, "step": 2324 }, { "epoch": 0.18, "learning_rate": 0.000297255817523032, "loss": 2.006, "step": 2325 }, { "epoch": 0.18, "learning_rate": 0.0002972534636601852, "loss": 2.0526, "step": 2326 }, { "epoch": 0.18, "learning_rate": 0.0002972511087975686, "loss": 1.9908, "step": 2327 }, { "epoch": 0.18, "learning_rate": 0.0002972487529351983, "loss": 2.0024, "step": 2328 }, { "epoch": 0.18, "learning_rate": 0.00029724639607309016, "loss": 2.0674, "step": 2329 }, { "epoch": 0.18, "learning_rate": 0.00029724403821126033, "loss": 1.968, "step": 2330 }, { "epoch": 0.18, "learning_rate": 0.0002972416793497247, "loss": 2.0535, "step": 2331 }, { "epoch": 0.18, "learning_rate": 0.0002972393194884993, "loss": 2.0276, "step": 2332 }, { "epoch": 0.18, "learning_rate": 0.0002972369586276002, "loss": 2.0136, "step": 2333 }, { "epoch": 0.18, "learning_rate": 0.0002972345967670434, "loss": 2.0052, "step": 2334 }, { "epoch": 0.18, "learning_rate": 0.00029723223390684493, "loss": 2.0048, "step": 2335 }, { "epoch": 0.18, "learning_rate": 0.00029722987004702085, "loss": 2.0477, "step": 2336 }, { "epoch": 0.18, "learning_rate": 0.00029722750518758714, "loss": 2.0199, "step": 2337 }, { "epoch": 0.18, "learning_rate": 0.00029722513932856, "loss": 1.9927, "step": 2338 }, { "epoch": 0.18, "learning_rate": 0.0002972227724699554, "loss": 2.0408, "step": 2339 }, { "epoch": 0.18, "learning_rate": 0.00029722040461178934, "loss": 2.0293, "step": 2340 }, { "epoch": 0.18, "learning_rate": 0.00029721803575407806, "loss": 2.0718, "step": 2341 }, { "epoch": 0.18, "learning_rate": 0.00029721566589683754, "loss": 2.0359, "step": 2342 }, { "epoch": 0.18, "learning_rate": 0.0002972132950400839, "loss": 1.9944, "step": 2343 }, { "epoch": 0.18, "learning_rate": 0.0002972109231838332, "loss": 1.9929, "step": 2344 }, { "epoch": 0.18, "learning_rate": 0.00029720855032810153, "loss": 1.986, "step": 2345 }, { "epoch": 0.18, "learning_rate": 0.00029720617647290514, "loss": 1.9758, "step": 2346 }, { "epoch": 0.18, "learning_rate": 0.00029720380161825995, "loss": 1.9972, "step": 2347 }, { "epoch": 0.18, "learning_rate": 0.00029720142576418224, "loss": 2.0297, "step": 2348 }, { "epoch": 0.18, "learning_rate": 0.00029719904891068805, "loss": 2.0381, "step": 2349 }, { "epoch": 0.18, "learning_rate": 0.0002971966710577936, "loss": 2.02, "step": 2350 }, { "epoch": 0.18, "learning_rate": 0.0002971942922055149, "loss": 2.0395, "step": 2351 }, { "epoch": 0.19, "learning_rate": 0.00029719191235386827, "loss": 1.9586, "step": 2352 }, { "epoch": 0.19, "learning_rate": 0.0002971895315028697, "loss": 1.9831, "step": 2353 }, { "epoch": 0.19, "learning_rate": 0.0002971871496525355, "loss": 2.0259, "step": 2354 }, { "epoch": 0.19, "learning_rate": 0.00029718476680288175, "loss": 2.096, "step": 2355 }, { "epoch": 0.19, "learning_rate": 0.00029718238295392465, "loss": 1.9924, "step": 2356 }, { "epoch": 0.19, "learning_rate": 0.00029717999810568047, "loss": 2.0112, "step": 2357 }, { "epoch": 0.19, "learning_rate": 0.0002971776122581652, "loss": 2.0257, "step": 2358 }, { "epoch": 0.19, "learning_rate": 0.0002971752254113953, "loss": 1.9993, "step": 2359 }, { "epoch": 0.19, "learning_rate": 0.00029717283756538674, "loss": 2.0093, "step": 2360 }, { "epoch": 0.19, "learning_rate": 0.00029717044872015584, "loss": 2.003, "step": 2361 }, { "epoch": 0.19, "learning_rate": 0.00029716805887571875, "loss": 1.9982, "step": 2362 }, { "epoch": 0.19, "learning_rate": 0.0002971656680320919, "loss": 1.9967, "step": 2363 }, { "epoch": 0.19, "learning_rate": 0.0002971632761892913, "loss": 2.0754, "step": 2364 }, { "epoch": 0.19, "learning_rate": 0.00029716088334733325, "loss": 2.0053, "step": 2365 }, { "epoch": 0.19, "learning_rate": 0.000297158489506234, "loss": 1.9816, "step": 2366 }, { "epoch": 0.19, "learning_rate": 0.00029715609466600987, "loss": 2.0577, "step": 2367 }, { "epoch": 0.19, "learning_rate": 0.00029715369882667706, "loss": 1.9694, "step": 2368 }, { "epoch": 0.19, "learning_rate": 0.0002971513019882518, "loss": 2.0338, "step": 2369 }, { "epoch": 0.19, "learning_rate": 0.0002971489041507504, "loss": 2.0154, "step": 2370 }, { "epoch": 0.19, "learning_rate": 0.0002971465053141892, "loss": 1.9841, "step": 2371 }, { "epoch": 0.19, "learning_rate": 0.00029714410547858436, "loss": 1.9484, "step": 2372 }, { "epoch": 0.19, "learning_rate": 0.0002971417046439523, "loss": 2.0448, "step": 2373 }, { "epoch": 0.19, "learning_rate": 0.00029713930281030925, "loss": 2.0485, "step": 2374 }, { "epoch": 0.19, "learning_rate": 0.0002971368999776715, "loss": 2.0419, "step": 2375 }, { "epoch": 0.19, "learning_rate": 0.0002971344961460554, "loss": 2.0089, "step": 2376 }, { "epoch": 0.19, "learning_rate": 0.00029713209131547734, "loss": 2.0564, "step": 2377 }, { "epoch": 0.19, "learning_rate": 0.00029712968548595357, "loss": 1.9625, "step": 2378 }, { "epoch": 0.19, "learning_rate": 0.00029712727865750034, "loss": 2.0046, "step": 2379 }, { "epoch": 0.19, "learning_rate": 0.00029712487083013414, "loss": 2.027, "step": 2380 }, { "epoch": 0.19, "learning_rate": 0.00029712246200387123, "loss": 1.9644, "step": 2381 }, { "epoch": 0.19, "learning_rate": 0.000297120052178728, "loss": 2.0078, "step": 2382 }, { "epoch": 0.19, "learning_rate": 0.0002971176413547208, "loss": 2.0496, "step": 2383 }, { "epoch": 0.19, "learning_rate": 0.00029711522953186604, "loss": 2.0311, "step": 2384 }, { "epoch": 0.19, "learning_rate": 0.00029711281671018, "loss": 2.0109, "step": 2385 }, { "epoch": 0.19, "learning_rate": 0.00029711040288967914, "loss": 1.9503, "step": 2386 }, { "epoch": 0.19, "learning_rate": 0.00029710798807037987, "loss": 2.0139, "step": 2387 }, { "epoch": 0.19, "learning_rate": 0.0002971055722522985, "loss": 2.0064, "step": 2388 }, { "epoch": 0.19, "learning_rate": 0.0002971031554354514, "loss": 2.0027, "step": 2389 }, { "epoch": 0.19, "learning_rate": 0.0002971007376198552, "loss": 2.0233, "step": 2390 }, { "epoch": 0.19, "learning_rate": 0.00029709831880552607, "loss": 2.0745, "step": 2391 }, { "epoch": 0.19, "learning_rate": 0.00029709589899248054, "loss": 2.0128, "step": 2392 }, { "epoch": 0.19, "learning_rate": 0.00029709347818073504, "loss": 2.0563, "step": 2393 }, { "epoch": 0.19, "learning_rate": 0.000297091056370306, "loss": 1.9942, "step": 2394 }, { "epoch": 0.19, "learning_rate": 0.00029708863356120994, "loss": 2.0181, "step": 2395 }, { "epoch": 0.19, "learning_rate": 0.0002970862097534631, "loss": 2.036, "step": 2396 }, { "epoch": 0.19, "learning_rate": 0.0002970837849470821, "loss": 2.0131, "step": 2397 }, { "epoch": 0.19, "learning_rate": 0.00029708135914208335, "loss": 2.0232, "step": 2398 }, { "epoch": 0.19, "learning_rate": 0.0002970789323384834, "loss": 1.9136, "step": 2399 }, { "epoch": 0.19, "learning_rate": 0.00029707650453629866, "loss": 2.0167, "step": 2400 }, { "epoch": 0.19, "learning_rate": 0.0002970740757355456, "loss": 2.0475, "step": 2401 }, { "epoch": 0.19, "learning_rate": 0.00029707164593624074, "loss": 2.0281, "step": 2402 }, { "epoch": 0.19, "learning_rate": 0.00029706921513840054, "loss": 2.055, "step": 2403 }, { "epoch": 0.19, "learning_rate": 0.0002970667833420415, "loss": 2.0329, "step": 2404 }, { "epoch": 0.19, "learning_rate": 0.0002970643505471802, "loss": 2.0095, "step": 2405 }, { "epoch": 0.19, "learning_rate": 0.0002970619167538331, "loss": 1.9488, "step": 2406 }, { "epoch": 0.19, "learning_rate": 0.0002970594819620168, "loss": 2.058, "step": 2407 }, { "epoch": 0.19, "learning_rate": 0.0002970570461717477, "loss": 1.9563, "step": 2408 }, { "epoch": 0.19, "learning_rate": 0.00029705460938304245, "loss": 1.9938, "step": 2409 }, { "epoch": 0.19, "learning_rate": 0.0002970521715959175, "loss": 1.9573, "step": 2410 }, { "epoch": 0.19, "learning_rate": 0.0002970497328103895, "loss": 2.0006, "step": 2411 }, { "epoch": 0.19, "learning_rate": 0.000297047293026475, "loss": 1.9403, "step": 2412 }, { "epoch": 0.19, "learning_rate": 0.0002970448522441904, "loss": 2.0205, "step": 2413 }, { "epoch": 0.19, "learning_rate": 0.00029704241046355254, "loss": 1.9802, "step": 2414 }, { "epoch": 0.19, "learning_rate": 0.0002970399676845778, "loss": 1.9518, "step": 2415 }, { "epoch": 0.19, "learning_rate": 0.0002970375239072828, "loss": 1.9705, "step": 2416 }, { "epoch": 0.19, "learning_rate": 0.0002970350791316842, "loss": 2.0769, "step": 2417 }, { "epoch": 0.19, "learning_rate": 0.0002970326333577985, "loss": 1.9603, "step": 2418 }, { "epoch": 0.19, "learning_rate": 0.0002970301865856424, "loss": 2.0071, "step": 2419 }, { "epoch": 0.19, "learning_rate": 0.00029702773881523246, "loss": 1.9773, "step": 2420 }, { "epoch": 0.19, "learning_rate": 0.0002970252900465853, "loss": 1.9815, "step": 2421 }, { "epoch": 0.19, "learning_rate": 0.0002970228402797176, "loss": 1.964, "step": 2422 }, { "epoch": 0.19, "learning_rate": 0.00029702038951464585, "loss": 1.9941, "step": 2423 }, { "epoch": 0.19, "learning_rate": 0.0002970179377513869, "loss": 2.0307, "step": 2424 }, { "epoch": 0.19, "learning_rate": 0.0002970154849899572, "loss": 1.9634, "step": 2425 }, { "epoch": 0.19, "learning_rate": 0.00029701303123037354, "loss": 1.9698, "step": 2426 }, { "epoch": 0.19, "learning_rate": 0.0002970105764726525, "loss": 2.0627, "step": 2427 }, { "epoch": 0.19, "learning_rate": 0.00029700812071681076, "loss": 1.9517, "step": 2428 }, { "epoch": 0.19, "learning_rate": 0.00029700566396286503, "loss": 1.9837, "step": 2429 }, { "epoch": 0.19, "learning_rate": 0.000297003206210832, "loss": 1.9546, "step": 2430 }, { "epoch": 0.19, "learning_rate": 0.0002970007474607283, "loss": 2.0251, "step": 2431 }, { "epoch": 0.19, "learning_rate": 0.0002969982877125706, "loss": 2.0164, "step": 2432 }, { "epoch": 0.19, "learning_rate": 0.0002969958269663757, "loss": 2.0477, "step": 2433 }, { "epoch": 0.19, "learning_rate": 0.0002969933652221602, "loss": 1.9873, "step": 2434 }, { "epoch": 0.19, "learning_rate": 0.0002969909024799409, "loss": 2.0496, "step": 2435 }, { "epoch": 0.19, "learning_rate": 0.0002969884387397345, "loss": 1.966, "step": 2436 }, { "epoch": 0.19, "learning_rate": 0.00029698597400155773, "loss": 1.9939, "step": 2437 }, { "epoch": 0.19, "learning_rate": 0.00029698350826542726, "loss": 1.9706, "step": 2438 }, { "epoch": 0.19, "learning_rate": 0.00029698104153135993, "loss": 2.0138, "step": 2439 }, { "epoch": 0.19, "learning_rate": 0.00029697857379937237, "loss": 2.0823, "step": 2440 }, { "epoch": 0.19, "learning_rate": 0.00029697610506948145, "loss": 2.032, "step": 2441 }, { "epoch": 0.19, "learning_rate": 0.0002969736353417039, "loss": 1.9983, "step": 2442 }, { "epoch": 0.19, "learning_rate": 0.00029697116461605645, "loss": 1.9871, "step": 2443 }, { "epoch": 0.19, "learning_rate": 0.00029696869289255593, "loss": 2.0175, "step": 2444 }, { "epoch": 0.19, "learning_rate": 0.00029696622017121905, "loss": 2.0184, "step": 2445 }, { "epoch": 0.19, "learning_rate": 0.0002969637464520627, "loss": 1.9509, "step": 2446 }, { "epoch": 0.19, "learning_rate": 0.00029696127173510354, "loss": 1.9664, "step": 2447 }, { "epoch": 0.19, "learning_rate": 0.00029695879602035846, "loss": 2.0135, "step": 2448 }, { "epoch": 0.19, "learning_rate": 0.00029695631930784424, "loss": 1.9805, "step": 2449 }, { "epoch": 0.19, "learning_rate": 0.00029695384159757773, "loss": 1.9801, "step": 2450 }, { "epoch": 0.19, "learning_rate": 0.00029695136288957575, "loss": 2.001, "step": 2451 }, { "epoch": 0.19, "learning_rate": 0.0002969488831838551, "loss": 1.9125, "step": 2452 }, { "epoch": 0.19, "learning_rate": 0.0002969464024804326, "loss": 1.9304, "step": 2453 }, { "epoch": 0.19, "learning_rate": 0.00029694392077932516, "loss": 2.0199, "step": 2454 }, { "epoch": 0.19, "learning_rate": 0.00029694143808054954, "loss": 1.9943, "step": 2455 }, { "epoch": 0.19, "learning_rate": 0.0002969389543841227, "loss": 2.0079, "step": 2456 }, { "epoch": 0.19, "learning_rate": 0.0002969364696900614, "loss": 1.9573, "step": 2457 }, { "epoch": 0.19, "learning_rate": 0.0002969339839983826, "loss": 1.9591, "step": 2458 }, { "epoch": 0.19, "learning_rate": 0.0002969314973091031, "loss": 1.9963, "step": 2459 }, { "epoch": 0.19, "learning_rate": 0.00029692900962223983, "loss": 1.9902, "step": 2460 }, { "epoch": 0.19, "learning_rate": 0.00029692652093780964, "loss": 1.9797, "step": 2461 }, { "epoch": 0.19, "learning_rate": 0.00029692403125582947, "loss": 2.0361, "step": 2462 }, { "epoch": 0.19, "learning_rate": 0.00029692154057631625, "loss": 2.0035, "step": 2463 }, { "epoch": 0.19, "learning_rate": 0.0002969190488992868, "loss": 1.976, "step": 2464 }, { "epoch": 0.19, "learning_rate": 0.0002969165562247581, "loss": 1.9639, "step": 2465 }, { "epoch": 0.19, "learning_rate": 0.00029691406255274706, "loss": 2.0134, "step": 2466 }, { "epoch": 0.19, "learning_rate": 0.0002969115678832706, "loss": 2.0125, "step": 2467 }, { "epoch": 0.19, "learning_rate": 0.0002969090722163457, "loss": 2.0011, "step": 2468 }, { "epoch": 0.19, "learning_rate": 0.0002969065755519892, "loss": 1.9907, "step": 2469 }, { "epoch": 0.19, "learning_rate": 0.00029690407789021816, "loss": 1.9621, "step": 2470 }, { "epoch": 0.19, "learning_rate": 0.00029690157923104954, "loss": 1.9823, "step": 2471 }, { "epoch": 0.19, "learning_rate": 0.0002968990795745002, "loss": 2.0053, "step": 2472 }, { "epoch": 0.19, "learning_rate": 0.0002968965789205872, "loss": 1.9784, "step": 2473 }, { "epoch": 0.19, "learning_rate": 0.00029689407726932746, "loss": 1.9604, "step": 2474 }, { "epoch": 0.19, "learning_rate": 0.00029689157462073806, "loss": 1.9723, "step": 2475 }, { "epoch": 0.19, "learning_rate": 0.0002968890709748359, "loss": 2.0323, "step": 2476 }, { "epoch": 0.19, "learning_rate": 0.000296886566331638, "loss": 1.9825, "step": 2477 }, { "epoch": 0.19, "learning_rate": 0.0002968840606911614, "loss": 1.9766, "step": 2478 }, { "epoch": 0.2, "learning_rate": 0.0002968815540534231, "loss": 2.0157, "step": 2479 }, { "epoch": 0.2, "learning_rate": 0.00029687904641844006, "loss": 2.0257, "step": 2480 }, { "epoch": 0.2, "learning_rate": 0.00029687653778622935, "loss": 1.9628, "step": 2481 }, { "epoch": 0.2, "learning_rate": 0.00029687402815680797, "loss": 1.9822, "step": 2482 }, { "epoch": 0.2, "learning_rate": 0.0002968715175301931, "loss": 1.9808, "step": 2483 }, { "epoch": 0.2, "learning_rate": 0.00029686900590640157, "loss": 2.0006, "step": 2484 }, { "epoch": 0.2, "learning_rate": 0.0002968664932854506, "loss": 1.9586, "step": 2485 }, { "epoch": 0.2, "learning_rate": 0.0002968639796673572, "loss": 2.0379, "step": 2486 }, { "epoch": 0.2, "learning_rate": 0.00029686146505213834, "loss": 2.0451, "step": 2487 }, { "epoch": 0.2, "learning_rate": 0.0002968589494398112, "loss": 1.9686, "step": 2488 }, { "epoch": 0.2, "learning_rate": 0.0002968564328303929, "loss": 1.993, "step": 2489 }, { "epoch": 0.2, "learning_rate": 0.00029685391522390044, "loss": 1.9356, "step": 2490 }, { "epoch": 0.2, "learning_rate": 0.0002968513966203509, "loss": 1.9931, "step": 2491 }, { "epoch": 0.2, "learning_rate": 0.00029684887701976145, "loss": 2.018, "step": 2492 }, { "epoch": 0.2, "learning_rate": 0.00029684635642214914, "loss": 2.0143, "step": 2493 }, { "epoch": 0.2, "learning_rate": 0.00029684383482753114, "loss": 1.9808, "step": 2494 }, { "epoch": 0.2, "learning_rate": 0.0002968413122359245, "loss": 2.0329, "step": 2495 }, { "epoch": 0.2, "learning_rate": 0.00029683878864734644, "loss": 1.9966, "step": 2496 }, { "epoch": 0.2, "learning_rate": 0.000296836264061814, "loss": 2.0304, "step": 2497 }, { "epoch": 0.2, "learning_rate": 0.00029683373847934433, "loss": 2.0164, "step": 2498 }, { "epoch": 0.2, "learning_rate": 0.0002968312118999547, "loss": 2.0047, "step": 2499 }, { "epoch": 0.2, "learning_rate": 0.00029682868432366204, "loss": 1.9647, "step": 2500 }, { "epoch": 0.2, "learning_rate": 0.0002968261557504837, "loss": 1.9896, "step": 2501 }, { "epoch": 0.2, "learning_rate": 0.0002968236261804368, "loss": 1.974, "step": 2502 }, { "epoch": 0.2, "learning_rate": 0.00029682109561353847, "loss": 1.9904, "step": 2503 }, { "epoch": 0.2, "learning_rate": 0.00029681856404980596, "loss": 1.9792, "step": 2504 }, { "epoch": 0.2, "learning_rate": 0.00029681603148925645, "loss": 1.9467, "step": 2505 }, { "epoch": 0.2, "learning_rate": 0.00029681349793190707, "loss": 2.0217, "step": 2506 }, { "epoch": 0.2, "learning_rate": 0.000296810963377775, "loss": 1.9819, "step": 2507 }, { "epoch": 0.2, "learning_rate": 0.00029680842782687757, "loss": 2.0507, "step": 2508 }, { "epoch": 0.2, "learning_rate": 0.0002968058912792319, "loss": 2.0176, "step": 2509 }, { "epoch": 0.2, "learning_rate": 0.00029680335373485526, "loss": 1.9551, "step": 2510 }, { "epoch": 0.2, "learning_rate": 0.00029680081519376487, "loss": 1.9957, "step": 2511 }, { "epoch": 0.2, "learning_rate": 0.00029679827565597794, "loss": 1.9503, "step": 2512 }, { "epoch": 0.2, "learning_rate": 0.00029679573512151177, "loss": 1.9952, "step": 2513 }, { "epoch": 0.2, "learning_rate": 0.0002967931935903835, "loss": 2.0082, "step": 2514 }, { "epoch": 0.2, "learning_rate": 0.00029679065106261046, "loss": 1.9837, "step": 2515 }, { "epoch": 0.2, "learning_rate": 0.00029678810753821, "loss": 1.9005, "step": 2516 }, { "epoch": 0.2, "learning_rate": 0.0002967855630171992, "loss": 1.9805, "step": 2517 }, { "epoch": 0.2, "learning_rate": 0.0002967830174995955, "loss": 1.9415, "step": 2518 }, { "epoch": 0.2, "learning_rate": 0.000296780470985416, "loss": 1.9818, "step": 2519 }, { "epoch": 0.2, "learning_rate": 0.00029677792347467815, "loss": 1.9898, "step": 2520 }, { "epoch": 0.2, "learning_rate": 0.00029677537496739924, "loss": 2.0611, "step": 2521 }, { "epoch": 0.2, "learning_rate": 0.0002967728254635965, "loss": 2.0332, "step": 2522 }, { "epoch": 0.2, "learning_rate": 0.0002967702749632873, "loss": 2.0409, "step": 2523 }, { "epoch": 0.2, "learning_rate": 0.0002967677234664889, "loss": 2.0123, "step": 2524 }, { "epoch": 0.2, "learning_rate": 0.0002967651709732187, "loss": 1.9757, "step": 2525 }, { "epoch": 0.2, "learning_rate": 0.00029676261748349386, "loss": 2.0135, "step": 2526 }, { "epoch": 0.2, "learning_rate": 0.00029676006299733193, "loss": 1.9917, "step": 2527 }, { "epoch": 0.2, "learning_rate": 0.00029675750751475015, "loss": 1.9844, "step": 2528 }, { "epoch": 0.2, "learning_rate": 0.0002967549510357659, "loss": 1.9988, "step": 2529 }, { "epoch": 0.2, "learning_rate": 0.00029675239356039647, "loss": 1.9922, "step": 2530 }, { "epoch": 0.2, "learning_rate": 0.0002967498350886593, "loss": 1.9973, "step": 2531 }, { "epoch": 0.2, "learning_rate": 0.00029674727562057176, "loss": 1.9918, "step": 2532 }, { "epoch": 0.2, "learning_rate": 0.0002967447151561512, "loss": 2.0375, "step": 2533 }, { "epoch": 0.2, "learning_rate": 0.0002967421536954149, "loss": 1.9893, "step": 2534 }, { "epoch": 0.2, "learning_rate": 0.0002967395912383805, "loss": 2.0233, "step": 2535 }, { "epoch": 0.2, "learning_rate": 0.00029673702778506514, "loss": 1.9874, "step": 2536 }, { "epoch": 0.2, "learning_rate": 0.0002967344633354864, "loss": 2.0068, "step": 2537 }, { "epoch": 0.2, "learning_rate": 0.0002967318978896616, "loss": 1.9428, "step": 2538 }, { "epoch": 0.2, "learning_rate": 0.0002967293314476082, "loss": 1.9384, "step": 2539 }, { "epoch": 0.2, "learning_rate": 0.0002967267640093436, "loss": 2.0032, "step": 2540 }, { "epoch": 0.2, "learning_rate": 0.0002967241955748853, "loss": 1.9615, "step": 2541 }, { "epoch": 0.2, "learning_rate": 0.0002967216261442506, "loss": 1.9926, "step": 2542 }, { "epoch": 0.2, "learning_rate": 0.0002967190557174571, "loss": 2.0212, "step": 2543 }, { "epoch": 0.2, "learning_rate": 0.0002967164842945221, "loss": 2.0617, "step": 2544 }, { "epoch": 0.2, "learning_rate": 0.0002967139118754632, "loss": 1.9932, "step": 2545 }, { "epoch": 0.2, "learning_rate": 0.0002967113384602978, "loss": 2.0165, "step": 2546 }, { "epoch": 0.2, "learning_rate": 0.00029670876404904335, "loss": 1.9844, "step": 2547 }, { "epoch": 0.2, "learning_rate": 0.0002967061886417173, "loss": 1.9715, "step": 2548 }, { "epoch": 0.2, "learning_rate": 0.0002967036122383372, "loss": 1.9296, "step": 2549 }, { "epoch": 0.2, "learning_rate": 0.0002967010348389206, "loss": 1.968, "step": 2550 }, { "epoch": 0.2, "learning_rate": 0.0002966984564434849, "loss": 1.9358, "step": 2551 }, { "epoch": 0.2, "learning_rate": 0.0002966958770520477, "loss": 1.9753, "step": 2552 }, { "epoch": 0.2, "learning_rate": 0.00029669329666462635, "loss": 1.9877, "step": 2553 }, { "epoch": 0.2, "learning_rate": 0.0002966907152812385, "loss": 1.9404, "step": 2554 }, { "epoch": 0.2, "learning_rate": 0.0002966881329019017, "loss": 1.9798, "step": 2555 }, { "epoch": 0.2, "learning_rate": 0.00029668554952663333, "loss": 1.9264, "step": 2556 }, { "epoch": 0.2, "learning_rate": 0.0002966829651554511, "loss": 1.9994, "step": 2557 }, { "epoch": 0.2, "learning_rate": 0.0002966803797883724, "loss": 1.9565, "step": 2558 }, { "epoch": 0.2, "learning_rate": 0.00029667779342541496, "loss": 1.9393, "step": 2559 }, { "epoch": 0.2, "learning_rate": 0.0002966752060665962, "loss": 1.9525, "step": 2560 }, { "epoch": 0.2, "learning_rate": 0.00029667261771193374, "loss": 2.011, "step": 2561 }, { "epoch": 0.2, "learning_rate": 0.00029667002836144515, "loss": 1.9882, "step": 2562 }, { "epoch": 0.2, "learning_rate": 0.000296667438015148, "loss": 1.9444, "step": 2563 }, { "epoch": 0.2, "learning_rate": 0.00029666484667305987, "loss": 1.9326, "step": 2564 }, { "epoch": 0.2, "learning_rate": 0.0002966622543351984, "loss": 2.0187, "step": 2565 }, { "epoch": 0.2, "learning_rate": 0.0002966596610015811, "loss": 1.9994, "step": 2566 }, { "epoch": 0.2, "learning_rate": 0.0002966570666722257, "loss": 2.0058, "step": 2567 }, { "epoch": 0.2, "learning_rate": 0.00029665447134714977, "loss": 1.9339, "step": 2568 }, { "epoch": 0.2, "learning_rate": 0.00029665187502637085, "loss": 2.0132, "step": 2569 }, { "epoch": 0.2, "learning_rate": 0.0002966492777099066, "loss": 1.9707, "step": 2570 }, { "epoch": 0.2, "learning_rate": 0.00029664667939777477, "loss": 2.0033, "step": 2571 }, { "epoch": 0.2, "learning_rate": 0.0002966440800899929, "loss": 1.9503, "step": 2572 }, { "epoch": 0.2, "learning_rate": 0.00029664147978657857, "loss": 1.9888, "step": 2573 }, { "epoch": 0.2, "learning_rate": 0.0002966388784875496, "loss": 1.9797, "step": 2574 }, { "epoch": 0.2, "learning_rate": 0.00029663627619292354, "loss": 1.9514, "step": 2575 }, { "epoch": 0.2, "learning_rate": 0.00029663367290271806, "loss": 1.9843, "step": 2576 }, { "epoch": 0.2, "learning_rate": 0.0002966310686169509, "loss": 1.997, "step": 2577 }, { "epoch": 0.2, "learning_rate": 0.00029662846333563966, "loss": 1.9394, "step": 2578 }, { "epoch": 0.2, "learning_rate": 0.0002966258570588021, "loss": 2.0232, "step": 2579 }, { "epoch": 0.2, "learning_rate": 0.0002966232497864559, "loss": 1.9546, "step": 2580 }, { "epoch": 0.2, "learning_rate": 0.00029662064151861865, "loss": 1.9382, "step": 2581 }, { "epoch": 0.2, "learning_rate": 0.00029661803225530825, "loss": 1.9501, "step": 2582 }, { "epoch": 0.2, "learning_rate": 0.0002966154219965423, "loss": 1.9376, "step": 2583 }, { "epoch": 0.2, "learning_rate": 0.0002966128107423386, "loss": 1.9918, "step": 2584 }, { "epoch": 0.2, "learning_rate": 0.0002966101984927147, "loss": 2.003, "step": 2585 }, { "epoch": 0.2, "learning_rate": 0.00029660758524768853, "loss": 2.0151, "step": 2586 }, { "epoch": 0.2, "learning_rate": 0.00029660497100727774, "loss": 2.0116, "step": 2587 }, { "epoch": 0.2, "learning_rate": 0.0002966023557715002, "loss": 2.0253, "step": 2588 }, { "epoch": 0.2, "learning_rate": 0.0002965997395403734, "loss": 1.9861, "step": 2589 }, { "epoch": 0.2, "learning_rate": 0.0002965971223139154, "loss": 1.9946, "step": 2590 }, { "epoch": 0.2, "learning_rate": 0.00029659450409214375, "loss": 1.9661, "step": 2591 }, { "epoch": 0.2, "learning_rate": 0.0002965918848750764, "loss": 2.0268, "step": 2592 }, { "epoch": 0.2, "learning_rate": 0.00029658926466273096, "loss": 2.0264, "step": 2593 }, { "epoch": 0.2, "learning_rate": 0.0002965866434551254, "loss": 1.9889, "step": 2594 }, { "epoch": 0.2, "learning_rate": 0.0002965840212522773, "loss": 1.9583, "step": 2595 }, { "epoch": 0.2, "learning_rate": 0.0002965813980542047, "loss": 1.9626, "step": 2596 }, { "epoch": 0.2, "learning_rate": 0.0002965787738609253, "loss": 1.9797, "step": 2597 }, { "epoch": 0.2, "learning_rate": 0.00029657614867245683, "loss": 2.0048, "step": 2598 }, { "epoch": 0.2, "learning_rate": 0.00029657352248881725, "loss": 1.9786, "step": 2599 }, { "epoch": 0.2, "learning_rate": 0.0002965708953100243, "loss": 1.9793, "step": 2600 }, { "epoch": 0.2, "learning_rate": 0.00029656826713609594, "loss": 1.9795, "step": 2601 }, { "epoch": 0.2, "learning_rate": 0.00029656563796704984, "loss": 1.9338, "step": 2602 }, { "epoch": 0.2, "learning_rate": 0.00029656300780290395, "loss": 1.9694, "step": 2603 }, { "epoch": 0.2, "learning_rate": 0.0002965603766436762, "loss": 1.9332, "step": 2604 }, { "epoch": 0.2, "learning_rate": 0.0002965577444893843, "loss": 1.984, "step": 2605 }, { "epoch": 0.21, "learning_rate": 0.0002965551113400462, "loss": 1.9802, "step": 2606 }, { "epoch": 0.21, "learning_rate": 0.00029655247719567973, "loss": 2.0248, "step": 2607 }, { "epoch": 0.21, "learning_rate": 0.0002965498420563029, "loss": 2.0189, "step": 2608 }, { "epoch": 0.21, "learning_rate": 0.00029654720592193345, "loss": 2.0246, "step": 2609 }, { "epoch": 0.21, "learning_rate": 0.0002965445687925894, "loss": 1.9814, "step": 2610 }, { "epoch": 0.21, "learning_rate": 0.0002965419306682885, "loss": 1.9878, "step": 2611 }, { "epoch": 0.21, "learning_rate": 0.00029653929154904886, "loss": 1.9755, "step": 2612 }, { "epoch": 0.21, "learning_rate": 0.0002965366514348883, "loss": 1.9527, "step": 2613 }, { "epoch": 0.21, "learning_rate": 0.00029653401032582466, "loss": 2.0234, "step": 2614 }, { "epoch": 0.21, "learning_rate": 0.000296531368221876, "loss": 2.0304, "step": 2615 }, { "epoch": 0.21, "learning_rate": 0.00029652872512306023, "loss": 2.0101, "step": 2616 }, { "epoch": 0.21, "learning_rate": 0.00029652608102939524, "loss": 1.9836, "step": 2617 }, { "epoch": 0.21, "learning_rate": 0.0002965234359408991, "loss": 2.0368, "step": 2618 }, { "epoch": 0.21, "learning_rate": 0.0002965207898575896, "loss": 1.9628, "step": 2619 }, { "epoch": 0.21, "learning_rate": 0.0002965181427794848, "loss": 1.9667, "step": 2620 }, { "epoch": 0.21, "learning_rate": 0.0002965154947066027, "loss": 1.9526, "step": 2621 }, { "epoch": 0.21, "learning_rate": 0.0002965128456389612, "loss": 1.9686, "step": 2622 }, { "epoch": 0.21, "learning_rate": 0.0002965101955765784, "loss": 2.0197, "step": 2623 }, { "epoch": 0.21, "learning_rate": 0.0002965075445194722, "loss": 1.9785, "step": 2624 }, { "epoch": 0.21, "learning_rate": 0.00029650489246766054, "loss": 1.949, "step": 2625 }, { "epoch": 0.21, "learning_rate": 0.0002965022394211616, "loss": 1.9698, "step": 2626 }, { "epoch": 0.21, "learning_rate": 0.0002964995853799933, "loss": 1.8866, "step": 2627 }, { "epoch": 0.21, "learning_rate": 0.00029649693034417365, "loss": 1.9842, "step": 2628 }, { "epoch": 0.21, "learning_rate": 0.0002964942743137207, "loss": 2.0231, "step": 2629 }, { "epoch": 0.21, "learning_rate": 0.0002964916172886524, "loss": 1.9974, "step": 2630 }, { "epoch": 0.21, "learning_rate": 0.0002964889592689869, "loss": 1.9512, "step": 2631 }, { "epoch": 0.21, "learning_rate": 0.0002964863002547422, "loss": 1.9448, "step": 2632 }, { "epoch": 0.21, "learning_rate": 0.0002964836402459364, "loss": 1.938, "step": 2633 }, { "epoch": 0.21, "learning_rate": 0.00029648097924258747, "loss": 1.9669, "step": 2634 }, { "epoch": 0.21, "learning_rate": 0.0002964783172447135, "loss": 1.9492, "step": 2635 }, { "epoch": 0.21, "learning_rate": 0.00029647565425233263, "loss": 1.9923, "step": 2636 }, { "epoch": 0.21, "learning_rate": 0.00029647299026546294, "loss": 2.0172, "step": 2637 }, { "epoch": 0.21, "learning_rate": 0.0002964703252841224, "loss": 1.9175, "step": 2638 }, { "epoch": 0.21, "learning_rate": 0.00029646765930832925, "loss": 1.9414, "step": 2639 }, { "epoch": 0.21, "learning_rate": 0.0002964649923381015, "loss": 1.9646, "step": 2640 }, { "epoch": 0.21, "learning_rate": 0.0002964623243734573, "loss": 2.0132, "step": 2641 }, { "epoch": 0.21, "learning_rate": 0.0002964596554144147, "loss": 2.0194, "step": 2642 }, { "epoch": 0.21, "learning_rate": 0.0002964569854609918, "loss": 2.0072, "step": 2643 }, { "epoch": 0.21, "learning_rate": 0.00029645431451320685, "loss": 1.942, "step": 2644 }, { "epoch": 0.21, "learning_rate": 0.000296451642571078, "loss": 2.0061, "step": 2645 }, { "epoch": 0.21, "learning_rate": 0.00029644896963462324, "loss": 1.9367, "step": 2646 }, { "epoch": 0.21, "learning_rate": 0.0002964462957038608, "loss": 1.9102, "step": 2647 }, { "epoch": 0.21, "learning_rate": 0.0002964436207788088, "loss": 1.99, "step": 2648 }, { "epoch": 0.21, "learning_rate": 0.0002964409448594855, "loss": 1.9505, "step": 2649 }, { "epoch": 0.21, "learning_rate": 0.00029643826794590895, "loss": 1.9581, "step": 2650 }, { "epoch": 0.21, "learning_rate": 0.0002964355900380974, "loss": 1.9588, "step": 2651 }, { "epoch": 0.21, "learning_rate": 0.00029643291113606895, "loss": 1.9704, "step": 2652 }, { "epoch": 0.21, "learning_rate": 0.0002964302312398419, "loss": 1.9731, "step": 2653 }, { "epoch": 0.21, "learning_rate": 0.00029642755034943436, "loss": 1.9352, "step": 2654 }, { "epoch": 0.21, "learning_rate": 0.0002964248684648646, "loss": 1.935, "step": 2655 }, { "epoch": 0.21, "learning_rate": 0.0002964221855861507, "loss": 2.0527, "step": 2656 }, { "epoch": 0.21, "learning_rate": 0.000296419501713311, "loss": 1.9329, "step": 2657 }, { "epoch": 0.21, "learning_rate": 0.00029641681684636375, "loss": 1.9278, "step": 2658 }, { "epoch": 0.21, "learning_rate": 0.000296414130985327, "loss": 1.9898, "step": 2659 }, { "epoch": 0.21, "learning_rate": 0.00029641144413021915, "loss": 1.9389, "step": 2660 }, { "epoch": 0.21, "learning_rate": 0.00029640875628105846, "loss": 1.9554, "step": 2661 }, { "epoch": 0.21, "learning_rate": 0.00029640606743786305, "loss": 2.0226, "step": 2662 }, { "epoch": 0.21, "learning_rate": 0.0002964033776006512, "loss": 2.0315, "step": 2663 }, { "epoch": 0.21, "learning_rate": 0.0002964006867694413, "loss": 1.9145, "step": 2664 }, { "epoch": 0.21, "learning_rate": 0.0002963979949442514, "loss": 1.9504, "step": 2665 }, { "epoch": 0.21, "learning_rate": 0.00029639530212510003, "loss": 2.0197, "step": 2666 }, { "epoch": 0.21, "learning_rate": 0.00029639260831200524, "loss": 1.949, "step": 2667 }, { "epoch": 0.21, "learning_rate": 0.0002963899135049855, "loss": 1.9843, "step": 2668 }, { "epoch": 0.21, "learning_rate": 0.000296387217704059, "loss": 1.9527, "step": 2669 }, { "epoch": 0.21, "learning_rate": 0.0002963845209092441, "loss": 1.9631, "step": 2670 }, { "epoch": 0.21, "learning_rate": 0.00029638182312055904, "loss": 1.9532, "step": 2671 }, { "epoch": 0.21, "learning_rate": 0.00029637912433802224, "loss": 1.9832, "step": 2672 }, { "epoch": 0.21, "learning_rate": 0.0002963764245616519, "loss": 1.9801, "step": 2673 }, { "epoch": 0.21, "learning_rate": 0.00029637372379146643, "loss": 1.9372, "step": 2674 }, { "epoch": 0.21, "learning_rate": 0.0002963710220274842, "loss": 1.9731, "step": 2675 }, { "epoch": 0.21, "learning_rate": 0.0002963683192697235, "loss": 1.968, "step": 2676 }, { "epoch": 0.21, "learning_rate": 0.00029636561551820264, "loss": 1.9807, "step": 2677 }, { "epoch": 0.21, "learning_rate": 0.00029636291077294, "loss": 1.9166, "step": 2678 }, { "epoch": 0.21, "learning_rate": 0.000296360205033954, "loss": 1.9566, "step": 2679 }, { "epoch": 0.21, "learning_rate": 0.000296357498301263, "loss": 1.9442, "step": 2680 }, { "epoch": 0.21, "learning_rate": 0.00029635479057488537, "loss": 1.9712, "step": 2681 }, { "epoch": 0.21, "learning_rate": 0.0002963520818548394, "loss": 1.9838, "step": 2682 }, { "epoch": 0.21, "learning_rate": 0.0002963493721411436, "loss": 1.9764, "step": 2683 }, { "epoch": 0.21, "learning_rate": 0.0002963466614338163, "loss": 1.9933, "step": 2684 }, { "epoch": 0.21, "learning_rate": 0.000296343949732876, "loss": 1.9906, "step": 2685 }, { "epoch": 0.21, "learning_rate": 0.000296341237038341, "loss": 1.9669, "step": 2686 }, { "epoch": 0.21, "learning_rate": 0.00029633852335022974, "loss": 1.9623, "step": 2687 }, { "epoch": 0.21, "learning_rate": 0.00029633580866856066, "loss": 2.0132, "step": 2688 }, { "epoch": 0.21, "learning_rate": 0.0002963330929933522, "loss": 1.9704, "step": 2689 }, { "epoch": 0.21, "learning_rate": 0.00029633037632462286, "loss": 1.9751, "step": 2690 }, { "epoch": 0.21, "learning_rate": 0.00029632765866239094, "loss": 1.971, "step": 2691 }, { "epoch": 0.21, "learning_rate": 0.000296324940006675, "loss": 1.9517, "step": 2692 }, { "epoch": 0.21, "learning_rate": 0.00029632222035749344, "loss": 1.9593, "step": 2693 }, { "epoch": 0.21, "learning_rate": 0.0002963194997148648, "loss": 2.0173, "step": 2694 }, { "epoch": 0.21, "learning_rate": 0.0002963167780788074, "loss": 1.9219, "step": 2695 }, { "epoch": 0.21, "learning_rate": 0.00029631405544933994, "loss": 1.9363, "step": 2696 }, { "epoch": 0.21, "learning_rate": 0.0002963113318264807, "loss": 1.9497, "step": 2697 }, { "epoch": 0.21, "learning_rate": 0.0002963086072102483, "loss": 1.9955, "step": 2698 }, { "epoch": 0.21, "learning_rate": 0.0002963058816006612, "loss": 2.0124, "step": 2699 }, { "epoch": 0.21, "learning_rate": 0.0002963031549977379, "loss": 1.94, "step": 2700 }, { "epoch": 0.21, "learning_rate": 0.0002963004274014969, "loss": 1.9805, "step": 2701 }, { "epoch": 0.21, "learning_rate": 0.0002962976988119567, "loss": 1.9751, "step": 2702 }, { "epoch": 0.21, "learning_rate": 0.00029629496922913587, "loss": 1.9809, "step": 2703 }, { "epoch": 0.21, "learning_rate": 0.00029629223865305297, "loss": 1.9919, "step": 2704 }, { "epoch": 0.21, "learning_rate": 0.0002962895070837265, "loss": 1.9917, "step": 2705 }, { "epoch": 0.21, "learning_rate": 0.000296286774521175, "loss": 1.9391, "step": 2706 }, { "epoch": 0.21, "learning_rate": 0.00029628404096541705, "loss": 1.9787, "step": 2707 }, { "epoch": 0.21, "learning_rate": 0.00029628130641647115, "loss": 1.9462, "step": 2708 }, { "epoch": 0.21, "learning_rate": 0.0002962785708743559, "loss": 1.9614, "step": 2709 }, { "epoch": 0.21, "learning_rate": 0.00029627583433908993, "loss": 1.9167, "step": 2710 }, { "epoch": 0.21, "learning_rate": 0.0002962730968106917, "loss": 1.9551, "step": 2711 }, { "epoch": 0.21, "learning_rate": 0.0002962703582891799, "loss": 1.8963, "step": 2712 }, { "epoch": 0.21, "learning_rate": 0.0002962676187745731, "loss": 1.9746, "step": 2713 }, { "epoch": 0.21, "learning_rate": 0.00029626487826688985, "loss": 2.0041, "step": 2714 }, { "epoch": 0.21, "learning_rate": 0.0002962621367661488, "loss": 1.9681, "step": 2715 }, { "epoch": 0.21, "learning_rate": 0.00029625939427236855, "loss": 1.9925, "step": 2716 }, { "epoch": 0.21, "learning_rate": 0.00029625665078556775, "loss": 1.9294, "step": 2717 }, { "epoch": 0.21, "learning_rate": 0.000296253906305765, "loss": 1.9873, "step": 2718 }, { "epoch": 0.21, "learning_rate": 0.0002962511608329789, "loss": 2.0144, "step": 2719 }, { "epoch": 0.21, "learning_rate": 0.0002962484143672282, "loss": 1.9049, "step": 2720 }, { "epoch": 0.21, "learning_rate": 0.0002962456669085314, "loss": 1.9677, "step": 2721 }, { "epoch": 0.21, "learning_rate": 0.0002962429184569072, "loss": 1.9734, "step": 2722 }, { "epoch": 0.21, "learning_rate": 0.0002962401690123744, "loss": 1.9243, "step": 2723 }, { "epoch": 0.21, "learning_rate": 0.0002962374185749515, "loss": 2.0186, "step": 2724 }, { "epoch": 0.21, "learning_rate": 0.0002962346671446572, "loss": 1.9463, "step": 2725 }, { "epoch": 0.21, "learning_rate": 0.0002962319147215102, "loss": 1.9705, "step": 2726 }, { "epoch": 0.21, "learning_rate": 0.0002962291613055293, "loss": 1.9483, "step": 2727 }, { "epoch": 0.21, "learning_rate": 0.00029622640689673296, "loss": 2.0342, "step": 2728 }, { "epoch": 0.21, "learning_rate": 0.00029622365149514004, "loss": 1.9203, "step": 2729 }, { "epoch": 0.21, "learning_rate": 0.00029622089510076925, "loss": 1.9681, "step": 2730 }, { "epoch": 0.21, "learning_rate": 0.00029621813771363927, "loss": 1.9432, "step": 2731 }, { "epoch": 0.21, "learning_rate": 0.00029621537933376883, "loss": 1.9112, "step": 2732 }, { "epoch": 0.22, "learning_rate": 0.00029621261996117665, "loss": 1.9484, "step": 2733 }, { "epoch": 0.22, "learning_rate": 0.0002962098595958815, "loss": 1.9799, "step": 2734 }, { "epoch": 0.22, "learning_rate": 0.00029620709823790207, "loss": 1.973, "step": 2735 }, { "epoch": 0.22, "learning_rate": 0.0002962043358872571, "loss": 1.9898, "step": 2736 }, { "epoch": 0.22, "learning_rate": 0.00029620157254396537, "loss": 1.9215, "step": 2737 }, { "epoch": 0.22, "learning_rate": 0.0002961988082080457, "loss": 1.9124, "step": 2738 }, { "epoch": 0.22, "learning_rate": 0.0002961960428795167, "loss": 1.9627, "step": 2739 }, { "epoch": 0.22, "learning_rate": 0.0002961932765583973, "loss": 1.9286, "step": 2740 }, { "epoch": 0.22, "learning_rate": 0.00029619050924470624, "loss": 1.9117, "step": 2741 }, { "epoch": 0.22, "learning_rate": 0.0002961877409384623, "loss": 1.8861, "step": 2742 }, { "epoch": 0.22, "learning_rate": 0.00029618497163968425, "loss": 1.9358, "step": 2743 }, { "epoch": 0.22, "learning_rate": 0.0002961822013483909, "loss": 1.9603, "step": 2744 }, { "epoch": 0.22, "learning_rate": 0.0002961794300646011, "loss": 1.968, "step": 2745 }, { "epoch": 0.22, "learning_rate": 0.0002961766577883336, "loss": 1.9344, "step": 2746 }, { "epoch": 0.22, "learning_rate": 0.00029617388451960735, "loss": 1.943, "step": 2747 }, { "epoch": 0.22, "learning_rate": 0.00029617111025844107, "loss": 1.9665, "step": 2748 }, { "epoch": 0.22, "learning_rate": 0.0002961683350048536, "loss": 1.9504, "step": 2749 }, { "epoch": 0.22, "learning_rate": 0.00029616555875886376, "loss": 1.9273, "step": 2750 }, { "epoch": 0.22, "learning_rate": 0.00029616278152049045, "loss": 1.9235, "step": 2751 }, { "epoch": 0.22, "learning_rate": 0.0002961600032897525, "loss": 1.9095, "step": 2752 }, { "epoch": 0.22, "learning_rate": 0.0002961572240666688, "loss": 2.0046, "step": 2753 }, { "epoch": 0.22, "learning_rate": 0.0002961544438512582, "loss": 1.9449, "step": 2754 }, { "epoch": 0.22, "learning_rate": 0.00029615166264353957, "loss": 1.9432, "step": 2755 }, { "epoch": 0.22, "learning_rate": 0.00029614888044353187, "loss": 1.9617, "step": 2756 }, { "epoch": 0.22, "learning_rate": 0.0002961460972512539, "loss": 1.9593, "step": 2757 }, { "epoch": 0.22, "learning_rate": 0.0002961433130667245, "loss": 1.8817, "step": 2758 }, { "epoch": 0.22, "learning_rate": 0.0002961405278899627, "loss": 1.9769, "step": 2759 }, { "epoch": 0.22, "learning_rate": 0.0002961377417209874, "loss": 1.9047, "step": 2760 }, { "epoch": 0.22, "learning_rate": 0.00029613495455981746, "loss": 1.96, "step": 2761 }, { "epoch": 0.22, "learning_rate": 0.00029613216640647183, "loss": 1.9076, "step": 2762 }, { "epoch": 0.22, "learning_rate": 0.0002961293772609694, "loss": 1.9779, "step": 2763 }, { "epoch": 0.22, "learning_rate": 0.00029612658712332914, "loss": 1.9608, "step": 2764 }, { "epoch": 0.22, "learning_rate": 0.00029612379599357, "loss": 1.9472, "step": 2765 }, { "epoch": 0.22, "learning_rate": 0.00029612100387171094, "loss": 1.9202, "step": 2766 }, { "epoch": 0.22, "learning_rate": 0.0002961182107577709, "loss": 1.9697, "step": 2767 }, { "epoch": 0.22, "learning_rate": 0.00029611541665176887, "loss": 1.958, "step": 2768 }, { "epoch": 0.22, "learning_rate": 0.0002961126215537237, "loss": 1.9135, "step": 2769 }, { "epoch": 0.22, "learning_rate": 0.00029610982546365454, "loss": 1.9459, "step": 2770 }, { "epoch": 0.22, "learning_rate": 0.0002961070283815803, "loss": 1.9444, "step": 2771 }, { "epoch": 0.22, "learning_rate": 0.0002961042303075199, "loss": 1.9797, "step": 2772 }, { "epoch": 0.22, "learning_rate": 0.00029610143124149244, "loss": 2.0228, "step": 2773 }, { "epoch": 0.22, "learning_rate": 0.0002960986311835169, "loss": 1.9803, "step": 2774 }, { "epoch": 0.22, "learning_rate": 0.0002960958301336123, "loss": 1.9815, "step": 2775 }, { "epoch": 0.22, "learning_rate": 0.0002960930280917976, "loss": 1.9171, "step": 2776 }, { "epoch": 0.22, "learning_rate": 0.00029609022505809184, "loss": 1.947, "step": 2777 }, { "epoch": 0.22, "learning_rate": 0.0002960874210325141, "loss": 1.9437, "step": 2778 }, { "epoch": 0.22, "learning_rate": 0.00029608461601508335, "loss": 2.0045, "step": 2779 }, { "epoch": 0.22, "learning_rate": 0.0002960818100058188, "loss": 1.8615, "step": 2780 }, { "epoch": 0.22, "learning_rate": 0.00029607900300473923, "loss": 1.9953, "step": 2781 }, { "epoch": 0.22, "learning_rate": 0.0002960761950118639, "loss": 1.9401, "step": 2782 }, { "epoch": 0.22, "learning_rate": 0.0002960733860272118, "loss": 1.8921, "step": 2783 }, { "epoch": 0.22, "learning_rate": 0.00029607057605080206, "loss": 1.9349, "step": 2784 }, { "epoch": 0.22, "learning_rate": 0.0002960677650826537, "loss": 1.9544, "step": 2785 }, { "epoch": 0.22, "learning_rate": 0.0002960649531227858, "loss": 2.0052, "step": 2786 }, { "epoch": 0.22, "learning_rate": 0.0002960621401712175, "loss": 1.9634, "step": 2787 }, { "epoch": 0.22, "learning_rate": 0.00029605932622796786, "loss": 1.9421, "step": 2788 }, { "epoch": 0.22, "learning_rate": 0.00029605651129305596, "loss": 1.9888, "step": 2789 }, { "epoch": 0.22, "learning_rate": 0.000296053695366501, "loss": 1.9276, "step": 2790 }, { "epoch": 0.22, "learning_rate": 0.000296050878448322, "loss": 1.9866, "step": 2791 }, { "epoch": 0.22, "learning_rate": 0.0002960480605385382, "loss": 1.982, "step": 2792 }, { "epoch": 0.22, "learning_rate": 0.0002960452416371686, "loss": 1.9358, "step": 2793 }, { "epoch": 0.22, "learning_rate": 0.00029604242174423247, "loss": 1.9882, "step": 2794 }, { "epoch": 0.22, "learning_rate": 0.00029603960085974884, "loss": 1.9659, "step": 2795 }, { "epoch": 0.22, "learning_rate": 0.0002960367789837369, "loss": 1.886, "step": 2796 }, { "epoch": 0.22, "learning_rate": 0.00029603395611621584, "loss": 1.8837, "step": 2797 }, { "epoch": 0.22, "learning_rate": 0.00029603113225720485, "loss": 1.9824, "step": 2798 }, { "epoch": 0.22, "learning_rate": 0.000296028307406723, "loss": 1.9849, "step": 2799 }, { "epoch": 0.22, "learning_rate": 0.00029602548156478956, "loss": 1.9455, "step": 2800 }, { "epoch": 0.22, "learning_rate": 0.00029602265473142365, "loss": 1.8753, "step": 2801 }, { "epoch": 0.22, "learning_rate": 0.0002960198269066445, "loss": 1.959, "step": 2802 }, { "epoch": 0.22, "learning_rate": 0.00029601699809047135, "loss": 1.9752, "step": 2803 }, { "epoch": 0.22, "learning_rate": 0.00029601416828292334, "loss": 1.9652, "step": 2804 }, { "epoch": 0.22, "learning_rate": 0.0002960113374840197, "loss": 1.9862, "step": 2805 }, { "epoch": 0.22, "learning_rate": 0.00029600850569377966, "loss": 1.9705, "step": 2806 }, { "epoch": 0.22, "learning_rate": 0.0002960056729122224, "loss": 1.9454, "step": 2807 }, { "epoch": 0.22, "learning_rate": 0.0002960028391393672, "loss": 1.8944, "step": 2808 }, { "epoch": 0.22, "learning_rate": 0.00029600000437523334, "loss": 1.9891, "step": 2809 }, { "epoch": 0.22, "learning_rate": 0.00029599716861984003, "loss": 1.9916, "step": 2810 }, { "epoch": 0.22, "learning_rate": 0.0002959943318732065, "loss": 1.99, "step": 2811 }, { "epoch": 0.22, "learning_rate": 0.000295991494135352, "loss": 1.9606, "step": 2812 }, { "epoch": 0.22, "learning_rate": 0.0002959886554062958, "loss": 1.9074, "step": 2813 }, { "epoch": 0.22, "learning_rate": 0.00029598581568605724, "loss": 2.0124, "step": 2814 }, { "epoch": 0.22, "learning_rate": 0.0002959829749746555, "loss": 1.9879, "step": 2815 }, { "epoch": 0.22, "learning_rate": 0.00029598013327211, "loss": 1.9039, "step": 2816 }, { "epoch": 0.22, "learning_rate": 0.0002959772905784399, "loss": 1.9466, "step": 2817 }, { "epoch": 0.22, "learning_rate": 0.0002959744468936645, "loss": 1.9618, "step": 2818 }, { "epoch": 0.22, "learning_rate": 0.00029597160221780326, "loss": 1.9725, "step": 2819 }, { "epoch": 0.22, "learning_rate": 0.00029596875655087536, "loss": 1.9678, "step": 2820 }, { "epoch": 0.22, "learning_rate": 0.00029596590989290015, "loss": 1.9794, "step": 2821 }, { "epoch": 0.22, "learning_rate": 0.00029596306224389694, "loss": 1.9197, "step": 2822 }, { "epoch": 0.22, "learning_rate": 0.00029596021360388513, "loss": 1.9384, "step": 2823 }, { "epoch": 0.22, "learning_rate": 0.00029595736397288396, "loss": 1.9644, "step": 2824 }, { "epoch": 0.22, "learning_rate": 0.0002959545133509129, "loss": 1.9516, "step": 2825 }, { "epoch": 0.22, "learning_rate": 0.0002959516617379912, "loss": 1.9611, "step": 2826 }, { "epoch": 0.22, "learning_rate": 0.00029594880913413825, "loss": 1.9323, "step": 2827 }, { "epoch": 0.22, "learning_rate": 0.00029594595553937347, "loss": 1.8608, "step": 2828 }, { "epoch": 0.22, "learning_rate": 0.00029594310095371615, "loss": 1.9878, "step": 2829 }, { "epoch": 0.22, "learning_rate": 0.0002959402453771857, "loss": 1.9338, "step": 2830 }, { "epoch": 0.22, "learning_rate": 0.0002959373888098016, "loss": 1.9217, "step": 2831 }, { "epoch": 0.22, "learning_rate": 0.0002959345312515831, "loss": 1.9671, "step": 2832 }, { "epoch": 0.22, "learning_rate": 0.0002959316727025497, "loss": 1.9832, "step": 2833 }, { "epoch": 0.22, "learning_rate": 0.00029592881316272074, "loss": 1.9989, "step": 2834 }, { "epoch": 0.22, "learning_rate": 0.0002959259526321157, "loss": 1.9054, "step": 2835 }, { "epoch": 0.22, "learning_rate": 0.00029592309111075394, "loss": 2.0174, "step": 2836 }, { "epoch": 0.22, "learning_rate": 0.00029592022859865495, "loss": 1.9607, "step": 2837 }, { "epoch": 0.22, "learning_rate": 0.0002959173650958381, "loss": 1.9148, "step": 2838 }, { "epoch": 0.22, "learning_rate": 0.0002959145006023229, "loss": 1.9194, "step": 2839 }, { "epoch": 0.22, "learning_rate": 0.0002959116351181287, "loss": 1.9897, "step": 2840 }, { "epoch": 0.22, "learning_rate": 0.0002959087686432751, "loss": 1.94, "step": 2841 }, { "epoch": 0.22, "learning_rate": 0.00029590590117778144, "loss": 1.9287, "step": 2842 }, { "epoch": 0.22, "learning_rate": 0.0002959030327216672, "loss": 1.9862, "step": 2843 }, { "epoch": 0.22, "learning_rate": 0.0002959001632749519, "loss": 1.944, "step": 2844 }, { "epoch": 0.22, "learning_rate": 0.00029589729283765505, "loss": 1.9163, "step": 2845 }, { "epoch": 0.22, "learning_rate": 0.00029589442140979605, "loss": 1.9758, "step": 2846 }, { "epoch": 0.22, "learning_rate": 0.0002958915489913945, "loss": 1.9402, "step": 2847 }, { "epoch": 0.22, "learning_rate": 0.0002958886755824698, "loss": 1.9588, "step": 2848 }, { "epoch": 0.22, "learning_rate": 0.0002958858011830415, "loss": 1.9638, "step": 2849 }, { "epoch": 0.22, "learning_rate": 0.0002958829257931291, "loss": 1.9488, "step": 2850 }, { "epoch": 0.22, "learning_rate": 0.0002958800494127521, "loss": 1.8947, "step": 2851 }, { "epoch": 0.22, "learning_rate": 0.0002958771720419302, "loss": 1.8807, "step": 2852 }, { "epoch": 0.22, "learning_rate": 0.0002958742936806827, "loss": 1.9654, "step": 2853 }, { "epoch": 0.22, "learning_rate": 0.00029587141432902927, "loss": 1.9761, "step": 2854 }, { "epoch": 0.22, "learning_rate": 0.00029586853398698947, "loss": 1.9502, "step": 2855 }, { "epoch": 0.22, "learning_rate": 0.00029586565265458275, "loss": 1.9149, "step": 2856 }, { "epoch": 0.22, "learning_rate": 0.00029586277033182874, "loss": 1.9327, "step": 2857 }, { "epoch": 0.22, "learning_rate": 0.00029585988701874707, "loss": 1.9157, "step": 2858 }, { "epoch": 0.22, "learning_rate": 0.00029585700271535725, "loss": 2.0089, "step": 2859 }, { "epoch": 0.23, "learning_rate": 0.0002958541174216789, "loss": 1.9701, "step": 2860 }, { "epoch": 0.23, "learning_rate": 0.00029585123113773154, "loss": 1.9006, "step": 2861 }, { "epoch": 0.23, "learning_rate": 0.0002958483438635348, "loss": 1.8724, "step": 2862 }, { "epoch": 0.23, "learning_rate": 0.0002958454555991083, "loss": 1.9195, "step": 2863 }, { "epoch": 0.23, "learning_rate": 0.00029584256634447164, "loss": 1.9212, "step": 2864 }, { "epoch": 0.23, "learning_rate": 0.0002958396760996444, "loss": 1.9867, "step": 2865 }, { "epoch": 0.23, "learning_rate": 0.00029583678486464637, "loss": 1.95, "step": 2866 }, { "epoch": 0.23, "learning_rate": 0.0002958338926394969, "loss": 1.9435, "step": 2867 }, { "epoch": 0.23, "learning_rate": 0.0002958309994242159, "loss": 1.9624, "step": 2868 }, { "epoch": 0.23, "learning_rate": 0.0002958281052188228, "loss": 1.9409, "step": 2869 }, { "epoch": 0.23, "learning_rate": 0.00029582521002333737, "loss": 1.8945, "step": 2870 }, { "epoch": 0.23, "learning_rate": 0.0002958223138377792, "loss": 1.8976, "step": 2871 }, { "epoch": 0.23, "learning_rate": 0.00029581941666216805, "loss": 1.9708, "step": 2872 }, { "epoch": 0.23, "learning_rate": 0.0002958165184965235, "loss": 1.9649, "step": 2873 }, { "epoch": 0.23, "learning_rate": 0.0002958136193408653, "loss": 1.9935, "step": 2874 }, { "epoch": 0.23, "learning_rate": 0.000295810719195213, "loss": 1.965, "step": 2875 }, { "epoch": 0.23, "learning_rate": 0.00029580781805958647, "loss": 1.9769, "step": 2876 }, { "epoch": 0.23, "learning_rate": 0.0002958049159340053, "loss": 1.9395, "step": 2877 }, { "epoch": 0.23, "learning_rate": 0.0002958020128184892, "loss": 1.9522, "step": 2878 }, { "epoch": 0.23, "learning_rate": 0.0002957991087130579, "loss": 1.9256, "step": 2879 }, { "epoch": 0.23, "learning_rate": 0.0002957962036177311, "loss": 1.9144, "step": 2880 }, { "epoch": 0.23, "learning_rate": 0.00029579329753252854, "loss": 1.8503, "step": 2881 }, { "epoch": 0.23, "learning_rate": 0.00029579039045746994, "loss": 1.8861, "step": 2882 }, { "epoch": 0.23, "learning_rate": 0.00029578748239257504, "loss": 1.9715, "step": 2883 }, { "epoch": 0.23, "learning_rate": 0.00029578457333786357, "loss": 1.9416, "step": 2884 }, { "epoch": 0.23, "learning_rate": 0.00029578166329335536, "loss": 1.9692, "step": 2885 }, { "epoch": 0.23, "learning_rate": 0.00029577875225907004, "loss": 1.9936, "step": 2886 }, { "epoch": 0.23, "learning_rate": 0.0002957758402350275, "loss": 1.9477, "step": 2887 }, { "epoch": 0.23, "learning_rate": 0.00029577292722124735, "loss": 1.949, "step": 2888 }, { "epoch": 0.23, "learning_rate": 0.0002957700132177496, "loss": 1.9662, "step": 2889 }, { "epoch": 0.23, "learning_rate": 0.0002957670982245538, "loss": 1.9964, "step": 2890 }, { "epoch": 0.23, "learning_rate": 0.00029576418224167987, "loss": 1.9044, "step": 2891 }, { "epoch": 0.23, "learning_rate": 0.00029576126526914765, "loss": 1.9292, "step": 2892 }, { "epoch": 0.23, "learning_rate": 0.0002957583473069768, "loss": 1.9478, "step": 2893 }, { "epoch": 0.23, "learning_rate": 0.0002957554283551872, "loss": 1.9905, "step": 2894 }, { "epoch": 0.23, "learning_rate": 0.00029575250841379873, "loss": 1.9148, "step": 2895 }, { "epoch": 0.23, "learning_rate": 0.00029574958748283114, "loss": 1.9386, "step": 2896 }, { "epoch": 0.23, "learning_rate": 0.00029574666556230427, "loss": 1.9857, "step": 2897 }, { "epoch": 0.23, "learning_rate": 0.000295743742652238, "loss": 1.9475, "step": 2898 }, { "epoch": 0.23, "learning_rate": 0.0002957408187526521, "loss": 1.9442, "step": 2899 }, { "epoch": 0.23, "learning_rate": 0.00029573789386356646, "loss": 1.9901, "step": 2900 }, { "epoch": 0.23, "learning_rate": 0.000295734967985001, "loss": 1.9528, "step": 2901 }, { "epoch": 0.23, "learning_rate": 0.0002957320411169755, "loss": 1.9867, "step": 2902 }, { "epoch": 0.23, "learning_rate": 0.0002957291132595099, "loss": 1.9629, "step": 2903 }, { "epoch": 0.23, "learning_rate": 0.000295726184412624, "loss": 1.9558, "step": 2904 }, { "epoch": 0.23, "learning_rate": 0.0002957232545763377, "loss": 1.9334, "step": 2905 }, { "epoch": 0.23, "learning_rate": 0.000295720323750671, "loss": 1.9457, "step": 2906 }, { "epoch": 0.23, "learning_rate": 0.00029571739193564364, "loss": 1.9164, "step": 2907 }, { "epoch": 0.23, "learning_rate": 0.0002957144591312756, "loss": 1.9589, "step": 2908 }, { "epoch": 0.23, "learning_rate": 0.00029571152533758684, "loss": 1.9847, "step": 2909 }, { "epoch": 0.23, "learning_rate": 0.00029570859055459724, "loss": 1.9456, "step": 2910 }, { "epoch": 0.23, "learning_rate": 0.0002957056547823267, "loss": 1.9631, "step": 2911 }, { "epoch": 0.23, "learning_rate": 0.0002957027180207952, "loss": 1.9366, "step": 2912 }, { "epoch": 0.23, "learning_rate": 0.00029569978027002255, "loss": 1.9959, "step": 2913 }, { "epoch": 0.23, "learning_rate": 0.0002956968415300289, "loss": 1.9089, "step": 2914 }, { "epoch": 0.23, "learning_rate": 0.00029569390180083407, "loss": 1.9168, "step": 2915 }, { "epoch": 0.23, "learning_rate": 0.000295690961082458, "loss": 1.9529, "step": 2916 }, { "epoch": 0.23, "learning_rate": 0.0002956880193749208, "loss": 1.9486, "step": 2917 }, { "epoch": 0.23, "learning_rate": 0.0002956850766782423, "loss": 1.9338, "step": 2918 }, { "epoch": 0.23, "learning_rate": 0.00029568213299244244, "loss": 1.9291, "step": 2919 }, { "epoch": 0.23, "learning_rate": 0.0002956791883175414, "loss": 1.9028, "step": 2920 }, { "epoch": 0.23, "learning_rate": 0.00029567624265355906, "loss": 1.9651, "step": 2921 }, { "epoch": 0.23, "learning_rate": 0.00029567329600051537, "loss": 1.9442, "step": 2922 }, { "epoch": 0.23, "learning_rate": 0.0002956703483584304, "loss": 1.9134, "step": 2923 }, { "epoch": 0.23, "learning_rate": 0.00029566739972732416, "loss": 1.8906, "step": 2924 }, { "epoch": 0.23, "learning_rate": 0.0002956644501072167, "loss": 1.9333, "step": 2925 }, { "epoch": 0.23, "learning_rate": 0.00029566149949812793, "loss": 1.9416, "step": 2926 }, { "epoch": 0.23, "learning_rate": 0.00029565854790007803, "loss": 1.9291, "step": 2927 }, { "epoch": 0.23, "learning_rate": 0.00029565559531308694, "loss": 1.9494, "step": 2928 }, { "epoch": 0.23, "learning_rate": 0.0002956526417371747, "loss": 1.9343, "step": 2929 }, { "epoch": 0.23, "learning_rate": 0.0002956496871723615, "loss": 1.9191, "step": 2930 }, { "epoch": 0.23, "learning_rate": 0.00029564673161866723, "loss": 1.9258, "step": 2931 }, { "epoch": 0.23, "learning_rate": 0.000295643775076112, "loss": 1.9419, "step": 2932 }, { "epoch": 0.23, "learning_rate": 0.00029564081754471596, "loss": 1.9564, "step": 2933 }, { "epoch": 0.23, "learning_rate": 0.00029563785902449917, "loss": 1.9338, "step": 2934 }, { "epoch": 0.23, "learning_rate": 0.00029563489951548165, "loss": 1.8527, "step": 2935 }, { "epoch": 0.23, "learning_rate": 0.0002956319390176835, "loss": 1.9541, "step": 2936 }, { "epoch": 0.23, "learning_rate": 0.0002956289775311249, "loss": 1.9187, "step": 2937 }, { "epoch": 0.23, "learning_rate": 0.0002956260150558259, "loss": 1.885, "step": 2938 }, { "epoch": 0.23, "learning_rate": 0.0002956230515918066, "loss": 1.8933, "step": 2939 }, { "epoch": 0.23, "learning_rate": 0.00029562008713908714, "loss": 1.9181, "step": 2940 }, { "epoch": 0.23, "learning_rate": 0.00029561712169768765, "loss": 1.9164, "step": 2941 }, { "epoch": 0.23, "learning_rate": 0.00029561415526762827, "loss": 1.9301, "step": 2942 }, { "epoch": 0.23, "learning_rate": 0.00029561118784892916, "loss": 1.9397, "step": 2943 }, { "epoch": 0.23, "learning_rate": 0.0002956082194416104, "loss": 1.9171, "step": 2944 }, { "epoch": 0.23, "learning_rate": 0.00029560525004569216, "loss": 1.9119, "step": 2945 }, { "epoch": 0.23, "learning_rate": 0.00029560227966119465, "loss": 1.9443, "step": 2946 }, { "epoch": 0.23, "learning_rate": 0.0002955993082881381, "loss": 1.9676, "step": 2947 }, { "epoch": 0.23, "learning_rate": 0.00029559633592654246, "loss": 1.9644, "step": 2948 }, { "epoch": 0.23, "learning_rate": 0.0002955933625764281, "loss": 1.9491, "step": 2949 }, { "epoch": 0.23, "learning_rate": 0.00029559038823781514, "loss": 1.9598, "step": 2950 }, { "epoch": 0.23, "learning_rate": 0.0002955874129107238, "loss": 1.8858, "step": 2951 }, { "epoch": 0.23, "learning_rate": 0.0002955844365951743, "loss": 1.9092, "step": 2952 }, { "epoch": 0.23, "learning_rate": 0.00029558145929118674, "loss": 2.0315, "step": 2953 }, { "epoch": 0.23, "learning_rate": 0.00029557848099878145, "loss": 1.9144, "step": 2954 }, { "epoch": 0.23, "learning_rate": 0.00029557550171797865, "loss": 1.9649, "step": 2955 }, { "epoch": 0.23, "learning_rate": 0.0002955725214487985, "loss": 1.9522, "step": 2956 }, { "epoch": 0.23, "learning_rate": 0.0002955695401912612, "loss": 1.9428, "step": 2957 }, { "epoch": 0.23, "learning_rate": 0.00029556655794538714, "loss": 1.9235, "step": 2958 }, { "epoch": 0.23, "learning_rate": 0.00029556357471119643, "loss": 1.9562, "step": 2959 }, { "epoch": 0.23, "learning_rate": 0.0002955605904887094, "loss": 1.8647, "step": 2960 }, { "epoch": 0.23, "learning_rate": 0.0002955576052779463, "loss": 1.8978, "step": 2961 }, { "epoch": 0.23, "learning_rate": 0.00029555461907892735, "loss": 1.9983, "step": 2962 }, { "epoch": 0.23, "learning_rate": 0.0002955516318916729, "loss": 1.9125, "step": 2963 }, { "epoch": 0.23, "learning_rate": 0.0002955486437162032, "loss": 1.9381, "step": 2964 }, { "epoch": 0.23, "learning_rate": 0.00029554565455253845, "loss": 1.9002, "step": 2965 }, { "epoch": 0.23, "learning_rate": 0.0002955426644006991, "loss": 1.9093, "step": 2966 }, { "epoch": 0.23, "learning_rate": 0.00029553967326070537, "loss": 1.9211, "step": 2967 }, { "epoch": 0.23, "learning_rate": 0.00029553668113257753, "loss": 2.0067, "step": 2968 }, { "epoch": 0.23, "learning_rate": 0.00029553368801633597, "loss": 1.9362, "step": 2969 }, { "epoch": 0.23, "learning_rate": 0.000295530693912001, "loss": 1.9031, "step": 2970 }, { "epoch": 0.23, "learning_rate": 0.00029552769881959287, "loss": 1.8829, "step": 2971 }, { "epoch": 0.23, "learning_rate": 0.000295524702739132, "loss": 1.9544, "step": 2972 }, { "epoch": 0.23, "learning_rate": 0.0002955217056706387, "loss": 1.8732, "step": 2973 }, { "epoch": 0.23, "learning_rate": 0.00029551870761413334, "loss": 1.9583, "step": 2974 }, { "epoch": 0.23, "learning_rate": 0.0002955157085696363, "loss": 1.9336, "step": 2975 }, { "epoch": 0.23, "learning_rate": 0.0002955127085371678, "loss": 1.9872, "step": 2976 }, { "epoch": 0.23, "learning_rate": 0.0002955097075167484, "loss": 1.9413, "step": 2977 }, { "epoch": 0.23, "learning_rate": 0.00029550670550839835, "loss": 1.8951, "step": 2978 }, { "epoch": 0.23, "learning_rate": 0.0002955037025121381, "loss": 1.9037, "step": 2979 }, { "epoch": 0.23, "learning_rate": 0.000295500698527988, "loss": 1.904, "step": 2980 }, { "epoch": 0.23, "learning_rate": 0.0002954976935559684, "loss": 1.9517, "step": 2981 }, { "epoch": 0.23, "learning_rate": 0.0002954946875960998, "loss": 1.9412, "step": 2982 }, { "epoch": 0.23, "learning_rate": 0.00029549168064840254, "loss": 1.9772, "step": 2983 }, { "epoch": 0.23, "learning_rate": 0.000295488672712897, "loss": 1.9484, "step": 2984 }, { "epoch": 0.23, "learning_rate": 0.00029548566378960375, "loss": 1.9457, "step": 2985 }, { "epoch": 0.23, "learning_rate": 0.00029548265387854307, "loss": 1.9658, "step": 2986 }, { "epoch": 0.24, "learning_rate": 0.0002954796429797355, "loss": 1.9219, "step": 2987 }, { "epoch": 0.24, "learning_rate": 0.00029547663109320143, "loss": 1.9363, "step": 2988 }, { "epoch": 0.24, "learning_rate": 0.00029547361821896125, "loss": 1.9417, "step": 2989 }, { "epoch": 0.24, "learning_rate": 0.00029547060435703554, "loss": 1.935, "step": 2990 }, { "epoch": 0.24, "learning_rate": 0.0002954675895074447, "loss": 1.9089, "step": 2991 }, { "epoch": 0.24, "learning_rate": 0.0002954645736702092, "loss": 1.9596, "step": 2992 }, { "epoch": 0.24, "learning_rate": 0.0002954615568453495, "loss": 1.9096, "step": 2993 }, { "epoch": 0.24, "learning_rate": 0.0002954585390328861, "loss": 1.8888, "step": 2994 }, { "epoch": 0.24, "learning_rate": 0.0002954555202328395, "loss": 1.9725, "step": 2995 }, { "epoch": 0.24, "learning_rate": 0.00029545250044523026, "loss": 1.8987, "step": 2996 }, { "epoch": 0.24, "learning_rate": 0.0002954494796700787, "loss": 1.9273, "step": 2997 }, { "epoch": 0.24, "learning_rate": 0.0002954464579074055, "loss": 1.9277, "step": 2998 }, { "epoch": 0.24, "learning_rate": 0.00029544343515723116, "loss": 1.9546, "step": 2999 }, { "epoch": 0.24, "learning_rate": 0.0002954404114195761, "loss": 1.9802, "step": 3000 }, { "epoch": 0.24, "learning_rate": 0.00029543738669446086, "loss": 1.9789, "step": 3001 }, { "epoch": 0.24, "learning_rate": 0.00029543436098190606, "loss": 1.9029, "step": 3002 }, { "epoch": 0.24, "learning_rate": 0.00029543133428193224, "loss": 1.9344, "step": 3003 }, { "epoch": 0.24, "learning_rate": 0.0002954283065945599, "loss": 1.911, "step": 3004 }, { "epoch": 0.24, "learning_rate": 0.0002954252779198096, "loss": 1.9353, "step": 3005 }, { "epoch": 0.24, "learning_rate": 0.0002954222482577019, "loss": 1.9148, "step": 3006 }, { "epoch": 0.24, "learning_rate": 0.00029541921760825737, "loss": 1.9345, "step": 3007 }, { "epoch": 0.24, "learning_rate": 0.00029541618597149667, "loss": 1.908, "step": 3008 }, { "epoch": 0.24, "learning_rate": 0.00029541315334744023, "loss": 1.9111, "step": 3009 }, { "epoch": 0.24, "learning_rate": 0.0002954101197361088, "loss": 1.881, "step": 3010 }, { "epoch": 0.24, "learning_rate": 0.00029540708513752287, "loss": 1.9059, "step": 3011 }, { "epoch": 0.24, "learning_rate": 0.0002954040495517031, "loss": 1.9593, "step": 3012 }, { "epoch": 0.24, "learning_rate": 0.00029540101297867005, "loss": 1.9005, "step": 3013 }, { "epoch": 0.24, "learning_rate": 0.00029539797541844434, "loss": 1.868, "step": 3014 }, { "epoch": 0.24, "learning_rate": 0.00029539493687104665, "loss": 1.8858, "step": 3015 }, { "epoch": 0.24, "learning_rate": 0.0002953918973364976, "loss": 1.9514, "step": 3016 }, { "epoch": 0.24, "learning_rate": 0.0002953888568148177, "loss": 1.9132, "step": 3017 }, { "epoch": 0.24, "learning_rate": 0.0002953858153060278, "loss": 1.9216, "step": 3018 }, { "epoch": 0.24, "learning_rate": 0.00029538277281014835, "loss": 1.8929, "step": 3019 }, { "epoch": 0.24, "learning_rate": 0.00029537972932720016, "loss": 1.9299, "step": 3020 }, { "epoch": 0.24, "learning_rate": 0.00029537668485720385, "loss": 1.9799, "step": 3021 }, { "epoch": 0.24, "learning_rate": 0.00029537363940018, "loss": 1.9453, "step": 3022 }, { "epoch": 0.24, "learning_rate": 0.00029537059295614944, "loss": 1.9296, "step": 3023 }, { "epoch": 0.24, "learning_rate": 0.0002953675455251328, "loss": 1.9567, "step": 3024 }, { "epoch": 0.24, "learning_rate": 0.0002953644971071507, "loss": 1.9136, "step": 3025 }, { "epoch": 0.24, "learning_rate": 0.0002953614477022239, "loss": 1.8654, "step": 3026 }, { "epoch": 0.24, "learning_rate": 0.000295358397310373, "loss": 1.8893, "step": 3027 }, { "epoch": 0.24, "learning_rate": 0.0002953553459316189, "loss": 1.9104, "step": 3028 }, { "epoch": 0.24, "learning_rate": 0.00029535229356598215, "loss": 1.9047, "step": 3029 }, { "epoch": 0.24, "learning_rate": 0.0002953492402134836, "loss": 1.949, "step": 3030 }, { "epoch": 0.24, "learning_rate": 0.00029534618587414386, "loss": 1.8882, "step": 3031 }, { "epoch": 0.24, "learning_rate": 0.00029534313054798377, "loss": 1.9409, "step": 3032 }, { "epoch": 0.24, "learning_rate": 0.000295340074235024, "loss": 1.9173, "step": 3033 }, { "epoch": 0.24, "learning_rate": 0.0002953370169352854, "loss": 1.9195, "step": 3034 }, { "epoch": 0.24, "learning_rate": 0.00029533395864878855, "loss": 1.9158, "step": 3035 }, { "epoch": 0.24, "learning_rate": 0.0002953308993755544, "loss": 1.9091, "step": 3036 }, { "epoch": 0.24, "learning_rate": 0.0002953278391156036, "loss": 1.9596, "step": 3037 }, { "epoch": 0.24, "learning_rate": 0.00029532477786895704, "loss": 1.9425, "step": 3038 }, { "epoch": 0.24, "learning_rate": 0.00029532171563563536, "loss": 1.9926, "step": 3039 }, { "epoch": 0.24, "learning_rate": 0.00029531865241565945, "loss": 1.9387, "step": 3040 }, { "epoch": 0.24, "learning_rate": 0.0002953155882090501, "loss": 1.9674, "step": 3041 }, { "epoch": 0.24, "learning_rate": 0.00029531252301582807, "loss": 1.9419, "step": 3042 }, { "epoch": 0.24, "learning_rate": 0.0002953094568360142, "loss": 1.9422, "step": 3043 }, { "epoch": 0.24, "learning_rate": 0.0002953063896696293, "loss": 1.9456, "step": 3044 }, { "epoch": 0.24, "learning_rate": 0.00029530332151669425, "loss": 1.9313, "step": 3045 }, { "epoch": 0.24, "learning_rate": 0.0002953002523772298, "loss": 1.9425, "step": 3046 }, { "epoch": 0.24, "learning_rate": 0.0002952971822512568, "loss": 1.9205, "step": 3047 }, { "epoch": 0.24, "learning_rate": 0.0002952941111387962, "loss": 1.9096, "step": 3048 }, { "epoch": 0.24, "learning_rate": 0.00029529103903986866, "loss": 1.897, "step": 3049 }, { "epoch": 0.24, "learning_rate": 0.0002952879659544952, "loss": 1.9927, "step": 3050 }, { "epoch": 0.24, "learning_rate": 0.00029528489188269664, "loss": 1.9141, "step": 3051 }, { "epoch": 0.24, "learning_rate": 0.0002952818168244938, "loss": 1.9193, "step": 3052 }, { "epoch": 0.24, "learning_rate": 0.0002952787407799076, "loss": 1.8981, "step": 3053 }, { "epoch": 0.24, "learning_rate": 0.0002952756637489589, "loss": 1.847, "step": 3054 }, { "epoch": 0.24, "learning_rate": 0.0002952725857316687, "loss": 1.909, "step": 3055 }, { "epoch": 0.24, "learning_rate": 0.0002952695067280577, "loss": 1.9687, "step": 3056 }, { "epoch": 0.24, "learning_rate": 0.00029526642673814696, "loss": 1.988, "step": 3057 }, { "epoch": 0.24, "learning_rate": 0.0002952633457619574, "loss": 1.9348, "step": 3058 }, { "epoch": 0.24, "learning_rate": 0.0002952602637995098, "loss": 1.8429, "step": 3059 }, { "epoch": 0.24, "learning_rate": 0.00029525718085082525, "loss": 1.954, "step": 3060 }, { "epoch": 0.24, "learning_rate": 0.00029525409691592456, "loss": 1.8587, "step": 3061 }, { "epoch": 0.24, "learning_rate": 0.0002952510119948287, "loss": 1.8805, "step": 3062 }, { "epoch": 0.24, "learning_rate": 0.00029524792608755864, "loss": 1.9018, "step": 3063 }, { "epoch": 0.24, "learning_rate": 0.0002952448391941353, "loss": 1.915, "step": 3064 }, { "epoch": 0.24, "learning_rate": 0.00029524175131457963, "loss": 1.9796, "step": 3065 }, { "epoch": 0.24, "learning_rate": 0.0002952386624489127, "loss": 1.9062, "step": 3066 }, { "epoch": 0.24, "learning_rate": 0.0002952355725971554, "loss": 1.9412, "step": 3067 }, { "epoch": 0.24, "learning_rate": 0.0002952324817593286, "loss": 1.8909, "step": 3068 }, { "epoch": 0.24, "learning_rate": 0.0002952293899354535, "loss": 1.8896, "step": 3069 }, { "epoch": 0.24, "learning_rate": 0.000295226297125551, "loss": 1.88, "step": 3070 }, { "epoch": 0.24, "learning_rate": 0.00029522320332964197, "loss": 1.9219, "step": 3071 }, { "epoch": 0.24, "learning_rate": 0.0002952201085477476, "loss": 1.9041, "step": 3072 }, { "epoch": 0.24, "learning_rate": 0.0002952170127798888, "loss": 1.9414, "step": 3073 }, { "epoch": 0.24, "learning_rate": 0.0002952139160260867, "loss": 1.8893, "step": 3074 }, { "epoch": 0.24, "learning_rate": 0.0002952108182863622, "loss": 1.9013, "step": 3075 }, { "epoch": 0.24, "learning_rate": 0.0002952077195607363, "loss": 1.8746, "step": 3076 }, { "epoch": 0.24, "learning_rate": 0.00029520461984923024, "loss": 1.9317, "step": 3077 }, { "epoch": 0.24, "learning_rate": 0.00029520151915186487, "loss": 1.9695, "step": 3078 }, { "epoch": 0.24, "learning_rate": 0.00029519841746866135, "loss": 1.9118, "step": 3079 }, { "epoch": 0.24, "learning_rate": 0.00029519531479964067, "loss": 1.9195, "step": 3080 }, { "epoch": 0.24, "learning_rate": 0.00029519221114482396, "loss": 1.9328, "step": 3081 }, { "epoch": 0.24, "learning_rate": 0.00029518910650423225, "loss": 1.9297, "step": 3082 }, { "epoch": 0.24, "learning_rate": 0.00029518600087788665, "loss": 1.8584, "step": 3083 }, { "epoch": 0.24, "learning_rate": 0.00029518289426580817, "loss": 1.8918, "step": 3084 }, { "epoch": 0.24, "learning_rate": 0.000295179786668018, "loss": 1.8839, "step": 3085 }, { "epoch": 0.24, "learning_rate": 0.00029517667808453716, "loss": 1.9493, "step": 3086 }, { "epoch": 0.24, "learning_rate": 0.0002951735685153868, "loss": 1.9459, "step": 3087 }, { "epoch": 0.24, "learning_rate": 0.00029517045796058805, "loss": 1.9873, "step": 3088 }, { "epoch": 0.24, "learning_rate": 0.00029516734642016197, "loss": 1.9028, "step": 3089 }, { "epoch": 0.24, "learning_rate": 0.00029516423389412975, "loss": 1.9675, "step": 3090 }, { "epoch": 0.24, "learning_rate": 0.00029516112038251245, "loss": 1.9186, "step": 3091 }, { "epoch": 0.24, "learning_rate": 0.0002951580058853313, "loss": 1.9536, "step": 3092 }, { "epoch": 0.24, "learning_rate": 0.0002951548904026074, "loss": 1.8689, "step": 3093 }, { "epoch": 0.24, "learning_rate": 0.00029515177393436186, "loss": 1.8927, "step": 3094 }, { "epoch": 0.24, "learning_rate": 0.0002951486564806158, "loss": 1.9158, "step": 3095 }, { "epoch": 0.24, "learning_rate": 0.0002951455380413906, "loss": 1.9138, "step": 3096 }, { "epoch": 0.24, "learning_rate": 0.00029514241861670724, "loss": 1.9913, "step": 3097 }, { "epoch": 0.24, "learning_rate": 0.0002951392982065869, "loss": 1.9204, "step": 3098 }, { "epoch": 0.24, "learning_rate": 0.0002951361768110509, "loss": 1.9286, "step": 3099 }, { "epoch": 0.24, "learning_rate": 0.00029513305443012034, "loss": 1.8494, "step": 3100 }, { "epoch": 0.24, "learning_rate": 0.0002951299310638164, "loss": 1.9179, "step": 3101 }, { "epoch": 0.24, "learning_rate": 0.00029512680671216034, "loss": 1.9152, "step": 3102 }, { "epoch": 0.24, "learning_rate": 0.00029512368137517335, "loss": 1.8952, "step": 3103 }, { "epoch": 0.24, "learning_rate": 0.00029512055505287666, "loss": 1.9642, "step": 3104 }, { "epoch": 0.24, "learning_rate": 0.00029511742774529146, "loss": 1.9724, "step": 3105 }, { "epoch": 0.24, "learning_rate": 0.000295114299452439, "loss": 1.9691, "step": 3106 }, { "epoch": 0.24, "learning_rate": 0.0002951111701743405, "loss": 1.9031, "step": 3107 }, { "epoch": 0.24, "learning_rate": 0.00029510803991101734, "loss": 1.8781, "step": 3108 }, { "epoch": 0.24, "learning_rate": 0.0002951049086624906, "loss": 1.847, "step": 3109 }, { "epoch": 0.24, "learning_rate": 0.0002951017764287816, "loss": 1.9193, "step": 3110 }, { "epoch": 0.24, "learning_rate": 0.00029509864320991164, "loss": 1.9394, "step": 3111 }, { "epoch": 0.24, "learning_rate": 0.00029509550900590193, "loss": 1.8647, "step": 3112 }, { "epoch": 0.24, "learning_rate": 0.0002950923738167738, "loss": 1.9041, "step": 3113 }, { "epoch": 0.25, "learning_rate": 0.0002950892376425485, "loss": 1.9499, "step": 3114 }, { "epoch": 0.25, "learning_rate": 0.00029508610048324733, "loss": 1.908, "step": 3115 }, { "epoch": 0.25, "learning_rate": 0.0002950829623388917, "loss": 1.944, "step": 3116 }, { "epoch": 0.25, "learning_rate": 0.00029507982320950275, "loss": 1.9607, "step": 3117 }, { "epoch": 0.25, "learning_rate": 0.0002950766830951018, "loss": 1.952, "step": 3118 }, { "epoch": 0.25, "learning_rate": 0.00029507354199571033, "loss": 1.8981, "step": 3119 }, { "epoch": 0.25, "learning_rate": 0.00029507039991134957, "loss": 1.9014, "step": 3120 }, { "epoch": 0.25, "learning_rate": 0.0002950672568420408, "loss": 1.8965, "step": 3121 }, { "epoch": 0.25, "learning_rate": 0.00029506411278780545, "loss": 1.9028, "step": 3122 }, { "epoch": 0.25, "learning_rate": 0.00029506096774866477, "loss": 1.9238, "step": 3123 }, { "epoch": 0.25, "learning_rate": 0.00029505782172464025, "loss": 1.8958, "step": 3124 }, { "epoch": 0.25, "learning_rate": 0.0002950546747157531, "loss": 1.9214, "step": 3125 }, { "epoch": 0.25, "learning_rate": 0.0002950515267220248, "loss": 1.9544, "step": 3126 }, { "epoch": 0.25, "learning_rate": 0.00029504837774347665, "loss": 1.9088, "step": 3127 }, { "epoch": 0.25, "learning_rate": 0.00029504522778013006, "loss": 1.8887, "step": 3128 }, { "epoch": 0.25, "learning_rate": 0.00029504207683200644, "loss": 1.8931, "step": 3129 }, { "epoch": 0.25, "learning_rate": 0.00029503892489912714, "loss": 1.9432, "step": 3130 }, { "epoch": 0.25, "learning_rate": 0.00029503577198151357, "loss": 1.8974, "step": 3131 }, { "epoch": 0.25, "learning_rate": 0.00029503261807918715, "loss": 1.8648, "step": 3132 }, { "epoch": 0.25, "learning_rate": 0.0002950294631921693, "loss": 1.8926, "step": 3133 }, { "epoch": 0.25, "learning_rate": 0.00029502630732048144, "loss": 1.8848, "step": 3134 }, { "epoch": 0.25, "learning_rate": 0.00029502315046414494, "loss": 1.8976, "step": 3135 }, { "epoch": 0.25, "learning_rate": 0.0002950199926231814, "loss": 1.9414, "step": 3136 }, { "epoch": 0.25, "learning_rate": 0.000295016833797612, "loss": 1.9216, "step": 3137 }, { "epoch": 0.25, "learning_rate": 0.0002950136739874584, "loss": 1.921, "step": 3138 }, { "epoch": 0.25, "learning_rate": 0.00029501051319274195, "loss": 1.9192, "step": 3139 }, { "epoch": 0.25, "learning_rate": 0.0002950073514134841, "loss": 1.8751, "step": 3140 }, { "epoch": 0.25, "learning_rate": 0.0002950041886497064, "loss": 1.908, "step": 3141 }, { "epoch": 0.25, "learning_rate": 0.00029500102490143034, "loss": 1.8686, "step": 3142 }, { "epoch": 0.25, "learning_rate": 0.00029499786016867725, "loss": 1.9418, "step": 3143 }, { "epoch": 0.25, "learning_rate": 0.0002949946944514687, "loss": 1.9682, "step": 3144 }, { "epoch": 0.25, "learning_rate": 0.00029499152774982624, "loss": 1.8931, "step": 3145 }, { "epoch": 0.25, "learning_rate": 0.0002949883600637713, "loss": 1.9508, "step": 3146 }, { "epoch": 0.25, "learning_rate": 0.0002949851913933254, "loss": 1.9572, "step": 3147 }, { "epoch": 0.25, "learning_rate": 0.0002949820217385101, "loss": 1.9157, "step": 3148 }, { "epoch": 0.25, "learning_rate": 0.00029497885109934686, "loss": 1.9099, "step": 3149 }, { "epoch": 0.25, "learning_rate": 0.0002949756794758572, "loss": 1.855, "step": 3150 }, { "epoch": 0.25, "learning_rate": 0.0002949725068680627, "loss": 1.9448, "step": 3151 }, { "epoch": 0.25, "learning_rate": 0.00029496933327598484, "loss": 1.9213, "step": 3152 }, { "epoch": 0.25, "learning_rate": 0.00029496615869964524, "loss": 1.927, "step": 3153 }, { "epoch": 0.25, "learning_rate": 0.00029496298313906545, "loss": 1.8928, "step": 3154 }, { "epoch": 0.25, "learning_rate": 0.000294959806594267, "loss": 1.888, "step": 3155 }, { "epoch": 0.25, "learning_rate": 0.0002949566290652714, "loss": 1.9317, "step": 3156 }, { "epoch": 0.25, "learning_rate": 0.00029495345055210033, "loss": 1.8719, "step": 3157 }, { "epoch": 0.25, "learning_rate": 0.00029495027105477535, "loss": 1.904, "step": 3158 }, { "epoch": 0.25, "learning_rate": 0.00029494709057331794, "loss": 1.8777, "step": 3159 }, { "epoch": 0.25, "learning_rate": 0.00029494390910774984, "loss": 1.8914, "step": 3160 }, { "epoch": 0.25, "learning_rate": 0.0002949407266580926, "loss": 1.9697, "step": 3161 }, { "epoch": 0.25, "learning_rate": 0.0002949375432243677, "loss": 1.8965, "step": 3162 }, { "epoch": 0.25, "learning_rate": 0.00029493435880659696, "loss": 1.9026, "step": 3163 }, { "epoch": 0.25, "learning_rate": 0.00029493117340480187, "loss": 1.8232, "step": 3164 }, { "epoch": 0.25, "learning_rate": 0.00029492798701900413, "loss": 1.9288, "step": 3165 }, { "epoch": 0.25, "learning_rate": 0.00029492479964922526, "loss": 1.9273, "step": 3166 }, { "epoch": 0.25, "learning_rate": 0.000294921611295487, "loss": 1.9318, "step": 3167 }, { "epoch": 0.25, "learning_rate": 0.00029491842195781106, "loss": 1.9087, "step": 3168 }, { "epoch": 0.25, "learning_rate": 0.0002949152316362189, "loss": 1.8782, "step": 3169 }, { "epoch": 0.25, "learning_rate": 0.0002949120403307324, "loss": 1.9071, "step": 3170 }, { "epoch": 0.25, "learning_rate": 0.000294908848041373, "loss": 1.8867, "step": 3171 }, { "epoch": 0.25, "learning_rate": 0.0002949056547681625, "loss": 1.9326, "step": 3172 }, { "epoch": 0.25, "learning_rate": 0.00029490246051112266, "loss": 1.9377, "step": 3173 }, { "epoch": 0.25, "learning_rate": 0.00029489926527027504, "loss": 1.9129, "step": 3174 }, { "epoch": 0.25, "learning_rate": 0.00029489606904564133, "loss": 1.9018, "step": 3175 }, { "epoch": 0.25, "learning_rate": 0.0002948928718372433, "loss": 1.9011, "step": 3176 }, { "epoch": 0.25, "learning_rate": 0.00029488967364510265, "loss": 1.9105, "step": 3177 }, { "epoch": 0.25, "learning_rate": 0.00029488647446924103, "loss": 1.9082, "step": 3178 }, { "epoch": 0.25, "learning_rate": 0.0002948832743096802, "loss": 1.9626, "step": 3179 }, { "epoch": 0.25, "learning_rate": 0.0002948800731664419, "loss": 1.9482, "step": 3180 }, { "epoch": 0.25, "learning_rate": 0.0002948768710395479, "loss": 1.9301, "step": 3181 }, { "epoch": 0.25, "learning_rate": 0.00029487366792901984, "loss": 1.9821, "step": 3182 }, { "epoch": 0.25, "learning_rate": 0.0002948704638348796, "loss": 1.9031, "step": 3183 }, { "epoch": 0.25, "learning_rate": 0.00029486725875714877, "loss": 1.8373, "step": 3184 }, { "epoch": 0.25, "learning_rate": 0.0002948640526958492, "loss": 1.8805, "step": 3185 }, { "epoch": 0.25, "learning_rate": 0.0002948608456510027, "loss": 1.8826, "step": 3186 }, { "epoch": 0.25, "learning_rate": 0.000294857637622631, "loss": 1.9156, "step": 3187 }, { "epoch": 0.25, "learning_rate": 0.0002948544286107559, "loss": 1.9861, "step": 3188 }, { "epoch": 0.25, "learning_rate": 0.00029485121861539906, "loss": 1.8897, "step": 3189 }, { "epoch": 0.25, "learning_rate": 0.0002948480076365825, "loss": 1.934, "step": 3190 }, { "epoch": 0.25, "learning_rate": 0.0002948447956743278, "loss": 1.9889, "step": 3191 }, { "epoch": 0.25, "learning_rate": 0.00029484158272865695, "loss": 1.8649, "step": 3192 }, { "epoch": 0.25, "learning_rate": 0.0002948383687995917, "loss": 1.8908, "step": 3193 }, { "epoch": 0.25, "learning_rate": 0.00029483515388715374, "loss": 1.9103, "step": 3194 }, { "epoch": 0.25, "learning_rate": 0.0002948319379913651, "loss": 1.9455, "step": 3195 }, { "epoch": 0.25, "learning_rate": 0.0002948287211122475, "loss": 1.9045, "step": 3196 }, { "epoch": 0.25, "learning_rate": 0.0002948255032498228, "loss": 1.9232, "step": 3197 }, { "epoch": 0.25, "learning_rate": 0.00029482228440411287, "loss": 1.9125, "step": 3198 }, { "epoch": 0.25, "learning_rate": 0.0002948190645751396, "loss": 1.9784, "step": 3199 }, { "epoch": 0.25, "learning_rate": 0.0002948158437629247, "loss": 1.8743, "step": 3200 }, { "epoch": 0.25, "learning_rate": 0.0002948126219674902, "loss": 1.8962, "step": 3201 }, { "epoch": 0.25, "learning_rate": 0.0002948093991888579, "loss": 1.902, "step": 3202 }, { "epoch": 0.25, "learning_rate": 0.0002948061754270497, "loss": 1.944, "step": 3203 }, { "epoch": 0.25, "learning_rate": 0.0002948029506820874, "loss": 1.9382, "step": 3204 }, { "epoch": 0.25, "learning_rate": 0.0002947997249539931, "loss": 1.9346, "step": 3205 }, { "epoch": 0.25, "learning_rate": 0.0002947964982427885, "loss": 1.9171, "step": 3206 }, { "epoch": 0.25, "learning_rate": 0.00029479327054849556, "loss": 1.9261, "step": 3207 }, { "epoch": 0.25, "learning_rate": 0.0002947900418711363, "loss": 1.9266, "step": 3208 }, { "epoch": 0.25, "learning_rate": 0.00029478681221073243, "loss": 1.9622, "step": 3209 }, { "epoch": 0.25, "learning_rate": 0.00029478358156730615, "loss": 1.9768, "step": 3210 }, { "epoch": 0.25, "learning_rate": 0.00029478034994087914, "loss": 1.8953, "step": 3211 }, { "epoch": 0.25, "learning_rate": 0.00029477711733147356, "loss": 1.9088, "step": 3212 }, { "epoch": 0.25, "learning_rate": 0.00029477388373911115, "loss": 1.9035, "step": 3213 }, { "epoch": 0.25, "learning_rate": 0.000294770649163814, "loss": 1.9174, "step": 3214 }, { "epoch": 0.25, "learning_rate": 0.000294767413605604, "loss": 1.8209, "step": 3215 }, { "epoch": 0.25, "learning_rate": 0.0002947641770645032, "loss": 1.9644, "step": 3216 }, { "epoch": 0.25, "learning_rate": 0.0002947609395405335, "loss": 1.8753, "step": 3217 }, { "epoch": 0.25, "learning_rate": 0.0002947577010337169, "loss": 1.8886, "step": 3218 }, { "epoch": 0.25, "learning_rate": 0.0002947544615440754, "loss": 1.8764, "step": 3219 }, { "epoch": 0.25, "learning_rate": 0.00029475122107163105, "loss": 1.9021, "step": 3220 }, { "epoch": 0.25, "learning_rate": 0.00029474797961640567, "loss": 1.9067, "step": 3221 }, { "epoch": 0.25, "learning_rate": 0.0002947447371784215, "loss": 1.9475, "step": 3222 }, { "epoch": 0.25, "learning_rate": 0.00029474149375770036, "loss": 1.9191, "step": 3223 }, { "epoch": 0.25, "learning_rate": 0.00029473824935426435, "loss": 1.9519, "step": 3224 }, { "epoch": 0.25, "learning_rate": 0.0002947350039681355, "loss": 1.9099, "step": 3225 }, { "epoch": 0.25, "learning_rate": 0.0002947317575993359, "loss": 1.8684, "step": 3226 }, { "epoch": 0.25, "learning_rate": 0.0002947285102478876, "loss": 1.9149, "step": 3227 }, { "epoch": 0.25, "learning_rate": 0.00029472526191381244, "loss": 1.9164, "step": 3228 }, { "epoch": 0.25, "learning_rate": 0.0002947220125971327, "loss": 1.8882, "step": 3229 }, { "epoch": 0.25, "learning_rate": 0.0002947187622978703, "loss": 1.8581, "step": 3230 }, { "epoch": 0.25, "learning_rate": 0.0002947155110160474, "loss": 1.9002, "step": 3231 }, { "epoch": 0.25, "learning_rate": 0.00029471225875168607, "loss": 1.9286, "step": 3232 }, { "epoch": 0.25, "learning_rate": 0.0002947090055048083, "loss": 1.8482, "step": 3233 }, { "epoch": 0.25, "learning_rate": 0.00029470575127543626, "loss": 1.8948, "step": 3234 }, { "epoch": 0.25, "learning_rate": 0.00029470249606359204, "loss": 1.8938, "step": 3235 }, { "epoch": 0.25, "learning_rate": 0.0002946992398692977, "loss": 1.912, "step": 3236 }, { "epoch": 0.25, "learning_rate": 0.00029469598269257546, "loss": 1.9163, "step": 3237 }, { "epoch": 0.25, "learning_rate": 0.0002946927245334472, "loss": 1.9518, "step": 3238 }, { "epoch": 0.25, "learning_rate": 0.0002946894653919353, "loss": 1.9013, "step": 3239 }, { "epoch": 0.25, "learning_rate": 0.0002946862052680617, "loss": 1.9324, "step": 3240 }, { "epoch": 0.26, "learning_rate": 0.0002946829441618487, "loss": 1.8947, "step": 3241 }, { "epoch": 0.26, "learning_rate": 0.0002946796820733183, "loss": 1.9273, "step": 3242 }, { "epoch": 0.26, "learning_rate": 0.0002946764190024927, "loss": 1.9069, "step": 3243 }, { "epoch": 0.26, "learning_rate": 0.0002946731549493941, "loss": 1.9343, "step": 3244 }, { "epoch": 0.26, "learning_rate": 0.00029466988991404453, "loss": 1.9035, "step": 3245 }, { "epoch": 0.26, "learning_rate": 0.0002946666238964663, "loss": 1.9506, "step": 3246 }, { "epoch": 0.26, "learning_rate": 0.0002946633568966815, "loss": 1.8922, "step": 3247 }, { "epoch": 0.26, "learning_rate": 0.00029466008891471237, "loss": 1.8763, "step": 3248 }, { "epoch": 0.26, "learning_rate": 0.0002946568199505811, "loss": 1.8464, "step": 3249 }, { "epoch": 0.26, "learning_rate": 0.00029465355000430975, "loss": 1.8973, "step": 3250 }, { "epoch": 0.26, "learning_rate": 0.00029465027907592066, "loss": 1.8987, "step": 3251 }, { "epoch": 0.26, "learning_rate": 0.00029464700716543604, "loss": 1.8277, "step": 3252 }, { "epoch": 0.26, "learning_rate": 0.000294643734272878, "loss": 1.8928, "step": 3253 }, { "epoch": 0.26, "learning_rate": 0.0002946404603982689, "loss": 1.926, "step": 3254 }, { "epoch": 0.26, "learning_rate": 0.0002946371855416309, "loss": 1.9245, "step": 3255 }, { "epoch": 0.26, "learning_rate": 0.0002946339097029861, "loss": 1.9048, "step": 3256 }, { "epoch": 0.26, "learning_rate": 0.00029463063288235697, "loss": 1.8699, "step": 3257 }, { "epoch": 0.26, "learning_rate": 0.00029462735507976566, "loss": 1.9063, "step": 3258 }, { "epoch": 0.26, "learning_rate": 0.0002946240762952344, "loss": 1.9673, "step": 3259 }, { "epoch": 0.26, "learning_rate": 0.00029462079652878547, "loss": 1.9287, "step": 3260 }, { "epoch": 0.26, "learning_rate": 0.00029461751578044115, "loss": 1.9137, "step": 3261 }, { "epoch": 0.26, "learning_rate": 0.00029461423405022366, "loss": 1.8875, "step": 3262 }, { "epoch": 0.26, "learning_rate": 0.0002946109513381554, "loss": 1.8623, "step": 3263 }, { "epoch": 0.26, "learning_rate": 0.0002946076676442585, "loss": 1.8767, "step": 3264 }, { "epoch": 0.26, "learning_rate": 0.0002946043829685554, "loss": 1.9078, "step": 3265 }, { "epoch": 0.26, "learning_rate": 0.0002946010973110683, "loss": 1.8734, "step": 3266 }, { "epoch": 0.26, "learning_rate": 0.0002945978106718196, "loss": 1.9253, "step": 3267 }, { "epoch": 0.26, "learning_rate": 0.0002945945230508315, "loss": 1.8997, "step": 3268 }, { "epoch": 0.26, "learning_rate": 0.0002945912344481264, "loss": 1.8574, "step": 3269 }, { "epoch": 0.26, "learning_rate": 0.00029458794486372666, "loss": 1.8936, "step": 3270 }, { "epoch": 0.26, "learning_rate": 0.00029458465429765455, "loss": 1.9375, "step": 3271 }, { "epoch": 0.26, "learning_rate": 0.0002945813627499324, "loss": 1.8769, "step": 3272 }, { "epoch": 0.26, "learning_rate": 0.0002945780702205826, "loss": 1.8702, "step": 3273 }, { "epoch": 0.26, "learning_rate": 0.00029457477670962747, "loss": 1.9111, "step": 3274 }, { "epoch": 0.26, "learning_rate": 0.0002945714822170894, "loss": 1.8927, "step": 3275 }, { "epoch": 0.26, "learning_rate": 0.0002945681867429907, "loss": 1.8607, "step": 3276 }, { "epoch": 0.26, "learning_rate": 0.00029456489028735386, "loss": 1.8996, "step": 3277 }, { "epoch": 0.26, "learning_rate": 0.00029456159285020116, "loss": 1.8994, "step": 3278 }, { "epoch": 0.26, "learning_rate": 0.00029455829443155503, "loss": 1.9765, "step": 3279 }, { "epoch": 0.26, "learning_rate": 0.00029455499503143787, "loss": 1.831, "step": 3280 }, { "epoch": 0.26, "learning_rate": 0.000294551694649872, "loss": 1.959, "step": 3281 }, { "epoch": 0.26, "learning_rate": 0.00029454839328687995, "loss": 1.8721, "step": 3282 }, { "epoch": 0.26, "learning_rate": 0.00029454509094248407, "loss": 1.9269, "step": 3283 }, { "epoch": 0.26, "learning_rate": 0.00029454178761670677, "loss": 1.9417, "step": 3284 }, { "epoch": 0.26, "learning_rate": 0.00029453848330957054, "loss": 1.917, "step": 3285 }, { "epoch": 0.26, "learning_rate": 0.0002945351780210977, "loss": 1.9386, "step": 3286 }, { "epoch": 0.26, "learning_rate": 0.00029453187175131084, "loss": 1.9294, "step": 3287 }, { "epoch": 0.26, "learning_rate": 0.00029452856450023227, "loss": 1.9278, "step": 3288 }, { "epoch": 0.26, "learning_rate": 0.00029452525626788453, "loss": 1.9549, "step": 3289 }, { "epoch": 0.26, "learning_rate": 0.00029452194705429003, "loss": 1.9348, "step": 3290 }, { "epoch": 0.26, "learning_rate": 0.0002945186368594713, "loss": 1.8755, "step": 3291 }, { "epoch": 0.26, "learning_rate": 0.00029451532568345077, "loss": 1.9236, "step": 3292 }, { "epoch": 0.26, "learning_rate": 0.00029451201352625095, "loss": 1.9201, "step": 3293 }, { "epoch": 0.26, "learning_rate": 0.00029450870038789424, "loss": 1.898, "step": 3294 }, { "epoch": 0.26, "learning_rate": 0.00029450538626840325, "loss": 1.8375, "step": 3295 }, { "epoch": 0.26, "learning_rate": 0.0002945020711678004, "loss": 1.8723, "step": 3296 }, { "epoch": 0.26, "learning_rate": 0.0002944987550861083, "loss": 1.8253, "step": 3297 }, { "epoch": 0.26, "learning_rate": 0.00029449543802334934, "loss": 1.9144, "step": 3298 }, { "epoch": 0.26, "learning_rate": 0.0002944921199795461, "loss": 1.8857, "step": 3299 }, { "epoch": 0.26, "learning_rate": 0.0002944888009547211, "loss": 1.9143, "step": 3300 }, { "epoch": 0.26, "learning_rate": 0.0002944854809488969, "loss": 1.9129, "step": 3301 }, { "epoch": 0.26, "learning_rate": 0.000294482159962096, "loss": 1.9294, "step": 3302 }, { "epoch": 0.26, "learning_rate": 0.00029447883799434095, "loss": 1.9072, "step": 3303 }, { "epoch": 0.26, "learning_rate": 0.00029447551504565433, "loss": 1.9835, "step": 3304 }, { "epoch": 0.26, "learning_rate": 0.0002944721911160587, "loss": 1.8865, "step": 3305 }, { "epoch": 0.26, "learning_rate": 0.00029446886620557665, "loss": 1.9332, "step": 3306 }, { "epoch": 0.26, "learning_rate": 0.0002944655403142307, "loss": 1.9307, "step": 3307 }, { "epoch": 0.26, "learning_rate": 0.00029446221344204345, "loss": 1.9389, "step": 3308 }, { "epoch": 0.26, "learning_rate": 0.0002944588855890375, "loss": 1.8921, "step": 3309 }, { "epoch": 0.26, "learning_rate": 0.0002944555567552354, "loss": 1.9529, "step": 3310 }, { "epoch": 0.26, "learning_rate": 0.0002944522269406598, "loss": 1.896, "step": 3311 }, { "epoch": 0.26, "learning_rate": 0.0002944488961453333, "loss": 1.8985, "step": 3312 }, { "epoch": 0.26, "learning_rate": 0.0002944455643692785, "loss": 1.9344, "step": 3313 }, { "epoch": 0.26, "learning_rate": 0.000294442231612518, "loss": 1.9506, "step": 3314 }, { "epoch": 0.26, "learning_rate": 0.00029443889787507453, "loss": 1.8878, "step": 3315 }, { "epoch": 0.26, "learning_rate": 0.0002944355631569706, "loss": 1.8725, "step": 3316 }, { "epoch": 0.26, "learning_rate": 0.0002944322274582289, "loss": 1.9367, "step": 3317 }, { "epoch": 0.26, "learning_rate": 0.0002944288907788721, "loss": 1.9069, "step": 3318 }, { "epoch": 0.26, "learning_rate": 0.0002944255531189229, "loss": 1.9106, "step": 3319 }, { "epoch": 0.26, "learning_rate": 0.0002944222144784038, "loss": 1.9446, "step": 3320 }, { "epoch": 0.26, "learning_rate": 0.00029441887485733763, "loss": 1.9151, "step": 3321 }, { "epoch": 0.26, "learning_rate": 0.0002944155342557469, "loss": 1.9293, "step": 3322 }, { "epoch": 0.26, "learning_rate": 0.00029441219267365446, "loss": 1.9163, "step": 3323 }, { "epoch": 0.26, "learning_rate": 0.0002944088501110829, "loss": 1.8758, "step": 3324 }, { "epoch": 0.26, "learning_rate": 0.000294405506568055, "loss": 1.9934, "step": 3325 }, { "epoch": 0.26, "learning_rate": 0.0002944021620445933, "loss": 1.9279, "step": 3326 }, { "epoch": 0.26, "learning_rate": 0.0002943988165407207, "loss": 1.909, "step": 3327 }, { "epoch": 0.26, "learning_rate": 0.00029439547005645977, "loss": 1.8924, "step": 3328 }, { "epoch": 0.26, "learning_rate": 0.0002943921225918333, "loss": 1.9478, "step": 3329 }, { "epoch": 0.26, "learning_rate": 0.000294388774146864, "loss": 1.8765, "step": 3330 }, { "epoch": 0.26, "learning_rate": 0.00029438542472157457, "loss": 1.8346, "step": 3331 }, { "epoch": 0.26, "learning_rate": 0.0002943820743159878, "loss": 1.9355, "step": 3332 }, { "epoch": 0.26, "learning_rate": 0.00029437872293012644, "loss": 1.9302, "step": 3333 }, { "epoch": 0.26, "learning_rate": 0.0002943753705640132, "loss": 1.9188, "step": 3334 }, { "epoch": 0.26, "learning_rate": 0.0002943720172176709, "loss": 1.9095, "step": 3335 }, { "epoch": 0.26, "learning_rate": 0.00029436866289112224, "loss": 1.9501, "step": 3336 }, { "epoch": 0.26, "learning_rate": 0.0002943653075843901, "loss": 1.8645, "step": 3337 }, { "epoch": 0.26, "learning_rate": 0.00029436195129749714, "loss": 1.9047, "step": 3338 }, { "epoch": 0.26, "learning_rate": 0.00029435859403046614, "loss": 1.9049, "step": 3339 }, { "epoch": 0.26, "learning_rate": 0.00029435523578332006, "loss": 1.8794, "step": 3340 }, { "epoch": 0.26, "learning_rate": 0.0002943518765560815, "loss": 1.8991, "step": 3341 }, { "epoch": 0.26, "learning_rate": 0.0002943485163487734, "loss": 1.8827, "step": 3342 }, { "epoch": 0.26, "learning_rate": 0.0002943451551614185, "loss": 1.915, "step": 3343 }, { "epoch": 0.26, "learning_rate": 0.00029434179299403973, "loss": 1.8549, "step": 3344 }, { "epoch": 0.26, "learning_rate": 0.00029433842984665973, "loss": 1.8188, "step": 3345 }, { "epoch": 0.26, "learning_rate": 0.0002943350657193015, "loss": 1.8822, "step": 3346 }, { "epoch": 0.26, "learning_rate": 0.00029433170061198786, "loss": 1.8649, "step": 3347 }, { "epoch": 0.26, "learning_rate": 0.00029432833452474157, "loss": 1.8819, "step": 3348 }, { "epoch": 0.26, "learning_rate": 0.00029432496745758556, "loss": 1.8715, "step": 3349 }, { "epoch": 0.26, "learning_rate": 0.00029432159941054263, "loss": 1.9307, "step": 3350 }, { "epoch": 0.26, "learning_rate": 0.00029431823038363574, "loss": 1.9379, "step": 3351 }, { "epoch": 0.26, "learning_rate": 0.0002943148603768877, "loss": 1.8985, "step": 3352 }, { "epoch": 0.26, "learning_rate": 0.00029431148939032135, "loss": 1.8922, "step": 3353 }, { "epoch": 0.26, "learning_rate": 0.0002943081174239596, "loss": 1.8819, "step": 3354 }, { "epoch": 0.26, "learning_rate": 0.0002943047444778254, "loss": 1.9372, "step": 3355 }, { "epoch": 0.26, "learning_rate": 0.0002943013705519417, "loss": 1.8865, "step": 3356 }, { "epoch": 0.26, "learning_rate": 0.00029429799564633123, "loss": 1.8866, "step": 3357 }, { "epoch": 0.26, "learning_rate": 0.0002942946197610171, "loss": 1.8663, "step": 3358 }, { "epoch": 0.26, "learning_rate": 0.00029429124289602205, "loss": 1.9257, "step": 3359 }, { "epoch": 0.26, "learning_rate": 0.00029428786505136903, "loss": 1.8568, "step": 3360 }, { "epoch": 0.26, "learning_rate": 0.0002942844862270812, "loss": 1.8761, "step": 3361 }, { "epoch": 0.26, "learning_rate": 0.00029428110642318116, "loss": 1.8608, "step": 3362 }, { "epoch": 0.26, "learning_rate": 0.0002942777256396921, "loss": 1.8626, "step": 3363 }, { "epoch": 0.26, "learning_rate": 0.00029427434387663693, "loss": 1.8968, "step": 3364 }, { "epoch": 0.26, "learning_rate": 0.0002942709611340386, "loss": 1.8696, "step": 3365 }, { "epoch": 0.26, "learning_rate": 0.00029426757741191995, "loss": 1.8726, "step": 3366 }, { "epoch": 0.26, "learning_rate": 0.0002942641927103041, "loss": 1.8866, "step": 3367 }, { "epoch": 0.26, "learning_rate": 0.00029426080702921404, "loss": 1.8828, "step": 3368 }, { "epoch": 0.27, "learning_rate": 0.00029425742036867273, "loss": 1.8992, "step": 3369 }, { "epoch": 0.27, "learning_rate": 0.0002942540327287031, "loss": 1.8505, "step": 3370 }, { "epoch": 0.27, "learning_rate": 0.0002942506441093282, "loss": 1.8081, "step": 3371 }, { "epoch": 0.27, "learning_rate": 0.000294247254510571, "loss": 1.9217, "step": 3372 }, { "epoch": 0.27, "learning_rate": 0.0002942438639324546, "loss": 1.8956, "step": 3373 }, { "epoch": 0.27, "learning_rate": 0.00029424047237500194, "loss": 1.9423, "step": 3374 }, { "epoch": 0.27, "learning_rate": 0.00029423707983823605, "loss": 1.9502, "step": 3375 }, { "epoch": 0.27, "learning_rate": 0.00029423368632218, "loss": 1.96, "step": 3376 }, { "epoch": 0.27, "learning_rate": 0.0002942302918268568, "loss": 1.8417, "step": 3377 }, { "epoch": 0.27, "learning_rate": 0.00029422689635228956, "loss": 1.9154, "step": 3378 }, { "epoch": 0.27, "learning_rate": 0.0002942234998985012, "loss": 1.8254, "step": 3379 }, { "epoch": 0.27, "learning_rate": 0.00029422010246551495, "loss": 1.9248, "step": 3380 }, { "epoch": 0.27, "learning_rate": 0.0002942167040533538, "loss": 1.8601, "step": 3381 }, { "epoch": 0.27, "learning_rate": 0.00029421330466204075, "loss": 1.8962, "step": 3382 }, { "epoch": 0.27, "learning_rate": 0.00029420990429159893, "loss": 1.947, "step": 3383 }, { "epoch": 0.27, "learning_rate": 0.00029420650294205154, "loss": 1.9282, "step": 3384 }, { "epoch": 0.27, "learning_rate": 0.0002942031006134215, "loss": 1.9087, "step": 3385 }, { "epoch": 0.27, "learning_rate": 0.00029419969730573196, "loss": 1.8461, "step": 3386 }, { "epoch": 0.27, "learning_rate": 0.0002941962930190061, "loss": 1.8558, "step": 3387 }, { "epoch": 0.27, "learning_rate": 0.000294192887753267, "loss": 1.8868, "step": 3388 }, { "epoch": 0.27, "learning_rate": 0.0002941894815085377, "loss": 1.9549, "step": 3389 }, { "epoch": 0.27, "learning_rate": 0.00029418607428484145, "loss": 1.8848, "step": 3390 }, { "epoch": 0.27, "learning_rate": 0.0002941826660822013, "loss": 1.8639, "step": 3391 }, { "epoch": 0.27, "learning_rate": 0.00029417925690064045, "loss": 1.8139, "step": 3392 }, { "epoch": 0.27, "learning_rate": 0.00029417584674018197, "loss": 1.886, "step": 3393 }, { "epoch": 0.27, "learning_rate": 0.00029417243560084905, "loss": 1.8715, "step": 3394 }, { "epoch": 0.27, "learning_rate": 0.00029416902348266486, "loss": 1.908, "step": 3395 }, { "epoch": 0.27, "learning_rate": 0.0002941656103856526, "loss": 1.9148, "step": 3396 }, { "epoch": 0.27, "learning_rate": 0.00029416219630983535, "loss": 1.859, "step": 3397 }, { "epoch": 0.27, "learning_rate": 0.0002941587812552364, "loss": 1.8007, "step": 3398 }, { "epoch": 0.27, "learning_rate": 0.0002941553652218788, "loss": 1.9247, "step": 3399 }, { "epoch": 0.27, "learning_rate": 0.00029415194820978585, "loss": 1.9071, "step": 3400 }, { "epoch": 0.27, "learning_rate": 0.00029414853021898074, "loss": 1.9396, "step": 3401 }, { "epoch": 0.27, "learning_rate": 0.0002941451112494866, "loss": 1.8785, "step": 3402 }, { "epoch": 0.27, "learning_rate": 0.0002941416913013268, "loss": 1.8548, "step": 3403 }, { "epoch": 0.27, "learning_rate": 0.0002941382703745244, "loss": 1.9128, "step": 3404 }, { "epoch": 0.27, "learning_rate": 0.0002941348484691027, "loss": 1.9228, "step": 3405 }, { "epoch": 0.27, "learning_rate": 0.0002941314255850849, "loss": 1.8807, "step": 3406 }, { "epoch": 0.27, "learning_rate": 0.00029412800172249427, "loss": 1.918, "step": 3407 }, { "epoch": 0.27, "learning_rate": 0.0002941245768813541, "loss": 1.8916, "step": 3408 }, { "epoch": 0.27, "learning_rate": 0.0002941211510616875, "loss": 1.9117, "step": 3409 }, { "epoch": 0.27, "learning_rate": 0.00029411772426351786, "loss": 1.9661, "step": 3410 }, { "epoch": 0.27, "learning_rate": 0.00029411429648686836, "loss": 1.8503, "step": 3411 }, { "epoch": 0.27, "learning_rate": 0.0002941108677317624, "loss": 1.8941, "step": 3412 }, { "epoch": 0.27, "learning_rate": 0.0002941074379982231, "loss": 1.886, "step": 3413 }, { "epoch": 0.27, "learning_rate": 0.00029410400728627385, "loss": 1.8502, "step": 3414 }, { "epoch": 0.27, "learning_rate": 0.00029410057559593793, "loss": 1.8735, "step": 3415 }, { "epoch": 0.27, "learning_rate": 0.00029409714292723857, "loss": 1.8865, "step": 3416 }, { "epoch": 0.27, "learning_rate": 0.0002940937092801992, "loss": 1.9119, "step": 3417 }, { "epoch": 0.27, "learning_rate": 0.00029409027465484303, "loss": 1.8924, "step": 3418 }, { "epoch": 0.27, "learning_rate": 0.00029408683905119337, "loss": 1.886, "step": 3419 }, { "epoch": 0.27, "learning_rate": 0.0002940834024692736, "loss": 1.8929, "step": 3420 }, { "epoch": 0.27, "learning_rate": 0.0002940799649091071, "loss": 1.9259, "step": 3421 }, { "epoch": 0.27, "learning_rate": 0.00029407652637071714, "loss": 1.8967, "step": 3422 }, { "epoch": 0.27, "learning_rate": 0.00029407308685412703, "loss": 1.8536, "step": 3423 }, { "epoch": 0.27, "learning_rate": 0.0002940696463593602, "loss": 1.8668, "step": 3424 }, { "epoch": 0.27, "learning_rate": 0.0002940662048864399, "loss": 1.9217, "step": 3425 }, { "epoch": 0.27, "learning_rate": 0.00029406276243538966, "loss": 1.9107, "step": 3426 }, { "epoch": 0.27, "learning_rate": 0.0002940593190062327, "loss": 1.9356, "step": 3427 }, { "epoch": 0.27, "learning_rate": 0.0002940558745989925, "loss": 1.8852, "step": 3428 }, { "epoch": 0.27, "learning_rate": 0.0002940524292136924, "loss": 1.9408, "step": 3429 }, { "epoch": 0.27, "learning_rate": 0.0002940489828503558, "loss": 1.8319, "step": 3430 }, { "epoch": 0.27, "learning_rate": 0.0002940455355090061, "loss": 1.8672, "step": 3431 }, { "epoch": 0.27, "learning_rate": 0.00029404208718966673, "loss": 1.9145, "step": 3432 }, { "epoch": 0.27, "learning_rate": 0.000294038637892361, "loss": 1.8757, "step": 3433 }, { "epoch": 0.27, "learning_rate": 0.0002940351876171125, "loss": 1.8588, "step": 3434 }, { "epoch": 0.27, "learning_rate": 0.00029403173636394453, "loss": 1.8544, "step": 3435 }, { "epoch": 0.27, "learning_rate": 0.0002940282841328805, "loss": 1.9026, "step": 3436 }, { "epoch": 0.27, "learning_rate": 0.00029402483092394395, "loss": 1.828, "step": 3437 }, { "epoch": 0.27, "learning_rate": 0.0002940213767371583, "loss": 1.9297, "step": 3438 }, { "epoch": 0.27, "learning_rate": 0.00029401792157254694, "loss": 1.7984, "step": 3439 }, { "epoch": 0.27, "learning_rate": 0.00029401446543013334, "loss": 1.8732, "step": 3440 }, { "epoch": 0.27, "learning_rate": 0.00029401100830994106, "loss": 1.9118, "step": 3441 }, { "epoch": 0.27, "learning_rate": 0.00029400755021199347, "loss": 1.865, "step": 3442 }, { "epoch": 0.27, "learning_rate": 0.0002940040911363141, "loss": 1.8978, "step": 3443 }, { "epoch": 0.27, "learning_rate": 0.0002940006310829264, "loss": 1.9485, "step": 3444 }, { "epoch": 0.27, "learning_rate": 0.0002939971700518539, "loss": 1.8739, "step": 3445 }, { "epoch": 0.27, "learning_rate": 0.0002939937080431201, "loss": 1.8548, "step": 3446 }, { "epoch": 0.27, "learning_rate": 0.0002939902450567485, "loss": 1.8391, "step": 3447 }, { "epoch": 0.27, "learning_rate": 0.0002939867810927625, "loss": 1.8905, "step": 3448 }, { "epoch": 0.27, "learning_rate": 0.00029398331615118574, "loss": 1.8502, "step": 3449 }, { "epoch": 0.27, "learning_rate": 0.00029397985023204177, "loss": 1.9434, "step": 3450 }, { "epoch": 0.27, "learning_rate": 0.00029397638333535407, "loss": 1.8861, "step": 3451 }, { "epoch": 0.27, "learning_rate": 0.00029397291546114616, "loss": 1.8416, "step": 3452 }, { "epoch": 0.27, "learning_rate": 0.0002939694466094416, "loss": 1.9213, "step": 3453 }, { "epoch": 0.27, "learning_rate": 0.00029396597678026397, "loss": 1.8575, "step": 3454 }, { "epoch": 0.27, "learning_rate": 0.00029396250597363673, "loss": 1.9116, "step": 3455 }, { "epoch": 0.27, "learning_rate": 0.0002939590341895836, "loss": 1.8401, "step": 3456 }, { "epoch": 0.27, "learning_rate": 0.00029395556142812804, "loss": 1.8916, "step": 3457 }, { "epoch": 0.27, "learning_rate": 0.0002939520876892937, "loss": 1.914, "step": 3458 }, { "epoch": 0.27, "learning_rate": 0.00029394861297310406, "loss": 1.9689, "step": 3459 }, { "epoch": 0.27, "learning_rate": 0.00029394513727958277, "loss": 1.8979, "step": 3460 }, { "epoch": 0.27, "learning_rate": 0.0002939416606087535, "loss": 1.8956, "step": 3461 }, { "epoch": 0.27, "learning_rate": 0.00029393818296063974, "loss": 1.9295, "step": 3462 }, { "epoch": 0.27, "learning_rate": 0.00029393470433526517, "loss": 1.8495, "step": 3463 }, { "epoch": 0.27, "learning_rate": 0.00029393122473265343, "loss": 1.8916, "step": 3464 }, { "epoch": 0.27, "learning_rate": 0.00029392774415282804, "loss": 1.8679, "step": 3465 }, { "epoch": 0.27, "learning_rate": 0.0002939242625958127, "loss": 1.816, "step": 3466 }, { "epoch": 0.27, "learning_rate": 0.00029392078006163104, "loss": 1.8988, "step": 3467 }, { "epoch": 0.27, "learning_rate": 0.0002939172965503067, "loss": 1.9046, "step": 3468 }, { "epoch": 0.27, "learning_rate": 0.00029391381206186337, "loss": 1.891, "step": 3469 }, { "epoch": 0.27, "learning_rate": 0.0002939103265963246, "loss": 1.9038, "step": 3470 }, { "epoch": 0.27, "learning_rate": 0.0002939068401537142, "loss": 1.8665, "step": 3471 }, { "epoch": 0.27, "learning_rate": 0.00029390335273405576, "loss": 1.8903, "step": 3472 }, { "epoch": 0.27, "learning_rate": 0.00029389986433737297, "loss": 1.8913, "step": 3473 }, { "epoch": 0.27, "learning_rate": 0.0002938963749636895, "loss": 1.8979, "step": 3474 }, { "epoch": 0.27, "learning_rate": 0.00029389288461302907, "loss": 1.9142, "step": 3475 }, { "epoch": 0.27, "learning_rate": 0.00029388939328541533, "loss": 1.8765, "step": 3476 }, { "epoch": 0.27, "learning_rate": 0.000293885900980872, "loss": 1.8712, "step": 3477 }, { "epoch": 0.27, "learning_rate": 0.00029388240769942286, "loss": 1.8507, "step": 3478 }, { "epoch": 0.27, "learning_rate": 0.00029387891344109156, "loss": 1.8951, "step": 3479 }, { "epoch": 0.27, "learning_rate": 0.00029387541820590185, "loss": 1.8792, "step": 3480 }, { "epoch": 0.27, "learning_rate": 0.00029387192199387737, "loss": 1.8914, "step": 3481 }, { "epoch": 0.27, "learning_rate": 0.00029386842480504197, "loss": 1.8681, "step": 3482 }, { "epoch": 0.27, "learning_rate": 0.0002938649266394194, "loss": 1.8727, "step": 3483 }, { "epoch": 0.27, "learning_rate": 0.00029386142749703335, "loss": 1.9193, "step": 3484 }, { "epoch": 0.27, "learning_rate": 0.0002938579273779076, "loss": 1.9174, "step": 3485 }, { "epoch": 0.27, "learning_rate": 0.0002938544262820659, "loss": 1.8653, "step": 3486 }, { "epoch": 0.27, "learning_rate": 0.000293850924209532, "loss": 1.9053, "step": 3487 }, { "epoch": 0.27, "learning_rate": 0.0002938474211603298, "loss": 1.9031, "step": 3488 }, { "epoch": 0.27, "learning_rate": 0.0002938439171344829, "loss": 1.9413, "step": 3489 }, { "epoch": 0.27, "learning_rate": 0.0002938404121320152, "loss": 1.8723, "step": 3490 }, { "epoch": 0.27, "learning_rate": 0.0002938369061529505, "loss": 1.925, "step": 3491 }, { "epoch": 0.27, "learning_rate": 0.0002938333991973126, "loss": 1.912, "step": 3492 }, { "epoch": 0.27, "learning_rate": 0.00029382989126512524, "loss": 1.9055, "step": 3493 }, { "epoch": 0.27, "learning_rate": 0.00029382638235641234, "loss": 1.8252, "step": 3494 }, { "epoch": 0.27, "learning_rate": 0.0002938228724711976, "loss": 1.8963, "step": 3495 }, { "epoch": 0.28, "learning_rate": 0.00029381936160950505, "loss": 1.8776, "step": 3496 }, { "epoch": 0.28, "learning_rate": 0.0002938158497713583, "loss": 1.9174, "step": 3497 }, { "epoch": 0.28, "learning_rate": 0.00029381233695678134, "loss": 1.8829, "step": 3498 }, { "epoch": 0.28, "learning_rate": 0.00029380882316579795, "loss": 1.8521, "step": 3499 }, { "epoch": 0.28, "learning_rate": 0.000293805308398432, "loss": 1.9833, "step": 3500 }, { "epoch": 0.28, "learning_rate": 0.0002938017926547074, "loss": 1.8689, "step": 3501 }, { "epoch": 0.28, "learning_rate": 0.00029379827593464797, "loss": 1.9059, "step": 3502 }, { "epoch": 0.28, "learning_rate": 0.00029379475823827756, "loss": 1.8841, "step": 3503 }, { "epoch": 0.28, "learning_rate": 0.0002937912395656201, "loss": 1.8644, "step": 3504 }, { "epoch": 0.28, "learning_rate": 0.00029378771991669955, "loss": 1.8723, "step": 3505 }, { "epoch": 0.28, "learning_rate": 0.0002937841992915397, "loss": 1.8964, "step": 3506 }, { "epoch": 0.28, "learning_rate": 0.00029378067769016445, "loss": 1.8524, "step": 3507 }, { "epoch": 0.28, "learning_rate": 0.0002937771551125978, "loss": 1.851, "step": 3508 }, { "epoch": 0.28, "learning_rate": 0.0002937736315588636, "loss": 1.8929, "step": 3509 }, { "epoch": 0.28, "learning_rate": 0.0002937701070289857, "loss": 1.8456, "step": 3510 }, { "epoch": 0.28, "learning_rate": 0.0002937665815229882, "loss": 1.906, "step": 3511 }, { "epoch": 0.28, "learning_rate": 0.00029376305504089486, "loss": 1.8846, "step": 3512 }, { "epoch": 0.28, "learning_rate": 0.00029375952758272977, "loss": 1.8543, "step": 3513 }, { "epoch": 0.28, "learning_rate": 0.00029375599914851683, "loss": 1.8576, "step": 3514 }, { "epoch": 0.28, "learning_rate": 0.00029375246973828, "loss": 1.8287, "step": 3515 }, { "epoch": 0.28, "learning_rate": 0.0002937489393520432, "loss": 1.9086, "step": 3516 }, { "epoch": 0.28, "learning_rate": 0.00029374540798983044, "loss": 1.9039, "step": 3517 }, { "epoch": 0.28, "learning_rate": 0.00029374187565166563, "loss": 1.8332, "step": 3518 }, { "epoch": 0.28, "learning_rate": 0.0002937383423375729, "loss": 1.8905, "step": 3519 }, { "epoch": 0.28, "learning_rate": 0.0002937348080475761, "loss": 1.9213, "step": 3520 }, { "epoch": 0.28, "learning_rate": 0.00029373127278169923, "loss": 1.8716, "step": 3521 }, { "epoch": 0.28, "learning_rate": 0.0002937277365399664, "loss": 1.8542, "step": 3522 }, { "epoch": 0.28, "learning_rate": 0.00029372419932240156, "loss": 1.9162, "step": 3523 }, { "epoch": 0.28, "learning_rate": 0.00029372066112902867, "loss": 1.8808, "step": 3524 }, { "epoch": 0.28, "learning_rate": 0.00029371712195987187, "loss": 1.8773, "step": 3525 }, { "epoch": 0.28, "learning_rate": 0.000293713581814955, "loss": 1.8895, "step": 3526 }, { "epoch": 0.28, "learning_rate": 0.00029371004069430234, "loss": 1.8561, "step": 3527 }, { "epoch": 0.28, "learning_rate": 0.00029370649859793775, "loss": 1.9307, "step": 3528 }, { "epoch": 0.28, "learning_rate": 0.00029370295552588537, "loss": 1.8744, "step": 3529 }, { "epoch": 0.28, "learning_rate": 0.0002936994114781692, "loss": 1.9115, "step": 3530 }, { "epoch": 0.28, "learning_rate": 0.00029369586645481335, "loss": 1.85, "step": 3531 }, { "epoch": 0.28, "learning_rate": 0.0002936923204558418, "loss": 1.876, "step": 3532 }, { "epoch": 0.28, "learning_rate": 0.00029368877348127877, "loss": 1.8764, "step": 3533 }, { "epoch": 0.28, "learning_rate": 0.00029368522553114825, "loss": 1.949, "step": 3534 }, { "epoch": 0.28, "learning_rate": 0.00029368167660547435, "loss": 1.8902, "step": 3535 }, { "epoch": 0.28, "learning_rate": 0.00029367812670428104, "loss": 1.8911, "step": 3536 }, { "epoch": 0.28, "learning_rate": 0.00029367457582759265, "loss": 1.8589, "step": 3537 }, { "epoch": 0.28, "learning_rate": 0.0002936710239754332, "loss": 1.93, "step": 3538 }, { "epoch": 0.28, "learning_rate": 0.0002936674711478267, "loss": 1.9006, "step": 3539 }, { "epoch": 0.28, "learning_rate": 0.0002936639173447974, "loss": 1.8288, "step": 3540 }, { "epoch": 0.28, "learning_rate": 0.00029366036256636935, "loss": 1.8171, "step": 3541 }, { "epoch": 0.28, "learning_rate": 0.00029365680681256673, "loss": 1.882, "step": 3542 }, { "epoch": 0.28, "learning_rate": 0.00029365325008341367, "loss": 1.8096, "step": 3543 }, { "epoch": 0.28, "learning_rate": 0.00029364969237893434, "loss": 1.859, "step": 3544 }, { "epoch": 0.28, "learning_rate": 0.0002936461336991529, "loss": 1.8554, "step": 3545 }, { "epoch": 0.28, "learning_rate": 0.00029364257404409334, "loss": 1.8722, "step": 3546 }, { "epoch": 0.28, "learning_rate": 0.00029363901341378007, "loss": 1.8734, "step": 3547 }, { "epoch": 0.28, "learning_rate": 0.0002936354518082372, "loss": 1.8706, "step": 3548 }, { "epoch": 0.28, "learning_rate": 0.0002936318892274888, "loss": 1.8487, "step": 3549 }, { "epoch": 0.28, "learning_rate": 0.0002936283256715592, "loss": 1.867, "step": 3550 }, { "epoch": 0.28, "learning_rate": 0.00029362476114047246, "loss": 1.8713, "step": 3551 }, { "epoch": 0.28, "learning_rate": 0.0002936211956342529, "loss": 1.8761, "step": 3552 }, { "epoch": 0.28, "learning_rate": 0.00029361762915292467, "loss": 1.8966, "step": 3553 }, { "epoch": 0.28, "learning_rate": 0.000293614061696512, "loss": 1.8707, "step": 3554 }, { "epoch": 0.28, "learning_rate": 0.0002936104932650391, "loss": 1.886, "step": 3555 }, { "epoch": 0.28, "learning_rate": 0.00029360692385853017, "loss": 1.856, "step": 3556 }, { "epoch": 0.28, "learning_rate": 0.0002936033534770095, "loss": 1.8474, "step": 3557 }, { "epoch": 0.28, "learning_rate": 0.00029359978212050136, "loss": 1.8249, "step": 3558 }, { "epoch": 0.28, "learning_rate": 0.00029359620978902987, "loss": 1.8907, "step": 3559 }, { "epoch": 0.28, "learning_rate": 0.0002935926364826194, "loss": 1.943, "step": 3560 }, { "epoch": 0.28, "learning_rate": 0.0002935890622012941, "loss": 1.9245, "step": 3561 }, { "epoch": 0.28, "learning_rate": 0.0002935854869450784, "loss": 1.7807, "step": 3562 }, { "epoch": 0.28, "learning_rate": 0.00029358191071399646, "loss": 1.855, "step": 3563 }, { "epoch": 0.28, "learning_rate": 0.00029357833350807257, "loss": 1.881, "step": 3564 }, { "epoch": 0.28, "learning_rate": 0.000293574755327331, "loss": 1.9171, "step": 3565 }, { "epoch": 0.28, "learning_rate": 0.0002935711761717961, "loss": 1.8709, "step": 3566 }, { "epoch": 0.28, "learning_rate": 0.0002935675960414921, "loss": 1.8531, "step": 3567 }, { "epoch": 0.28, "learning_rate": 0.00029356401493644337, "loss": 1.9297, "step": 3568 }, { "epoch": 0.28, "learning_rate": 0.0002935604328566743, "loss": 1.8881, "step": 3569 }, { "epoch": 0.28, "learning_rate": 0.000293556849802209, "loss": 1.8073, "step": 3570 }, { "epoch": 0.28, "learning_rate": 0.0002935532657730719, "loss": 1.8636, "step": 3571 }, { "epoch": 0.28, "learning_rate": 0.0002935496807692874, "loss": 1.8742, "step": 3572 }, { "epoch": 0.28, "learning_rate": 0.0002935460947908798, "loss": 1.9165, "step": 3573 }, { "epoch": 0.28, "learning_rate": 0.00029354250783787336, "loss": 1.8862, "step": 3574 }, { "epoch": 0.28, "learning_rate": 0.00029353891991029256, "loss": 1.8849, "step": 3575 }, { "epoch": 0.28, "learning_rate": 0.0002935353310081617, "loss": 1.9108, "step": 3576 }, { "epoch": 0.28, "learning_rate": 0.0002935317411315051, "loss": 1.8664, "step": 3577 }, { "epoch": 0.28, "learning_rate": 0.0002935281502803473, "loss": 1.8549, "step": 3578 }, { "epoch": 0.28, "learning_rate": 0.00029352455845471246, "loss": 1.954, "step": 3579 }, { "epoch": 0.28, "learning_rate": 0.00029352096565462513, "loss": 1.8654, "step": 3580 }, { "epoch": 0.28, "learning_rate": 0.00029351737188010963, "loss": 1.8706, "step": 3581 }, { "epoch": 0.28, "learning_rate": 0.00029351377713119037, "loss": 1.8968, "step": 3582 }, { "epoch": 0.28, "learning_rate": 0.0002935101814078917, "loss": 1.8826, "step": 3583 }, { "epoch": 0.28, "learning_rate": 0.0002935065847102382, "loss": 1.8131, "step": 3584 }, { "epoch": 0.28, "learning_rate": 0.00029350298703825415, "loss": 1.8454, "step": 3585 }, { "epoch": 0.28, "learning_rate": 0.00029349938839196395, "loss": 1.8342, "step": 3586 }, { "epoch": 0.28, "learning_rate": 0.0002934957887713922, "loss": 1.8015, "step": 3587 }, { "epoch": 0.28, "learning_rate": 0.0002934921881765631, "loss": 1.8381, "step": 3588 }, { "epoch": 0.28, "learning_rate": 0.0002934885866075013, "loss": 1.8396, "step": 3589 }, { "epoch": 0.28, "learning_rate": 0.0002934849840642312, "loss": 1.8862, "step": 3590 }, { "epoch": 0.28, "learning_rate": 0.0002934813805467772, "loss": 1.9199, "step": 3591 }, { "epoch": 0.28, "learning_rate": 0.0002934777760551638, "loss": 1.914, "step": 3592 }, { "epoch": 0.28, "learning_rate": 0.00029347417058941553, "loss": 1.8664, "step": 3593 }, { "epoch": 0.28, "learning_rate": 0.0002934705641495568, "loss": 1.9168, "step": 3594 }, { "epoch": 0.28, "learning_rate": 0.00029346695673561205, "loss": 1.9159, "step": 3595 }, { "epoch": 0.28, "learning_rate": 0.00029346334834760596, "loss": 1.8855, "step": 3596 }, { "epoch": 0.28, "learning_rate": 0.0002934597389855628, "loss": 1.8723, "step": 3597 }, { "epoch": 0.28, "learning_rate": 0.00029345612864950716, "loss": 1.8678, "step": 3598 }, { "epoch": 0.28, "learning_rate": 0.0002934525173394637, "loss": 1.8975, "step": 3599 }, { "epoch": 0.28, "learning_rate": 0.0002934489050554567, "loss": 1.8561, "step": 3600 }, { "epoch": 0.28, "learning_rate": 0.00029344529179751083, "loss": 1.9043, "step": 3601 }, { "epoch": 0.28, "learning_rate": 0.0002934416775656506, "loss": 1.8986, "step": 3602 }, { "epoch": 0.28, "learning_rate": 0.00029343806235990053, "loss": 1.8334, "step": 3603 }, { "epoch": 0.28, "learning_rate": 0.0002934344461802851, "loss": 1.8342, "step": 3604 }, { "epoch": 0.28, "learning_rate": 0.000293430829026829, "loss": 1.8611, "step": 3605 }, { "epoch": 0.28, "learning_rate": 0.00029342721089955674, "loss": 1.9098, "step": 3606 }, { "epoch": 0.28, "learning_rate": 0.0002934235917984929, "loss": 1.8532, "step": 3607 }, { "epoch": 0.28, "learning_rate": 0.000293419971723662, "loss": 1.8854, "step": 3608 }, { "epoch": 0.28, "learning_rate": 0.0002934163506750886, "loss": 1.8979, "step": 3609 }, { "epoch": 0.28, "learning_rate": 0.0002934127286527973, "loss": 1.8554, "step": 3610 }, { "epoch": 0.28, "learning_rate": 0.00029340910565681274, "loss": 1.8685, "step": 3611 }, { "epoch": 0.28, "learning_rate": 0.0002934054816871595, "loss": 1.8516, "step": 3612 }, { "epoch": 0.28, "learning_rate": 0.00029340185674386215, "loss": 1.8039, "step": 3613 }, { "epoch": 0.28, "learning_rate": 0.0002933982308269454, "loss": 1.8595, "step": 3614 }, { "epoch": 0.28, "learning_rate": 0.00029339460393643373, "loss": 1.8485, "step": 3615 }, { "epoch": 0.28, "learning_rate": 0.00029339097607235183, "loss": 1.8735, "step": 3616 }, { "epoch": 0.28, "learning_rate": 0.00029338734723472436, "loss": 1.8313, "step": 3617 }, { "epoch": 0.28, "learning_rate": 0.00029338371742357593, "loss": 1.8642, "step": 3618 }, { "epoch": 0.28, "learning_rate": 0.00029338008663893115, "loss": 1.8645, "step": 3619 }, { "epoch": 0.28, "learning_rate": 0.00029337645488081474, "loss": 1.8799, "step": 3620 }, { "epoch": 0.28, "learning_rate": 0.0002933728221492513, "loss": 1.9521, "step": 3621 }, { "epoch": 0.28, "learning_rate": 0.00029336918844426554, "loss": 1.8684, "step": 3622 }, { "epoch": 0.29, "learning_rate": 0.00029336555376588213, "loss": 1.8584, "step": 3623 }, { "epoch": 0.29, "learning_rate": 0.0002933619181141257, "loss": 1.8763, "step": 3624 }, { "epoch": 0.29, "learning_rate": 0.0002933582814890209, "loss": 1.8755, "step": 3625 }, { "epoch": 0.29, "learning_rate": 0.0002933546438905926, "loss": 1.8664, "step": 3626 }, { "epoch": 0.29, "learning_rate": 0.0002933510053188653, "loss": 1.9342, "step": 3627 }, { "epoch": 0.29, "learning_rate": 0.0002933473657738638, "loss": 1.8484, "step": 3628 }, { "epoch": 0.29, "learning_rate": 0.0002933437252556128, "loss": 1.8537, "step": 3629 }, { "epoch": 0.29, "learning_rate": 0.00029334008376413696, "loss": 1.9305, "step": 3630 }, { "epoch": 0.29, "learning_rate": 0.0002933364412994611, "loss": 1.9227, "step": 3631 }, { "epoch": 0.29, "learning_rate": 0.0002933327978616099, "loss": 1.8584, "step": 3632 }, { "epoch": 0.29, "learning_rate": 0.00029332915345060807, "loss": 1.913, "step": 3633 }, { "epoch": 0.29, "learning_rate": 0.0002933255080664804, "loss": 1.8732, "step": 3634 }, { "epoch": 0.29, "learning_rate": 0.0002933218617092517, "loss": 1.8914, "step": 3635 }, { "epoch": 0.29, "learning_rate": 0.00029331821437894655, "loss": 1.8562, "step": 3636 }, { "epoch": 0.29, "learning_rate": 0.0002933145660755898, "loss": 1.843, "step": 3637 }, { "epoch": 0.29, "learning_rate": 0.0002933109167992063, "loss": 1.8681, "step": 3638 }, { "epoch": 0.29, "learning_rate": 0.00029330726654982076, "loss": 1.8742, "step": 3639 }, { "epoch": 0.29, "learning_rate": 0.0002933036153274579, "loss": 1.8609, "step": 3640 }, { "epoch": 0.29, "learning_rate": 0.00029329996313214263, "loss": 1.8629, "step": 3641 }, { "epoch": 0.29, "learning_rate": 0.0002932963099638997, "loss": 1.8523, "step": 3642 }, { "epoch": 0.29, "learning_rate": 0.00029329265582275386, "loss": 1.8933, "step": 3643 }, { "epoch": 0.29, "learning_rate": 0.00029328900070872997, "loss": 1.9499, "step": 3644 }, { "epoch": 0.29, "learning_rate": 0.0002932853446218529, "loss": 1.8951, "step": 3645 }, { "epoch": 0.29, "learning_rate": 0.00029328168756214735, "loss": 1.8678, "step": 3646 }, { "epoch": 0.29, "learning_rate": 0.0002932780295296382, "loss": 1.9005, "step": 3647 }, { "epoch": 0.29, "learning_rate": 0.0002932743705243503, "loss": 1.8513, "step": 3648 }, { "epoch": 0.29, "learning_rate": 0.0002932707105463085, "loss": 1.871, "step": 3649 }, { "epoch": 0.29, "learning_rate": 0.00029326704959553763, "loss": 1.8629, "step": 3650 }, { "epoch": 0.29, "learning_rate": 0.00029326338767206257, "loss": 1.807, "step": 3651 }, { "epoch": 0.29, "learning_rate": 0.0002932597247759082, "loss": 1.8229, "step": 3652 }, { "epoch": 0.29, "learning_rate": 0.00029325606090709934, "loss": 1.8936, "step": 3653 }, { "epoch": 0.29, "learning_rate": 0.0002932523960656609, "loss": 1.9024, "step": 3654 }, { "epoch": 0.29, "learning_rate": 0.00029324873025161766, "loss": 1.8447, "step": 3655 }, { "epoch": 0.29, "learning_rate": 0.00029324506346499463, "loss": 1.9601, "step": 3656 }, { "epoch": 0.29, "learning_rate": 0.0002932413957058167, "loss": 1.8687, "step": 3657 }, { "epoch": 0.29, "learning_rate": 0.0002932377269741087, "loss": 1.9304, "step": 3658 }, { "epoch": 0.29, "learning_rate": 0.0002932340572698956, "loss": 1.9485, "step": 3659 }, { "epoch": 0.29, "learning_rate": 0.0002932303865932023, "loss": 1.8999, "step": 3660 }, { "epoch": 0.29, "learning_rate": 0.0002932267149440537, "loss": 1.8835, "step": 3661 }, { "epoch": 0.29, "learning_rate": 0.00029322304232247474, "loss": 1.8453, "step": 3662 }, { "epoch": 0.29, "learning_rate": 0.0002932193687284904, "loss": 1.9024, "step": 3663 }, { "epoch": 0.29, "learning_rate": 0.00029321569416212556, "loss": 1.9196, "step": 3664 }, { "epoch": 0.29, "learning_rate": 0.00029321201862340517, "loss": 1.8549, "step": 3665 }, { "epoch": 0.29, "learning_rate": 0.0002932083421123542, "loss": 1.846, "step": 3666 }, { "epoch": 0.29, "learning_rate": 0.00029320466462899765, "loss": 1.8995, "step": 3667 }, { "epoch": 0.29, "learning_rate": 0.00029320098617336045, "loss": 1.8672, "step": 3668 }, { "epoch": 0.29, "learning_rate": 0.0002931973067454676, "loss": 1.8632, "step": 3669 }, { "epoch": 0.29, "learning_rate": 0.000293193626345344, "loss": 1.8765, "step": 3670 }, { "epoch": 0.29, "learning_rate": 0.00029318994497301473, "loss": 1.8119, "step": 3671 }, { "epoch": 0.29, "learning_rate": 0.00029318626262850474, "loss": 1.9098, "step": 3672 }, { "epoch": 0.29, "learning_rate": 0.000293182579311839, "loss": 1.8964, "step": 3673 }, { "epoch": 0.29, "learning_rate": 0.00029317889502304266, "loss": 1.8739, "step": 3674 }, { "epoch": 0.29, "learning_rate": 0.0002931752097621406, "loss": 1.8737, "step": 3675 }, { "epoch": 0.29, "learning_rate": 0.0002931715235291579, "loss": 1.9244, "step": 3676 }, { "epoch": 0.29, "learning_rate": 0.0002931678363241195, "loss": 1.8508, "step": 3677 }, { "epoch": 0.29, "learning_rate": 0.0002931641481470505, "loss": 1.8727, "step": 3678 }, { "epoch": 0.29, "learning_rate": 0.000293160458997976, "loss": 1.8213, "step": 3679 }, { "epoch": 0.29, "learning_rate": 0.00029315676887692094, "loss": 1.8888, "step": 3680 }, { "epoch": 0.29, "learning_rate": 0.00029315307778391043, "loss": 1.868, "step": 3681 }, { "epoch": 0.29, "learning_rate": 0.0002931493857189695, "loss": 1.8432, "step": 3682 }, { "epoch": 0.29, "learning_rate": 0.0002931456926821233, "loss": 1.8404, "step": 3683 }, { "epoch": 0.29, "learning_rate": 0.00029314199867339676, "loss": 1.8627, "step": 3684 }, { "epoch": 0.29, "learning_rate": 0.00029313830369281506, "loss": 1.8389, "step": 3685 }, { "epoch": 0.29, "learning_rate": 0.0002931346077404033, "loss": 1.8675, "step": 3686 }, { "epoch": 0.29, "learning_rate": 0.00029313091081618653, "loss": 1.9284, "step": 3687 }, { "epoch": 0.29, "learning_rate": 0.0002931272129201899, "loss": 1.8324, "step": 3688 }, { "epoch": 0.29, "learning_rate": 0.0002931235140524384, "loss": 1.8801, "step": 3689 }, { "epoch": 0.29, "learning_rate": 0.0002931198142129573, "loss": 1.849, "step": 3690 }, { "epoch": 0.29, "learning_rate": 0.0002931161134017716, "loss": 1.8711, "step": 3691 }, { "epoch": 0.29, "learning_rate": 0.0002931124116189065, "loss": 1.8488, "step": 3692 }, { "epoch": 0.29, "learning_rate": 0.00029310870886438704, "loss": 1.8538, "step": 3693 }, { "epoch": 0.29, "learning_rate": 0.00029310500513823846, "loss": 1.8574, "step": 3694 }, { "epoch": 0.29, "learning_rate": 0.00029310130044048584, "loss": 1.8426, "step": 3695 }, { "epoch": 0.29, "learning_rate": 0.0002930975947711544, "loss": 1.8836, "step": 3696 }, { "epoch": 0.29, "learning_rate": 0.0002930938881302692, "loss": 1.8923, "step": 3697 }, { "epoch": 0.29, "learning_rate": 0.0002930901805178555, "loss": 1.7752, "step": 3698 }, { "epoch": 0.29, "learning_rate": 0.0002930864719339385, "loss": 1.8493, "step": 3699 }, { "epoch": 0.29, "learning_rate": 0.0002930827623785432, "loss": 1.9699, "step": 3700 }, { "epoch": 0.29, "learning_rate": 0.000293079051851695, "loss": 1.9114, "step": 3701 }, { "epoch": 0.29, "learning_rate": 0.00029307534035341896, "loss": 1.817, "step": 3702 }, { "epoch": 0.29, "learning_rate": 0.00029307162788374033, "loss": 1.8532, "step": 3703 }, { "epoch": 0.29, "learning_rate": 0.00029306791444268427, "loss": 1.8903, "step": 3704 }, { "epoch": 0.29, "learning_rate": 0.00029306420003027603, "loss": 1.8512, "step": 3705 }, { "epoch": 0.29, "learning_rate": 0.0002930604846465408, "loss": 1.8428, "step": 3706 }, { "epoch": 0.29, "learning_rate": 0.0002930567682915039, "loss": 1.8498, "step": 3707 }, { "epoch": 0.29, "learning_rate": 0.00029305305096519044, "loss": 1.8865, "step": 3708 }, { "epoch": 0.29, "learning_rate": 0.00029304933266762574, "loss": 1.8317, "step": 3709 }, { "epoch": 0.29, "learning_rate": 0.00029304561339883495, "loss": 1.9021, "step": 3710 }, { "epoch": 0.29, "learning_rate": 0.00029304189315884345, "loss": 1.8995, "step": 3711 }, { "epoch": 0.29, "learning_rate": 0.00029303817194767633, "loss": 1.8306, "step": 3712 }, { "epoch": 0.29, "learning_rate": 0.0002930344497653591, "loss": 1.8712, "step": 3713 }, { "epoch": 0.29, "learning_rate": 0.0002930307266119168, "loss": 1.829, "step": 3714 }, { "epoch": 0.29, "learning_rate": 0.00029302700248737474, "loss": 1.8647, "step": 3715 }, { "epoch": 0.29, "learning_rate": 0.0002930232773917584, "loss": 1.904, "step": 3716 }, { "epoch": 0.29, "learning_rate": 0.00029301955132509283, "loss": 1.9531, "step": 3717 }, { "epoch": 0.29, "learning_rate": 0.00029301582428740346, "loss": 1.8748, "step": 3718 }, { "epoch": 0.29, "learning_rate": 0.00029301209627871557, "loss": 1.8884, "step": 3719 }, { "epoch": 0.29, "learning_rate": 0.0002930083672990545, "loss": 1.856, "step": 3720 }, { "epoch": 0.29, "learning_rate": 0.0002930046373484455, "loss": 1.8899, "step": 3721 }, { "epoch": 0.29, "learning_rate": 0.00029300090642691396, "loss": 1.8595, "step": 3722 }, { "epoch": 0.29, "learning_rate": 0.00029299717453448514, "loss": 1.8795, "step": 3723 }, { "epoch": 0.29, "learning_rate": 0.0002929934416711844, "loss": 1.8924, "step": 3724 }, { "epoch": 0.29, "learning_rate": 0.00029298970783703715, "loss": 1.8829, "step": 3725 }, { "epoch": 0.29, "learning_rate": 0.00029298597303206866, "loss": 1.92, "step": 3726 }, { "epoch": 0.29, "learning_rate": 0.00029298223725630435, "loss": 1.869, "step": 3727 }, { "epoch": 0.29, "learning_rate": 0.00029297850050976953, "loss": 1.8094, "step": 3728 }, { "epoch": 0.29, "learning_rate": 0.0002929747627924896, "loss": 1.8565, "step": 3729 }, { "epoch": 0.29, "learning_rate": 0.00029297102410448994, "loss": 1.9086, "step": 3730 }, { "epoch": 0.29, "learning_rate": 0.0002929672844457959, "loss": 1.8268, "step": 3731 }, { "epoch": 0.29, "learning_rate": 0.00029296354381643295, "loss": 1.8803, "step": 3732 }, { "epoch": 0.29, "learning_rate": 0.00029295980221642634, "loss": 1.844, "step": 3733 }, { "epoch": 0.29, "learning_rate": 0.0002929560596458016, "loss": 1.8213, "step": 3734 }, { "epoch": 0.29, "learning_rate": 0.00029295231610458416, "loss": 1.8576, "step": 3735 }, { "epoch": 0.29, "learning_rate": 0.00029294857159279937, "loss": 1.8814, "step": 3736 }, { "epoch": 0.29, "learning_rate": 0.0002929448261104726, "loss": 1.8101, "step": 3737 }, { "epoch": 0.29, "learning_rate": 0.0002929410796576294, "loss": 1.874, "step": 3738 }, { "epoch": 0.29, "learning_rate": 0.00029293733223429515, "loss": 1.874, "step": 3739 }, { "epoch": 0.29, "learning_rate": 0.00029293358384049526, "loss": 1.862, "step": 3740 }, { "epoch": 0.29, "learning_rate": 0.0002929298344762552, "loss": 1.888, "step": 3741 }, { "epoch": 0.29, "learning_rate": 0.0002929260841416005, "loss": 1.8313, "step": 3742 }, { "epoch": 0.29, "learning_rate": 0.00029292233283655653, "loss": 1.8884, "step": 3743 }, { "epoch": 0.29, "learning_rate": 0.0002929185805611488, "loss": 1.7404, "step": 3744 }, { "epoch": 0.29, "learning_rate": 0.00029291482731540273, "loss": 1.8953, "step": 3745 }, { "epoch": 0.29, "learning_rate": 0.0002929110730993439, "loss": 1.8435, "step": 3746 }, { "epoch": 0.29, "learning_rate": 0.0002929073179129977, "loss": 1.8881, "step": 3747 }, { "epoch": 0.29, "learning_rate": 0.00029290356175638973, "loss": 1.8059, "step": 3748 }, { "epoch": 0.29, "learning_rate": 0.0002928998046295454, "loss": 1.8443, "step": 3749 }, { "epoch": 0.3, "learning_rate": 0.00029289604653249027, "loss": 1.8498, "step": 3750 }, { "epoch": 0.3, "learning_rate": 0.00029289228746524985, "loss": 1.8566, "step": 3751 }, { "epoch": 0.3, "learning_rate": 0.00029288852742784965, "loss": 1.8801, "step": 3752 }, { "epoch": 0.3, "learning_rate": 0.0002928847664203152, "loss": 1.8613, "step": 3753 }, { "epoch": 0.3, "learning_rate": 0.000292881004442672, "loss": 1.8941, "step": 3754 }, { "epoch": 0.3, "learning_rate": 0.0002928772414949457, "loss": 1.8492, "step": 3755 }, { "epoch": 0.3, "learning_rate": 0.0002928734775771617, "loss": 1.9005, "step": 3756 }, { "epoch": 0.3, "learning_rate": 0.0002928697126893457, "loss": 1.7973, "step": 3757 }, { "epoch": 0.3, "learning_rate": 0.0002928659468315232, "loss": 1.8703, "step": 3758 }, { "epoch": 0.3, "learning_rate": 0.0002928621800037197, "loss": 1.8873, "step": 3759 }, { "epoch": 0.3, "learning_rate": 0.00029285841220596083, "loss": 1.859, "step": 3760 }, { "epoch": 0.3, "learning_rate": 0.00029285464343827217, "loss": 1.8958, "step": 3761 }, { "epoch": 0.3, "learning_rate": 0.0002928508737006794, "loss": 1.8631, "step": 3762 }, { "epoch": 0.3, "learning_rate": 0.000292847102993208, "loss": 1.8544, "step": 3763 }, { "epoch": 0.3, "learning_rate": 0.00029284333131588357, "loss": 1.818, "step": 3764 }, { "epoch": 0.3, "learning_rate": 0.00029283955866873175, "loss": 1.8751, "step": 3765 }, { "epoch": 0.3, "learning_rate": 0.0002928357850517781, "loss": 1.8155, "step": 3766 }, { "epoch": 0.3, "learning_rate": 0.0002928320104650484, "loss": 1.8479, "step": 3767 }, { "epoch": 0.3, "learning_rate": 0.0002928282349085681, "loss": 1.8124, "step": 3768 }, { "epoch": 0.3, "learning_rate": 0.00029282445838236295, "loss": 1.8426, "step": 3769 }, { "epoch": 0.3, "learning_rate": 0.0002928206808864585, "loss": 1.8849, "step": 3770 }, { "epoch": 0.3, "learning_rate": 0.0002928169024208805, "loss": 1.9025, "step": 3771 }, { "epoch": 0.3, "learning_rate": 0.00029281312298565443, "loss": 1.862, "step": 3772 }, { "epoch": 0.3, "learning_rate": 0.00029280934258080617, "loss": 1.8482, "step": 3773 }, { "epoch": 0.3, "learning_rate": 0.00029280556120636126, "loss": 1.8786, "step": 3774 }, { "epoch": 0.3, "learning_rate": 0.0002928017788623454, "loss": 1.8973, "step": 3775 }, { "epoch": 0.3, "learning_rate": 0.0002927979955487843, "loss": 1.8699, "step": 3776 }, { "epoch": 0.3, "learning_rate": 0.00029279421126570353, "loss": 1.9402, "step": 3777 }, { "epoch": 0.3, "learning_rate": 0.0002927904260131289, "loss": 1.8483, "step": 3778 }, { "epoch": 0.3, "learning_rate": 0.00029278663979108606, "loss": 1.8662, "step": 3779 }, { "epoch": 0.3, "learning_rate": 0.0002927828525996008, "loss": 1.8614, "step": 3780 }, { "epoch": 0.3, "learning_rate": 0.0002927790644386987, "loss": 1.8215, "step": 3781 }, { "epoch": 0.3, "learning_rate": 0.0002927752753084055, "loss": 1.8448, "step": 3782 }, { "epoch": 0.3, "learning_rate": 0.0002927714852087471, "loss": 1.8519, "step": 3783 }, { "epoch": 0.3, "learning_rate": 0.00029276769413974903, "loss": 1.872, "step": 3784 }, { "epoch": 0.3, "learning_rate": 0.0002927639021014371, "loss": 1.8297, "step": 3785 }, { "epoch": 0.3, "learning_rate": 0.0002927601090938371, "loss": 1.8768, "step": 3786 }, { "epoch": 0.3, "learning_rate": 0.00029275631511697464, "loss": 1.7995, "step": 3787 }, { "epoch": 0.3, "learning_rate": 0.0002927525201708757, "loss": 1.8407, "step": 3788 }, { "epoch": 0.3, "learning_rate": 0.00029274872425556585, "loss": 1.8582, "step": 3789 }, { "epoch": 0.3, "learning_rate": 0.000292744927371071, "loss": 1.8628, "step": 3790 }, { "epoch": 0.3, "learning_rate": 0.00029274112951741676, "loss": 1.9647, "step": 3791 }, { "epoch": 0.3, "learning_rate": 0.0002927373306946291, "loss": 1.868, "step": 3792 }, { "epoch": 0.3, "learning_rate": 0.0002927335309027337, "loss": 1.8726, "step": 3793 }, { "epoch": 0.3, "learning_rate": 0.00029272973014175644, "loss": 1.9098, "step": 3794 }, { "epoch": 0.3, "learning_rate": 0.00029272592841172307, "loss": 1.8364, "step": 3795 }, { "epoch": 0.3, "learning_rate": 0.0002927221257126594, "loss": 1.8256, "step": 3796 }, { "epoch": 0.3, "learning_rate": 0.0002927183220445912, "loss": 1.8944, "step": 3797 }, { "epoch": 0.3, "learning_rate": 0.0002927145174075444, "loss": 1.8338, "step": 3798 }, { "epoch": 0.3, "learning_rate": 0.0002927107118015448, "loss": 1.8852, "step": 3799 }, { "epoch": 0.3, "learning_rate": 0.0002927069052266182, "loss": 1.8298, "step": 3800 }, { "epoch": 0.3, "learning_rate": 0.00029270309768279046, "loss": 1.9146, "step": 3801 }, { "epoch": 0.3, "learning_rate": 0.00029269928917008745, "loss": 1.8635, "step": 3802 }, { "epoch": 0.3, "learning_rate": 0.00029269547968853503, "loss": 1.8426, "step": 3803 }, { "epoch": 0.3, "learning_rate": 0.000292691669238159, "loss": 1.8323, "step": 3804 }, { "epoch": 0.3, "learning_rate": 0.00029268785781898536, "loss": 1.8685, "step": 3805 }, { "epoch": 0.3, "learning_rate": 0.0002926840454310398, "loss": 1.891, "step": 3806 }, { "epoch": 0.3, "learning_rate": 0.00029268023207434837, "loss": 1.8702, "step": 3807 }, { "epoch": 0.3, "learning_rate": 0.0002926764177489369, "loss": 1.8591, "step": 3808 }, { "epoch": 0.3, "learning_rate": 0.0002926726024548313, "loss": 1.8911, "step": 3809 }, { "epoch": 0.3, "learning_rate": 0.00029266878619205747, "loss": 1.8056, "step": 3810 }, { "epoch": 0.3, "learning_rate": 0.00029266496896064126, "loss": 1.8174, "step": 3811 }, { "epoch": 0.3, "learning_rate": 0.00029266115076060874, "loss": 1.8177, "step": 3812 }, { "epoch": 0.3, "learning_rate": 0.0002926573315919856, "loss": 1.8485, "step": 3813 }, { "epoch": 0.3, "learning_rate": 0.000292653511454798, "loss": 1.8721, "step": 3814 }, { "epoch": 0.3, "learning_rate": 0.00029264969034907177, "loss": 1.8445, "step": 3815 }, { "epoch": 0.3, "learning_rate": 0.0002926458682748328, "loss": 1.8361, "step": 3816 }, { "epoch": 0.3, "learning_rate": 0.00029264204523210714, "loss": 1.8296, "step": 3817 }, { "epoch": 0.3, "learning_rate": 0.00029263822122092077, "loss": 1.855, "step": 3818 }, { "epoch": 0.3, "learning_rate": 0.00029263439624129954, "loss": 1.8652, "step": 3819 }, { "epoch": 0.3, "learning_rate": 0.0002926305702932694, "loss": 1.8488, "step": 3820 }, { "epoch": 0.3, "learning_rate": 0.0002926267433768565, "loss": 1.8527, "step": 3821 }, { "epoch": 0.3, "learning_rate": 0.0002926229154920867, "loss": 1.8861, "step": 3822 }, { "epoch": 0.3, "learning_rate": 0.00029261908663898595, "loss": 1.8709, "step": 3823 }, { "epoch": 0.3, "learning_rate": 0.0002926152568175804, "loss": 1.8831, "step": 3824 }, { "epoch": 0.3, "learning_rate": 0.00029261142602789587, "loss": 1.8761, "step": 3825 }, { "epoch": 0.3, "learning_rate": 0.00029260759426995856, "loss": 1.8517, "step": 3826 }, { "epoch": 0.3, "learning_rate": 0.0002926037615437943, "loss": 1.9022, "step": 3827 }, { "epoch": 0.3, "learning_rate": 0.00029259992784942923, "loss": 1.806, "step": 3828 }, { "epoch": 0.3, "learning_rate": 0.0002925960931868893, "loss": 1.8691, "step": 3829 }, { "epoch": 0.3, "learning_rate": 0.0002925922575562006, "loss": 1.8473, "step": 3830 }, { "epoch": 0.3, "learning_rate": 0.0002925884209573892, "loss": 1.8514, "step": 3831 }, { "epoch": 0.3, "learning_rate": 0.0002925845833904811, "loss": 1.8955, "step": 3832 }, { "epoch": 0.3, "learning_rate": 0.0002925807448555023, "loss": 1.8709, "step": 3833 }, { "epoch": 0.3, "learning_rate": 0.000292576905352479, "loss": 1.8448, "step": 3834 }, { "epoch": 0.3, "learning_rate": 0.00029257306488143716, "loss": 1.8075, "step": 3835 }, { "epoch": 0.3, "learning_rate": 0.0002925692234424029, "loss": 1.8762, "step": 3836 }, { "epoch": 0.3, "learning_rate": 0.00029256538103540223, "loss": 1.8292, "step": 3837 }, { "epoch": 0.3, "learning_rate": 0.00029256153766046134, "loss": 1.9507, "step": 3838 }, { "epoch": 0.3, "learning_rate": 0.0002925576933176063, "loss": 1.8035, "step": 3839 }, { "epoch": 0.3, "learning_rate": 0.0002925538480068632, "loss": 1.8466, "step": 3840 }, { "epoch": 0.3, "learning_rate": 0.00029255000172825814, "loss": 1.8564, "step": 3841 }, { "epoch": 0.3, "learning_rate": 0.00029254615448181723, "loss": 1.9127, "step": 3842 }, { "epoch": 0.3, "learning_rate": 0.00029254230626756656, "loss": 1.9008, "step": 3843 }, { "epoch": 0.3, "learning_rate": 0.0002925384570855323, "loss": 1.891, "step": 3844 }, { "epoch": 0.3, "learning_rate": 0.0002925346069357406, "loss": 1.8517, "step": 3845 }, { "epoch": 0.3, "learning_rate": 0.0002925307558182175, "loss": 1.8328, "step": 3846 }, { "epoch": 0.3, "learning_rate": 0.00029252690373298936, "loss": 1.8778, "step": 3847 }, { "epoch": 0.3, "learning_rate": 0.0002925230506800821, "loss": 1.849, "step": 3848 }, { "epoch": 0.3, "learning_rate": 0.000292519196659522, "loss": 1.7949, "step": 3849 }, { "epoch": 0.3, "learning_rate": 0.0002925153416713352, "loss": 1.8621, "step": 3850 }, { "epoch": 0.3, "learning_rate": 0.0002925114857155479, "loss": 1.8169, "step": 3851 }, { "epoch": 0.3, "learning_rate": 0.00029250762879218624, "loss": 1.8617, "step": 3852 }, { "epoch": 0.3, "learning_rate": 0.0002925037709012764, "loss": 1.8635, "step": 3853 }, { "epoch": 0.3, "learning_rate": 0.0002924999120428446, "loss": 1.7654, "step": 3854 }, { "epoch": 0.3, "learning_rate": 0.00029249605221691704, "loss": 1.9275, "step": 3855 }, { "epoch": 0.3, "learning_rate": 0.00029249219142351993, "loss": 1.827, "step": 3856 }, { "epoch": 0.3, "learning_rate": 0.00029248832966267946, "loss": 1.8968, "step": 3857 }, { "epoch": 0.3, "learning_rate": 0.0002924844669344219, "loss": 1.8314, "step": 3858 }, { "epoch": 0.3, "learning_rate": 0.0002924806032387734, "loss": 1.8248, "step": 3859 }, { "epoch": 0.3, "learning_rate": 0.00029247673857576024, "loss": 1.8873, "step": 3860 }, { "epoch": 0.3, "learning_rate": 0.0002924728729454087, "loss": 1.9098, "step": 3861 }, { "epoch": 0.3, "learning_rate": 0.00029246900634774493, "loss": 1.8833, "step": 3862 }, { "epoch": 0.3, "learning_rate": 0.0002924651387827952, "loss": 1.7776, "step": 3863 }, { "epoch": 0.3, "learning_rate": 0.00029246127025058584, "loss": 1.8054, "step": 3864 }, { "epoch": 0.3, "learning_rate": 0.0002924574007511431, "loss": 1.8603, "step": 3865 }, { "epoch": 0.3, "learning_rate": 0.00029245353028449316, "loss": 1.8335, "step": 3866 }, { "epoch": 0.3, "learning_rate": 0.00029244965885066236, "loss": 1.8673, "step": 3867 }, { "epoch": 0.3, "learning_rate": 0.00029244578644967704, "loss": 1.8386, "step": 3868 }, { "epoch": 0.3, "learning_rate": 0.0002924419130815634, "loss": 1.8698, "step": 3869 }, { "epoch": 0.3, "learning_rate": 0.00029243803874634777, "loss": 1.8466, "step": 3870 }, { "epoch": 0.3, "learning_rate": 0.00029243416344405647, "loss": 1.8565, "step": 3871 }, { "epoch": 0.3, "learning_rate": 0.0002924302871747158, "loss": 1.8851, "step": 3872 }, { "epoch": 0.3, "learning_rate": 0.0002924264099383521, "loss": 1.867, "step": 3873 }, { "epoch": 0.3, "learning_rate": 0.0002924225317349917, "loss": 1.8581, "step": 3874 }, { "epoch": 0.3, "learning_rate": 0.00029241865256466085, "loss": 1.7993, "step": 3875 }, { "epoch": 0.3, "learning_rate": 0.00029241477242738595, "loss": 1.8271, "step": 3876 }, { "epoch": 0.31, "learning_rate": 0.0002924108913231933, "loss": 1.8794, "step": 3877 }, { "epoch": 0.31, "learning_rate": 0.0002924070092521094, "loss": 1.825, "step": 3878 }, { "epoch": 0.31, "learning_rate": 0.00029240312621416043, "loss": 1.8561, "step": 3879 }, { "epoch": 0.31, "learning_rate": 0.0002923992422093728, "loss": 1.8898, "step": 3880 }, { "epoch": 0.31, "learning_rate": 0.0002923953572377729, "loss": 1.8193, "step": 3881 }, { "epoch": 0.31, "learning_rate": 0.0002923914712993871, "loss": 1.8735, "step": 3882 }, { "epoch": 0.31, "learning_rate": 0.0002923875843942418, "loss": 1.8743, "step": 3883 }, { "epoch": 0.31, "learning_rate": 0.0002923836965223634, "loss": 1.8592, "step": 3884 }, { "epoch": 0.31, "learning_rate": 0.00029237980768377826, "loss": 1.836, "step": 3885 }, { "epoch": 0.31, "learning_rate": 0.00029237591787851277, "loss": 1.8578, "step": 3886 }, { "epoch": 0.31, "learning_rate": 0.0002923720271065934, "loss": 1.9073, "step": 3887 }, { "epoch": 0.31, "learning_rate": 0.0002923681353680465, "loss": 1.8586, "step": 3888 }, { "epoch": 0.31, "learning_rate": 0.00029236424266289855, "loss": 1.8829, "step": 3889 }, { "epoch": 0.31, "learning_rate": 0.000292360348991176, "loss": 1.8403, "step": 3890 }, { "epoch": 0.31, "learning_rate": 0.00029235645435290514, "loss": 1.8738, "step": 3891 }, { "epoch": 0.31, "learning_rate": 0.0002923525587481126, "loss": 1.8652, "step": 3892 }, { "epoch": 0.31, "learning_rate": 0.0002923486621768247, "loss": 1.8696, "step": 3893 }, { "epoch": 0.31, "learning_rate": 0.000292344764639068, "loss": 1.8699, "step": 3894 }, { "epoch": 0.31, "learning_rate": 0.00029234086613486883, "loss": 1.8729, "step": 3895 }, { "epoch": 0.31, "learning_rate": 0.0002923369666642537, "loss": 1.8534, "step": 3896 }, { "epoch": 0.31, "learning_rate": 0.0002923330662272492, "loss": 1.8687, "step": 3897 }, { "epoch": 0.31, "learning_rate": 0.0002923291648238817, "loss": 1.8479, "step": 3898 }, { "epoch": 0.31, "learning_rate": 0.0002923252624541777, "loss": 1.8802, "step": 3899 }, { "epoch": 0.31, "learning_rate": 0.0002923213591181637, "loss": 1.9133, "step": 3900 }, { "epoch": 0.31, "learning_rate": 0.00029231745481586623, "loss": 1.8672, "step": 3901 }, { "epoch": 0.31, "learning_rate": 0.0002923135495473118, "loss": 1.8673, "step": 3902 }, { "epoch": 0.31, "learning_rate": 0.0002923096433125269, "loss": 1.836, "step": 3903 }, { "epoch": 0.31, "learning_rate": 0.00029230573611153796, "loss": 1.8305, "step": 3904 }, { "epoch": 0.31, "learning_rate": 0.0002923018279443717, "loss": 1.8459, "step": 3905 }, { "epoch": 0.31, "learning_rate": 0.00029229791881105454, "loss": 1.8325, "step": 3906 }, { "epoch": 0.31, "learning_rate": 0.00029229400871161305, "loss": 1.8472, "step": 3907 }, { "epoch": 0.31, "learning_rate": 0.00029229009764607374, "loss": 1.902, "step": 3908 }, { "epoch": 0.31, "learning_rate": 0.0002922861856144632, "loss": 1.8051, "step": 3909 }, { "epoch": 0.31, "learning_rate": 0.00029228227261680797, "loss": 1.8509, "step": 3910 }, { "epoch": 0.31, "learning_rate": 0.0002922783586531346, "loss": 1.813, "step": 3911 }, { "epoch": 0.31, "learning_rate": 0.0002922744437234698, "loss": 1.8315, "step": 3912 }, { "epoch": 0.31, "learning_rate": 0.00029227052782783994, "loss": 1.8752, "step": 3913 }, { "epoch": 0.31, "learning_rate": 0.0002922666109662717, "loss": 1.8564, "step": 3914 }, { "epoch": 0.31, "learning_rate": 0.00029226269313879175, "loss": 1.8519, "step": 3915 }, { "epoch": 0.31, "learning_rate": 0.00029225877434542653, "loss": 1.8184, "step": 3916 }, { "epoch": 0.31, "learning_rate": 0.0002922548545862028, "loss": 1.8716, "step": 3917 }, { "epoch": 0.31, "learning_rate": 0.00029225093386114713, "loss": 1.8202, "step": 3918 }, { "epoch": 0.31, "learning_rate": 0.00029224701217028603, "loss": 1.8966, "step": 3919 }, { "epoch": 0.31, "learning_rate": 0.0002922430895136463, "loss": 1.8506, "step": 3920 }, { "epoch": 0.31, "learning_rate": 0.0002922391658912545, "loss": 1.8691, "step": 3921 }, { "epoch": 0.31, "learning_rate": 0.0002922352413031372, "loss": 1.8436, "step": 3922 }, { "epoch": 0.31, "learning_rate": 0.0002922313157493211, "loss": 1.792, "step": 3923 }, { "epoch": 0.31, "learning_rate": 0.00029222738922983293, "loss": 1.7931, "step": 3924 }, { "epoch": 0.31, "learning_rate": 0.0002922234617446992, "loss": 1.754, "step": 3925 }, { "epoch": 0.31, "learning_rate": 0.0002922195332939467, "loss": 1.8874, "step": 3926 }, { "epoch": 0.31, "learning_rate": 0.00029221560387760197, "loss": 1.8813, "step": 3927 }, { "epoch": 0.31, "learning_rate": 0.00029221167349569185, "loss": 1.9105, "step": 3928 }, { "epoch": 0.31, "learning_rate": 0.00029220774214824293, "loss": 1.856, "step": 3929 }, { "epoch": 0.31, "learning_rate": 0.0002922038098352819, "loss": 1.844, "step": 3930 }, { "epoch": 0.31, "learning_rate": 0.00029219987655683546, "loss": 1.7764, "step": 3931 }, { "epoch": 0.31, "learning_rate": 0.0002921959423129304, "loss": 1.8349, "step": 3932 }, { "epoch": 0.31, "learning_rate": 0.0002921920071035933, "loss": 1.8148, "step": 3933 }, { "epoch": 0.31, "learning_rate": 0.00029218807092885093, "loss": 1.8308, "step": 3934 }, { "epoch": 0.31, "learning_rate": 0.0002921841337887301, "loss": 1.8505, "step": 3935 }, { "epoch": 0.31, "learning_rate": 0.0002921801956832574, "loss": 1.8759, "step": 3936 }, { "epoch": 0.31, "learning_rate": 0.00029217625661245964, "loss": 1.8894, "step": 3937 }, { "epoch": 0.31, "learning_rate": 0.0002921723165763636, "loss": 1.8152, "step": 3938 }, { "epoch": 0.31, "learning_rate": 0.00029216837557499595, "loss": 1.8482, "step": 3939 }, { "epoch": 0.31, "learning_rate": 0.00029216443360838344, "loss": 1.8373, "step": 3940 }, { "epoch": 0.31, "learning_rate": 0.00029216049067655296, "loss": 1.8775, "step": 3941 }, { "epoch": 0.31, "learning_rate": 0.0002921565467795312, "loss": 1.8865, "step": 3942 }, { "epoch": 0.31, "learning_rate": 0.0002921526019173449, "loss": 1.8498, "step": 3943 }, { "epoch": 0.31, "learning_rate": 0.00029214865609002085, "loss": 1.8118, "step": 3944 }, { "epoch": 0.31, "learning_rate": 0.00029214470929758593, "loss": 1.7787, "step": 3945 }, { "epoch": 0.31, "learning_rate": 0.0002921407615400668, "loss": 1.7834, "step": 3946 }, { "epoch": 0.31, "learning_rate": 0.0002921368128174904, "loss": 1.8167, "step": 3947 }, { "epoch": 0.31, "learning_rate": 0.0002921328631298835, "loss": 1.8576, "step": 3948 }, { "epoch": 0.31, "learning_rate": 0.00029212891247727284, "loss": 1.9214, "step": 3949 }, { "epoch": 0.31, "learning_rate": 0.0002921249608596853, "loss": 1.7998, "step": 3950 }, { "epoch": 0.31, "learning_rate": 0.00029212100827714774, "loss": 1.8263, "step": 3951 }, { "epoch": 0.31, "learning_rate": 0.0002921170547296869, "loss": 1.8745, "step": 3952 }, { "epoch": 0.31, "learning_rate": 0.0002921131002173298, "loss": 1.8482, "step": 3953 }, { "epoch": 0.31, "learning_rate": 0.00029210914474010307, "loss": 1.812, "step": 3954 }, { "epoch": 0.31, "learning_rate": 0.0002921051882980337, "loss": 1.866, "step": 3955 }, { "epoch": 0.31, "learning_rate": 0.0002921012308911486, "loss": 1.8698, "step": 3956 }, { "epoch": 0.31, "learning_rate": 0.00029209727251947444, "loss": 1.788, "step": 3957 }, { "epoch": 0.31, "learning_rate": 0.00029209331318303826, "loss": 1.893, "step": 3958 }, { "epoch": 0.31, "learning_rate": 0.0002920893528818669, "loss": 1.8802, "step": 3959 }, { "epoch": 0.31, "learning_rate": 0.00029208539161598723, "loss": 1.8526, "step": 3960 }, { "epoch": 0.31, "learning_rate": 0.0002920814293854262, "loss": 1.8823, "step": 3961 }, { "epoch": 0.31, "learning_rate": 0.00029207746619021064, "loss": 1.7869, "step": 3962 }, { "epoch": 0.31, "learning_rate": 0.00029207350203036753, "loss": 1.8271, "step": 3963 }, { "epoch": 0.31, "learning_rate": 0.0002920695369059237, "loss": 1.8507, "step": 3964 }, { "epoch": 0.31, "learning_rate": 0.0002920655708169061, "loss": 1.8458, "step": 3965 }, { "epoch": 0.31, "learning_rate": 0.0002920616037633417, "loss": 1.8248, "step": 3966 }, { "epoch": 0.31, "learning_rate": 0.0002920576357452574, "loss": 1.8375, "step": 3967 }, { "epoch": 0.31, "learning_rate": 0.0002920536667626802, "loss": 1.8705, "step": 3968 }, { "epoch": 0.31, "learning_rate": 0.0002920496968156369, "loss": 1.8758, "step": 3969 }, { "epoch": 0.31, "learning_rate": 0.0002920457259041546, "loss": 1.9331, "step": 3970 }, { "epoch": 0.31, "learning_rate": 0.00029204175402826023, "loss": 1.88, "step": 3971 }, { "epoch": 0.31, "learning_rate": 0.00029203778118798066, "loss": 1.8081, "step": 3972 }, { "epoch": 0.31, "learning_rate": 0.00029203380738334304, "loss": 1.8194, "step": 3973 }, { "epoch": 0.31, "learning_rate": 0.00029202983261437417, "loss": 1.766, "step": 3974 }, { "epoch": 0.31, "learning_rate": 0.0002920258568811012, "loss": 1.8967, "step": 3975 }, { "epoch": 0.31, "learning_rate": 0.0002920218801835509, "loss": 1.841, "step": 3976 }, { "epoch": 0.31, "learning_rate": 0.0002920179025217505, "loss": 1.8461, "step": 3977 }, { "epoch": 0.31, "learning_rate": 0.0002920139238957269, "loss": 1.8234, "step": 3978 }, { "epoch": 0.31, "learning_rate": 0.0002920099443055071, "loss": 1.836, "step": 3979 }, { "epoch": 0.31, "learning_rate": 0.0002920059637511182, "loss": 1.8956, "step": 3980 }, { "epoch": 0.31, "learning_rate": 0.0002920019822325871, "loss": 1.8424, "step": 3981 }, { "epoch": 0.31, "learning_rate": 0.000291997999749941, "loss": 1.9107, "step": 3982 }, { "epoch": 0.31, "learning_rate": 0.0002919940163032068, "loss": 1.8974, "step": 3983 }, { "epoch": 0.31, "learning_rate": 0.00029199003189241156, "loss": 1.8247, "step": 3984 }, { "epoch": 0.31, "learning_rate": 0.00029198604651758237, "loss": 1.8514, "step": 3985 }, { "epoch": 0.31, "learning_rate": 0.0002919820601787463, "loss": 1.8121, "step": 3986 }, { "epoch": 0.31, "learning_rate": 0.00029197807287593036, "loss": 1.8386, "step": 3987 }, { "epoch": 0.31, "learning_rate": 0.0002919740846091617, "loss": 1.8565, "step": 3988 }, { "epoch": 0.31, "learning_rate": 0.00029197009537846734, "loss": 1.8284, "step": 3989 }, { "epoch": 0.31, "learning_rate": 0.00029196610518387436, "loss": 1.8269, "step": 3990 }, { "epoch": 0.31, "learning_rate": 0.0002919621140254099, "loss": 1.8224, "step": 3991 }, { "epoch": 0.31, "learning_rate": 0.00029195812190310093, "loss": 1.9385, "step": 3992 }, { "epoch": 0.31, "learning_rate": 0.00029195412881697475, "loss": 1.8048, "step": 3993 }, { "epoch": 0.31, "learning_rate": 0.0002919501347670583, "loss": 1.8459, "step": 3994 }, { "epoch": 0.31, "learning_rate": 0.00029194613975337886, "loss": 1.8197, "step": 3995 }, { "epoch": 0.31, "learning_rate": 0.0002919421437759634, "loss": 1.8354, "step": 3996 }, { "epoch": 0.31, "learning_rate": 0.00029193814683483915, "loss": 1.9004, "step": 3997 }, { "epoch": 0.31, "learning_rate": 0.00029193414893003317, "loss": 1.7746, "step": 3998 }, { "epoch": 0.31, "learning_rate": 0.0002919301500615727, "loss": 1.8108, "step": 3999 }, { "epoch": 0.31, "learning_rate": 0.0002919261502294848, "loss": 1.8784, "step": 4000 }, { "epoch": 0.31, "learning_rate": 0.0002919221494337967, "loss": 1.8941, "step": 4001 }, { "epoch": 0.31, "learning_rate": 0.0002919181476745355, "loss": 1.8358, "step": 4002 }, { "epoch": 0.31, "learning_rate": 0.0002919141449517283, "loss": 1.8212, "step": 4003 }, { "epoch": 0.32, "learning_rate": 0.0002919101412654025, "loss": 1.8864, "step": 4004 }, { "epoch": 0.32, "learning_rate": 0.0002919061366155851, "loss": 1.7775, "step": 4005 }, { "epoch": 0.32, "learning_rate": 0.0002919021310023034, "loss": 1.8573, "step": 4006 }, { "epoch": 0.32, "learning_rate": 0.00029189812442558444, "loss": 1.8247, "step": 4007 }, { "epoch": 0.32, "learning_rate": 0.00029189411688545553, "loss": 1.8642, "step": 4008 }, { "epoch": 0.32, "learning_rate": 0.00029189010838194393, "loss": 1.841, "step": 4009 }, { "epoch": 0.32, "learning_rate": 0.00029188609891507675, "loss": 1.831, "step": 4010 }, { "epoch": 0.32, "learning_rate": 0.0002918820884848813, "loss": 1.8106, "step": 4011 }, { "epoch": 0.32, "learning_rate": 0.0002918780770913848, "loss": 1.8883, "step": 4012 }, { "epoch": 0.32, "learning_rate": 0.0002918740647346144, "loss": 1.8233, "step": 4013 }, { "epoch": 0.32, "learning_rate": 0.00029187005141459736, "loss": 1.883, "step": 4014 }, { "epoch": 0.32, "learning_rate": 0.000291866037131361, "loss": 1.8002, "step": 4015 }, { "epoch": 0.32, "learning_rate": 0.0002918620218849325, "loss": 1.8493, "step": 4016 }, { "epoch": 0.32, "learning_rate": 0.0002918580056753392, "loss": 1.9019, "step": 4017 }, { "epoch": 0.32, "learning_rate": 0.00029185398850260834, "loss": 1.7938, "step": 4018 }, { "epoch": 0.32, "learning_rate": 0.00029184997036676714, "loss": 1.8758, "step": 4019 }, { "epoch": 0.32, "learning_rate": 0.0002918459512678429, "loss": 1.8069, "step": 4020 }, { "epoch": 0.32, "learning_rate": 0.00029184193120586295, "loss": 1.8404, "step": 4021 }, { "epoch": 0.32, "learning_rate": 0.0002918379101808546, "loss": 1.8332, "step": 4022 }, { "epoch": 0.32, "learning_rate": 0.0002918338881928451, "loss": 1.8537, "step": 4023 }, { "epoch": 0.32, "learning_rate": 0.00029182986524186173, "loss": 1.8362, "step": 4024 }, { "epoch": 0.32, "learning_rate": 0.0002918258413279319, "loss": 1.8644, "step": 4025 }, { "epoch": 0.32, "learning_rate": 0.00029182181645108284, "loss": 1.8967, "step": 4026 }, { "epoch": 0.32, "learning_rate": 0.0002918177906113419, "loss": 1.8725, "step": 4027 }, { "epoch": 0.32, "learning_rate": 0.0002918137638087364, "loss": 1.8226, "step": 4028 }, { "epoch": 0.32, "learning_rate": 0.0002918097360432938, "loss": 1.8286, "step": 4029 }, { "epoch": 0.32, "learning_rate": 0.00029180570731504124, "loss": 1.8321, "step": 4030 }, { "epoch": 0.32, "learning_rate": 0.0002918016776240063, "loss": 1.8105, "step": 4031 }, { "epoch": 0.32, "learning_rate": 0.0002917976469702161, "loss": 1.8254, "step": 4032 }, { "epoch": 0.32, "learning_rate": 0.00029179361535369816, "loss": 1.8631, "step": 4033 }, { "epoch": 0.32, "learning_rate": 0.00029178958277447986, "loss": 1.8273, "step": 4034 }, { "epoch": 0.32, "learning_rate": 0.0002917855492325885, "loss": 1.9059, "step": 4035 }, { "epoch": 0.32, "learning_rate": 0.00029178151472805154, "loss": 1.8697, "step": 4036 }, { "epoch": 0.32, "learning_rate": 0.0002917774792608963, "loss": 1.8206, "step": 4037 }, { "epoch": 0.32, "learning_rate": 0.0002917734428311503, "loss": 1.9014, "step": 4038 }, { "epoch": 0.32, "learning_rate": 0.0002917694054388407, "loss": 1.8889, "step": 4039 }, { "epoch": 0.32, "learning_rate": 0.0002917653670839952, "loss": 1.9107, "step": 4040 }, { "epoch": 0.32, "learning_rate": 0.00029176132776664106, "loss": 1.8929, "step": 4041 }, { "epoch": 0.32, "learning_rate": 0.0002917572874868057, "loss": 1.869, "step": 4042 }, { "epoch": 0.32, "learning_rate": 0.0002917532462445166, "loss": 1.7673, "step": 4043 }, { "epoch": 0.32, "learning_rate": 0.0002917492040398012, "loss": 1.8571, "step": 4044 }, { "epoch": 0.32, "learning_rate": 0.00029174516087268696, "loss": 1.8239, "step": 4045 }, { "epoch": 0.32, "learning_rate": 0.00029174111674320124, "loss": 1.8069, "step": 4046 }, { "epoch": 0.32, "learning_rate": 0.00029173707165137166, "loss": 1.8707, "step": 4047 }, { "epoch": 0.32, "learning_rate": 0.0002917330255972254, "loss": 1.7801, "step": 4048 }, { "epoch": 0.32, "learning_rate": 0.0002917289785807903, "loss": 1.8641, "step": 4049 }, { "epoch": 0.32, "learning_rate": 0.00029172493060209353, "loss": 1.8494, "step": 4050 }, { "epoch": 0.32, "learning_rate": 0.00029172088166116273, "loss": 1.869, "step": 4051 }, { "epoch": 0.32, "learning_rate": 0.0002917168317580253, "loss": 1.8661, "step": 4052 }, { "epoch": 0.32, "learning_rate": 0.00029171278089270886, "loss": 1.8223, "step": 4053 }, { "epoch": 0.32, "learning_rate": 0.00029170872906524086, "loss": 1.8009, "step": 4054 }, { "epoch": 0.32, "learning_rate": 0.0002917046762756487, "loss": 1.8605, "step": 4055 }, { "epoch": 0.32, "learning_rate": 0.00029170062252396005, "loss": 1.801, "step": 4056 }, { "epoch": 0.32, "learning_rate": 0.0002916965678102024, "loss": 1.7711, "step": 4057 }, { "epoch": 0.32, "learning_rate": 0.00029169251213440316, "loss": 1.8264, "step": 4058 }, { "epoch": 0.32, "learning_rate": 0.00029168845549659, "loss": 1.8734, "step": 4059 }, { "epoch": 0.32, "learning_rate": 0.00029168439789679045, "loss": 1.8102, "step": 4060 }, { "epoch": 0.32, "learning_rate": 0.00029168033933503197, "loss": 1.8516, "step": 4061 }, { "epoch": 0.32, "learning_rate": 0.00029167627981134216, "loss": 1.8598, "step": 4062 }, { "epoch": 0.32, "learning_rate": 0.0002916722193257487, "loss": 1.8482, "step": 4063 }, { "epoch": 0.32, "learning_rate": 0.00029166815787827895, "loss": 1.8691, "step": 4064 }, { "epoch": 0.32, "learning_rate": 0.0002916640954689606, "loss": 1.831, "step": 4065 }, { "epoch": 0.32, "learning_rate": 0.0002916600320978212, "loss": 1.8533, "step": 4066 }, { "epoch": 0.32, "learning_rate": 0.0002916559677648884, "loss": 1.8217, "step": 4067 }, { "epoch": 0.32, "learning_rate": 0.00029165190247018975, "loss": 1.8062, "step": 4068 }, { "epoch": 0.32, "learning_rate": 0.00029164783621375283, "loss": 1.8218, "step": 4069 }, { "epoch": 0.32, "learning_rate": 0.0002916437689956053, "loss": 1.8081, "step": 4070 }, { "epoch": 0.32, "learning_rate": 0.0002916397008157747, "loss": 1.8535, "step": 4071 }, { "epoch": 0.32, "learning_rate": 0.0002916356316742887, "loss": 1.8399, "step": 4072 }, { "epoch": 0.32, "learning_rate": 0.000291631561571175, "loss": 1.8312, "step": 4073 }, { "epoch": 0.32, "learning_rate": 0.0002916274905064611, "loss": 1.8797, "step": 4074 }, { "epoch": 0.32, "learning_rate": 0.0002916234184801747, "loss": 1.829, "step": 4075 }, { "epoch": 0.32, "learning_rate": 0.0002916193454923434, "loss": 1.8422, "step": 4076 }, { "epoch": 0.32, "learning_rate": 0.00029161527154299496, "loss": 1.829, "step": 4077 }, { "epoch": 0.32, "learning_rate": 0.00029161119663215695, "loss": 1.8705, "step": 4078 }, { "epoch": 0.32, "learning_rate": 0.00029160712075985707, "loss": 1.8188, "step": 4079 }, { "epoch": 0.32, "learning_rate": 0.00029160304392612297, "loss": 1.8445, "step": 4080 }, { "epoch": 0.32, "learning_rate": 0.00029159896613098235, "loss": 1.8625, "step": 4081 }, { "epoch": 0.32, "learning_rate": 0.0002915948873744629, "loss": 1.861, "step": 4082 }, { "epoch": 0.32, "learning_rate": 0.0002915908076565923, "loss": 1.7897, "step": 4083 }, { "epoch": 0.32, "learning_rate": 0.00029158672697739824, "loss": 1.8442, "step": 4084 }, { "epoch": 0.32, "learning_rate": 0.00029158264533690845, "loss": 1.8126, "step": 4085 }, { "epoch": 0.32, "learning_rate": 0.00029157856273515065, "loss": 1.831, "step": 4086 }, { "epoch": 0.32, "learning_rate": 0.0002915744791721525, "loss": 1.825, "step": 4087 }, { "epoch": 0.32, "learning_rate": 0.00029157039464794177, "loss": 1.7813, "step": 4088 }, { "epoch": 0.32, "learning_rate": 0.0002915663091625462, "loss": 1.8904, "step": 4089 }, { "epoch": 0.32, "learning_rate": 0.00029156222271599347, "loss": 1.8006, "step": 4090 }, { "epoch": 0.32, "learning_rate": 0.00029155813530831146, "loss": 1.854, "step": 4091 }, { "epoch": 0.32, "learning_rate": 0.0002915540469395278, "loss": 1.8102, "step": 4092 }, { "epoch": 0.32, "learning_rate": 0.0002915499576096702, "loss": 1.8208, "step": 4093 }, { "epoch": 0.32, "learning_rate": 0.0002915458673187666, "loss": 1.8729, "step": 4094 }, { "epoch": 0.32, "learning_rate": 0.0002915417760668446, "loss": 1.8474, "step": 4095 }, { "epoch": 0.32, "learning_rate": 0.0002915376838539321, "loss": 1.8308, "step": 4096 }, { "epoch": 0.32, "learning_rate": 0.0002915335906800568, "loss": 1.8787, "step": 4097 }, { "epoch": 0.32, "learning_rate": 0.00029152949654524655, "loss": 1.8052, "step": 4098 }, { "epoch": 0.32, "learning_rate": 0.0002915254014495291, "loss": 1.8795, "step": 4099 }, { "epoch": 0.32, "learning_rate": 0.00029152130539293223, "loss": 1.843, "step": 4100 }, { "epoch": 0.32, "learning_rate": 0.0002915172083754839, "loss": 1.7879, "step": 4101 }, { "epoch": 0.32, "learning_rate": 0.00029151311039721174, "loss": 1.8492, "step": 4102 }, { "epoch": 0.32, "learning_rate": 0.0002915090114581437, "loss": 1.7961, "step": 4103 }, { "epoch": 0.32, "learning_rate": 0.0002915049115583075, "loss": 1.7987, "step": 4104 }, { "epoch": 0.32, "learning_rate": 0.0002915008106977311, "loss": 1.8618, "step": 4105 }, { "epoch": 0.32, "learning_rate": 0.0002914967088764423, "loss": 1.7986, "step": 4106 }, { "epoch": 0.32, "learning_rate": 0.00029149260609446885, "loss": 1.8141, "step": 4107 }, { "epoch": 0.32, "learning_rate": 0.00029148850235183874, "loss": 1.8139, "step": 4108 }, { "epoch": 0.32, "learning_rate": 0.00029148439764857976, "loss": 1.8282, "step": 4109 }, { "epoch": 0.32, "learning_rate": 0.00029148029198471987, "loss": 1.8518, "step": 4110 }, { "epoch": 0.32, "learning_rate": 0.0002914761853602868, "loss": 1.8444, "step": 4111 }, { "epoch": 0.32, "learning_rate": 0.00029147207777530847, "loss": 1.8058, "step": 4112 }, { "epoch": 0.32, "learning_rate": 0.00029146796922981284, "loss": 1.8284, "step": 4113 }, { "epoch": 0.32, "learning_rate": 0.00029146385972382777, "loss": 1.8588, "step": 4114 }, { "epoch": 0.32, "learning_rate": 0.00029145974925738117, "loss": 1.8134, "step": 4115 }, { "epoch": 0.32, "learning_rate": 0.00029145563783050096, "loss": 1.8373, "step": 4116 }, { "epoch": 0.32, "learning_rate": 0.000291451525443215, "loss": 1.8968, "step": 4117 }, { "epoch": 0.32, "learning_rate": 0.0002914474120955512, "loss": 1.799, "step": 4118 }, { "epoch": 0.32, "learning_rate": 0.0002914432977875376, "loss": 1.7743, "step": 4119 }, { "epoch": 0.32, "learning_rate": 0.000291439182519202, "loss": 1.8609, "step": 4120 }, { "epoch": 0.32, "learning_rate": 0.00029143506629057247, "loss": 1.8867, "step": 4121 }, { "epoch": 0.32, "learning_rate": 0.0002914309491016769, "loss": 1.8184, "step": 4122 }, { "epoch": 0.32, "learning_rate": 0.0002914268309525431, "loss": 1.8403, "step": 4123 }, { "epoch": 0.32, "learning_rate": 0.0002914227118431993, "loss": 1.8511, "step": 4124 }, { "epoch": 0.32, "learning_rate": 0.0002914185917736733, "loss": 1.8529, "step": 4125 }, { "epoch": 0.32, "learning_rate": 0.0002914144707439931, "loss": 1.7788, "step": 4126 }, { "epoch": 0.32, "learning_rate": 0.00029141034875418664, "loss": 1.8259, "step": 4127 }, { "epoch": 0.32, "learning_rate": 0.000291406225804282, "loss": 1.8663, "step": 4128 }, { "epoch": 0.32, "learning_rate": 0.0002914021018943071, "loss": 1.8524, "step": 4129 }, { "epoch": 0.32, "learning_rate": 0.00029139797702428997, "loss": 1.8832, "step": 4130 }, { "epoch": 0.33, "learning_rate": 0.0002913938511942586, "loss": 1.8616, "step": 4131 }, { "epoch": 0.33, "learning_rate": 0.000291389724404241, "loss": 1.796, "step": 4132 }, { "epoch": 0.33, "learning_rate": 0.0002913855966542652, "loss": 1.8471, "step": 4133 }, { "epoch": 0.33, "learning_rate": 0.0002913814679443592, "loss": 1.8312, "step": 4134 }, { "epoch": 0.33, "learning_rate": 0.00029137733827455106, "loss": 1.8372, "step": 4135 }, { "epoch": 0.33, "learning_rate": 0.00029137320764486885, "loss": 1.8746, "step": 4136 }, { "epoch": 0.33, "learning_rate": 0.00029136907605534055, "loss": 1.8767, "step": 4137 }, { "epoch": 0.33, "learning_rate": 0.00029136494350599426, "loss": 1.848, "step": 4138 }, { "epoch": 0.33, "learning_rate": 0.000291360809996858, "loss": 1.8281, "step": 4139 }, { "epoch": 0.33, "learning_rate": 0.00029135667552795984, "loss": 1.8494, "step": 4140 }, { "epoch": 0.33, "learning_rate": 0.0002913525400993279, "loss": 1.8843, "step": 4141 }, { "epoch": 0.33, "learning_rate": 0.0002913484037109902, "loss": 1.818, "step": 4142 }, { "epoch": 0.33, "learning_rate": 0.0002913442663629748, "loss": 1.8777, "step": 4143 }, { "epoch": 0.33, "learning_rate": 0.0002913401280553098, "loss": 1.8435, "step": 4144 }, { "epoch": 0.33, "learning_rate": 0.0002913359887880234, "loss": 1.8298, "step": 4145 }, { "epoch": 0.33, "learning_rate": 0.00029133184856114364, "loss": 1.874, "step": 4146 }, { "epoch": 0.33, "learning_rate": 0.0002913277073746986, "loss": 1.8049, "step": 4147 }, { "epoch": 0.33, "learning_rate": 0.00029132356522871644, "loss": 1.8207, "step": 4148 }, { "epoch": 0.33, "learning_rate": 0.0002913194221232252, "loss": 1.7602, "step": 4149 }, { "epoch": 0.33, "learning_rate": 0.0002913152780582531, "loss": 1.8272, "step": 4150 }, { "epoch": 0.33, "learning_rate": 0.0002913111330338283, "loss": 1.8178, "step": 4151 }, { "epoch": 0.33, "learning_rate": 0.00029130698704997877, "loss": 1.8068, "step": 4152 }, { "epoch": 0.33, "learning_rate": 0.0002913028401067329, "loss": 1.858, "step": 4153 }, { "epoch": 0.33, "learning_rate": 0.0002912986922041187, "loss": 1.8408, "step": 4154 }, { "epoch": 0.33, "learning_rate": 0.0002912945433421643, "loss": 1.8582, "step": 4155 }, { "epoch": 0.33, "learning_rate": 0.0002912903935208979, "loss": 1.8121, "step": 4156 }, { "epoch": 0.33, "learning_rate": 0.0002912862427403478, "loss": 1.8696, "step": 4157 }, { "epoch": 0.33, "learning_rate": 0.00029128209100054203, "loss": 1.8336, "step": 4158 }, { "epoch": 0.33, "learning_rate": 0.0002912779383015088, "loss": 1.8118, "step": 4159 }, { "epoch": 0.33, "learning_rate": 0.0002912737846432764, "loss": 1.7618, "step": 4160 }, { "epoch": 0.33, "learning_rate": 0.0002912696300258729, "loss": 1.8081, "step": 4161 }, { "epoch": 0.33, "learning_rate": 0.0002912654744493266, "loss": 1.8034, "step": 4162 }, { "epoch": 0.33, "learning_rate": 0.0002912613179136657, "loss": 1.8218, "step": 4163 }, { "epoch": 0.33, "learning_rate": 0.0002912571604189184, "loss": 1.8221, "step": 4164 }, { "epoch": 0.33, "learning_rate": 0.0002912530019651129, "loss": 1.8499, "step": 4165 }, { "epoch": 0.33, "learning_rate": 0.0002912488425522775, "loss": 1.8563, "step": 4166 }, { "epoch": 0.33, "learning_rate": 0.00029124468218044036, "loss": 1.7936, "step": 4167 }, { "epoch": 0.33, "learning_rate": 0.0002912405208496298, "loss": 1.805, "step": 4168 }, { "epoch": 0.33, "learning_rate": 0.00029123635855987407, "loss": 1.7759, "step": 4169 }, { "epoch": 0.33, "learning_rate": 0.0002912321953112014, "loss": 1.8069, "step": 4170 }, { "epoch": 0.33, "learning_rate": 0.00029122803110364005, "loss": 1.8892, "step": 4171 }, { "epoch": 0.33, "learning_rate": 0.00029122386593721827, "loss": 1.8237, "step": 4172 }, { "epoch": 0.33, "learning_rate": 0.00029121969981196446, "loss": 1.7786, "step": 4173 }, { "epoch": 0.33, "learning_rate": 0.00029121553272790676, "loss": 1.8107, "step": 4174 }, { "epoch": 0.33, "learning_rate": 0.0002912113646850735, "loss": 1.8354, "step": 4175 }, { "epoch": 0.33, "learning_rate": 0.00029120719568349304, "loss": 1.86, "step": 4176 }, { "epoch": 0.33, "learning_rate": 0.00029120302572319367, "loss": 1.8529, "step": 4177 }, { "epoch": 0.33, "learning_rate": 0.0002911988548042036, "loss": 1.7874, "step": 4178 }, { "epoch": 0.33, "learning_rate": 0.0002911946829265513, "loss": 1.836, "step": 4179 }, { "epoch": 0.33, "learning_rate": 0.000291190510090265, "loss": 1.8618, "step": 4180 }, { "epoch": 0.33, "learning_rate": 0.00029118633629537303, "loss": 1.8012, "step": 4181 }, { "epoch": 0.33, "learning_rate": 0.00029118216154190373, "loss": 1.8393, "step": 4182 }, { "epoch": 0.33, "learning_rate": 0.0002911779858298855, "loss": 1.8042, "step": 4183 }, { "epoch": 0.33, "learning_rate": 0.0002911738091593467, "loss": 1.8809, "step": 4184 }, { "epoch": 0.33, "learning_rate": 0.0002911696315303156, "loss": 1.8068, "step": 4185 }, { "epoch": 0.33, "learning_rate": 0.0002911654529428206, "loss": 1.8328, "step": 4186 }, { "epoch": 0.33, "learning_rate": 0.0002911612733968901, "loss": 1.8476, "step": 4187 }, { "epoch": 0.33, "learning_rate": 0.0002911570928925524, "loss": 1.8387, "step": 4188 }, { "epoch": 0.33, "learning_rate": 0.000291152911429836, "loss": 1.8801, "step": 4189 }, { "epoch": 0.33, "learning_rate": 0.0002911487290087692, "loss": 1.8209, "step": 4190 }, { "epoch": 0.33, "learning_rate": 0.00029114454562938034, "loss": 1.7969, "step": 4191 }, { "epoch": 0.33, "learning_rate": 0.00029114036129169796, "loss": 1.8709, "step": 4192 }, { "epoch": 0.33, "learning_rate": 0.00029113617599575047, "loss": 1.8111, "step": 4193 }, { "epoch": 0.33, "learning_rate": 0.0002911319897415662, "loss": 1.8563, "step": 4194 }, { "epoch": 0.33, "learning_rate": 0.00029112780252917356, "loss": 1.8322, "step": 4195 }, { "epoch": 0.33, "learning_rate": 0.0002911236143586011, "loss": 1.8328, "step": 4196 }, { "epoch": 0.33, "learning_rate": 0.00029111942522987714, "loss": 1.7964, "step": 4197 }, { "epoch": 0.33, "learning_rate": 0.00029111523514303015, "loss": 1.8114, "step": 4198 }, { "epoch": 0.33, "learning_rate": 0.00029111104409808856, "loss": 1.7836, "step": 4199 }, { "epoch": 0.33, "learning_rate": 0.00029110685209508087, "loss": 1.8988, "step": 4200 }, { "epoch": 0.33, "learning_rate": 0.0002911026591340356, "loss": 1.857, "step": 4201 }, { "epoch": 0.33, "learning_rate": 0.00029109846521498106, "loss": 1.8582, "step": 4202 }, { "epoch": 0.33, "learning_rate": 0.0002910942703379458, "loss": 1.8068, "step": 4203 }, { "epoch": 0.33, "learning_rate": 0.00029109007450295836, "loss": 1.855, "step": 4204 }, { "epoch": 0.33, "learning_rate": 0.0002910858777100471, "loss": 1.8123, "step": 4205 }, { "epoch": 0.33, "learning_rate": 0.00029108167995924066, "loss": 1.7877, "step": 4206 }, { "epoch": 0.33, "learning_rate": 0.00029107748125056744, "loss": 1.8181, "step": 4207 }, { "epoch": 0.33, "learning_rate": 0.00029107328158405597, "loss": 1.7782, "step": 4208 }, { "epoch": 0.33, "learning_rate": 0.00029106908095973477, "loss": 1.8343, "step": 4209 }, { "epoch": 0.33, "learning_rate": 0.00029106487937763235, "loss": 1.8644, "step": 4210 }, { "epoch": 0.33, "learning_rate": 0.0002910606768377772, "loss": 1.8457, "step": 4211 }, { "epoch": 0.33, "learning_rate": 0.000291056473340198, "loss": 1.8691, "step": 4212 }, { "epoch": 0.33, "learning_rate": 0.00029105226888492315, "loss": 1.807, "step": 4213 }, { "epoch": 0.33, "learning_rate": 0.0002910480634719813, "loss": 1.7869, "step": 4214 }, { "epoch": 0.33, "learning_rate": 0.0002910438571014008, "loss": 1.8054, "step": 4215 }, { "epoch": 0.33, "learning_rate": 0.00029103964977321043, "loss": 1.8824, "step": 4216 }, { "epoch": 0.33, "learning_rate": 0.00029103544148743866, "loss": 1.8224, "step": 4217 }, { "epoch": 0.33, "learning_rate": 0.00029103123224411405, "loss": 1.7749, "step": 4218 }, { "epoch": 0.33, "learning_rate": 0.00029102702204326523, "loss": 1.8223, "step": 4219 }, { "epoch": 0.33, "learning_rate": 0.0002910228108849207, "loss": 1.8212, "step": 4220 }, { "epoch": 0.33, "learning_rate": 0.00029101859876910915, "loss": 1.8501, "step": 4221 }, { "epoch": 0.33, "learning_rate": 0.0002910143856958591, "loss": 1.8461, "step": 4222 }, { "epoch": 0.33, "learning_rate": 0.0002910101716651992, "loss": 1.8615, "step": 4223 }, { "epoch": 0.33, "learning_rate": 0.0002910059566771581, "loss": 1.8132, "step": 4224 }, { "epoch": 0.33, "learning_rate": 0.0002910017407317644, "loss": 1.7694, "step": 4225 }, { "epoch": 0.33, "learning_rate": 0.0002909975238290466, "loss": 1.7711, "step": 4226 }, { "epoch": 0.33, "learning_rate": 0.00029099330596903345, "loss": 1.7787, "step": 4227 }, { "epoch": 0.33, "learning_rate": 0.0002909890871517535, "loss": 1.7833, "step": 4228 }, { "epoch": 0.33, "learning_rate": 0.0002909848673772355, "loss": 1.8842, "step": 4229 }, { "epoch": 0.33, "learning_rate": 0.0002909806466455081, "loss": 1.8106, "step": 4230 }, { "epoch": 0.33, "learning_rate": 0.00029097642495659983, "loss": 1.7507, "step": 4231 }, { "epoch": 0.33, "learning_rate": 0.0002909722023105395, "loss": 1.844, "step": 4232 }, { "epoch": 0.33, "learning_rate": 0.0002909679787073557, "loss": 1.7649, "step": 4233 }, { "epoch": 0.33, "learning_rate": 0.00029096375414707713, "loss": 1.8291, "step": 4234 }, { "epoch": 0.33, "learning_rate": 0.0002909595286297324, "loss": 1.8187, "step": 4235 }, { "epoch": 0.33, "learning_rate": 0.0002909553021553503, "loss": 1.8326, "step": 4236 }, { "epoch": 0.33, "learning_rate": 0.00029095107472395946, "loss": 1.8635, "step": 4237 }, { "epoch": 0.33, "learning_rate": 0.0002909468463355886, "loss": 1.7067, "step": 4238 }, { "epoch": 0.33, "learning_rate": 0.0002909426169902665, "loss": 1.8186, "step": 4239 }, { "epoch": 0.33, "learning_rate": 0.00029093838668802174, "loss": 1.7843, "step": 4240 }, { "epoch": 0.33, "learning_rate": 0.0002909341554288831, "loss": 1.8909, "step": 4241 }, { "epoch": 0.33, "learning_rate": 0.0002909299232128794, "loss": 1.8162, "step": 4242 }, { "epoch": 0.33, "learning_rate": 0.00029092569004003925, "loss": 1.7874, "step": 4243 }, { "epoch": 0.33, "learning_rate": 0.00029092145591039145, "loss": 1.8336, "step": 4244 }, { "epoch": 0.33, "learning_rate": 0.00029091722082396466, "loss": 1.8947, "step": 4245 }, { "epoch": 0.33, "learning_rate": 0.0002909129847807878, "loss": 1.858, "step": 4246 }, { "epoch": 0.33, "learning_rate": 0.00029090874778088944, "loss": 1.842, "step": 4247 }, { "epoch": 0.33, "learning_rate": 0.00029090450982429853, "loss": 1.8506, "step": 4248 }, { "epoch": 0.33, "learning_rate": 0.00029090027091104373, "loss": 1.8735, "step": 4249 }, { "epoch": 0.33, "learning_rate": 0.0002908960310411538, "loss": 1.8324, "step": 4250 }, { "epoch": 0.33, "learning_rate": 0.00029089179021465764, "loss": 1.8641, "step": 4251 }, { "epoch": 0.33, "learning_rate": 0.00029088754843158393, "loss": 1.8438, "step": 4252 }, { "epoch": 0.33, "learning_rate": 0.0002908833056919615, "loss": 1.8297, "step": 4253 }, { "epoch": 0.33, "learning_rate": 0.0002908790619958192, "loss": 1.7755, "step": 4254 }, { "epoch": 0.33, "learning_rate": 0.0002908748173431858, "loss": 1.8098, "step": 4255 }, { "epoch": 0.33, "learning_rate": 0.0002908705717340902, "loss": 1.7578, "step": 4256 }, { "epoch": 0.33, "learning_rate": 0.00029086632516856105, "loss": 1.8138, "step": 4257 }, { "epoch": 0.34, "learning_rate": 0.0002908620776466273, "loss": 1.7897, "step": 4258 }, { "epoch": 0.34, "learning_rate": 0.0002908578291683178, "loss": 1.8412, "step": 4259 }, { "epoch": 0.34, "learning_rate": 0.0002908535797336614, "loss": 1.8229, "step": 4260 }, { "epoch": 0.34, "learning_rate": 0.00029084932934268694, "loss": 1.7633, "step": 4261 }, { "epoch": 0.34, "learning_rate": 0.0002908450779954232, "loss": 1.8273, "step": 4262 }, { "epoch": 0.34, "learning_rate": 0.0002908408256918992, "loss": 1.7431, "step": 4263 }, { "epoch": 0.34, "learning_rate": 0.00029083657243214356, "loss": 1.7959, "step": 4264 }, { "epoch": 0.34, "learning_rate": 0.0002908323182161855, "loss": 1.8496, "step": 4265 }, { "epoch": 0.34, "learning_rate": 0.00029082806304405357, "loss": 1.846, "step": 4266 }, { "epoch": 0.34, "learning_rate": 0.0002908238069157769, "loss": 1.8265, "step": 4267 }, { "epoch": 0.34, "learning_rate": 0.0002908195498313842, "loss": 1.8703, "step": 4268 }, { "epoch": 0.34, "learning_rate": 0.0002908152917909045, "loss": 1.8498, "step": 4269 }, { "epoch": 0.34, "learning_rate": 0.0002908110327943667, "loss": 1.9118, "step": 4270 }, { "epoch": 0.34, "learning_rate": 0.00029080677284179973, "loss": 1.8045, "step": 4271 }, { "epoch": 0.34, "learning_rate": 0.0002908025119332324, "loss": 1.8028, "step": 4272 }, { "epoch": 0.34, "learning_rate": 0.00029079825006869377, "loss": 1.8086, "step": 4273 }, { "epoch": 0.34, "learning_rate": 0.00029079398724821267, "loss": 1.8655, "step": 4274 }, { "epoch": 0.34, "learning_rate": 0.00029078972347181816, "loss": 1.7985, "step": 4275 }, { "epoch": 0.34, "learning_rate": 0.00029078545873953903, "loss": 1.7913, "step": 4276 }, { "epoch": 0.34, "learning_rate": 0.00029078119305140445, "loss": 1.8178, "step": 4277 }, { "epoch": 0.34, "learning_rate": 0.00029077692640744313, "loss": 1.8005, "step": 4278 }, { "epoch": 0.34, "learning_rate": 0.00029077265880768426, "loss": 1.7737, "step": 4279 }, { "epoch": 0.34, "learning_rate": 0.0002907683902521567, "loss": 1.8526, "step": 4280 }, { "epoch": 0.34, "learning_rate": 0.00029076412074088945, "loss": 1.8613, "step": 4281 }, { "epoch": 0.34, "learning_rate": 0.00029075985027391147, "loss": 1.8026, "step": 4282 }, { "epoch": 0.34, "learning_rate": 0.00029075557885125183, "loss": 1.8271, "step": 4283 }, { "epoch": 0.34, "learning_rate": 0.00029075130647293943, "loss": 1.9011, "step": 4284 }, { "epoch": 0.34, "learning_rate": 0.00029074703313900337, "loss": 1.8414, "step": 4285 }, { "epoch": 0.34, "learning_rate": 0.0002907427588494726, "loss": 1.8564, "step": 4286 }, { "epoch": 0.34, "learning_rate": 0.0002907384836043762, "loss": 1.799, "step": 4287 }, { "epoch": 0.34, "learning_rate": 0.0002907342074037431, "loss": 1.8486, "step": 4288 }, { "epoch": 0.34, "learning_rate": 0.00029072993024760246, "loss": 1.7983, "step": 4289 }, { "epoch": 0.34, "learning_rate": 0.00029072565213598327, "loss": 1.8479, "step": 4290 }, { "epoch": 0.34, "learning_rate": 0.00029072137306891454, "loss": 1.7729, "step": 4291 }, { "epoch": 0.34, "learning_rate": 0.00029071709304642534, "loss": 1.8505, "step": 4292 }, { "epoch": 0.34, "learning_rate": 0.00029071281206854467, "loss": 1.8609, "step": 4293 }, { "epoch": 0.34, "learning_rate": 0.00029070853013530174, "loss": 1.8116, "step": 4294 }, { "epoch": 0.34, "learning_rate": 0.0002907042472467255, "loss": 1.788, "step": 4295 }, { "epoch": 0.34, "learning_rate": 0.0002906999634028451, "loss": 1.8235, "step": 4296 }, { "epoch": 0.34, "learning_rate": 0.00029069567860368957, "loss": 1.8611, "step": 4297 }, { "epoch": 0.34, "learning_rate": 0.000290691392849288, "loss": 1.8175, "step": 4298 }, { "epoch": 0.34, "learning_rate": 0.00029068710613966957, "loss": 1.8355, "step": 4299 }, { "epoch": 0.34, "learning_rate": 0.0002906828184748633, "loss": 1.8283, "step": 4300 }, { "epoch": 0.34, "learning_rate": 0.0002906785298548983, "loss": 1.8826, "step": 4301 }, { "epoch": 0.34, "learning_rate": 0.00029067424027980375, "loss": 1.8129, "step": 4302 }, { "epoch": 0.34, "learning_rate": 0.00029066994974960873, "loss": 1.8166, "step": 4303 }, { "epoch": 0.34, "learning_rate": 0.00029066565826434235, "loss": 1.8549, "step": 4304 }, { "epoch": 0.34, "learning_rate": 0.0002906613658240338, "loss": 1.8174, "step": 4305 }, { "epoch": 0.34, "learning_rate": 0.0002906570724287122, "loss": 1.8106, "step": 4306 }, { "epoch": 0.34, "learning_rate": 0.00029065277807840674, "loss": 1.8004, "step": 4307 }, { "epoch": 0.34, "learning_rate": 0.0002906484827731465, "loss": 1.8082, "step": 4308 }, { "epoch": 0.34, "learning_rate": 0.0002906441865129607, "loss": 1.886, "step": 4309 }, { "epoch": 0.34, "learning_rate": 0.0002906398892978784, "loss": 1.8306, "step": 4310 }, { "epoch": 0.34, "learning_rate": 0.00029063559112792897, "loss": 1.8504, "step": 4311 }, { "epoch": 0.34, "learning_rate": 0.0002906312920031414, "loss": 1.8163, "step": 4312 }, { "epoch": 0.34, "learning_rate": 0.00029062699192354503, "loss": 1.8453, "step": 4313 }, { "epoch": 0.34, "learning_rate": 0.00029062269088916894, "loss": 1.8644, "step": 4314 }, { "epoch": 0.34, "learning_rate": 0.0002906183889000424, "loss": 1.8102, "step": 4315 }, { "epoch": 0.34, "learning_rate": 0.00029061408595619466, "loss": 1.833, "step": 4316 }, { "epoch": 0.34, "learning_rate": 0.0002906097820576548, "loss": 1.8353, "step": 4317 }, { "epoch": 0.34, "learning_rate": 0.00029060547720445216, "loss": 1.8224, "step": 4318 }, { "epoch": 0.34, "learning_rate": 0.00029060117139661584, "loss": 1.8289, "step": 4319 }, { "epoch": 0.34, "learning_rate": 0.00029059686463417525, "loss": 1.8421, "step": 4320 }, { "epoch": 0.34, "learning_rate": 0.00029059255691715947, "loss": 1.828, "step": 4321 }, { "epoch": 0.34, "learning_rate": 0.0002905882482455979, "loss": 1.8768, "step": 4322 }, { "epoch": 0.34, "learning_rate": 0.0002905839386195196, "loss": 1.801, "step": 4323 }, { "epoch": 0.34, "learning_rate": 0.000290579628038954, "loss": 1.875, "step": 4324 }, { "epoch": 0.34, "learning_rate": 0.0002905753165039303, "loss": 1.7887, "step": 4325 }, { "epoch": 0.34, "learning_rate": 0.00029057100401447776, "loss": 1.8601, "step": 4326 }, { "epoch": 0.34, "learning_rate": 0.00029056669057062566, "loss": 1.8253, "step": 4327 }, { "epoch": 0.34, "learning_rate": 0.00029056237617240335, "loss": 1.8401, "step": 4328 }, { "epoch": 0.34, "learning_rate": 0.00029055806081984006, "loss": 1.8147, "step": 4329 }, { "epoch": 0.34, "learning_rate": 0.0002905537445129651, "loss": 1.7512, "step": 4330 }, { "epoch": 0.34, "learning_rate": 0.00029054942725180774, "loss": 1.8362, "step": 4331 }, { "epoch": 0.34, "learning_rate": 0.0002905451090363974, "loss": 1.7945, "step": 4332 }, { "epoch": 0.34, "learning_rate": 0.0002905407898667633, "loss": 1.8427, "step": 4333 }, { "epoch": 0.34, "learning_rate": 0.0002905364697429348, "loss": 1.876, "step": 4334 }, { "epoch": 0.34, "learning_rate": 0.0002905321486649412, "loss": 1.7892, "step": 4335 }, { "epoch": 0.34, "learning_rate": 0.00029052782663281185, "loss": 1.8326, "step": 4336 }, { "epoch": 0.34, "learning_rate": 0.00029052350364657616, "loss": 1.8425, "step": 4337 }, { "epoch": 0.34, "learning_rate": 0.00029051917970626337, "loss": 1.8235, "step": 4338 }, { "epoch": 0.34, "learning_rate": 0.0002905148548119029, "loss": 1.8193, "step": 4339 }, { "epoch": 0.34, "learning_rate": 0.0002905105289635242, "loss": 1.8139, "step": 4340 }, { "epoch": 0.34, "learning_rate": 0.00029050620216115647, "loss": 1.8453, "step": 4341 }, { "epoch": 0.34, "learning_rate": 0.0002905018744048291, "loss": 1.8247, "step": 4342 }, { "epoch": 0.34, "learning_rate": 0.0002904975456945717, "loss": 1.8265, "step": 4343 }, { "epoch": 0.34, "learning_rate": 0.00029049321603041335, "loss": 1.8214, "step": 4344 }, { "epoch": 0.34, "learning_rate": 0.0002904888854123837, "loss": 1.8205, "step": 4345 }, { "epoch": 0.34, "learning_rate": 0.00029048455384051195, "loss": 1.8065, "step": 4346 }, { "epoch": 0.34, "learning_rate": 0.0002904802213148277, "loss": 1.8372, "step": 4347 }, { "epoch": 0.34, "learning_rate": 0.00029047588783536024, "loss": 1.8195, "step": 4348 }, { "epoch": 0.34, "learning_rate": 0.000290471553402139, "loss": 1.7637, "step": 4349 }, { "epoch": 0.34, "learning_rate": 0.00029046721801519345, "loss": 1.7428, "step": 4350 }, { "epoch": 0.34, "learning_rate": 0.00029046288167455293, "loss": 1.8191, "step": 4351 }, { "epoch": 0.34, "learning_rate": 0.00029045854438024705, "loss": 1.8405, "step": 4352 }, { "epoch": 0.34, "learning_rate": 0.0002904542061323051, "loss": 1.7779, "step": 4353 }, { "epoch": 0.34, "learning_rate": 0.00029044986693075664, "loss": 1.7796, "step": 4354 }, { "epoch": 0.34, "learning_rate": 0.0002904455267756311, "loss": 1.8294, "step": 4355 }, { "epoch": 0.34, "learning_rate": 0.000290441185666958, "loss": 1.8504, "step": 4356 }, { "epoch": 0.34, "learning_rate": 0.00029043684360476665, "loss": 1.7972, "step": 4357 }, { "epoch": 0.34, "learning_rate": 0.00029043250058908665, "loss": 1.8274, "step": 4358 }, { "epoch": 0.34, "learning_rate": 0.00029042815661994744, "loss": 1.836, "step": 4359 }, { "epoch": 0.34, "learning_rate": 0.00029042381169737863, "loss": 1.844, "step": 4360 }, { "epoch": 0.34, "learning_rate": 0.00029041946582140953, "loss": 1.7835, "step": 4361 }, { "epoch": 0.34, "learning_rate": 0.0002904151189920698, "loss": 1.8213, "step": 4362 }, { "epoch": 0.34, "learning_rate": 0.0002904107712093889, "loss": 1.801, "step": 4363 }, { "epoch": 0.34, "learning_rate": 0.0002904064224733963, "loss": 1.7486, "step": 4364 }, { "epoch": 0.34, "learning_rate": 0.00029040207278412165, "loss": 1.7416, "step": 4365 }, { "epoch": 0.34, "learning_rate": 0.0002903977221415944, "loss": 1.8044, "step": 4366 }, { "epoch": 0.34, "learning_rate": 0.00029039337054584407, "loss": 1.877, "step": 4367 }, { "epoch": 0.34, "learning_rate": 0.00029038901799690025, "loss": 1.7891, "step": 4368 }, { "epoch": 0.34, "learning_rate": 0.0002903846644947924, "loss": 1.7928, "step": 4369 }, { "epoch": 0.34, "learning_rate": 0.0002903803100395502, "loss": 1.8563, "step": 4370 }, { "epoch": 0.34, "learning_rate": 0.00029037595463120313, "loss": 1.822, "step": 4371 }, { "epoch": 0.34, "learning_rate": 0.00029037159826978087, "loss": 1.8729, "step": 4372 }, { "epoch": 0.34, "learning_rate": 0.00029036724095531287, "loss": 1.8112, "step": 4373 }, { "epoch": 0.34, "learning_rate": 0.00029036288268782876, "loss": 1.8138, "step": 4374 }, { "epoch": 0.34, "learning_rate": 0.00029035852346735817, "loss": 1.8231, "step": 4375 }, { "epoch": 0.34, "learning_rate": 0.0002903541632939306, "loss": 1.855, "step": 4376 }, { "epoch": 0.34, "learning_rate": 0.0002903498021675758, "loss": 1.7896, "step": 4377 }, { "epoch": 0.34, "learning_rate": 0.0002903454400883232, "loss": 1.8336, "step": 4378 }, { "epoch": 0.34, "learning_rate": 0.0002903410770562026, "loss": 1.8509, "step": 4379 }, { "epoch": 0.34, "learning_rate": 0.00029033671307124347, "loss": 1.8893, "step": 4380 }, { "epoch": 0.34, "learning_rate": 0.0002903323481334755, "loss": 1.8421, "step": 4381 }, { "epoch": 0.34, "learning_rate": 0.0002903279822429284, "loss": 1.7667, "step": 4382 }, { "epoch": 0.34, "learning_rate": 0.0002903236153996317, "loss": 1.8449, "step": 4383 }, { "epoch": 0.34, "learning_rate": 0.00029031924760361506, "loss": 1.8521, "step": 4384 }, { "epoch": 0.35, "learning_rate": 0.0002903148788549082, "loss": 1.8097, "step": 4385 }, { "epoch": 0.35, "learning_rate": 0.00029031050915354073, "loss": 1.8334, "step": 4386 }, { "epoch": 0.35, "learning_rate": 0.00029030613849954234, "loss": 1.7868, "step": 4387 }, { "epoch": 0.35, "learning_rate": 0.0002903017668929427, "loss": 1.7973, "step": 4388 }, { "epoch": 0.35, "learning_rate": 0.00029029739433377144, "loss": 1.7876, "step": 4389 }, { "epoch": 0.35, "learning_rate": 0.00029029302082205833, "loss": 1.8485, "step": 4390 }, { "epoch": 0.35, "learning_rate": 0.000290288646357833, "loss": 1.7981, "step": 4391 }, { "epoch": 0.35, "learning_rate": 0.0002902842709411252, "loss": 1.8453, "step": 4392 }, { "epoch": 0.35, "learning_rate": 0.00029027989457196463, "loss": 1.7526, "step": 4393 }, { "epoch": 0.35, "learning_rate": 0.00029027551725038103, "loss": 1.8156, "step": 4394 }, { "epoch": 0.35, "learning_rate": 0.000290271138976404, "loss": 1.8532, "step": 4395 }, { "epoch": 0.35, "learning_rate": 0.0002902667597500634, "loss": 1.8518, "step": 4396 }, { "epoch": 0.35, "learning_rate": 0.00029026237957138887, "loss": 1.8095, "step": 4397 }, { "epoch": 0.35, "learning_rate": 0.0002902579984404102, "loss": 1.8127, "step": 4398 }, { "epoch": 0.35, "learning_rate": 0.0002902536163571571, "loss": 1.9227, "step": 4399 }, { "epoch": 0.35, "learning_rate": 0.0002902492333216594, "loss": 1.8515, "step": 4400 }, { "epoch": 0.35, "learning_rate": 0.0002902448493339467, "loss": 1.8317, "step": 4401 }, { "epoch": 0.35, "learning_rate": 0.00029024046439404897, "loss": 1.8082, "step": 4402 }, { "epoch": 0.35, "learning_rate": 0.00029023607850199584, "loss": 1.8391, "step": 4403 }, { "epoch": 0.35, "learning_rate": 0.00029023169165781713, "loss": 1.7857, "step": 4404 }, { "epoch": 0.35, "learning_rate": 0.0002902273038615426, "loss": 1.8148, "step": 4405 }, { "epoch": 0.35, "learning_rate": 0.0002902229151132021, "loss": 1.8373, "step": 4406 }, { "epoch": 0.35, "learning_rate": 0.00029021852541282535, "loss": 1.7664, "step": 4407 }, { "epoch": 0.35, "learning_rate": 0.0002902141347604422, "loss": 1.8428, "step": 4408 }, { "epoch": 0.35, "learning_rate": 0.00029020974315608245, "loss": 1.8387, "step": 4409 }, { "epoch": 0.35, "learning_rate": 0.0002902053505997759, "loss": 1.798, "step": 4410 }, { "epoch": 0.35, "learning_rate": 0.00029020095709155245, "loss": 1.8626, "step": 4411 }, { "epoch": 0.35, "learning_rate": 0.0002901965626314418, "loss": 1.8342, "step": 4412 }, { "epoch": 0.35, "learning_rate": 0.0002901921672194739, "loss": 1.8125, "step": 4413 }, { "epoch": 0.35, "learning_rate": 0.0002901877708556785, "loss": 1.8311, "step": 4414 }, { "epoch": 0.35, "learning_rate": 0.0002901833735400856, "loss": 1.8272, "step": 4415 }, { "epoch": 0.35, "learning_rate": 0.00029017897527272487, "loss": 1.794, "step": 4416 }, { "epoch": 0.35, "learning_rate": 0.00029017457605362627, "loss": 1.8291, "step": 4417 }, { "epoch": 0.35, "learning_rate": 0.00029017017588281967, "loss": 1.7967, "step": 4418 }, { "epoch": 0.35, "learning_rate": 0.00029016577476033493, "loss": 1.802, "step": 4419 }, { "epoch": 0.35, "learning_rate": 0.0002901613726862019, "loss": 1.7649, "step": 4420 }, { "epoch": 0.35, "learning_rate": 0.0002901569696604505, "loss": 1.8514, "step": 4421 }, { "epoch": 0.35, "learning_rate": 0.00029015256568311066, "loss": 1.8003, "step": 4422 }, { "epoch": 0.35, "learning_rate": 0.00029014816075421224, "loss": 1.8737, "step": 4423 }, { "epoch": 0.35, "learning_rate": 0.0002901437548737851, "loss": 1.8313, "step": 4424 }, { "epoch": 0.35, "learning_rate": 0.00029013934804185924, "loss": 1.8425, "step": 4425 }, { "epoch": 0.35, "learning_rate": 0.0002901349402584645, "loss": 1.8685, "step": 4426 }, { "epoch": 0.35, "learning_rate": 0.0002901305315236309, "loss": 1.7932, "step": 4427 }, { "epoch": 0.35, "learning_rate": 0.0002901261218373883, "loss": 1.827, "step": 4428 }, { "epoch": 0.35, "learning_rate": 0.0002901217111997666, "loss": 1.798, "step": 4429 }, { "epoch": 0.35, "learning_rate": 0.0002901172996107959, "loss": 1.8167, "step": 4430 }, { "epoch": 0.35, "learning_rate": 0.00029011288707050606, "loss": 1.7968, "step": 4431 }, { "epoch": 0.35, "learning_rate": 0.000290108473578927, "loss": 1.8145, "step": 4432 }, { "epoch": 0.35, "learning_rate": 0.0002901040591360887, "loss": 1.8101, "step": 4433 }, { "epoch": 0.35, "learning_rate": 0.0002900996437420212, "loss": 1.816, "step": 4434 }, { "epoch": 0.35, "learning_rate": 0.0002900952273967544, "loss": 1.8646, "step": 4435 }, { "epoch": 0.35, "learning_rate": 0.0002900908101003184, "loss": 1.8392, "step": 4436 }, { "epoch": 0.35, "learning_rate": 0.00029008639185274296, "loss": 1.8601, "step": 4437 }, { "epoch": 0.35, "learning_rate": 0.0002900819726540583, "loss": 1.8513, "step": 4438 }, { "epoch": 0.35, "learning_rate": 0.00029007755250429434, "loss": 1.8661, "step": 4439 }, { "epoch": 0.35, "learning_rate": 0.00029007313140348115, "loss": 1.7945, "step": 4440 }, { "epoch": 0.35, "learning_rate": 0.00029006870935164864, "loss": 1.8012, "step": 4441 }, { "epoch": 0.35, "learning_rate": 0.0002900642863488269, "loss": 1.7002, "step": 4442 }, { "epoch": 0.35, "learning_rate": 0.00029005986239504596, "loss": 1.82, "step": 4443 }, { "epoch": 0.35, "learning_rate": 0.00029005543749033584, "loss": 1.8443, "step": 4444 }, { "epoch": 0.35, "learning_rate": 0.0002900510116347266, "loss": 1.788, "step": 4445 }, { "epoch": 0.35, "learning_rate": 0.0002900465848282483, "loss": 1.776, "step": 4446 }, { "epoch": 0.35, "learning_rate": 0.0002900421570709309, "loss": 1.8162, "step": 4447 }, { "epoch": 0.35, "learning_rate": 0.0002900377283628046, "loss": 1.8688, "step": 4448 }, { "epoch": 0.35, "learning_rate": 0.0002900332987038994, "loss": 1.8331, "step": 4449 }, { "epoch": 0.35, "learning_rate": 0.00029002886809424537, "loss": 1.8305, "step": 4450 }, { "epoch": 0.35, "learning_rate": 0.0002900244365338725, "loss": 1.8656, "step": 4451 }, { "epoch": 0.35, "learning_rate": 0.0002900200040228111, "loss": 1.8262, "step": 4452 }, { "epoch": 0.35, "learning_rate": 0.0002900155705610911, "loss": 1.8736, "step": 4453 }, { "epoch": 0.35, "learning_rate": 0.0002900111361487427, "loss": 1.7943, "step": 4454 }, { "epoch": 0.35, "learning_rate": 0.0002900067007857959, "loss": 1.8375, "step": 4455 }, { "epoch": 0.35, "learning_rate": 0.00029000226447228086, "loss": 1.8563, "step": 4456 }, { "epoch": 0.35, "learning_rate": 0.0002899978272082277, "loss": 1.8595, "step": 4457 }, { "epoch": 0.35, "learning_rate": 0.0002899933889936666, "loss": 1.8222, "step": 4458 }, { "epoch": 0.35, "learning_rate": 0.00028998894982862756, "loss": 1.8462, "step": 4459 }, { "epoch": 0.35, "learning_rate": 0.00028998450971314086, "loss": 1.7499, "step": 4460 }, { "epoch": 0.35, "learning_rate": 0.00028998006864723656, "loss": 1.8201, "step": 4461 }, { "epoch": 0.35, "learning_rate": 0.0002899756266309449, "loss": 1.8202, "step": 4462 }, { "epoch": 0.35, "learning_rate": 0.00028997118366429594, "loss": 1.8549, "step": 4463 }, { "epoch": 0.35, "learning_rate": 0.00028996673974731983, "loss": 1.8552, "step": 4464 }, { "epoch": 0.35, "learning_rate": 0.00028996229488004687, "loss": 1.8207, "step": 4465 }, { "epoch": 0.35, "learning_rate": 0.0002899578490625072, "loss": 1.8095, "step": 4466 }, { "epoch": 0.35, "learning_rate": 0.00028995340229473086, "loss": 1.7914, "step": 4467 }, { "epoch": 0.35, "learning_rate": 0.0002899489545767482, "loss": 1.8257, "step": 4468 }, { "epoch": 0.35, "learning_rate": 0.0002899445059085894, "loss": 1.8829, "step": 4469 }, { "epoch": 0.35, "learning_rate": 0.0002899400562902846, "loss": 1.8567, "step": 4470 }, { "epoch": 0.35, "learning_rate": 0.00028993560572186406, "loss": 1.8018, "step": 4471 }, { "epoch": 0.35, "learning_rate": 0.000289931154203358, "loss": 1.8089, "step": 4472 }, { "epoch": 0.35, "learning_rate": 0.00028992670173479655, "loss": 1.7933, "step": 4473 }, { "epoch": 0.35, "learning_rate": 0.00028992224831621006, "loss": 1.8504, "step": 4474 }, { "epoch": 0.35, "learning_rate": 0.0002899177939476287, "loss": 1.8004, "step": 4475 }, { "epoch": 0.35, "learning_rate": 0.00028991333862908277, "loss": 1.9034, "step": 4476 }, { "epoch": 0.35, "learning_rate": 0.00028990888236060246, "loss": 1.7895, "step": 4477 }, { "epoch": 0.35, "learning_rate": 0.00028990442514221804, "loss": 1.8233, "step": 4478 }, { "epoch": 0.35, "learning_rate": 0.00028989996697395976, "loss": 1.827, "step": 4479 }, { "epoch": 0.35, "learning_rate": 0.000289895507855858, "loss": 1.8022, "step": 4480 }, { "epoch": 0.35, "learning_rate": 0.00028989104778794284, "loss": 1.7986, "step": 4481 }, { "epoch": 0.35, "learning_rate": 0.0002898865867702447, "loss": 1.8654, "step": 4482 }, { "epoch": 0.35, "learning_rate": 0.0002898821248027938, "loss": 1.8231, "step": 4483 }, { "epoch": 0.35, "learning_rate": 0.0002898776618856205, "loss": 1.8362, "step": 4484 }, { "epoch": 0.35, "learning_rate": 0.0002898731980187551, "loss": 1.7776, "step": 4485 }, { "epoch": 0.35, "learning_rate": 0.0002898687332022278, "loss": 1.823, "step": 4486 }, { "epoch": 0.35, "learning_rate": 0.00028986426743606903, "loss": 1.7367, "step": 4487 }, { "epoch": 0.35, "learning_rate": 0.00028985980072030907, "loss": 1.8646, "step": 4488 }, { "epoch": 0.35, "learning_rate": 0.00028985533305497823, "loss": 1.7639, "step": 4489 }, { "epoch": 0.35, "learning_rate": 0.00028985086444010687, "loss": 1.7981, "step": 4490 }, { "epoch": 0.35, "learning_rate": 0.00028984639487572534, "loss": 1.8374, "step": 4491 }, { "epoch": 0.35, "learning_rate": 0.0002898419243618639, "loss": 1.7646, "step": 4492 }, { "epoch": 0.35, "learning_rate": 0.000289837452898553, "loss": 1.8428, "step": 4493 }, { "epoch": 0.35, "learning_rate": 0.00028983298048582297, "loss": 1.8567, "step": 4494 }, { "epoch": 0.35, "learning_rate": 0.0002898285071237042, "loss": 1.8472, "step": 4495 }, { "epoch": 0.35, "learning_rate": 0.00028982403281222694, "loss": 1.7847, "step": 4496 }, { "epoch": 0.35, "learning_rate": 0.0002898195575514217, "loss": 1.816, "step": 4497 }, { "epoch": 0.35, "learning_rate": 0.00028981508134131884, "loss": 1.8446, "step": 4498 }, { "epoch": 0.35, "learning_rate": 0.0002898106041819487, "loss": 1.8945, "step": 4499 }, { "epoch": 0.35, "learning_rate": 0.00028980612607334174, "loss": 1.7909, "step": 4500 }, { "epoch": 0.35, "learning_rate": 0.00028980164701552835, "loss": 1.8029, "step": 4501 }, { "epoch": 0.35, "learning_rate": 0.00028979716700853895, "loss": 1.8006, "step": 4502 }, { "epoch": 0.35, "learning_rate": 0.0002897926860524039, "loss": 1.8389, "step": 4503 }, { "epoch": 0.35, "learning_rate": 0.0002897882041471536, "loss": 1.7869, "step": 4504 }, { "epoch": 0.35, "learning_rate": 0.0002897837212928186, "loss": 1.7976, "step": 4505 }, { "epoch": 0.35, "learning_rate": 0.00028977923748942926, "loss": 1.8237, "step": 4506 }, { "epoch": 0.35, "learning_rate": 0.000289774752737016, "loss": 1.8069, "step": 4507 }, { "epoch": 0.35, "learning_rate": 0.00028977026703560935, "loss": 1.8889, "step": 4508 }, { "epoch": 0.35, "learning_rate": 0.0002897657803852397, "loss": 1.818, "step": 4509 }, { "epoch": 0.35, "learning_rate": 0.00028976129278593756, "loss": 1.8583, "step": 4510 }, { "epoch": 0.35, "learning_rate": 0.0002897568042377333, "loss": 1.8407, "step": 4511 }, { "epoch": 0.36, "learning_rate": 0.00028975231474065753, "loss": 1.8175, "step": 4512 }, { "epoch": 0.36, "learning_rate": 0.0002897478242947406, "loss": 1.836, "step": 4513 }, { "epoch": 0.36, "learning_rate": 0.0002897433329000131, "loss": 1.8299, "step": 4514 }, { "epoch": 0.36, "learning_rate": 0.00028973884055650547, "loss": 1.8483, "step": 4515 }, { "epoch": 0.36, "learning_rate": 0.00028973434726424827, "loss": 1.7954, "step": 4516 }, { "epoch": 0.36, "learning_rate": 0.00028972985302327194, "loss": 1.8378, "step": 4517 }, { "epoch": 0.36, "learning_rate": 0.000289725357833607, "loss": 1.864, "step": 4518 }, { "epoch": 0.36, "learning_rate": 0.00028972086169528396, "loss": 1.7594, "step": 4519 }, { "epoch": 0.36, "learning_rate": 0.00028971636460833346, "loss": 1.8135, "step": 4520 }, { "epoch": 0.36, "learning_rate": 0.0002897118665727859, "loss": 1.8032, "step": 4521 }, { "epoch": 0.36, "learning_rate": 0.00028970736758867185, "loss": 1.8036, "step": 4522 }, { "epoch": 0.36, "learning_rate": 0.00028970286765602187, "loss": 1.8387, "step": 4523 }, { "epoch": 0.36, "learning_rate": 0.0002896983667748665, "loss": 1.8349, "step": 4524 }, { "epoch": 0.36, "learning_rate": 0.00028969386494523636, "loss": 1.8156, "step": 4525 }, { "epoch": 0.36, "learning_rate": 0.00028968936216716197, "loss": 1.82, "step": 4526 }, { "epoch": 0.36, "learning_rate": 0.00028968485844067386, "loss": 1.7895, "step": 4527 }, { "epoch": 0.36, "learning_rate": 0.0002896803537658027, "loss": 1.829, "step": 4528 }, { "epoch": 0.36, "learning_rate": 0.00028967584814257894, "loss": 1.8054, "step": 4529 }, { "epoch": 0.36, "learning_rate": 0.0002896713415710333, "loss": 1.8469, "step": 4530 }, { "epoch": 0.36, "learning_rate": 0.00028966683405119633, "loss": 1.8108, "step": 4531 }, { "epoch": 0.36, "learning_rate": 0.0002896623255830986, "loss": 1.861, "step": 4532 }, { "epoch": 0.36, "learning_rate": 0.0002896578161667708, "loss": 1.7818, "step": 4533 }, { "epoch": 0.36, "learning_rate": 0.00028965330580224346, "loss": 1.8417, "step": 4534 }, { "epoch": 0.36, "learning_rate": 0.0002896487944895473, "loss": 1.8002, "step": 4535 }, { "epoch": 0.36, "learning_rate": 0.00028964428222871277, "loss": 1.772, "step": 4536 }, { "epoch": 0.36, "learning_rate": 0.0002896397690197707, "loss": 1.8559, "step": 4537 }, { "epoch": 0.36, "learning_rate": 0.00028963525486275167, "loss": 1.8131, "step": 4538 }, { "epoch": 0.36, "learning_rate": 0.0002896307397576863, "loss": 1.8402, "step": 4539 }, { "epoch": 0.36, "learning_rate": 0.00028962622370460526, "loss": 1.8268, "step": 4540 }, { "epoch": 0.36, "learning_rate": 0.0002896217067035392, "loss": 1.7969, "step": 4541 }, { "epoch": 0.36, "learning_rate": 0.00028961718875451884, "loss": 1.7924, "step": 4542 }, { "epoch": 0.36, "learning_rate": 0.00028961266985757475, "loss": 1.806, "step": 4543 }, { "epoch": 0.36, "learning_rate": 0.00028960815001273776, "loss": 1.7866, "step": 4544 }, { "epoch": 0.36, "learning_rate": 0.0002896036292200384, "loss": 1.7923, "step": 4545 }, { "epoch": 0.36, "learning_rate": 0.0002895991074795075, "loss": 1.8208, "step": 4546 }, { "epoch": 0.36, "learning_rate": 0.0002895945847911756, "loss": 1.815, "step": 4547 }, { "epoch": 0.36, "learning_rate": 0.00028959006115507357, "loss": 1.8196, "step": 4548 }, { "epoch": 0.36, "learning_rate": 0.0002895855365712321, "loss": 1.7712, "step": 4549 }, { "epoch": 0.36, "learning_rate": 0.00028958101103968183, "loss": 1.7899, "step": 4550 }, { "epoch": 0.36, "learning_rate": 0.00028957648456045355, "loss": 1.7979, "step": 4551 }, { "epoch": 0.36, "learning_rate": 0.0002895719571335779, "loss": 1.7899, "step": 4552 }, { "epoch": 0.36, "learning_rate": 0.00028956742875908565, "loss": 1.8153, "step": 4553 }, { "epoch": 0.36, "learning_rate": 0.00028956289943700766, "loss": 1.8208, "step": 4554 }, { "epoch": 0.36, "learning_rate": 0.0002895583691673746, "loss": 1.814, "step": 4555 }, { "epoch": 0.36, "learning_rate": 0.0002895538379502172, "loss": 1.8142, "step": 4556 }, { "epoch": 0.36, "learning_rate": 0.00028954930578556625, "loss": 1.8736, "step": 4557 }, { "epoch": 0.36, "learning_rate": 0.0002895447726734526, "loss": 1.8615, "step": 4558 }, { "epoch": 0.36, "learning_rate": 0.0002895402386139068, "loss": 1.7768, "step": 4559 }, { "epoch": 0.36, "learning_rate": 0.0002895357036069599, "loss": 1.7577, "step": 4560 }, { "epoch": 0.36, "learning_rate": 0.00028953116765264257, "loss": 1.7988, "step": 4561 }, { "epoch": 0.36, "learning_rate": 0.0002895266307509856, "loss": 1.8349, "step": 4562 }, { "epoch": 0.36, "learning_rate": 0.00028952209290201975, "loss": 1.8125, "step": 4563 }, { "epoch": 0.36, "learning_rate": 0.00028951755410577595, "loss": 1.8001, "step": 4564 }, { "epoch": 0.36, "learning_rate": 0.00028951301436228494, "loss": 1.794, "step": 4565 }, { "epoch": 0.36, "learning_rate": 0.0002895084736715775, "loss": 1.8407, "step": 4566 }, { "epoch": 0.36, "learning_rate": 0.0002895039320336846, "loss": 1.9048, "step": 4567 }, { "epoch": 0.36, "learning_rate": 0.0002894993894486369, "loss": 1.8221, "step": 4568 }, { "epoch": 0.36, "learning_rate": 0.00028949484591646535, "loss": 1.8239, "step": 4569 }, { "epoch": 0.36, "learning_rate": 0.0002894903014372008, "loss": 1.8562, "step": 4570 }, { "epoch": 0.36, "learning_rate": 0.00028948575601087405, "loss": 1.8169, "step": 4571 }, { "epoch": 0.36, "learning_rate": 0.000289481209637516, "loss": 1.7939, "step": 4572 }, { "epoch": 0.36, "learning_rate": 0.00028947666231715754, "loss": 1.8155, "step": 4573 }, { "epoch": 0.36, "learning_rate": 0.00028947211404982946, "loss": 1.8777, "step": 4574 }, { "epoch": 0.36, "learning_rate": 0.0002894675648355628, "loss": 1.8058, "step": 4575 }, { "epoch": 0.36, "learning_rate": 0.00028946301467438817, "loss": 1.8301, "step": 4576 }, { "epoch": 0.36, "learning_rate": 0.00028945846356633677, "loss": 1.7487, "step": 4577 }, { "epoch": 0.36, "learning_rate": 0.0002894539115114393, "loss": 1.7915, "step": 4578 }, { "epoch": 0.36, "learning_rate": 0.0002894493585097268, "loss": 1.8113, "step": 4579 }, { "epoch": 0.36, "learning_rate": 0.00028944480456123, "loss": 1.7863, "step": 4580 }, { "epoch": 0.36, "learning_rate": 0.00028944024966598, "loss": 1.8151, "step": 4581 }, { "epoch": 0.36, "learning_rate": 0.00028943569382400763, "loss": 1.8631, "step": 4582 }, { "epoch": 0.36, "learning_rate": 0.00028943113703534383, "loss": 1.8099, "step": 4583 }, { "epoch": 0.36, "learning_rate": 0.0002894265793000196, "loss": 1.7975, "step": 4584 }, { "epoch": 0.36, "learning_rate": 0.0002894220206180658, "loss": 1.8831, "step": 4585 }, { "epoch": 0.36, "learning_rate": 0.0002894174609895135, "loss": 1.8068, "step": 4586 }, { "epoch": 0.36, "learning_rate": 0.00028941290041439345, "loss": 1.8035, "step": 4587 }, { "epoch": 0.36, "learning_rate": 0.0002894083388927368, "loss": 1.8669, "step": 4588 }, { "epoch": 0.36, "learning_rate": 0.00028940377642457446, "loss": 1.6967, "step": 4589 }, { "epoch": 0.36, "learning_rate": 0.0002893992130099374, "loss": 1.8192, "step": 4590 }, { "epoch": 0.36, "learning_rate": 0.0002893946486488567, "loss": 1.8273, "step": 4591 }, { "epoch": 0.36, "learning_rate": 0.00028939008334136315, "loss": 1.7473, "step": 4592 }, { "epoch": 0.36, "learning_rate": 0.00028938551708748787, "loss": 1.7773, "step": 4593 }, { "epoch": 0.36, "learning_rate": 0.00028938094988726184, "loss": 1.7582, "step": 4594 }, { "epoch": 0.36, "learning_rate": 0.0002893763817407161, "loss": 1.8074, "step": 4595 }, { "epoch": 0.36, "learning_rate": 0.0002893718126478817, "loss": 1.815, "step": 4596 }, { "epoch": 0.36, "learning_rate": 0.0002893672426087895, "loss": 1.8514, "step": 4597 }, { "epoch": 0.36, "learning_rate": 0.0002893626716234707, "loss": 1.7866, "step": 4598 }, { "epoch": 0.36, "learning_rate": 0.0002893580996919562, "loss": 1.8213, "step": 4599 }, { "epoch": 0.36, "learning_rate": 0.0002893535268142772, "loss": 1.8195, "step": 4600 }, { "epoch": 0.36, "learning_rate": 0.0002893489529904646, "loss": 1.7792, "step": 4601 }, { "epoch": 0.36, "learning_rate": 0.0002893443782205495, "loss": 1.7986, "step": 4602 }, { "epoch": 0.36, "learning_rate": 0.000289339802504563, "loss": 1.7646, "step": 4603 }, { "epoch": 0.36, "learning_rate": 0.0002893352258425361, "loss": 1.8399, "step": 4604 }, { "epoch": 0.36, "learning_rate": 0.00028933064823449996, "loss": 1.7845, "step": 4605 }, { "epoch": 0.36, "learning_rate": 0.00028932606968048557, "loss": 1.7479, "step": 4606 }, { "epoch": 0.36, "learning_rate": 0.00028932149018052404, "loss": 1.8055, "step": 4607 }, { "epoch": 0.36, "learning_rate": 0.0002893169097346465, "loss": 1.8764, "step": 4608 }, { "epoch": 0.36, "learning_rate": 0.00028931232834288403, "loss": 1.7993, "step": 4609 }, { "epoch": 0.36, "learning_rate": 0.00028930774600526775, "loss": 1.8492, "step": 4610 }, { "epoch": 0.36, "learning_rate": 0.0002893031627218287, "loss": 1.8131, "step": 4611 }, { "epoch": 0.36, "learning_rate": 0.00028929857849259807, "loss": 1.8208, "step": 4612 }, { "epoch": 0.36, "learning_rate": 0.0002892939933176069, "loss": 1.7508, "step": 4613 }, { "epoch": 0.36, "learning_rate": 0.0002892894071968865, "loss": 1.8266, "step": 4614 }, { "epoch": 0.36, "learning_rate": 0.00028928482013046783, "loss": 1.7404, "step": 4615 }, { "epoch": 0.36, "learning_rate": 0.00028928023211838213, "loss": 1.8314, "step": 4616 }, { "epoch": 0.36, "learning_rate": 0.0002892756431606605, "loss": 1.8392, "step": 4617 }, { "epoch": 0.36, "learning_rate": 0.00028927105325733405, "loss": 1.7772, "step": 4618 }, { "epoch": 0.36, "learning_rate": 0.00028926646240843407, "loss": 1.8255, "step": 4619 }, { "epoch": 0.36, "learning_rate": 0.0002892618706139917, "loss": 1.8164, "step": 4620 }, { "epoch": 0.36, "learning_rate": 0.000289257277874038, "loss": 1.7905, "step": 4621 }, { "epoch": 0.36, "learning_rate": 0.00028925268418860425, "loss": 1.8816, "step": 4622 }, { "epoch": 0.36, "learning_rate": 0.0002892480895577216, "loss": 1.8072, "step": 4623 }, { "epoch": 0.36, "learning_rate": 0.0002892434939814213, "loss": 1.833, "step": 4624 }, { "epoch": 0.36, "learning_rate": 0.00028923889745973455, "loss": 1.8335, "step": 4625 }, { "epoch": 0.36, "learning_rate": 0.0002892342999926925, "loss": 1.8101, "step": 4626 }, { "epoch": 0.36, "learning_rate": 0.00028922970158032634, "loss": 1.7816, "step": 4627 }, { "epoch": 0.36, "learning_rate": 0.0002892251022226674, "loss": 1.8268, "step": 4628 }, { "epoch": 0.36, "learning_rate": 0.0002892205019197468, "loss": 1.8517, "step": 4629 }, { "epoch": 0.36, "learning_rate": 0.00028921590067159585, "loss": 1.7647, "step": 4630 }, { "epoch": 0.36, "learning_rate": 0.00028921129847824575, "loss": 1.7684, "step": 4631 }, { "epoch": 0.36, "learning_rate": 0.0002892066953397277, "loss": 1.8452, "step": 4632 }, { "epoch": 0.36, "learning_rate": 0.00028920209125607313, "loss": 1.7859, "step": 4633 }, { "epoch": 0.36, "learning_rate": 0.00028919748622731307, "loss": 1.8552, "step": 4634 }, { "epoch": 0.36, "learning_rate": 0.00028919288025347896, "loss": 1.8553, "step": 4635 }, { "epoch": 0.36, "learning_rate": 0.000289188273334602, "loss": 1.7795, "step": 4636 }, { "epoch": 0.36, "learning_rate": 0.00028918366547071346, "loss": 1.8134, "step": 4637 }, { "epoch": 0.36, "learning_rate": 0.0002891790566618446, "loss": 1.7561, "step": 4638 }, { "epoch": 0.37, "learning_rate": 0.00028917444690802687, "loss": 1.8189, "step": 4639 }, { "epoch": 0.37, "learning_rate": 0.00028916983620929135, "loss": 1.7918, "step": 4640 }, { "epoch": 0.37, "learning_rate": 0.00028916522456566947, "loss": 1.826, "step": 4641 }, { "epoch": 0.37, "learning_rate": 0.0002891606119771925, "loss": 1.8461, "step": 4642 }, { "epoch": 0.37, "learning_rate": 0.0002891559984438918, "loss": 1.8024, "step": 4643 }, { "epoch": 0.37, "learning_rate": 0.0002891513839657986, "loss": 1.8398, "step": 4644 }, { "epoch": 0.37, "learning_rate": 0.0002891467685429443, "loss": 1.8423, "step": 4645 }, { "epoch": 0.37, "learning_rate": 0.0002891421521753603, "loss": 1.8324, "step": 4646 }, { "epoch": 0.37, "learning_rate": 0.00028913753486307784, "loss": 1.7454, "step": 4647 }, { "epoch": 0.37, "learning_rate": 0.00028913291660612823, "loss": 1.7958, "step": 4648 }, { "epoch": 0.37, "learning_rate": 0.000289128297404543, "loss": 1.7177, "step": 4649 }, { "epoch": 0.37, "learning_rate": 0.00028912367725835337, "loss": 1.841, "step": 4650 }, { "epoch": 0.37, "learning_rate": 0.00028911905616759077, "loss": 1.8075, "step": 4651 }, { "epoch": 0.37, "learning_rate": 0.00028911443413228647, "loss": 1.829, "step": 4652 }, { "epoch": 0.37, "learning_rate": 0.000289109811152472, "loss": 1.8292, "step": 4653 }, { "epoch": 0.37, "learning_rate": 0.00028910518722817866, "loss": 1.7714, "step": 4654 }, { "epoch": 0.37, "learning_rate": 0.00028910056235943786, "loss": 1.8173, "step": 4655 }, { "epoch": 0.37, "learning_rate": 0.000289095936546281, "loss": 1.7921, "step": 4656 }, { "epoch": 0.37, "learning_rate": 0.00028909130978873953, "loss": 1.8369, "step": 4657 }, { "epoch": 0.37, "learning_rate": 0.00028908668208684477, "loss": 1.8286, "step": 4658 }, { "epoch": 0.37, "learning_rate": 0.00028908205344062825, "loss": 1.8703, "step": 4659 }, { "epoch": 0.37, "learning_rate": 0.0002890774238501213, "loss": 1.7483, "step": 4660 }, { "epoch": 0.37, "learning_rate": 0.0002890727933153554, "loss": 1.772, "step": 4661 }, { "epoch": 0.37, "learning_rate": 0.00028906816183636193, "loss": 1.7914, "step": 4662 }, { "epoch": 0.37, "learning_rate": 0.0002890635294131725, "loss": 1.8308, "step": 4663 }, { "epoch": 0.37, "learning_rate": 0.00028905889604581835, "loss": 1.8577, "step": 4664 }, { "epoch": 0.37, "learning_rate": 0.0002890542617343311, "loss": 1.7471, "step": 4665 }, { "epoch": 0.37, "learning_rate": 0.0002890496264787421, "loss": 1.8125, "step": 4666 }, { "epoch": 0.37, "learning_rate": 0.0002890449902790829, "loss": 1.812, "step": 4667 }, { "epoch": 0.37, "learning_rate": 0.00028904035313538493, "loss": 1.826, "step": 4668 }, { "epoch": 0.37, "learning_rate": 0.00028903571504767964, "loss": 1.7648, "step": 4669 }, { "epoch": 0.37, "learning_rate": 0.0002890310760159986, "loss": 1.8471, "step": 4670 }, { "epoch": 0.37, "learning_rate": 0.00028902643604037336, "loss": 1.7101, "step": 4671 }, { "epoch": 0.37, "learning_rate": 0.00028902179512083526, "loss": 1.7512, "step": 4672 }, { "epoch": 0.37, "learning_rate": 0.0002890171532574159, "loss": 1.7263, "step": 4673 }, { "epoch": 0.37, "learning_rate": 0.00028901251045014684, "loss": 1.7857, "step": 4674 }, { "epoch": 0.37, "learning_rate": 0.0002890078666990595, "loss": 1.7938, "step": 4675 }, { "epoch": 0.37, "learning_rate": 0.00028900322200418546, "loss": 1.7827, "step": 4676 }, { "epoch": 0.37, "learning_rate": 0.00028899857636555625, "loss": 1.7885, "step": 4677 }, { "epoch": 0.37, "learning_rate": 0.0002889939297832034, "loss": 1.7916, "step": 4678 }, { "epoch": 0.37, "learning_rate": 0.0002889892822571585, "loss": 1.8203, "step": 4679 }, { "epoch": 0.37, "learning_rate": 0.000288984633787453, "loss": 1.7507, "step": 4680 }, { "epoch": 0.37, "learning_rate": 0.00028897998437411865, "loss": 1.8344, "step": 4681 }, { "epoch": 0.37, "learning_rate": 0.0002889753340171868, "loss": 1.822, "step": 4682 }, { "epoch": 0.37, "learning_rate": 0.00028897068271668916, "loss": 1.7815, "step": 4683 }, { "epoch": 0.37, "learning_rate": 0.0002889660304726573, "loss": 1.7893, "step": 4684 }, { "epoch": 0.37, "learning_rate": 0.0002889613772851228, "loss": 1.7628, "step": 4685 }, { "epoch": 0.37, "learning_rate": 0.0002889567231541172, "loss": 1.8182, "step": 4686 }, { "epoch": 0.37, "learning_rate": 0.0002889520680796721, "loss": 1.8701, "step": 4687 }, { "epoch": 0.37, "learning_rate": 0.0002889474120618192, "loss": 1.8303, "step": 4688 }, { "epoch": 0.37, "learning_rate": 0.00028894275510059, "loss": 1.8543, "step": 4689 }, { "epoch": 0.37, "learning_rate": 0.0002889380971960162, "loss": 1.8163, "step": 4690 }, { "epoch": 0.37, "learning_rate": 0.00028893343834812934, "loss": 1.7743, "step": 4691 }, { "epoch": 0.37, "learning_rate": 0.0002889287785569611, "loss": 1.712, "step": 4692 }, { "epoch": 0.37, "learning_rate": 0.0002889241178225432, "loss": 1.8191, "step": 4693 }, { "epoch": 0.37, "learning_rate": 0.0002889194561449072, "loss": 1.7361, "step": 4694 }, { "epoch": 0.37, "learning_rate": 0.00028891479352408474, "loss": 1.8117, "step": 4695 }, { "epoch": 0.37, "learning_rate": 0.0002889101299601075, "loss": 1.8042, "step": 4696 }, { "epoch": 0.37, "learning_rate": 0.00028890546545300703, "loss": 1.7966, "step": 4697 }, { "epoch": 0.37, "learning_rate": 0.0002889008000028152, "loss": 1.818, "step": 4698 }, { "epoch": 0.37, "learning_rate": 0.0002888961336095636, "loss": 1.7468, "step": 4699 }, { "epoch": 0.37, "learning_rate": 0.00028889146627328387, "loss": 1.7971, "step": 4700 }, { "epoch": 0.37, "learning_rate": 0.0002888867979940077, "loss": 1.7627, "step": 4701 }, { "epoch": 0.37, "learning_rate": 0.00028888212877176687, "loss": 1.842, "step": 4702 }, { "epoch": 0.37, "learning_rate": 0.000288877458606593, "loss": 1.8189, "step": 4703 }, { "epoch": 0.37, "learning_rate": 0.00028887278749851786, "loss": 1.7951, "step": 4704 }, { "epoch": 0.37, "learning_rate": 0.00028886811544757306, "loss": 1.8356, "step": 4705 }, { "epoch": 0.37, "learning_rate": 0.00028886344245379045, "loss": 1.8014, "step": 4706 }, { "epoch": 0.37, "learning_rate": 0.00028885876851720166, "loss": 1.7681, "step": 4707 }, { "epoch": 0.37, "learning_rate": 0.0002888540936378385, "loss": 1.7059, "step": 4708 }, { "epoch": 0.37, "learning_rate": 0.0002888494178157327, "loss": 1.7773, "step": 4709 }, { "epoch": 0.37, "learning_rate": 0.00028884474105091585, "loss": 1.8534, "step": 4710 }, { "epoch": 0.37, "learning_rate": 0.0002888400633434199, "loss": 1.8177, "step": 4711 }, { "epoch": 0.37, "learning_rate": 0.00028883538469327656, "loss": 1.8232, "step": 4712 }, { "epoch": 0.37, "learning_rate": 0.0002888307051005176, "loss": 1.7937, "step": 4713 }, { "epoch": 0.37, "learning_rate": 0.00028882602456517466, "loss": 1.7905, "step": 4714 }, { "epoch": 0.37, "learning_rate": 0.00028882134308727976, "loss": 1.7682, "step": 4715 }, { "epoch": 0.37, "learning_rate": 0.00028881666066686443, "loss": 1.8225, "step": 4716 }, { "epoch": 0.37, "learning_rate": 0.0002888119773039606, "loss": 1.7569, "step": 4717 }, { "epoch": 0.37, "learning_rate": 0.00028880729299860013, "loss": 1.8131, "step": 4718 }, { "epoch": 0.37, "learning_rate": 0.00028880260775081463, "loss": 1.8011, "step": 4719 }, { "epoch": 0.37, "learning_rate": 0.0002887979215606361, "loss": 1.7736, "step": 4720 }, { "epoch": 0.37, "learning_rate": 0.0002887932344280962, "loss": 1.8222, "step": 4721 }, { "epoch": 0.37, "learning_rate": 0.00028878854635322693, "loss": 1.7705, "step": 4722 }, { "epoch": 0.37, "learning_rate": 0.00028878385733606, "loss": 1.8099, "step": 4723 }, { "epoch": 0.37, "learning_rate": 0.0002887791673766272, "loss": 1.7923, "step": 4724 }, { "epoch": 0.37, "learning_rate": 0.00028877447647496045, "loss": 1.7516, "step": 4725 }, { "epoch": 0.37, "learning_rate": 0.0002887697846310916, "loss": 1.7975, "step": 4726 }, { "epoch": 0.37, "learning_rate": 0.0002887650918450525, "loss": 1.8161, "step": 4727 }, { "epoch": 0.37, "learning_rate": 0.00028876039811687507, "loss": 1.7986, "step": 4728 }, { "epoch": 0.37, "learning_rate": 0.00028875570344659104, "loss": 1.8068, "step": 4729 }, { "epoch": 0.37, "learning_rate": 0.00028875100783423235, "loss": 1.8103, "step": 4730 }, { "epoch": 0.37, "learning_rate": 0.0002887463112798309, "loss": 1.7722, "step": 4731 }, { "epoch": 0.37, "learning_rate": 0.0002887416137834186, "loss": 1.7677, "step": 4732 }, { "epoch": 0.37, "learning_rate": 0.00028873691534502725, "loss": 1.8155, "step": 4733 }, { "epoch": 0.37, "learning_rate": 0.00028873221596468877, "loss": 1.7977, "step": 4734 }, { "epoch": 0.37, "learning_rate": 0.0002887275156424352, "loss": 1.792, "step": 4735 }, { "epoch": 0.37, "learning_rate": 0.0002887228143782983, "loss": 1.7955, "step": 4736 }, { "epoch": 0.37, "learning_rate": 0.00028871811217231005, "loss": 1.7112, "step": 4737 }, { "epoch": 0.37, "learning_rate": 0.0002887134090245024, "loss": 1.8203, "step": 4738 }, { "epoch": 0.37, "learning_rate": 0.0002887087049349072, "loss": 1.806, "step": 4739 }, { "epoch": 0.37, "learning_rate": 0.00028870399990355646, "loss": 1.8295, "step": 4740 }, { "epoch": 0.37, "learning_rate": 0.0002886992939304821, "loss": 1.7846, "step": 4741 }, { "epoch": 0.37, "learning_rate": 0.0002886945870157161, "loss": 1.8022, "step": 4742 }, { "epoch": 0.37, "learning_rate": 0.00028868987915929036, "loss": 1.8358, "step": 4743 }, { "epoch": 0.37, "learning_rate": 0.0002886851703612369, "loss": 1.7986, "step": 4744 }, { "epoch": 0.37, "learning_rate": 0.0002886804606215877, "loss": 1.7864, "step": 4745 }, { "epoch": 0.37, "learning_rate": 0.0002886757499403747, "loss": 1.7876, "step": 4746 }, { "epoch": 0.37, "learning_rate": 0.0002886710383176298, "loss": 1.8322, "step": 4747 }, { "epoch": 0.37, "learning_rate": 0.00028866632575338507, "loss": 1.7673, "step": 4748 }, { "epoch": 0.37, "learning_rate": 0.0002886616122476726, "loss": 1.8106, "step": 4749 }, { "epoch": 0.37, "learning_rate": 0.0002886568978005243, "loss": 1.8079, "step": 4750 }, { "epoch": 0.37, "learning_rate": 0.0002886521824119721, "loss": 1.7671, "step": 4751 }, { "epoch": 0.37, "learning_rate": 0.0002886474660820482, "loss": 1.8391, "step": 4752 }, { "epoch": 0.37, "learning_rate": 0.0002886427488107844, "loss": 1.8542, "step": 4753 }, { "epoch": 0.37, "learning_rate": 0.0002886380305982129, "loss": 1.804, "step": 4754 }, { "epoch": 0.37, "learning_rate": 0.0002886333114443657, "loss": 1.7814, "step": 4755 }, { "epoch": 0.37, "learning_rate": 0.0002886285913492748, "loss": 1.7655, "step": 4756 }, { "epoch": 0.37, "learning_rate": 0.00028862387031297225, "loss": 1.7695, "step": 4757 }, { "epoch": 0.37, "learning_rate": 0.00028861914833549015, "loss": 1.8054, "step": 4758 }, { "epoch": 0.37, "learning_rate": 0.0002886144254168605, "loss": 1.7923, "step": 4759 }, { "epoch": 0.37, "learning_rate": 0.0002886097015571154, "loss": 1.7651, "step": 4760 }, { "epoch": 0.37, "learning_rate": 0.000288604976756287, "loss": 1.8352, "step": 4761 }, { "epoch": 0.37, "learning_rate": 0.0002886002510144072, "loss": 1.8203, "step": 4762 }, { "epoch": 0.37, "learning_rate": 0.0002885955243315082, "loss": 1.8422, "step": 4763 }, { "epoch": 0.37, "learning_rate": 0.00028859079670762205, "loss": 1.8041, "step": 4764 }, { "epoch": 0.37, "learning_rate": 0.00028858606814278093, "loss": 1.7881, "step": 4765 }, { "epoch": 0.37, "learning_rate": 0.00028858133863701686, "loss": 1.7745, "step": 4766 }, { "epoch": 0.38, "learning_rate": 0.0002885766081903619, "loss": 1.7966, "step": 4767 }, { "epoch": 0.38, "learning_rate": 0.00028857187680284837, "loss": 1.8001, "step": 4768 }, { "epoch": 0.38, "learning_rate": 0.00028856714447450825, "loss": 1.7806, "step": 4769 }, { "epoch": 0.38, "learning_rate": 0.00028856241120537365, "loss": 1.8594, "step": 4770 }, { "epoch": 0.38, "learning_rate": 0.0002885576769954767, "loss": 1.761, "step": 4771 }, { "epoch": 0.38, "learning_rate": 0.00028855294184484964, "loss": 1.77, "step": 4772 }, { "epoch": 0.38, "learning_rate": 0.0002885482057535246, "loss": 1.7815, "step": 4773 }, { "epoch": 0.38, "learning_rate": 0.00028854346872153364, "loss": 1.7617, "step": 4774 }, { "epoch": 0.38, "learning_rate": 0.000288538730748909, "loss": 1.8032, "step": 4775 }, { "epoch": 0.38, "learning_rate": 0.0002885339918356828, "loss": 1.801, "step": 4776 }, { "epoch": 0.38, "learning_rate": 0.0002885292519818873, "loss": 1.8203, "step": 4777 }, { "epoch": 0.38, "learning_rate": 0.00028852451118755454, "loss": 1.7875, "step": 4778 }, { "epoch": 0.38, "learning_rate": 0.0002885197694527169, "loss": 1.8158, "step": 4779 }, { "epoch": 0.38, "learning_rate": 0.0002885150267774064, "loss": 1.8066, "step": 4780 }, { "epoch": 0.38, "learning_rate": 0.0002885102831616553, "loss": 1.8133, "step": 4781 }, { "epoch": 0.38, "learning_rate": 0.00028850553860549586, "loss": 1.7745, "step": 4782 }, { "epoch": 0.38, "learning_rate": 0.0002885007931089602, "loss": 1.7416, "step": 4783 }, { "epoch": 0.38, "learning_rate": 0.0002884960466720806, "loss": 1.8859, "step": 4784 }, { "epoch": 0.38, "learning_rate": 0.0002884912992948893, "loss": 1.861, "step": 4785 }, { "epoch": 0.38, "learning_rate": 0.0002884865509774185, "loss": 1.7552, "step": 4786 }, { "epoch": 0.38, "learning_rate": 0.00028848180171970044, "loss": 1.7779, "step": 4787 }, { "epoch": 0.38, "learning_rate": 0.00028847705152176736, "loss": 1.778, "step": 4788 }, { "epoch": 0.38, "learning_rate": 0.0002884723003836515, "loss": 1.7081, "step": 4789 }, { "epoch": 0.38, "learning_rate": 0.00028846754830538513, "loss": 1.7803, "step": 4790 }, { "epoch": 0.38, "learning_rate": 0.0002884627952870006, "loss": 1.8038, "step": 4791 }, { "epoch": 0.38, "learning_rate": 0.00028845804132853, "loss": 1.7678, "step": 4792 }, { "epoch": 0.38, "learning_rate": 0.00028845328643000573, "loss": 1.7839, "step": 4793 }, { "epoch": 0.38, "learning_rate": 0.00028844853059146005, "loss": 1.8119, "step": 4794 }, { "epoch": 0.38, "learning_rate": 0.0002884437738129253, "loss": 1.8146, "step": 4795 }, { "epoch": 0.38, "learning_rate": 0.0002884390160944337, "loss": 1.7748, "step": 4796 }, { "epoch": 0.38, "learning_rate": 0.00028843425743601755, "loss": 1.755, "step": 4797 }, { "epoch": 0.38, "learning_rate": 0.0002884294978377092, "loss": 1.7539, "step": 4798 }, { "epoch": 0.38, "learning_rate": 0.000288424737299541, "loss": 1.7808, "step": 4799 }, { "epoch": 0.38, "learning_rate": 0.00028841997582154514, "loss": 1.7585, "step": 4800 }, { "epoch": 0.38, "learning_rate": 0.00028841521340375407, "loss": 1.8091, "step": 4801 }, { "epoch": 0.38, "learning_rate": 0.0002884104500462001, "loss": 1.8117, "step": 4802 }, { "epoch": 0.38, "learning_rate": 0.0002884056857489155, "loss": 1.777, "step": 4803 }, { "epoch": 0.38, "learning_rate": 0.00028840092051193275, "loss": 1.8239, "step": 4804 }, { "epoch": 0.38, "learning_rate": 0.00028839615433528404, "loss": 1.8121, "step": 4805 }, { "epoch": 0.38, "learning_rate": 0.00028839138721900186, "loss": 1.816, "step": 4806 }, { "epoch": 0.38, "learning_rate": 0.0002883866191631185, "loss": 1.7842, "step": 4807 }, { "epoch": 0.38, "learning_rate": 0.00028838185016766645, "loss": 1.769, "step": 4808 }, { "epoch": 0.38, "learning_rate": 0.00028837708023267796, "loss": 1.7576, "step": 4809 }, { "epoch": 0.38, "learning_rate": 0.00028837230935818545, "loss": 1.7769, "step": 4810 }, { "epoch": 0.38, "learning_rate": 0.0002883675375442213, "loss": 1.7792, "step": 4811 }, { "epoch": 0.38, "learning_rate": 0.00028836276479081793, "loss": 1.8199, "step": 4812 }, { "epoch": 0.38, "learning_rate": 0.00028835799109800774, "loss": 1.7742, "step": 4813 }, { "epoch": 0.38, "learning_rate": 0.0002883532164658232, "loss": 1.7833, "step": 4814 }, { "epoch": 0.38, "learning_rate": 0.00028834844089429667, "loss": 1.7666, "step": 4815 }, { "epoch": 0.38, "learning_rate": 0.0002883436643834605, "loss": 1.7969, "step": 4816 }, { "epoch": 0.38, "learning_rate": 0.0002883388869333472, "loss": 1.8637, "step": 4817 }, { "epoch": 0.38, "learning_rate": 0.00028833410854398923, "loss": 1.7467, "step": 4818 }, { "epoch": 0.38, "learning_rate": 0.000288329329215419, "loss": 1.8169, "step": 4819 }, { "epoch": 0.38, "learning_rate": 0.00028832454894766896, "loss": 1.7436, "step": 4820 }, { "epoch": 0.38, "learning_rate": 0.00028831976774077155, "loss": 1.7133, "step": 4821 }, { "epoch": 0.38, "learning_rate": 0.0002883149855947593, "loss": 1.7767, "step": 4822 }, { "epoch": 0.38, "learning_rate": 0.0002883102025096646, "loss": 1.7656, "step": 4823 }, { "epoch": 0.38, "learning_rate": 0.00028830541848551993, "loss": 1.7672, "step": 4824 }, { "epoch": 0.38, "learning_rate": 0.0002883006335223578, "loss": 1.7811, "step": 4825 }, { "epoch": 0.38, "learning_rate": 0.00028829584762021066, "loss": 1.7971, "step": 4826 }, { "epoch": 0.38, "learning_rate": 0.0002882910607791111, "loss": 1.7755, "step": 4827 }, { "epoch": 0.38, "learning_rate": 0.0002882862729990915, "loss": 1.7661, "step": 4828 }, { "epoch": 0.38, "learning_rate": 0.0002882814842801844, "loss": 1.8277, "step": 4829 }, { "epoch": 0.38, "learning_rate": 0.0002882766946224224, "loss": 1.775, "step": 4830 }, { "epoch": 0.38, "learning_rate": 0.0002882719040258379, "loss": 1.8319, "step": 4831 }, { "epoch": 0.38, "learning_rate": 0.00028826711249046354, "loss": 1.8119, "step": 4832 }, { "epoch": 0.38, "learning_rate": 0.0002882623200163317, "loss": 1.8511, "step": 4833 }, { "epoch": 0.38, "learning_rate": 0.00028825752660347506, "loss": 1.7976, "step": 4834 }, { "epoch": 0.38, "learning_rate": 0.0002882527322519261, "loss": 1.8648, "step": 4835 }, { "epoch": 0.38, "learning_rate": 0.0002882479369617174, "loss": 1.7874, "step": 4836 }, { "epoch": 0.38, "learning_rate": 0.0002882431407328815, "loss": 1.8605, "step": 4837 }, { "epoch": 0.38, "learning_rate": 0.00028823834356545095, "loss": 1.7908, "step": 4838 }, { "epoch": 0.38, "learning_rate": 0.0002882335454594583, "loss": 1.7928, "step": 4839 }, { "epoch": 0.38, "learning_rate": 0.00028822874641493617, "loss": 1.8122, "step": 4840 }, { "epoch": 0.38, "learning_rate": 0.0002882239464319172, "loss": 1.7979, "step": 4841 }, { "epoch": 0.38, "learning_rate": 0.0002882191455104338, "loss": 1.7467, "step": 4842 }, { "epoch": 0.38, "learning_rate": 0.0002882143436505188, "loss": 1.7766, "step": 4843 }, { "epoch": 0.38, "learning_rate": 0.00028820954085220465, "loss": 1.7871, "step": 4844 }, { "epoch": 0.38, "learning_rate": 0.0002882047371155239, "loss": 1.8, "step": 4845 }, { "epoch": 0.38, "learning_rate": 0.00028819993244050935, "loss": 1.8039, "step": 4846 }, { "epoch": 0.38, "learning_rate": 0.0002881951268271935, "loss": 1.75, "step": 4847 }, { "epoch": 0.38, "learning_rate": 0.000288190320275609, "loss": 1.7957, "step": 4848 }, { "epoch": 0.38, "learning_rate": 0.00028818551278578843, "loss": 1.7825, "step": 4849 }, { "epoch": 0.38, "learning_rate": 0.0002881807043577645, "loss": 1.8029, "step": 4850 }, { "epoch": 0.38, "learning_rate": 0.0002881758949915699, "loss": 1.8182, "step": 4851 }, { "epoch": 0.38, "learning_rate": 0.0002881710846872372, "loss": 1.8009, "step": 4852 }, { "epoch": 0.38, "learning_rate": 0.00028816627344479905, "loss": 1.8021, "step": 4853 }, { "epoch": 0.38, "learning_rate": 0.0002881614612642882, "loss": 1.8097, "step": 4854 }, { "epoch": 0.38, "learning_rate": 0.00028815664814573725, "loss": 1.7896, "step": 4855 }, { "epoch": 0.38, "learning_rate": 0.00028815183408917886, "loss": 1.8043, "step": 4856 }, { "epoch": 0.38, "learning_rate": 0.00028814701909464583, "loss": 1.7569, "step": 4857 }, { "epoch": 0.38, "learning_rate": 0.00028814220316217076, "loss": 1.7645, "step": 4858 }, { "epoch": 0.38, "learning_rate": 0.0002881373862917863, "loss": 1.8029, "step": 4859 }, { "epoch": 0.38, "learning_rate": 0.0002881325684835253, "loss": 1.7755, "step": 4860 }, { "epoch": 0.38, "learning_rate": 0.00028812774973742037, "loss": 1.7902, "step": 4861 }, { "epoch": 0.38, "learning_rate": 0.0002881229300535042, "loss": 1.8395, "step": 4862 }, { "epoch": 0.38, "learning_rate": 0.00028811810943180956, "loss": 1.7544, "step": 4863 }, { "epoch": 0.38, "learning_rate": 0.0002881132878723692, "loss": 1.7848, "step": 4864 }, { "epoch": 0.38, "learning_rate": 0.0002881084653752158, "loss": 1.8153, "step": 4865 }, { "epoch": 0.38, "learning_rate": 0.0002881036419403822, "loss": 1.8466, "step": 4866 }, { "epoch": 0.38, "learning_rate": 0.00028809881756790105, "loss": 1.8011, "step": 4867 }, { "epoch": 0.38, "learning_rate": 0.00028809399225780517, "loss": 1.7682, "step": 4868 }, { "epoch": 0.38, "learning_rate": 0.00028808916601012725, "loss": 1.7618, "step": 4869 }, { "epoch": 0.38, "learning_rate": 0.0002880843388249001, "loss": 1.8203, "step": 4870 }, { "epoch": 0.38, "learning_rate": 0.00028807951070215646, "loss": 1.7621, "step": 4871 }, { "epoch": 0.38, "learning_rate": 0.00028807468164192924, "loss": 1.8405, "step": 4872 }, { "epoch": 0.38, "learning_rate": 0.000288069851644251, "loss": 1.7901, "step": 4873 }, { "epoch": 0.38, "learning_rate": 0.0002880650207091547, "loss": 1.7941, "step": 4874 }, { "epoch": 0.38, "learning_rate": 0.00028806018883667316, "loss": 1.8079, "step": 4875 }, { "epoch": 0.38, "learning_rate": 0.0002880553560268391, "loss": 1.8097, "step": 4876 }, { "epoch": 0.38, "learning_rate": 0.0002880505222796853, "loss": 1.8092, "step": 4877 }, { "epoch": 0.38, "learning_rate": 0.00028804568759524475, "loss": 1.8661, "step": 4878 }, { "epoch": 0.38, "learning_rate": 0.00028804085197355007, "loss": 1.7284, "step": 4879 }, { "epoch": 0.38, "learning_rate": 0.00028803601541463423, "loss": 1.7954, "step": 4880 }, { "epoch": 0.38, "learning_rate": 0.00028803117791852996, "loss": 1.8159, "step": 4881 }, { "epoch": 0.38, "learning_rate": 0.0002880263394852702, "loss": 1.8074, "step": 4882 }, { "epoch": 0.38, "learning_rate": 0.0002880215001148878, "loss": 1.7905, "step": 4883 }, { "epoch": 0.38, "learning_rate": 0.0002880166598074155, "loss": 1.7942, "step": 4884 }, { "epoch": 0.38, "learning_rate": 0.00028801181856288633, "loss": 1.8394, "step": 4885 }, { "epoch": 0.38, "learning_rate": 0.000288006976381333, "loss": 1.7735, "step": 4886 }, { "epoch": 0.38, "learning_rate": 0.00028800213326278854, "loss": 1.7868, "step": 4887 }, { "epoch": 0.38, "learning_rate": 0.0002879972892072857, "loss": 1.773, "step": 4888 }, { "epoch": 0.38, "learning_rate": 0.0002879924442148574, "loss": 1.8594, "step": 4889 }, { "epoch": 0.38, "learning_rate": 0.00028798759828553653, "loss": 1.8087, "step": 4890 }, { "epoch": 0.38, "learning_rate": 0.0002879827514193561, "loss": 1.7892, "step": 4891 }, { "epoch": 0.38, "learning_rate": 0.00028797790361634887, "loss": 1.8169, "step": 4892 }, { "epoch": 0.38, "learning_rate": 0.0002879730548765478, "loss": 1.8144, "step": 4893 }, { "epoch": 0.39, "learning_rate": 0.0002879682051999859, "loss": 1.8025, "step": 4894 }, { "epoch": 0.39, "learning_rate": 0.000287963354586696, "loss": 1.7879, "step": 4895 }, { "epoch": 0.39, "learning_rate": 0.000287958503036711, "loss": 1.7033, "step": 4896 }, { "epoch": 0.39, "learning_rate": 0.000287953650550064, "loss": 1.7853, "step": 4897 }, { "epoch": 0.39, "learning_rate": 0.0002879487971267878, "loss": 1.8166, "step": 4898 }, { "epoch": 0.39, "learning_rate": 0.00028794394276691535, "loss": 1.8124, "step": 4899 }, { "epoch": 0.39, "learning_rate": 0.00028793908747047967, "loss": 1.7731, "step": 4900 }, { "epoch": 0.39, "learning_rate": 0.00028793423123751373, "loss": 1.8326, "step": 4901 }, { "epoch": 0.39, "learning_rate": 0.0002879293740680505, "loss": 1.7531, "step": 4902 }, { "epoch": 0.39, "learning_rate": 0.0002879245159621229, "loss": 1.7644, "step": 4903 }, { "epoch": 0.39, "learning_rate": 0.00028791965691976395, "loss": 1.8506, "step": 4904 }, { "epoch": 0.39, "learning_rate": 0.00028791479694100663, "loss": 1.8337, "step": 4905 }, { "epoch": 0.39, "learning_rate": 0.00028790993602588396, "loss": 1.8197, "step": 4906 }, { "epoch": 0.39, "learning_rate": 0.00028790507417442894, "loss": 1.7607, "step": 4907 }, { "epoch": 0.39, "learning_rate": 0.00028790021138667455, "loss": 1.8464, "step": 4908 }, { "epoch": 0.39, "learning_rate": 0.00028789534766265385, "loss": 1.7903, "step": 4909 }, { "epoch": 0.39, "learning_rate": 0.0002878904830023998, "loss": 1.7956, "step": 4910 }, { "epoch": 0.39, "learning_rate": 0.00028788561740594553, "loss": 1.8348, "step": 4911 }, { "epoch": 0.39, "learning_rate": 0.00028788075087332393, "loss": 1.7572, "step": 4912 }, { "epoch": 0.39, "learning_rate": 0.00028787588340456813, "loss": 1.8169, "step": 4913 }, { "epoch": 0.39, "learning_rate": 0.0002878710149997112, "loss": 1.7958, "step": 4914 }, { "epoch": 0.39, "learning_rate": 0.0002878661456587862, "loss": 1.7938, "step": 4915 }, { "epoch": 0.39, "learning_rate": 0.00028786127538182605, "loss": 1.8069, "step": 4916 }, { "epoch": 0.39, "learning_rate": 0.000287856404168864, "loss": 1.7881, "step": 4917 }, { "epoch": 0.39, "learning_rate": 0.000287851532019933, "loss": 1.8497, "step": 4918 }, { "epoch": 0.39, "learning_rate": 0.0002878466589350662, "loss": 1.8019, "step": 4919 }, { "epoch": 0.39, "learning_rate": 0.0002878417849142966, "loss": 1.7965, "step": 4920 }, { "epoch": 0.39, "learning_rate": 0.00028783690995765743, "loss": 1.8031, "step": 4921 }, { "epoch": 0.39, "learning_rate": 0.0002878320340651817, "loss": 1.7523, "step": 4922 }, { "epoch": 0.39, "learning_rate": 0.0002878271572369025, "loss": 1.7838, "step": 4923 }, { "epoch": 0.39, "learning_rate": 0.00028782227947285287, "loss": 1.821, "step": 4924 }, { "epoch": 0.39, "learning_rate": 0.0002878174007730661, "loss": 1.8081, "step": 4925 }, { "epoch": 0.39, "learning_rate": 0.00028781252113757523, "loss": 1.8133, "step": 4926 }, { "epoch": 0.39, "learning_rate": 0.0002878076405664134, "loss": 1.8079, "step": 4927 }, { "epoch": 0.39, "learning_rate": 0.00028780275905961375, "loss": 1.7654, "step": 4928 }, { "epoch": 0.39, "learning_rate": 0.0002877978766172094, "loss": 1.7837, "step": 4929 }, { "epoch": 0.39, "learning_rate": 0.00028779299323923347, "loss": 1.7296, "step": 4930 }, { "epoch": 0.39, "learning_rate": 0.0002877881089257192, "loss": 1.7745, "step": 4931 }, { "epoch": 0.39, "learning_rate": 0.0002877832236766997, "loss": 1.7196, "step": 4932 }, { "epoch": 0.39, "learning_rate": 0.00028777833749220815, "loss": 1.7784, "step": 4933 }, { "epoch": 0.39, "learning_rate": 0.0002877734503722777, "loss": 1.7748, "step": 4934 }, { "epoch": 0.39, "learning_rate": 0.0002877685623169416, "loss": 1.746, "step": 4935 }, { "epoch": 0.39, "learning_rate": 0.0002877636733262329, "loss": 1.7767, "step": 4936 }, { "epoch": 0.39, "learning_rate": 0.000287758783400185, "loss": 1.7796, "step": 4937 }, { "epoch": 0.39, "learning_rate": 0.0002877538925388309, "loss": 1.7607, "step": 4938 }, { "epoch": 0.39, "learning_rate": 0.0002877490007422039, "loss": 1.7866, "step": 4939 }, { "epoch": 0.39, "learning_rate": 0.0002877441080103372, "loss": 1.7853, "step": 4940 }, { "epoch": 0.39, "learning_rate": 0.000287739214343264, "loss": 1.784, "step": 4941 }, { "epoch": 0.39, "learning_rate": 0.0002877343197410176, "loss": 1.7738, "step": 4942 }, { "epoch": 0.39, "learning_rate": 0.0002877294242036311, "loss": 1.7849, "step": 4943 }, { "epoch": 0.39, "learning_rate": 0.0002877245277311379, "loss": 1.742, "step": 4944 }, { "epoch": 0.39, "learning_rate": 0.00028771963032357114, "loss": 1.7943, "step": 4945 }, { "epoch": 0.39, "learning_rate": 0.00028771473198096407, "loss": 1.8224, "step": 4946 }, { "epoch": 0.39, "learning_rate": 0.00028770983270335, "loss": 1.8021, "step": 4947 }, { "epoch": 0.39, "learning_rate": 0.00028770493249076213, "loss": 1.7702, "step": 4948 }, { "epoch": 0.39, "learning_rate": 0.0002877000313432337, "loss": 1.7285, "step": 4949 }, { "epoch": 0.39, "learning_rate": 0.00028769512926079817, "loss": 1.7677, "step": 4950 }, { "epoch": 0.39, "learning_rate": 0.00028769022624348863, "loss": 1.7977, "step": 4951 }, { "epoch": 0.39, "learning_rate": 0.00028768532229133845, "loss": 1.8346, "step": 4952 }, { "epoch": 0.39, "learning_rate": 0.0002876804174043809, "loss": 1.7731, "step": 4953 }, { "epoch": 0.39, "learning_rate": 0.00028767551158264933, "loss": 1.7777, "step": 4954 }, { "epoch": 0.39, "learning_rate": 0.00028767060482617695, "loss": 1.809, "step": 4955 }, { "epoch": 0.39, "learning_rate": 0.0002876656971349972, "loss": 1.7922, "step": 4956 }, { "epoch": 0.39, "learning_rate": 0.0002876607885091433, "loss": 1.7829, "step": 4957 }, { "epoch": 0.39, "learning_rate": 0.0002876558789486486, "loss": 1.7998, "step": 4958 }, { "epoch": 0.39, "learning_rate": 0.0002876509684535465, "loss": 1.7789, "step": 4959 }, { "epoch": 0.39, "learning_rate": 0.0002876460570238703, "loss": 1.7699, "step": 4960 }, { "epoch": 0.39, "learning_rate": 0.0002876411446596532, "loss": 1.7757, "step": 4961 }, { "epoch": 0.39, "learning_rate": 0.0002876362313609288, "loss": 1.8406, "step": 4962 }, { "epoch": 0.39, "learning_rate": 0.0002876313171277303, "loss": 1.7933, "step": 4963 }, { "epoch": 0.39, "learning_rate": 0.00028762640196009116, "loss": 1.7499, "step": 4964 }, { "epoch": 0.39, "learning_rate": 0.00028762148585804466, "loss": 1.748, "step": 4965 }, { "epoch": 0.39, "learning_rate": 0.0002876165688216242, "loss": 1.7864, "step": 4966 }, { "epoch": 0.39, "learning_rate": 0.00028761165085086323, "loss": 1.7634, "step": 4967 }, { "epoch": 0.39, "learning_rate": 0.00028760673194579503, "loss": 1.7976, "step": 4968 }, { "epoch": 0.39, "learning_rate": 0.0002876018121064531, "loss": 1.8359, "step": 4969 }, { "epoch": 0.39, "learning_rate": 0.0002875968913328708, "loss": 1.8033, "step": 4970 }, { "epoch": 0.39, "learning_rate": 0.0002875919696250815, "loss": 1.7293, "step": 4971 }, { "epoch": 0.39, "learning_rate": 0.00028758704698311874, "loss": 1.8518, "step": 4972 }, { "epoch": 0.39, "learning_rate": 0.00028758212340701577, "loss": 1.7522, "step": 4973 }, { "epoch": 0.39, "learning_rate": 0.00028757719889680616, "loss": 1.7683, "step": 4974 }, { "epoch": 0.39, "learning_rate": 0.00028757227345252326, "loss": 1.8087, "step": 4975 }, { "epoch": 0.39, "learning_rate": 0.00028756734707420056, "loss": 1.8332, "step": 4976 }, { "epoch": 0.39, "learning_rate": 0.00028756241976187147, "loss": 1.8648, "step": 4977 }, { "epoch": 0.39, "learning_rate": 0.0002875574915155695, "loss": 1.7956, "step": 4978 }, { "epoch": 0.39, "learning_rate": 0.000287552562335328, "loss": 1.7902, "step": 4979 }, { "epoch": 0.39, "learning_rate": 0.00028754763222118055, "loss": 1.7765, "step": 4980 }, { "epoch": 0.39, "learning_rate": 0.0002875427011731606, "loss": 1.7793, "step": 4981 }, { "epoch": 0.39, "learning_rate": 0.0002875377691913016, "loss": 1.7469, "step": 4982 }, { "epoch": 0.39, "learning_rate": 0.000287532836275637, "loss": 1.7882, "step": 4983 }, { "epoch": 0.39, "learning_rate": 0.00028752790242620043, "loss": 1.7714, "step": 4984 }, { "epoch": 0.39, "learning_rate": 0.0002875229676430253, "loss": 1.7446, "step": 4985 }, { "epoch": 0.39, "learning_rate": 0.00028751803192614506, "loss": 1.7489, "step": 4986 }, { "epoch": 0.39, "learning_rate": 0.0002875130952755933, "loss": 1.7698, "step": 4987 }, { "epoch": 0.39, "learning_rate": 0.0002875081576914034, "loss": 1.7588, "step": 4988 }, { "epoch": 0.39, "learning_rate": 0.0002875032191736091, "loss": 1.8215, "step": 4989 }, { "epoch": 0.39, "learning_rate": 0.0002874982797222438, "loss": 1.7644, "step": 4990 }, { "epoch": 0.39, "learning_rate": 0.00028749333933734104, "loss": 1.7709, "step": 4991 }, { "epoch": 0.39, "learning_rate": 0.0002874883980189344, "loss": 1.7327, "step": 4992 }, { "epoch": 0.39, "learning_rate": 0.00028748345576705745, "loss": 1.8171, "step": 4993 }, { "epoch": 0.39, "learning_rate": 0.0002874785125817437, "loss": 1.8141, "step": 4994 }, { "epoch": 0.39, "learning_rate": 0.0002874735684630266, "loss": 1.8399, "step": 4995 }, { "epoch": 0.39, "learning_rate": 0.00028746862341093993, "loss": 1.7655, "step": 4996 }, { "epoch": 0.39, "learning_rate": 0.00028746367742551717, "loss": 1.8171, "step": 4997 }, { "epoch": 0.39, "learning_rate": 0.00028745873050679187, "loss": 1.8, "step": 4998 }, { "epoch": 0.39, "learning_rate": 0.0002874537826547977, "loss": 1.7688, "step": 4999 }, { "epoch": 0.39, "learning_rate": 0.00028744883386956817, "loss": 1.8219, "step": 5000 }, { "epoch": 0.39, "learning_rate": 0.00028744388415113687, "loss": 1.7348, "step": 5001 }, { "epoch": 0.39, "learning_rate": 0.00028743893349953743, "loss": 1.7209, "step": 5002 }, { "epoch": 0.39, "learning_rate": 0.00028743398191480356, "loss": 1.7841, "step": 5003 }, { "epoch": 0.39, "learning_rate": 0.00028742902939696876, "loss": 1.7538, "step": 5004 }, { "epoch": 0.39, "learning_rate": 0.00028742407594606665, "loss": 1.7618, "step": 5005 }, { "epoch": 0.39, "learning_rate": 0.00028741912156213093, "loss": 1.7619, "step": 5006 }, { "epoch": 0.39, "learning_rate": 0.0002874141662451952, "loss": 1.8046, "step": 5007 }, { "epoch": 0.39, "learning_rate": 0.00028740920999529315, "loss": 1.8282, "step": 5008 }, { "epoch": 0.39, "learning_rate": 0.00028740425281245836, "loss": 1.8163, "step": 5009 }, { "epoch": 0.39, "learning_rate": 0.0002873992946967245, "loss": 1.7597, "step": 5010 }, { "epoch": 0.39, "learning_rate": 0.0002873943356481253, "loss": 1.7948, "step": 5011 }, { "epoch": 0.39, "learning_rate": 0.0002873893756666944, "loss": 1.7605, "step": 5012 }, { "epoch": 0.39, "learning_rate": 0.00028738441475246535, "loss": 1.7911, "step": 5013 }, { "epoch": 0.39, "learning_rate": 0.000287379452905472, "loss": 1.7897, "step": 5014 }, { "epoch": 0.39, "learning_rate": 0.00028737449012574806, "loss": 1.7753, "step": 5015 }, { "epoch": 0.39, "learning_rate": 0.00028736952641332704, "loss": 1.7807, "step": 5016 }, { "epoch": 0.39, "learning_rate": 0.00028736456176824273, "loss": 1.7865, "step": 5017 }, { "epoch": 0.39, "learning_rate": 0.0002873595961905289, "loss": 1.7954, "step": 5018 }, { "epoch": 0.39, "learning_rate": 0.00028735462968021923, "loss": 1.7662, "step": 5019 }, { "epoch": 0.39, "learning_rate": 0.0002873496622373474, "loss": 1.8498, "step": 5020 }, { "epoch": 0.4, "learning_rate": 0.00028734469386194715, "loss": 1.6987, "step": 5021 }, { "epoch": 0.4, "learning_rate": 0.0002873397245540522, "loss": 1.7412, "step": 5022 }, { "epoch": 0.4, "learning_rate": 0.00028733475431369634, "loss": 1.8328, "step": 5023 }, { "epoch": 0.4, "learning_rate": 0.0002873297831409133, "loss": 1.8273, "step": 5024 }, { "epoch": 0.4, "learning_rate": 0.00028732481103573677, "loss": 1.8212, "step": 5025 }, { "epoch": 0.4, "learning_rate": 0.0002873198379982006, "loss": 1.8613, "step": 5026 }, { "epoch": 0.4, "learning_rate": 0.00028731486402833845, "loss": 1.7316, "step": 5027 }, { "epoch": 0.4, "learning_rate": 0.0002873098891261842, "loss": 1.8405, "step": 5028 }, { "epoch": 0.4, "learning_rate": 0.00028730491329177164, "loss": 1.7525, "step": 5029 }, { "epoch": 0.4, "learning_rate": 0.0002872999365251344, "loss": 1.795, "step": 5030 }, { "epoch": 0.4, "learning_rate": 0.00028729495882630633, "loss": 1.7502, "step": 5031 }, { "epoch": 0.4, "learning_rate": 0.0002872899801953213, "loss": 1.8218, "step": 5032 }, { "epoch": 0.4, "learning_rate": 0.0002872850006322131, "loss": 1.75, "step": 5033 }, { "epoch": 0.4, "learning_rate": 0.0002872800201370155, "loss": 1.7791, "step": 5034 }, { "epoch": 0.4, "learning_rate": 0.00028727503870976226, "loss": 1.7304, "step": 5035 }, { "epoch": 0.4, "learning_rate": 0.0002872700563504873, "loss": 1.7654, "step": 5036 }, { "epoch": 0.4, "learning_rate": 0.0002872650730592244, "loss": 1.8018, "step": 5037 }, { "epoch": 0.4, "learning_rate": 0.0002872600888360074, "loss": 1.7871, "step": 5038 }, { "epoch": 0.4, "learning_rate": 0.0002872551036808702, "loss": 1.809, "step": 5039 }, { "epoch": 0.4, "learning_rate": 0.0002872501175938465, "loss": 1.8053, "step": 5040 }, { "epoch": 0.4, "learning_rate": 0.0002872451305749703, "loss": 1.76, "step": 5041 }, { "epoch": 0.4, "learning_rate": 0.00028724014262427537, "loss": 1.7399, "step": 5042 }, { "epoch": 0.4, "learning_rate": 0.00028723515374179566, "loss": 1.7887, "step": 5043 }, { "epoch": 0.4, "learning_rate": 0.00028723016392756496, "loss": 1.8079, "step": 5044 }, { "epoch": 0.4, "learning_rate": 0.0002872251731816171, "loss": 1.7979, "step": 5045 }, { "epoch": 0.4, "learning_rate": 0.00028722018150398613, "loss": 1.7651, "step": 5046 }, { "epoch": 0.4, "learning_rate": 0.0002872151888947059, "loss": 1.6973, "step": 5047 }, { "epoch": 0.4, "learning_rate": 0.0002872101953538102, "loss": 1.8021, "step": 5048 }, { "epoch": 0.4, "learning_rate": 0.0002872052008813329, "loss": 1.7737, "step": 5049 }, { "epoch": 0.4, "learning_rate": 0.00028720020547730817, "loss": 1.7758, "step": 5050 }, { "epoch": 0.4, "learning_rate": 0.0002871952091417697, "loss": 1.8059, "step": 5051 }, { "epoch": 0.4, "learning_rate": 0.0002871902118747514, "loss": 1.7646, "step": 5052 }, { "epoch": 0.4, "learning_rate": 0.0002871852136762873, "loss": 1.8582, "step": 5053 }, { "epoch": 0.4, "learning_rate": 0.00028718021454641134, "loss": 1.8179, "step": 5054 }, { "epoch": 0.4, "learning_rate": 0.00028717521448515736, "loss": 1.8118, "step": 5055 }, { "epoch": 0.4, "learning_rate": 0.0002871702134925594, "loss": 1.777, "step": 5056 }, { "epoch": 0.4, "learning_rate": 0.0002871652115686514, "loss": 1.8057, "step": 5057 }, { "epoch": 0.4, "learning_rate": 0.00028716020871346736, "loss": 1.7761, "step": 5058 }, { "epoch": 0.4, "learning_rate": 0.00028715520492704114, "loss": 1.7549, "step": 5059 }, { "epoch": 0.4, "learning_rate": 0.0002871502002094068, "loss": 1.7664, "step": 5060 }, { "epoch": 0.4, "learning_rate": 0.00028714519456059825, "loss": 1.8068, "step": 5061 }, { "epoch": 0.4, "learning_rate": 0.0002871401879806495, "loss": 1.8126, "step": 5062 }, { "epoch": 0.4, "learning_rate": 0.00028713518046959456, "loss": 1.8563, "step": 5063 }, { "epoch": 0.4, "learning_rate": 0.0002871301720274675, "loss": 1.7647, "step": 5064 }, { "epoch": 0.4, "learning_rate": 0.00028712516265430214, "loss": 1.8037, "step": 5065 }, { "epoch": 0.4, "learning_rate": 0.00028712015235013265, "loss": 1.7889, "step": 5066 }, { "epoch": 0.4, "learning_rate": 0.00028711514111499296, "loss": 1.7822, "step": 5067 }, { "epoch": 0.4, "learning_rate": 0.00028711012894891717, "loss": 1.7445, "step": 5068 }, { "epoch": 0.4, "learning_rate": 0.00028710511585193927, "loss": 1.7453, "step": 5069 }, { "epoch": 0.4, "learning_rate": 0.0002871001018240933, "loss": 1.7528, "step": 5070 }, { "epoch": 0.4, "learning_rate": 0.0002870950868654132, "loss": 1.8327, "step": 5071 }, { "epoch": 0.4, "learning_rate": 0.00028709007097593324, "loss": 1.7278, "step": 5072 }, { "epoch": 0.4, "learning_rate": 0.0002870850541556873, "loss": 1.7863, "step": 5073 }, { "epoch": 0.4, "learning_rate": 0.0002870800364047095, "loss": 1.8337, "step": 5074 }, { "epoch": 0.4, "learning_rate": 0.0002870750177230339, "loss": 1.7688, "step": 5075 }, { "epoch": 0.4, "learning_rate": 0.00028706999811069456, "loss": 1.8003, "step": 5076 }, { "epoch": 0.4, "learning_rate": 0.00028706497756772557, "loss": 1.7959, "step": 5077 }, { "epoch": 0.4, "learning_rate": 0.000287059956094161, "loss": 1.7479, "step": 5078 }, { "epoch": 0.4, "learning_rate": 0.00028705493369003503, "loss": 1.7948, "step": 5079 }, { "epoch": 0.4, "learning_rate": 0.0002870499103553816, "loss": 1.8292, "step": 5080 }, { "epoch": 0.4, "learning_rate": 0.000287044886090235, "loss": 1.8242, "step": 5081 }, { "epoch": 0.4, "learning_rate": 0.00028703986089462924, "loss": 1.7769, "step": 5082 }, { "epoch": 0.4, "learning_rate": 0.0002870348347685984, "loss": 1.7756, "step": 5083 }, { "epoch": 0.4, "learning_rate": 0.0002870298077121767, "loss": 1.8318, "step": 5084 }, { "epoch": 0.4, "learning_rate": 0.0002870247797253982, "loss": 1.8246, "step": 5085 }, { "epoch": 0.4, "learning_rate": 0.00028701975080829706, "loss": 1.7686, "step": 5086 }, { "epoch": 0.4, "learning_rate": 0.00028701472096090744, "loss": 1.7749, "step": 5087 }, { "epoch": 0.4, "learning_rate": 0.0002870096901832635, "loss": 1.8261, "step": 5088 }, { "epoch": 0.4, "learning_rate": 0.0002870046584753993, "loss": 1.7398, "step": 5089 }, { "epoch": 0.4, "learning_rate": 0.00028699962583734914, "loss": 1.7793, "step": 5090 }, { "epoch": 0.4, "learning_rate": 0.0002869945922691471, "loss": 1.8203, "step": 5091 }, { "epoch": 0.4, "learning_rate": 0.0002869895577708274, "loss": 1.7906, "step": 5092 }, { "epoch": 0.4, "learning_rate": 0.00028698452234242414, "loss": 1.7509, "step": 5093 }, { "epoch": 0.4, "learning_rate": 0.0002869794859839716, "loss": 1.8262, "step": 5094 }, { "epoch": 0.4, "learning_rate": 0.000286974448695504, "loss": 1.8095, "step": 5095 }, { "epoch": 0.4, "learning_rate": 0.00028696941047705543, "loss": 1.7394, "step": 5096 }, { "epoch": 0.4, "learning_rate": 0.0002869643713286601, "loss": 1.7691, "step": 5097 }, { "epoch": 0.4, "learning_rate": 0.00028695933125035233, "loss": 1.7925, "step": 5098 }, { "epoch": 0.4, "learning_rate": 0.00028695429024216626, "loss": 1.7781, "step": 5099 }, { "epoch": 0.4, "learning_rate": 0.00028694924830413614, "loss": 1.8364, "step": 5100 }, { "epoch": 0.4, "learning_rate": 0.0002869442054362962, "loss": 1.7683, "step": 5101 }, { "epoch": 0.4, "learning_rate": 0.00028693916163868074, "loss": 1.7797, "step": 5102 }, { "epoch": 0.4, "learning_rate": 0.00028693411691132386, "loss": 1.7223, "step": 5103 }, { "epoch": 0.4, "learning_rate": 0.0002869290712542599, "loss": 1.7508, "step": 5104 }, { "epoch": 0.4, "learning_rate": 0.00028692402466752316, "loss": 1.7255, "step": 5105 }, { "epoch": 0.4, "learning_rate": 0.0002869189771511478, "loss": 1.7461, "step": 5106 }, { "epoch": 0.4, "learning_rate": 0.0002869139287051682, "loss": 1.7666, "step": 5107 }, { "epoch": 0.4, "learning_rate": 0.0002869088793296185, "loss": 1.7804, "step": 5108 }, { "epoch": 0.4, "learning_rate": 0.00028690382902453313, "loss": 1.737, "step": 5109 }, { "epoch": 0.4, "learning_rate": 0.0002868987777899463, "loss": 1.7358, "step": 5110 }, { "epoch": 0.4, "learning_rate": 0.0002868937256258923, "loss": 1.768, "step": 5111 }, { "epoch": 0.4, "learning_rate": 0.0002868886725324054, "loss": 1.8124, "step": 5112 }, { "epoch": 0.4, "learning_rate": 0.00028688361850952006, "loss": 1.7219, "step": 5113 }, { "epoch": 0.4, "learning_rate": 0.0002868785635572704, "loss": 1.7367, "step": 5114 }, { "epoch": 0.4, "learning_rate": 0.00028687350767569086, "loss": 1.8006, "step": 5115 }, { "epoch": 0.4, "learning_rate": 0.00028686845086481577, "loss": 1.7572, "step": 5116 }, { "epoch": 0.4, "learning_rate": 0.0002868633931246794, "loss": 1.7994, "step": 5117 }, { "epoch": 0.4, "learning_rate": 0.0002868583344553161, "loss": 1.8174, "step": 5118 }, { "epoch": 0.4, "learning_rate": 0.00028685327485676024, "loss": 1.8445, "step": 5119 }, { "epoch": 0.4, "learning_rate": 0.0002868482143290462, "loss": 1.8135, "step": 5120 }, { "epoch": 0.4, "learning_rate": 0.0002868431528722083, "loss": 1.7811, "step": 5121 }, { "epoch": 0.4, "learning_rate": 0.0002868380904862809, "loss": 1.8013, "step": 5122 }, { "epoch": 0.4, "learning_rate": 0.0002868330271712983, "loss": 1.7718, "step": 5123 }, { "epoch": 0.4, "learning_rate": 0.00028682796292729505, "loss": 1.7952, "step": 5124 }, { "epoch": 0.4, "learning_rate": 0.0002868228977543054, "loss": 1.8517, "step": 5125 }, { "epoch": 0.4, "learning_rate": 0.00028681783165236376, "loss": 1.84, "step": 5126 }, { "epoch": 0.4, "learning_rate": 0.0002868127646215046, "loss": 1.7625, "step": 5127 }, { "epoch": 0.4, "learning_rate": 0.0002868076966617623, "loss": 1.7845, "step": 5128 }, { "epoch": 0.4, "learning_rate": 0.00028680262777317113, "loss": 1.8194, "step": 5129 }, { "epoch": 0.4, "learning_rate": 0.00028679755795576567, "loss": 1.7806, "step": 5130 }, { "epoch": 0.4, "learning_rate": 0.0002867924872095803, "loss": 1.8059, "step": 5131 }, { "epoch": 0.4, "learning_rate": 0.0002867874155346494, "loss": 1.7681, "step": 5132 }, { "epoch": 0.4, "learning_rate": 0.00028678234293100745, "loss": 1.8383, "step": 5133 }, { "epoch": 0.4, "learning_rate": 0.00028677726939868884, "loss": 1.7672, "step": 5134 }, { "epoch": 0.4, "learning_rate": 0.0002867721949377281, "loss": 1.7919, "step": 5135 }, { "epoch": 0.4, "learning_rate": 0.00028676711954815957, "loss": 1.716, "step": 5136 }, { "epoch": 0.4, "learning_rate": 0.00028676204323001785, "loss": 1.7588, "step": 5137 }, { "epoch": 0.4, "learning_rate": 0.00028675696598333726, "loss": 1.7852, "step": 5138 }, { "epoch": 0.4, "learning_rate": 0.00028675188780815237, "loss": 1.804, "step": 5139 }, { "epoch": 0.4, "learning_rate": 0.0002867468087044976, "loss": 1.7505, "step": 5140 }, { "epoch": 0.4, "learning_rate": 0.00028674172867240754, "loss": 1.7448, "step": 5141 }, { "epoch": 0.4, "learning_rate": 0.00028673664771191655, "loss": 1.7705, "step": 5142 }, { "epoch": 0.4, "learning_rate": 0.00028673156582305917, "loss": 1.787, "step": 5143 }, { "epoch": 0.4, "learning_rate": 0.0002867264830058699, "loss": 1.7888, "step": 5144 }, { "epoch": 0.4, "learning_rate": 0.0002867213992603833, "loss": 1.772, "step": 5145 }, { "epoch": 0.4, "learning_rate": 0.0002867163145866338, "loss": 1.7731, "step": 5146 }, { "epoch": 0.4, "learning_rate": 0.00028671122898465604, "loss": 1.7967, "step": 5147 }, { "epoch": 0.41, "learning_rate": 0.0002867061424544845, "loss": 1.7574, "step": 5148 }, { "epoch": 0.41, "learning_rate": 0.00028670105499615356, "loss": 1.8336, "step": 5149 }, { "epoch": 0.41, "learning_rate": 0.000286695966609698, "loss": 1.7346, "step": 5150 }, { "epoch": 0.41, "learning_rate": 0.00028669087729515225, "loss": 1.77, "step": 5151 }, { "epoch": 0.41, "learning_rate": 0.00028668578705255086, "loss": 1.7903, "step": 5152 }, { "epoch": 0.41, "learning_rate": 0.0002866806958819284, "loss": 1.7663, "step": 5153 }, { "epoch": 0.41, "learning_rate": 0.0002866756037833194, "loss": 1.7773, "step": 5154 }, { "epoch": 0.41, "learning_rate": 0.00028667051075675855, "loss": 1.7954, "step": 5155 }, { "epoch": 0.41, "learning_rate": 0.0002866654168022803, "loss": 1.7735, "step": 5156 }, { "epoch": 0.41, "learning_rate": 0.0002866603219199193, "loss": 1.7922, "step": 5157 }, { "epoch": 0.41, "learning_rate": 0.0002866552261097102, "loss": 1.8076, "step": 5158 }, { "epoch": 0.41, "learning_rate": 0.00028665012937168746, "loss": 1.8073, "step": 5159 }, { "epoch": 0.41, "learning_rate": 0.0002866450317058857, "loss": 1.7082, "step": 5160 }, { "epoch": 0.41, "learning_rate": 0.00028663993311233967, "loss": 1.7821, "step": 5161 }, { "epoch": 0.41, "learning_rate": 0.0002866348335910839, "loss": 1.768, "step": 5162 }, { "epoch": 0.41, "learning_rate": 0.00028662973314215294, "loss": 1.7245, "step": 5163 }, { "epoch": 0.41, "learning_rate": 0.0002866246317655815, "loss": 1.7772, "step": 5164 }, { "epoch": 0.41, "learning_rate": 0.0002866195294614043, "loss": 1.7526, "step": 5165 }, { "epoch": 0.41, "learning_rate": 0.00028661442622965577, "loss": 1.7753, "step": 5166 }, { "epoch": 0.41, "learning_rate": 0.00028660932207037076, "loss": 1.8182, "step": 5167 }, { "epoch": 0.41, "learning_rate": 0.0002866042169835838, "loss": 1.7516, "step": 5168 }, { "epoch": 0.41, "learning_rate": 0.00028659911096932966, "loss": 1.7636, "step": 5169 }, { "epoch": 0.41, "learning_rate": 0.00028659400402764284, "loss": 1.7672, "step": 5170 }, { "epoch": 0.41, "learning_rate": 0.0002865888961585581, "loss": 1.7824, "step": 5171 }, { "epoch": 0.41, "learning_rate": 0.0002865837873621103, "loss": 1.8158, "step": 5172 }, { "epoch": 0.41, "learning_rate": 0.00028657867763833374, "loss": 1.7887, "step": 5173 }, { "epoch": 0.41, "learning_rate": 0.00028657356698726344, "loss": 1.81, "step": 5174 }, { "epoch": 0.41, "learning_rate": 0.000286568455408934, "loss": 1.7677, "step": 5175 }, { "epoch": 0.41, "learning_rate": 0.0002865633429033801, "loss": 1.8336, "step": 5176 }, { "epoch": 0.41, "learning_rate": 0.0002865582294706364, "loss": 1.752, "step": 5177 }, { "epoch": 0.41, "learning_rate": 0.0002865531151107378, "loss": 1.7691, "step": 5178 }, { "epoch": 0.41, "learning_rate": 0.0002865479998237188, "loss": 1.7426, "step": 5179 }, { "epoch": 0.41, "learning_rate": 0.0002865428836096143, "loss": 1.8265, "step": 5180 }, { "epoch": 0.41, "learning_rate": 0.0002865377664684589, "loss": 1.7875, "step": 5181 }, { "epoch": 0.41, "learning_rate": 0.00028653264840028744, "loss": 1.805, "step": 5182 }, { "epoch": 0.41, "learning_rate": 0.0002865275294051347, "loss": 1.7871, "step": 5183 }, { "epoch": 0.41, "learning_rate": 0.00028652240948303536, "loss": 1.7659, "step": 5184 }, { "epoch": 0.41, "learning_rate": 0.00028651728863402415, "loss": 1.7531, "step": 5185 }, { "epoch": 0.41, "learning_rate": 0.0002865121668581359, "loss": 1.7512, "step": 5186 }, { "epoch": 0.41, "learning_rate": 0.0002865070441554054, "loss": 1.7357, "step": 5187 }, { "epoch": 0.41, "learning_rate": 0.0002865019205258674, "loss": 1.81, "step": 5188 }, { "epoch": 0.41, "learning_rate": 0.0002864967959695566, "loss": 1.7725, "step": 5189 }, { "epoch": 0.41, "learning_rate": 0.000286491670486508, "loss": 1.7357, "step": 5190 }, { "epoch": 0.41, "learning_rate": 0.0002864865440767562, "loss": 1.7566, "step": 5191 }, { "epoch": 0.41, "learning_rate": 0.00028648141674033614, "loss": 1.8229, "step": 5192 }, { "epoch": 0.41, "learning_rate": 0.00028647628847728256, "loss": 1.7403, "step": 5193 }, { "epoch": 0.41, "learning_rate": 0.0002864711592876303, "loss": 1.8231, "step": 5194 }, { "epoch": 0.41, "learning_rate": 0.0002864660291714142, "loss": 1.7895, "step": 5195 }, { "epoch": 0.41, "learning_rate": 0.00028646089812866903, "loss": 1.7552, "step": 5196 }, { "epoch": 0.41, "learning_rate": 0.00028645576615942965, "loss": 1.7638, "step": 5197 }, { "epoch": 0.41, "learning_rate": 0.00028645063326373095, "loss": 1.7812, "step": 5198 }, { "epoch": 0.41, "learning_rate": 0.0002864454994416077, "loss": 1.7022, "step": 5199 }, { "epoch": 0.41, "learning_rate": 0.00028644036469309484, "loss": 1.779, "step": 5200 }, { "epoch": 0.41, "learning_rate": 0.00028643522901822727, "loss": 1.7618, "step": 5201 }, { "epoch": 0.41, "learning_rate": 0.0002864300924170397, "loss": 1.7891, "step": 5202 }, { "epoch": 0.41, "learning_rate": 0.0002864249548895671, "loss": 1.7278, "step": 5203 }, { "epoch": 0.41, "learning_rate": 0.0002864198164358444, "loss": 1.8143, "step": 5204 }, { "epoch": 0.41, "learning_rate": 0.0002864146770559064, "loss": 1.7599, "step": 5205 }, { "epoch": 0.41, "learning_rate": 0.00028640953674978796, "loss": 1.8218, "step": 5206 }, { "epoch": 0.41, "learning_rate": 0.0002864043955175241, "loss": 1.7488, "step": 5207 }, { "epoch": 0.41, "learning_rate": 0.00028639925335914964, "loss": 1.7534, "step": 5208 }, { "epoch": 0.41, "learning_rate": 0.00028639411027469956, "loss": 1.7911, "step": 5209 }, { "epoch": 0.41, "learning_rate": 0.0002863889662642087, "loss": 1.738, "step": 5210 }, { "epoch": 0.41, "learning_rate": 0.0002863838213277121, "loss": 1.8333, "step": 5211 }, { "epoch": 0.41, "learning_rate": 0.00028637867546524456, "loss": 1.7458, "step": 5212 }, { "epoch": 0.41, "learning_rate": 0.00028637352867684105, "loss": 1.7433, "step": 5213 }, { "epoch": 0.41, "learning_rate": 0.0002863683809625366, "loss": 1.7387, "step": 5214 }, { "epoch": 0.41, "learning_rate": 0.000286363232322366, "loss": 1.7804, "step": 5215 }, { "epoch": 0.41, "learning_rate": 0.0002863580827563644, "loss": 1.7713, "step": 5216 }, { "epoch": 0.41, "learning_rate": 0.0002863529322645666, "loss": 1.7611, "step": 5217 }, { "epoch": 0.41, "learning_rate": 0.0002863477808470077, "loss": 1.7624, "step": 5218 }, { "epoch": 0.41, "learning_rate": 0.00028634262850372257, "loss": 1.7214, "step": 5219 }, { "epoch": 0.41, "learning_rate": 0.0002863374752347462, "loss": 1.7381, "step": 5220 }, { "epoch": 0.41, "learning_rate": 0.0002863323210401137, "loss": 1.7534, "step": 5221 }, { "epoch": 0.41, "learning_rate": 0.0002863271659198599, "loss": 1.8259, "step": 5222 }, { "epoch": 0.41, "learning_rate": 0.0002863220098740199, "loss": 1.8065, "step": 5223 }, { "epoch": 0.41, "learning_rate": 0.00028631685290262873, "loss": 1.7642, "step": 5224 }, { "epoch": 0.41, "learning_rate": 0.00028631169500572124, "loss": 1.7528, "step": 5225 }, { "epoch": 0.41, "learning_rate": 0.00028630653618333266, "loss": 1.7849, "step": 5226 }, { "epoch": 0.41, "learning_rate": 0.0002863013764354979, "loss": 1.8312, "step": 5227 }, { "epoch": 0.41, "learning_rate": 0.000286296215762252, "loss": 1.712, "step": 5228 }, { "epoch": 0.41, "learning_rate": 0.00028629105416363, "loss": 1.8153, "step": 5229 }, { "epoch": 0.41, "learning_rate": 0.00028628589163966694, "loss": 1.8157, "step": 5230 }, { "epoch": 0.41, "learning_rate": 0.00028628072819039793, "loss": 1.769, "step": 5231 }, { "epoch": 0.41, "learning_rate": 0.000286275563815858, "loss": 1.7769, "step": 5232 }, { "epoch": 0.41, "learning_rate": 0.00028627039851608215, "loss": 1.7471, "step": 5233 }, { "epoch": 0.41, "learning_rate": 0.00028626523229110547, "loss": 1.772, "step": 5234 }, { "epoch": 0.41, "learning_rate": 0.00028626006514096314, "loss": 1.7836, "step": 5235 }, { "epoch": 0.41, "learning_rate": 0.00028625489706569007, "loss": 1.8032, "step": 5236 }, { "epoch": 0.41, "learning_rate": 0.0002862497280653215, "loss": 1.7078, "step": 5237 }, { "epoch": 0.41, "learning_rate": 0.00028624455813989244, "loss": 1.7216, "step": 5238 }, { "epoch": 0.41, "learning_rate": 0.000286239387289438, "loss": 1.8074, "step": 5239 }, { "epoch": 0.41, "learning_rate": 0.0002862342155139933, "loss": 1.8136, "step": 5240 }, { "epoch": 0.41, "learning_rate": 0.00028622904281359353, "loss": 1.8197, "step": 5241 }, { "epoch": 0.41, "learning_rate": 0.00028622386918827366, "loss": 1.7926, "step": 5242 }, { "epoch": 0.41, "learning_rate": 0.00028621869463806894, "loss": 1.7396, "step": 5243 }, { "epoch": 0.41, "learning_rate": 0.00028621351916301445, "loss": 1.7375, "step": 5244 }, { "epoch": 0.41, "learning_rate": 0.0002862083427631453, "loss": 1.7534, "step": 5245 }, { "epoch": 0.41, "learning_rate": 0.00028620316543849673, "loss": 1.7555, "step": 5246 }, { "epoch": 0.41, "learning_rate": 0.00028619798718910376, "loss": 1.7413, "step": 5247 }, { "epoch": 0.41, "learning_rate": 0.0002861928080150017, "loss": 1.7935, "step": 5248 }, { "epoch": 0.41, "learning_rate": 0.00028618762791622556, "loss": 1.7482, "step": 5249 }, { "epoch": 0.41, "learning_rate": 0.0002861824468928106, "loss": 1.803, "step": 5250 }, { "epoch": 0.41, "learning_rate": 0.000286177264944792, "loss": 1.7508, "step": 5251 }, { "epoch": 0.41, "learning_rate": 0.0002861720820722049, "loss": 1.7834, "step": 5252 }, { "epoch": 0.41, "learning_rate": 0.00028616689827508444, "loss": 1.7677, "step": 5253 }, { "epoch": 0.41, "learning_rate": 0.00028616171355346593, "loss": 1.786, "step": 5254 }, { "epoch": 0.41, "learning_rate": 0.0002861565279073846, "loss": 1.7864, "step": 5255 }, { "epoch": 0.41, "learning_rate": 0.00028615134133687554, "loss": 1.8466, "step": 5256 }, { "epoch": 0.41, "learning_rate": 0.00028614615384197397, "loss": 1.7694, "step": 5257 }, { "epoch": 0.41, "learning_rate": 0.0002861409654227152, "loss": 1.7892, "step": 5258 }, { "epoch": 0.41, "learning_rate": 0.00028613577607913436, "loss": 1.7503, "step": 5259 }, { "epoch": 0.41, "learning_rate": 0.00028613058581126674, "loss": 1.8474, "step": 5260 }, { "epoch": 0.41, "learning_rate": 0.00028612539461914756, "loss": 1.7386, "step": 5261 }, { "epoch": 0.41, "learning_rate": 0.0002861202025028121, "loss": 1.7654, "step": 5262 }, { "epoch": 0.41, "learning_rate": 0.00028611500946229557, "loss": 1.8201, "step": 5263 }, { "epoch": 0.41, "learning_rate": 0.0002861098154976332, "loss": 1.7867, "step": 5264 }, { "epoch": 0.41, "learning_rate": 0.0002861046206088603, "loss": 1.7593, "step": 5265 }, { "epoch": 0.41, "learning_rate": 0.0002860994247960122, "loss": 1.7778, "step": 5266 }, { "epoch": 0.41, "learning_rate": 0.0002860942280591241, "loss": 1.7458, "step": 5267 }, { "epoch": 0.41, "learning_rate": 0.00028608903039823125, "loss": 1.8195, "step": 5268 }, { "epoch": 0.41, "learning_rate": 0.00028608383181336896, "loss": 1.7908, "step": 5269 }, { "epoch": 0.41, "learning_rate": 0.0002860786323045726, "loss": 1.7124, "step": 5270 }, { "epoch": 0.41, "learning_rate": 0.00028607343187187737, "loss": 1.8383, "step": 5271 }, { "epoch": 0.41, "learning_rate": 0.00028606823051531875, "loss": 1.7792, "step": 5272 }, { "epoch": 0.41, "learning_rate": 0.0002860630282349318, "loss": 1.7683, "step": 5273 }, { "epoch": 0.41, "learning_rate": 0.00028605782503075204, "loss": 1.785, "step": 5274 }, { "epoch": 0.42, "learning_rate": 0.0002860526209028147, "loss": 1.7586, "step": 5275 }, { "epoch": 0.42, "learning_rate": 0.00028604741585115515, "loss": 1.8067, "step": 5276 }, { "epoch": 0.42, "learning_rate": 0.00028604220987580876, "loss": 1.7819, "step": 5277 }, { "epoch": 0.42, "learning_rate": 0.0002860370029768108, "loss": 1.8147, "step": 5278 }, { "epoch": 0.42, "learning_rate": 0.0002860317951541967, "loss": 1.7689, "step": 5279 }, { "epoch": 0.42, "learning_rate": 0.00028602658640800174, "loss": 1.7261, "step": 5280 }, { "epoch": 0.42, "learning_rate": 0.0002860213767382613, "loss": 1.7918, "step": 5281 }, { "epoch": 0.42, "learning_rate": 0.0002860161661450109, "loss": 1.8202, "step": 5282 }, { "epoch": 0.42, "learning_rate": 0.00028601095462828566, "loss": 1.7486, "step": 5283 }, { "epoch": 0.42, "learning_rate": 0.00028600574218812117, "loss": 1.7372, "step": 5284 }, { "epoch": 0.42, "learning_rate": 0.0002860005288245527, "loss": 1.8298, "step": 5285 }, { "epoch": 0.42, "learning_rate": 0.0002859953145376157, "loss": 1.8113, "step": 5286 }, { "epoch": 0.42, "learning_rate": 0.0002859900993273456, "loss": 1.8106, "step": 5287 }, { "epoch": 0.42, "learning_rate": 0.00028598488319377775, "loss": 1.7415, "step": 5288 }, { "epoch": 0.42, "learning_rate": 0.00028597966613694753, "loss": 1.7283, "step": 5289 }, { "epoch": 0.42, "learning_rate": 0.0002859744481568905, "loss": 1.787, "step": 5290 }, { "epoch": 0.42, "learning_rate": 0.0002859692292536419, "loss": 1.8049, "step": 5291 }, { "epoch": 0.42, "learning_rate": 0.00028596400942723735, "loss": 1.7788, "step": 5292 }, { "epoch": 0.42, "learning_rate": 0.0002859587886777122, "loss": 1.8316, "step": 5293 }, { "epoch": 0.42, "learning_rate": 0.0002859535670051019, "loss": 1.6998, "step": 5294 }, { "epoch": 0.42, "learning_rate": 0.0002859483444094419, "loss": 1.7538, "step": 5295 }, { "epoch": 0.42, "learning_rate": 0.00028594312089076765, "loss": 1.7893, "step": 5296 }, { "epoch": 0.42, "learning_rate": 0.00028593789644911464, "loss": 1.8007, "step": 5297 }, { "epoch": 0.42, "learning_rate": 0.0002859326710845184, "loss": 1.789, "step": 5298 }, { "epoch": 0.42, "learning_rate": 0.0002859274447970142, "loss": 1.7597, "step": 5299 }, { "epoch": 0.42, "learning_rate": 0.00028592221758663776, "loss": 1.7418, "step": 5300 }, { "epoch": 0.42, "learning_rate": 0.0002859169894534244, "loss": 1.7365, "step": 5301 }, { "epoch": 0.42, "learning_rate": 0.00028591176039740977, "loss": 1.7535, "step": 5302 }, { "epoch": 0.42, "learning_rate": 0.00028590653041862926, "loss": 1.7362, "step": 5303 }, { "epoch": 0.42, "learning_rate": 0.0002859012995171184, "loss": 1.7626, "step": 5304 }, { "epoch": 0.42, "learning_rate": 0.0002858960676929127, "loss": 1.7725, "step": 5305 }, { "epoch": 0.42, "learning_rate": 0.0002858908349460477, "loss": 1.7693, "step": 5306 }, { "epoch": 0.42, "learning_rate": 0.0002858856012765589, "loss": 1.7346, "step": 5307 }, { "epoch": 0.42, "learning_rate": 0.0002858803666844819, "loss": 1.8291, "step": 5308 }, { "epoch": 0.42, "learning_rate": 0.00028587513116985216, "loss": 1.7628, "step": 5309 }, { "epoch": 0.42, "learning_rate": 0.00028586989473270525, "loss": 1.7922, "step": 5310 }, { "epoch": 0.42, "learning_rate": 0.00028586465737307675, "loss": 1.7141, "step": 5311 }, { "epoch": 0.42, "learning_rate": 0.0002858594190910022, "loss": 1.7533, "step": 5312 }, { "epoch": 0.42, "learning_rate": 0.0002858541798865172, "loss": 1.7816, "step": 5313 }, { "epoch": 0.42, "learning_rate": 0.0002858489397596573, "loss": 1.7814, "step": 5314 }, { "epoch": 0.42, "learning_rate": 0.000285843698710458, "loss": 1.7586, "step": 5315 }, { "epoch": 0.42, "learning_rate": 0.000285838456738955, "loss": 1.6995, "step": 5316 }, { "epoch": 0.42, "learning_rate": 0.00028583321384518384, "loss": 1.7469, "step": 5317 }, { "epoch": 0.42, "learning_rate": 0.0002858279700291801, "loss": 1.7228, "step": 5318 }, { "epoch": 0.42, "learning_rate": 0.0002858227252909794, "loss": 1.7466, "step": 5319 }, { "epoch": 0.42, "learning_rate": 0.00028581747963061735, "loss": 1.7603, "step": 5320 }, { "epoch": 0.42, "learning_rate": 0.00028581223304812955, "loss": 1.7831, "step": 5321 }, { "epoch": 0.42, "learning_rate": 0.00028580698554355166, "loss": 1.7946, "step": 5322 }, { "epoch": 0.42, "learning_rate": 0.00028580173711691923, "loss": 1.7855, "step": 5323 }, { "epoch": 0.42, "learning_rate": 0.00028579648776826805, "loss": 1.8172, "step": 5324 }, { "epoch": 0.42, "learning_rate": 0.00028579123749763357, "loss": 1.8387, "step": 5325 }, { "epoch": 0.42, "learning_rate": 0.00028578598630505156, "loss": 1.7711, "step": 5326 }, { "epoch": 0.42, "learning_rate": 0.00028578073419055765, "loss": 1.7273, "step": 5327 }, { "epoch": 0.42, "learning_rate": 0.00028577548115418745, "loss": 1.7554, "step": 5328 }, { "epoch": 0.42, "learning_rate": 0.00028577022719597663, "loss": 1.7882, "step": 5329 }, { "epoch": 0.42, "learning_rate": 0.00028576497231596096, "loss": 1.7631, "step": 5330 }, { "epoch": 0.42, "learning_rate": 0.000285759716514176, "loss": 1.6488, "step": 5331 }, { "epoch": 0.42, "learning_rate": 0.0002857544597906575, "loss": 1.8296, "step": 5332 }, { "epoch": 0.42, "learning_rate": 0.00028574920214544114, "loss": 1.8361, "step": 5333 }, { "epoch": 0.42, "learning_rate": 0.0002857439435785626, "loss": 1.7403, "step": 5334 }, { "epoch": 0.42, "learning_rate": 0.0002857386840900576, "loss": 1.8627, "step": 5335 }, { "epoch": 0.42, "learning_rate": 0.00028573342367996187, "loss": 1.8164, "step": 5336 }, { "epoch": 0.42, "learning_rate": 0.0002857281623483111, "loss": 1.8016, "step": 5337 }, { "epoch": 0.42, "learning_rate": 0.0002857229000951409, "loss": 1.7573, "step": 5338 }, { "epoch": 0.42, "learning_rate": 0.0002857176369204872, "loss": 1.7137, "step": 5339 }, { "epoch": 0.42, "learning_rate": 0.00028571237282438565, "loss": 1.7381, "step": 5340 }, { "epoch": 0.42, "learning_rate": 0.00028570710780687194, "loss": 1.7898, "step": 5341 }, { "epoch": 0.42, "learning_rate": 0.00028570184186798187, "loss": 1.7784, "step": 5342 }, { "epoch": 0.42, "learning_rate": 0.0002856965750077512, "loss": 1.8016, "step": 5343 }, { "epoch": 0.42, "learning_rate": 0.0002856913072262157, "loss": 1.7725, "step": 5344 }, { "epoch": 0.42, "learning_rate": 0.00028568603852341097, "loss": 1.775, "step": 5345 }, { "epoch": 0.42, "learning_rate": 0.00028568076889937306, "loss": 1.7429, "step": 5346 }, { "epoch": 0.42, "learning_rate": 0.00028567549835413757, "loss": 1.7592, "step": 5347 }, { "epoch": 0.42, "learning_rate": 0.0002856702268877402, "loss": 1.8076, "step": 5348 }, { "epoch": 0.42, "learning_rate": 0.000285664954500217, "loss": 1.7915, "step": 5349 }, { "epoch": 0.42, "learning_rate": 0.0002856596811916036, "loss": 1.7854, "step": 5350 }, { "epoch": 0.42, "learning_rate": 0.0002856544069619358, "loss": 1.7694, "step": 5351 }, { "epoch": 0.42, "learning_rate": 0.00028564913181124943, "loss": 1.768, "step": 5352 }, { "epoch": 0.42, "learning_rate": 0.00028564385573958035, "loss": 1.8167, "step": 5353 }, { "epoch": 0.42, "learning_rate": 0.0002856385787469643, "loss": 1.7779, "step": 5354 }, { "epoch": 0.42, "learning_rate": 0.0002856333008334372, "loss": 1.795, "step": 5355 }, { "epoch": 0.42, "learning_rate": 0.0002856280219990348, "loss": 1.7551, "step": 5356 }, { "epoch": 0.42, "learning_rate": 0.000285622742243793, "loss": 1.8142, "step": 5357 }, { "epoch": 0.42, "learning_rate": 0.00028561746156774756, "loss": 1.8006, "step": 5358 }, { "epoch": 0.42, "learning_rate": 0.00028561217997093445, "loss": 1.7735, "step": 5359 }, { "epoch": 0.42, "learning_rate": 0.0002856068974533895, "loss": 1.7413, "step": 5360 }, { "epoch": 0.42, "learning_rate": 0.0002856016140151485, "loss": 1.7811, "step": 5361 }, { "epoch": 0.42, "learning_rate": 0.0002855963296562474, "loss": 1.7915, "step": 5362 }, { "epoch": 0.42, "learning_rate": 0.000285591044376722, "loss": 1.7884, "step": 5363 }, { "epoch": 0.42, "learning_rate": 0.0002855857581766083, "loss": 1.7301, "step": 5364 }, { "epoch": 0.42, "learning_rate": 0.0002855804710559421, "loss": 1.7426, "step": 5365 }, { "epoch": 0.42, "learning_rate": 0.0002855751830147593, "loss": 1.7577, "step": 5366 }, { "epoch": 0.42, "learning_rate": 0.00028556989405309583, "loss": 1.8295, "step": 5367 }, { "epoch": 0.42, "learning_rate": 0.00028556460417098763, "loss": 1.7762, "step": 5368 }, { "epoch": 0.42, "learning_rate": 0.00028555931336847056, "loss": 1.7732, "step": 5369 }, { "epoch": 0.42, "learning_rate": 0.00028555402164558055, "loss": 1.7617, "step": 5370 }, { "epoch": 0.42, "learning_rate": 0.0002855487290023536, "loss": 1.8117, "step": 5371 }, { "epoch": 0.42, "learning_rate": 0.00028554343543882543, "loss": 1.7446, "step": 5372 }, { "epoch": 0.42, "learning_rate": 0.00028553814095503226, "loss": 1.7583, "step": 5373 }, { "epoch": 0.42, "learning_rate": 0.00028553284555100987, "loss": 1.7512, "step": 5374 }, { "epoch": 0.42, "learning_rate": 0.00028552754922679424, "loss": 1.7919, "step": 5375 }, { "epoch": 0.42, "learning_rate": 0.0002855222519824214, "loss": 1.8223, "step": 5376 }, { "epoch": 0.42, "learning_rate": 0.0002855169538179272, "loss": 1.7305, "step": 5377 }, { "epoch": 0.42, "learning_rate": 0.00028551165473334774, "loss": 1.7764, "step": 5378 }, { "epoch": 0.42, "learning_rate": 0.0002855063547287188, "loss": 1.734, "step": 5379 }, { "epoch": 0.42, "learning_rate": 0.00028550105380407655, "loss": 1.7133, "step": 5380 }, { "epoch": 0.42, "learning_rate": 0.00028549575195945697, "loss": 1.7846, "step": 5381 }, { "epoch": 0.42, "learning_rate": 0.00028549044919489597, "loss": 1.7865, "step": 5382 }, { "epoch": 0.42, "learning_rate": 0.0002854851455104296, "loss": 1.8001, "step": 5383 }, { "epoch": 0.42, "learning_rate": 0.00028547984090609383, "loss": 1.7215, "step": 5384 }, { "epoch": 0.42, "learning_rate": 0.00028547453538192475, "loss": 1.8184, "step": 5385 }, { "epoch": 0.42, "learning_rate": 0.00028546922893795827, "loss": 1.7833, "step": 5386 }, { "epoch": 0.42, "learning_rate": 0.0002854639215742305, "loss": 1.7822, "step": 5387 }, { "epoch": 0.42, "learning_rate": 0.0002854586132907775, "loss": 1.8311, "step": 5388 }, { "epoch": 0.42, "learning_rate": 0.00028545330408763525, "loss": 1.7938, "step": 5389 }, { "epoch": 0.42, "learning_rate": 0.0002854479939648398, "loss": 1.8029, "step": 5390 }, { "epoch": 0.42, "learning_rate": 0.0002854426829224272, "loss": 1.8155, "step": 5391 }, { "epoch": 0.42, "learning_rate": 0.0002854373709604336, "loss": 1.7583, "step": 5392 }, { "epoch": 0.42, "learning_rate": 0.0002854320580788949, "loss": 1.7514, "step": 5393 }, { "epoch": 0.42, "learning_rate": 0.00028542674427784734, "loss": 1.7528, "step": 5394 }, { "epoch": 0.42, "learning_rate": 0.0002854214295573269, "loss": 1.7312, "step": 5395 }, { "epoch": 0.42, "learning_rate": 0.00028541611391736966, "loss": 1.7452, "step": 5396 }, { "epoch": 0.42, "learning_rate": 0.00028541079735801175, "loss": 1.7372, "step": 5397 }, { "epoch": 0.42, "learning_rate": 0.00028540547987928927, "loss": 1.832, "step": 5398 }, { "epoch": 0.42, "learning_rate": 0.00028540016148123826, "loss": 1.7673, "step": 5399 }, { "epoch": 0.42, "learning_rate": 0.0002853948421638949, "loss": 1.7895, "step": 5400 }, { "epoch": 0.42, "learning_rate": 0.0002853895219272953, "loss": 1.7529, "step": 5401 }, { "epoch": 0.43, "learning_rate": 0.0002853842007714755, "loss": 1.7536, "step": 5402 }, { "epoch": 0.43, "learning_rate": 0.00028537887869647174, "loss": 1.7772, "step": 5403 }, { "epoch": 0.43, "learning_rate": 0.0002853735557023201, "loss": 1.7656, "step": 5404 }, { "epoch": 0.43, "learning_rate": 0.00028536823178905673, "loss": 1.7377, "step": 5405 }, { "epoch": 0.43, "learning_rate": 0.00028536290695671773, "loss": 1.7402, "step": 5406 }, { "epoch": 0.43, "learning_rate": 0.0002853575812053393, "loss": 1.765, "step": 5407 }, { "epoch": 0.43, "learning_rate": 0.00028535225453495757, "loss": 1.7293, "step": 5408 }, { "epoch": 0.43, "learning_rate": 0.0002853469269456088, "loss": 1.7529, "step": 5409 }, { "epoch": 0.43, "learning_rate": 0.00028534159843732903, "loss": 1.7844, "step": 5410 }, { "epoch": 0.43, "learning_rate": 0.0002853362690101545, "loss": 1.7208, "step": 5411 }, { "epoch": 0.43, "learning_rate": 0.0002853309386641214, "loss": 1.7058, "step": 5412 }, { "epoch": 0.43, "learning_rate": 0.00028532560739926593, "loss": 1.7506, "step": 5413 }, { "epoch": 0.43, "learning_rate": 0.0002853202752156242, "loss": 1.7777, "step": 5414 }, { "epoch": 0.43, "learning_rate": 0.00028531494211323253, "loss": 1.7935, "step": 5415 }, { "epoch": 0.43, "learning_rate": 0.00028530960809212703, "loss": 1.7833, "step": 5416 }, { "epoch": 0.43, "learning_rate": 0.000285304273152344, "loss": 1.7986, "step": 5417 }, { "epoch": 0.43, "learning_rate": 0.00028529893729391963, "loss": 1.7971, "step": 5418 }, { "epoch": 0.43, "learning_rate": 0.0002852936005168901, "loss": 1.7834, "step": 5419 }, { "epoch": 0.43, "learning_rate": 0.0002852882628212917, "loss": 1.7771, "step": 5420 }, { "epoch": 0.43, "learning_rate": 0.00028528292420716066, "loss": 1.8097, "step": 5421 }, { "epoch": 0.43, "learning_rate": 0.00028527758467453325, "loss": 1.7389, "step": 5422 }, { "epoch": 0.43, "learning_rate": 0.00028527224422344565, "loss": 1.7747, "step": 5423 }, { "epoch": 0.43, "learning_rate": 0.0002852669028539342, "loss": 1.7963, "step": 5424 }, { "epoch": 0.43, "learning_rate": 0.0002852615605660351, "loss": 1.7608, "step": 5425 }, { "epoch": 0.43, "learning_rate": 0.00028525621735978464, "loss": 1.7877, "step": 5426 }, { "epoch": 0.43, "learning_rate": 0.00028525087323521913, "loss": 1.7734, "step": 5427 }, { "epoch": 0.43, "learning_rate": 0.0002852455281923748, "loss": 1.7754, "step": 5428 }, { "epoch": 0.43, "learning_rate": 0.000285240182231288, "loss": 1.7534, "step": 5429 }, { "epoch": 0.43, "learning_rate": 0.0002852348353519949, "loss": 1.8209, "step": 5430 }, { "epoch": 0.43, "learning_rate": 0.00028522948755453203, "loss": 1.738, "step": 5431 }, { "epoch": 0.43, "learning_rate": 0.0002852241388389355, "loss": 1.7723, "step": 5432 }, { "epoch": 0.43, "learning_rate": 0.0002852187892052417, "loss": 1.7189, "step": 5433 }, { "epoch": 0.43, "learning_rate": 0.00028521343865348694, "loss": 1.7449, "step": 5434 }, { "epoch": 0.43, "learning_rate": 0.00028520808718370753, "loss": 1.7392, "step": 5435 }, { "epoch": 0.43, "learning_rate": 0.00028520273479593983, "loss": 1.838, "step": 5436 }, { "epoch": 0.43, "learning_rate": 0.0002851973814902202, "loss": 1.77, "step": 5437 }, { "epoch": 0.43, "learning_rate": 0.00028519202726658496, "loss": 1.7456, "step": 5438 }, { "epoch": 0.43, "learning_rate": 0.0002851866721250704, "loss": 1.7617, "step": 5439 }, { "epoch": 0.43, "learning_rate": 0.00028518131606571296, "loss": 1.8237, "step": 5440 }, { "epoch": 0.43, "learning_rate": 0.000285175959088549, "loss": 1.7948, "step": 5441 }, { "epoch": 0.43, "learning_rate": 0.0002851706011936149, "loss": 1.7875, "step": 5442 }, { "epoch": 0.43, "learning_rate": 0.00028516524238094695, "loss": 1.7442, "step": 5443 }, { "epoch": 0.43, "learning_rate": 0.00028515988265058164, "loss": 1.7516, "step": 5444 }, { "epoch": 0.43, "learning_rate": 0.0002851545220025553, "loss": 1.7531, "step": 5445 }, { "epoch": 0.43, "learning_rate": 0.0002851491604369044, "loss": 1.7123, "step": 5446 }, { "epoch": 0.43, "learning_rate": 0.0002851437979536652, "loss": 1.7695, "step": 5447 }, { "epoch": 0.43, "learning_rate": 0.0002851384345528742, "loss": 1.7631, "step": 5448 }, { "epoch": 0.43, "learning_rate": 0.0002851330702345678, "loss": 1.7434, "step": 5449 }, { "epoch": 0.43, "learning_rate": 0.0002851277049987825, "loss": 1.7635, "step": 5450 }, { "epoch": 0.43, "learning_rate": 0.0002851223388455546, "loss": 1.7425, "step": 5451 }, { "epoch": 0.43, "learning_rate": 0.00028511697177492054, "loss": 1.8299, "step": 5452 }, { "epoch": 0.43, "learning_rate": 0.00028511160378691684, "loss": 1.7585, "step": 5453 }, { "epoch": 0.43, "learning_rate": 0.00028510623488157993, "loss": 1.775, "step": 5454 }, { "epoch": 0.43, "learning_rate": 0.00028510086505894623, "loss": 1.727, "step": 5455 }, { "epoch": 0.43, "learning_rate": 0.0002850954943190522, "loss": 1.7398, "step": 5456 }, { "epoch": 0.43, "learning_rate": 0.00028509012266193437, "loss": 1.7321, "step": 5457 }, { "epoch": 0.43, "learning_rate": 0.0002850847500876291, "loss": 1.7883, "step": 5458 }, { "epoch": 0.43, "learning_rate": 0.0002850793765961729, "loss": 1.7911, "step": 5459 }, { "epoch": 0.43, "learning_rate": 0.00028507400218760233, "loss": 1.6898, "step": 5460 }, { "epoch": 0.43, "learning_rate": 0.0002850686268619538, "loss": 1.7579, "step": 5461 }, { "epoch": 0.43, "learning_rate": 0.0002850632506192639, "loss": 1.7504, "step": 5462 }, { "epoch": 0.43, "learning_rate": 0.00028505787345956896, "loss": 1.7991, "step": 5463 }, { "epoch": 0.43, "learning_rate": 0.00028505249538290564, "loss": 1.7785, "step": 5464 }, { "epoch": 0.43, "learning_rate": 0.0002850471163893104, "loss": 1.851, "step": 5465 }, { "epoch": 0.43, "learning_rate": 0.00028504173647881975, "loss": 1.7945, "step": 5466 }, { "epoch": 0.43, "learning_rate": 0.00028503635565147026, "loss": 1.8289, "step": 5467 }, { "epoch": 0.43, "learning_rate": 0.0002850309739072984, "loss": 1.7579, "step": 5468 }, { "epoch": 0.43, "learning_rate": 0.0002850255912463408, "loss": 1.7373, "step": 5469 }, { "epoch": 0.43, "learning_rate": 0.0002850202076686339, "loss": 1.8047, "step": 5470 }, { "epoch": 0.43, "learning_rate": 0.00028501482317421433, "loss": 1.7606, "step": 5471 }, { "epoch": 0.43, "learning_rate": 0.0002850094377631186, "loss": 1.7851, "step": 5472 }, { "epoch": 0.43, "learning_rate": 0.0002850040514353833, "loss": 1.8154, "step": 5473 }, { "epoch": 0.43, "learning_rate": 0.00028499866419104495, "loss": 1.8063, "step": 5474 }, { "epoch": 0.43, "learning_rate": 0.0002849932760301402, "loss": 1.7435, "step": 5475 }, { "epoch": 0.43, "learning_rate": 0.0002849878869527056, "loss": 1.6951, "step": 5476 }, { "epoch": 0.43, "learning_rate": 0.00028498249695877776, "loss": 1.7634, "step": 5477 }, { "epoch": 0.43, "learning_rate": 0.0002849771060483932, "loss": 1.7441, "step": 5478 }, { "epoch": 0.43, "learning_rate": 0.00028497171422158863, "loss": 1.812, "step": 5479 }, { "epoch": 0.43, "learning_rate": 0.0002849663214784006, "loss": 1.7733, "step": 5480 }, { "epoch": 0.43, "learning_rate": 0.0002849609278188657, "loss": 1.7971, "step": 5481 }, { "epoch": 0.43, "learning_rate": 0.0002849555332430206, "loss": 1.7654, "step": 5482 }, { "epoch": 0.43, "learning_rate": 0.0002849501377509019, "loss": 1.7983, "step": 5483 }, { "epoch": 0.43, "learning_rate": 0.00028494474134254624, "loss": 1.7674, "step": 5484 }, { "epoch": 0.43, "learning_rate": 0.00028493934401799026, "loss": 1.7621, "step": 5485 }, { "epoch": 0.43, "learning_rate": 0.0002849339457772706, "loss": 1.7941, "step": 5486 }, { "epoch": 0.43, "learning_rate": 0.0002849285466204239, "loss": 1.7642, "step": 5487 }, { "epoch": 0.43, "learning_rate": 0.0002849231465474868, "loss": 1.7631, "step": 5488 }, { "epoch": 0.43, "learning_rate": 0.000284917745558496, "loss": 1.7804, "step": 5489 }, { "epoch": 0.43, "learning_rate": 0.00028491234365348817, "loss": 1.7204, "step": 5490 }, { "epoch": 0.43, "learning_rate": 0.00028490694083250004, "loss": 1.7214, "step": 5491 }, { "epoch": 0.43, "learning_rate": 0.00028490153709556816, "loss": 1.8211, "step": 5492 }, { "epoch": 0.43, "learning_rate": 0.00028489613244272934, "loss": 1.7949, "step": 5493 }, { "epoch": 0.43, "learning_rate": 0.00028489072687402017, "loss": 1.7205, "step": 5494 }, { "epoch": 0.43, "learning_rate": 0.00028488532038947745, "loss": 1.7198, "step": 5495 }, { "epoch": 0.43, "learning_rate": 0.0002848799129891378, "loss": 1.7365, "step": 5496 }, { "epoch": 0.43, "learning_rate": 0.00028487450467303796, "loss": 1.7533, "step": 5497 }, { "epoch": 0.43, "learning_rate": 0.0002848690954412147, "loss": 1.7726, "step": 5498 }, { "epoch": 0.43, "learning_rate": 0.0002848636852937047, "loss": 1.7724, "step": 5499 }, { "epoch": 0.43, "learning_rate": 0.0002848582742305447, "loss": 1.75, "step": 5500 }, { "epoch": 0.43, "learning_rate": 0.00028485286225177144, "loss": 1.7832, "step": 5501 }, { "epoch": 0.43, "learning_rate": 0.0002848474493574216, "loss": 1.7258, "step": 5502 }, { "epoch": 0.43, "learning_rate": 0.0002848420355475321, "loss": 1.8306, "step": 5503 }, { "epoch": 0.43, "learning_rate": 0.00028483662082213953, "loss": 1.7778, "step": 5504 }, { "epoch": 0.43, "learning_rate": 0.00028483120518128075, "loss": 1.7619, "step": 5505 }, { "epoch": 0.43, "learning_rate": 0.00028482578862499246, "loss": 1.786, "step": 5506 }, { "epoch": 0.43, "learning_rate": 0.00028482037115331145, "loss": 1.8107, "step": 5507 }, { "epoch": 0.43, "learning_rate": 0.0002848149527662746, "loss": 1.787, "step": 5508 }, { "epoch": 0.43, "learning_rate": 0.00028480953346391856, "loss": 1.7587, "step": 5509 }, { "epoch": 0.43, "learning_rate": 0.0002848041132462802, "loss": 1.7506, "step": 5510 }, { "epoch": 0.43, "learning_rate": 0.0002847986921133963, "loss": 1.787, "step": 5511 }, { "epoch": 0.43, "learning_rate": 0.00028479327006530365, "loss": 1.7577, "step": 5512 }, { "epoch": 0.43, "learning_rate": 0.00028478784710203906, "loss": 1.7206, "step": 5513 }, { "epoch": 0.43, "learning_rate": 0.0002847824232236394, "loss": 1.7409, "step": 5514 }, { "epoch": 0.43, "learning_rate": 0.0002847769984301415, "loss": 1.7694, "step": 5515 }, { "epoch": 0.43, "learning_rate": 0.0002847715727215821, "loss": 1.7837, "step": 5516 }, { "epoch": 0.43, "learning_rate": 0.0002847661460979981, "loss": 1.7812, "step": 5517 }, { "epoch": 0.43, "learning_rate": 0.0002847607185594264, "loss": 1.7703, "step": 5518 }, { "epoch": 0.43, "learning_rate": 0.00028475529010590374, "loss": 1.8262, "step": 5519 }, { "epoch": 0.43, "learning_rate": 0.000284749860737467, "loss": 1.7697, "step": 5520 }, { "epoch": 0.43, "learning_rate": 0.00028474443045415314, "loss": 1.794, "step": 5521 }, { "epoch": 0.43, "learning_rate": 0.0002847389992559989, "loss": 1.8139, "step": 5522 }, { "epoch": 0.43, "learning_rate": 0.0002847335671430412, "loss": 1.7517, "step": 5523 }, { "epoch": 0.43, "learning_rate": 0.000284728134115317, "loss": 1.7891, "step": 5524 }, { "epoch": 0.43, "learning_rate": 0.00028472270017286305, "loss": 1.7384, "step": 5525 }, { "epoch": 0.43, "learning_rate": 0.0002847172653157163, "loss": 1.7808, "step": 5526 }, { "epoch": 0.43, "learning_rate": 0.0002847118295439137, "loss": 1.7894, "step": 5527 }, { "epoch": 0.43, "learning_rate": 0.0002847063928574921, "loss": 1.7938, "step": 5528 }, { "epoch": 0.44, "learning_rate": 0.0002847009552564884, "loss": 1.7854, "step": 5529 }, { "epoch": 0.44, "learning_rate": 0.00028469551674093965, "loss": 1.748, "step": 5530 }, { "epoch": 0.44, "learning_rate": 0.0002846900773108826, "loss": 1.7661, "step": 5531 }, { "epoch": 0.44, "learning_rate": 0.0002846846369663543, "loss": 1.8261, "step": 5532 }, { "epoch": 0.44, "learning_rate": 0.00028467919570739157, "loss": 1.7546, "step": 5533 }, { "epoch": 0.44, "learning_rate": 0.00028467375353403144, "loss": 1.7267, "step": 5534 }, { "epoch": 0.44, "learning_rate": 0.00028466831044631093, "loss": 1.8035, "step": 5535 }, { "epoch": 0.44, "learning_rate": 0.0002846628664442668, "loss": 1.7166, "step": 5536 }, { "epoch": 0.44, "learning_rate": 0.00028465742152793615, "loss": 1.7348, "step": 5537 }, { "epoch": 0.44, "learning_rate": 0.00028465197569735594, "loss": 1.6903, "step": 5538 }, { "epoch": 0.44, "learning_rate": 0.0002846465289525631, "loss": 1.8084, "step": 5539 }, { "epoch": 0.44, "learning_rate": 0.00028464108129359466, "loss": 1.785, "step": 5540 }, { "epoch": 0.44, "learning_rate": 0.0002846356327204876, "loss": 1.7668, "step": 5541 }, { "epoch": 0.44, "learning_rate": 0.00028463018323327883, "loss": 1.722, "step": 5542 }, { "epoch": 0.44, "learning_rate": 0.0002846247328320054, "loss": 1.7894, "step": 5543 }, { "epoch": 0.44, "learning_rate": 0.0002846192815167044, "loss": 1.7357, "step": 5544 }, { "epoch": 0.44, "learning_rate": 0.0002846138292874127, "loss": 1.7978, "step": 5545 }, { "epoch": 0.44, "learning_rate": 0.0002846083761441674, "loss": 1.767, "step": 5546 }, { "epoch": 0.44, "learning_rate": 0.00028460292208700556, "loss": 1.7703, "step": 5547 }, { "epoch": 0.44, "learning_rate": 0.0002845974671159641, "loss": 1.7564, "step": 5548 }, { "epoch": 0.44, "learning_rate": 0.00028459201123108015, "loss": 1.7464, "step": 5549 }, { "epoch": 0.44, "learning_rate": 0.00028458655443239065, "loss": 1.7376, "step": 5550 }, { "epoch": 0.44, "learning_rate": 0.0002845810967199328, "loss": 1.6681, "step": 5551 }, { "epoch": 0.44, "learning_rate": 0.00028457563809374355, "loss": 1.7194, "step": 5552 }, { "epoch": 0.44, "learning_rate": 0.00028457017855385995, "loss": 1.6932, "step": 5553 }, { "epoch": 0.44, "learning_rate": 0.0002845647181003191, "loss": 1.8475, "step": 5554 }, { "epoch": 0.44, "learning_rate": 0.00028455925673315815, "loss": 1.7013, "step": 5555 }, { "epoch": 0.44, "learning_rate": 0.000284553794452414, "loss": 1.7472, "step": 5556 }, { "epoch": 0.44, "learning_rate": 0.00028454833125812393, "loss": 1.7513, "step": 5557 }, { "epoch": 0.44, "learning_rate": 0.0002845428671503249, "loss": 1.7009, "step": 5558 }, { "epoch": 0.44, "learning_rate": 0.00028453740212905403, "loss": 1.7531, "step": 5559 }, { "epoch": 0.44, "learning_rate": 0.0002845319361943485, "loss": 1.7463, "step": 5560 }, { "epoch": 0.44, "learning_rate": 0.0002845264693462453, "loss": 1.7527, "step": 5561 }, { "epoch": 0.44, "learning_rate": 0.00028452100158478166, "loss": 1.75, "step": 5562 }, { "epoch": 0.44, "learning_rate": 0.0002845155329099946, "loss": 1.7319, "step": 5563 }, { "epoch": 0.44, "learning_rate": 0.0002845100633219213, "loss": 1.7536, "step": 5564 }, { "epoch": 0.44, "learning_rate": 0.00028450459282059896, "loss": 1.7094, "step": 5565 }, { "epoch": 0.44, "learning_rate": 0.00028449912140606463, "loss": 1.791, "step": 5566 }, { "epoch": 0.44, "learning_rate": 0.0002844936490783555, "loss": 1.7285, "step": 5567 }, { "epoch": 0.44, "learning_rate": 0.0002844881758375087, "loss": 1.7461, "step": 5568 }, { "epoch": 0.44, "learning_rate": 0.0002844827016835614, "loss": 1.7533, "step": 5569 }, { "epoch": 0.44, "learning_rate": 0.00028447722661655077, "loss": 1.7665, "step": 5570 }, { "epoch": 0.44, "learning_rate": 0.000284471750636514, "loss": 1.8111, "step": 5571 }, { "epoch": 0.44, "learning_rate": 0.00028446627374348826, "loss": 1.7533, "step": 5572 }, { "epoch": 0.44, "learning_rate": 0.0002844607959375107, "loss": 1.7661, "step": 5573 }, { "epoch": 0.44, "learning_rate": 0.0002844553172186186, "loss": 1.8473, "step": 5574 }, { "epoch": 0.44, "learning_rate": 0.000284449837586849, "loss": 1.7877, "step": 5575 }, { "epoch": 0.44, "learning_rate": 0.0002844443570422392, "loss": 1.8129, "step": 5576 }, { "epoch": 0.44, "learning_rate": 0.00028443887558482646, "loss": 1.7782, "step": 5577 }, { "epoch": 0.44, "learning_rate": 0.0002844333932146479, "loss": 1.7673, "step": 5578 }, { "epoch": 0.44, "learning_rate": 0.0002844279099317408, "loss": 1.7422, "step": 5579 }, { "epoch": 0.44, "learning_rate": 0.00028442242573614246, "loss": 1.7842, "step": 5580 }, { "epoch": 0.44, "learning_rate": 0.00028441694062788993, "loss": 1.7385, "step": 5581 }, { "epoch": 0.44, "learning_rate": 0.0002844114546070206, "loss": 1.7277, "step": 5582 }, { "epoch": 0.44, "learning_rate": 0.0002844059676735716, "loss": 1.7883, "step": 5583 }, { "epoch": 0.44, "learning_rate": 0.0002844004798275803, "loss": 1.7101, "step": 5584 }, { "epoch": 0.44, "learning_rate": 0.00028439499106908394, "loss": 1.7103, "step": 5585 }, { "epoch": 0.44, "learning_rate": 0.0002843895013981197, "loss": 1.8038, "step": 5586 }, { "epoch": 0.44, "learning_rate": 0.0002843840108147249, "loss": 1.7531, "step": 5587 }, { "epoch": 0.44, "learning_rate": 0.0002843785193189369, "loss": 1.7961, "step": 5588 }, { "epoch": 0.44, "learning_rate": 0.00028437302691079286, "loss": 1.7089, "step": 5589 }, { "epoch": 0.44, "learning_rate": 0.0002843675335903301, "loss": 1.7704, "step": 5590 }, { "epoch": 0.44, "learning_rate": 0.00028436203935758596, "loss": 1.7399, "step": 5591 }, { "epoch": 0.44, "learning_rate": 0.00028435654421259777, "loss": 1.7981, "step": 5592 }, { "epoch": 0.44, "learning_rate": 0.0002843510481554027, "loss": 1.7534, "step": 5593 }, { "epoch": 0.44, "learning_rate": 0.0002843455511860382, "loss": 1.7652, "step": 5594 }, { "epoch": 0.44, "learning_rate": 0.00028434005330454156, "loss": 1.6997, "step": 5595 }, { "epoch": 0.44, "learning_rate": 0.0002843345545109501, "loss": 1.7387, "step": 5596 }, { "epoch": 0.44, "learning_rate": 0.00028432905480530113, "loss": 1.7178, "step": 5597 }, { "epoch": 0.44, "learning_rate": 0.000284323554187632, "loss": 1.7162, "step": 5598 }, { "epoch": 0.44, "learning_rate": 0.00028431805265798007, "loss": 1.7747, "step": 5599 }, { "epoch": 0.44, "learning_rate": 0.00028431255021638265, "loss": 1.7294, "step": 5600 }, { "epoch": 0.44, "learning_rate": 0.00028430704686287716, "loss": 1.7239, "step": 5601 }, { "epoch": 0.44, "learning_rate": 0.00028430154259750093, "loss": 1.7379, "step": 5602 }, { "epoch": 0.44, "learning_rate": 0.00028429603742029133, "loss": 1.7418, "step": 5603 }, { "epoch": 0.44, "learning_rate": 0.0002842905313312858, "loss": 1.7781, "step": 5604 }, { "epoch": 0.44, "learning_rate": 0.00028428502433052165, "loss": 1.7584, "step": 5605 }, { "epoch": 0.44, "learning_rate": 0.00028427951641803623, "loss": 1.7401, "step": 5606 }, { "epoch": 0.44, "learning_rate": 0.00028427400759386705, "loss": 1.7219, "step": 5607 }, { "epoch": 0.44, "learning_rate": 0.0002842684978580515, "loss": 1.7553, "step": 5608 }, { "epoch": 0.44, "learning_rate": 0.00028426298721062685, "loss": 1.7212, "step": 5609 }, { "epoch": 0.44, "learning_rate": 0.00028425747565163066, "loss": 1.7838, "step": 5610 }, { "epoch": 0.44, "learning_rate": 0.0002842519631811003, "loss": 1.7903, "step": 5611 }, { "epoch": 0.44, "learning_rate": 0.0002842464497990732, "loss": 1.796, "step": 5612 }, { "epoch": 0.44, "learning_rate": 0.0002842409355055868, "loss": 1.7426, "step": 5613 }, { "epoch": 0.44, "learning_rate": 0.00028423542030067846, "loss": 1.7612, "step": 5614 }, { "epoch": 0.44, "learning_rate": 0.0002842299041843857, "loss": 1.7338, "step": 5615 }, { "epoch": 0.44, "learning_rate": 0.0002842243871567461, "loss": 1.7703, "step": 5616 }, { "epoch": 0.44, "learning_rate": 0.00028421886921779684, "loss": 1.7707, "step": 5617 }, { "epoch": 0.44, "learning_rate": 0.00028421335036757557, "loss": 1.6947, "step": 5618 }, { "epoch": 0.44, "learning_rate": 0.0002842078306061197, "loss": 1.7164, "step": 5619 }, { "epoch": 0.44, "learning_rate": 0.00028420230993346675, "loss": 1.7273, "step": 5620 }, { "epoch": 0.44, "learning_rate": 0.0002841967883496542, "loss": 1.768, "step": 5621 }, { "epoch": 0.44, "learning_rate": 0.0002841912658547194, "loss": 1.7268, "step": 5622 }, { "epoch": 0.44, "learning_rate": 0.00028418574244870007, "loss": 1.7282, "step": 5623 }, { "epoch": 0.44, "learning_rate": 0.00028418021813163356, "loss": 1.7357, "step": 5624 }, { "epoch": 0.44, "learning_rate": 0.0002841746929035574, "loss": 1.7542, "step": 5625 }, { "epoch": 0.44, "learning_rate": 0.0002841691667645092, "loss": 1.7145, "step": 5626 }, { "epoch": 0.44, "learning_rate": 0.0002841636397145263, "loss": 1.7535, "step": 5627 }, { "epoch": 0.44, "learning_rate": 0.0002841581117536464, "loss": 1.7263, "step": 5628 }, { "epoch": 0.44, "learning_rate": 0.0002841525828819069, "loss": 1.8061, "step": 5629 }, { "epoch": 0.44, "learning_rate": 0.0002841470530993454, "loss": 1.7372, "step": 5630 }, { "epoch": 0.44, "learning_rate": 0.00028414152240599944, "loss": 1.7583, "step": 5631 }, { "epoch": 0.44, "learning_rate": 0.0002841359908019066, "loss": 1.7421, "step": 5632 }, { "epoch": 0.44, "learning_rate": 0.00028413045828710434, "loss": 1.7744, "step": 5633 }, { "epoch": 0.44, "learning_rate": 0.0002841249248616304, "loss": 1.7501, "step": 5634 }, { "epoch": 0.44, "learning_rate": 0.0002841193905255221, "loss": 1.7295, "step": 5635 }, { "epoch": 0.44, "learning_rate": 0.00028411385527881723, "loss": 1.7487, "step": 5636 }, { "epoch": 0.44, "learning_rate": 0.0002841083191215533, "loss": 1.7862, "step": 5637 }, { "epoch": 0.44, "learning_rate": 0.0002841027820537678, "loss": 1.7278, "step": 5638 }, { "epoch": 0.44, "learning_rate": 0.0002840972440754985, "loss": 1.7418, "step": 5639 }, { "epoch": 0.44, "learning_rate": 0.0002840917051867829, "loss": 1.7718, "step": 5640 }, { "epoch": 0.44, "learning_rate": 0.00028408616538765866, "loss": 1.7874, "step": 5641 }, { "epoch": 0.44, "learning_rate": 0.00028408062467816334, "loss": 1.7958, "step": 5642 }, { "epoch": 0.44, "learning_rate": 0.0002840750830583345, "loss": 1.7427, "step": 5643 }, { "epoch": 0.44, "learning_rate": 0.0002840695405282099, "loss": 1.8179, "step": 5644 }, { "epoch": 0.44, "learning_rate": 0.00028406399708782705, "loss": 1.7859, "step": 5645 }, { "epoch": 0.44, "learning_rate": 0.0002840584527372237, "loss": 1.7789, "step": 5646 }, { "epoch": 0.44, "learning_rate": 0.0002840529074764374, "loss": 1.7767, "step": 5647 }, { "epoch": 0.44, "learning_rate": 0.0002840473613055058, "loss": 1.8074, "step": 5648 }, { "epoch": 0.44, "learning_rate": 0.00028404181422446667, "loss": 1.7618, "step": 5649 }, { "epoch": 0.44, "learning_rate": 0.00028403626623335756, "loss": 1.7828, "step": 5650 }, { "epoch": 0.44, "learning_rate": 0.00028403071733221615, "loss": 1.7641, "step": 5651 }, { "epoch": 0.44, "learning_rate": 0.00028402516752108016, "loss": 1.7566, "step": 5652 }, { "epoch": 0.44, "learning_rate": 0.0002840196167999872, "loss": 1.7505, "step": 5653 }, { "epoch": 0.44, "learning_rate": 0.00028401406516897506, "loss": 1.7285, "step": 5654 }, { "epoch": 0.44, "learning_rate": 0.00028400851262808135, "loss": 1.8047, "step": 5655 }, { "epoch": 0.45, "learning_rate": 0.0002840029591773438, "loss": 1.746, "step": 5656 }, { "epoch": 0.45, "learning_rate": 0.00028399740481680006, "loss": 1.7788, "step": 5657 }, { "epoch": 0.45, "learning_rate": 0.0002839918495464879, "loss": 1.7521, "step": 5658 }, { "epoch": 0.45, "learning_rate": 0.00028398629336644503, "loss": 1.6955, "step": 5659 }, { "epoch": 0.45, "learning_rate": 0.0002839807362767092, "loss": 1.7568, "step": 5660 }, { "epoch": 0.45, "learning_rate": 0.0002839751782773181, "loss": 1.6827, "step": 5661 }, { "epoch": 0.45, "learning_rate": 0.0002839696193683094, "loss": 1.7588, "step": 5662 }, { "epoch": 0.45, "learning_rate": 0.00028396405954972105, "loss": 1.7498, "step": 5663 }, { "epoch": 0.45, "learning_rate": 0.00028395849882159054, "loss": 1.7852, "step": 5664 }, { "epoch": 0.45, "learning_rate": 0.00028395293718395584, "loss": 1.7424, "step": 5665 }, { "epoch": 0.45, "learning_rate": 0.0002839473746368546, "loss": 1.747, "step": 5666 }, { "epoch": 0.45, "learning_rate": 0.00028394181118032453, "loss": 1.7713, "step": 5667 }, { "epoch": 0.45, "learning_rate": 0.00028393624681440354, "loss": 1.7662, "step": 5668 }, { "epoch": 0.45, "learning_rate": 0.00028393068153912933, "loss": 1.7482, "step": 5669 }, { "epoch": 0.45, "learning_rate": 0.0002839251153545397, "loss": 1.7983, "step": 5670 }, { "epoch": 0.45, "learning_rate": 0.0002839195482606725, "loss": 1.7277, "step": 5671 }, { "epoch": 0.45, "learning_rate": 0.00028391398025756534, "loss": 1.7389, "step": 5672 }, { "epoch": 0.45, "learning_rate": 0.0002839084113452563, "loss": 1.6993, "step": 5673 }, { "epoch": 0.45, "learning_rate": 0.00028390284152378294, "loss": 1.7232, "step": 5674 }, { "epoch": 0.45, "learning_rate": 0.0002838972707931832, "loss": 1.7244, "step": 5675 }, { "epoch": 0.45, "learning_rate": 0.0002838916991534949, "loss": 1.6969, "step": 5676 }, { "epoch": 0.45, "learning_rate": 0.0002838861266047559, "loss": 1.7743, "step": 5677 }, { "epoch": 0.45, "learning_rate": 0.00028388055314700387, "loss": 1.7841, "step": 5678 }, { "epoch": 0.45, "learning_rate": 0.00028387497878027687, "loss": 1.7378, "step": 5679 }, { "epoch": 0.45, "learning_rate": 0.00028386940350461255, "loss": 1.7664, "step": 5680 }, { "epoch": 0.45, "learning_rate": 0.0002838638273200489, "loss": 1.7751, "step": 5681 }, { "epoch": 0.45, "learning_rate": 0.00028385825022662377, "loss": 1.7228, "step": 5682 }, { "epoch": 0.45, "learning_rate": 0.000283852672224375, "loss": 1.7516, "step": 5683 }, { "epoch": 0.45, "learning_rate": 0.0002838470933133404, "loss": 1.7363, "step": 5684 }, { "epoch": 0.45, "learning_rate": 0.0002838415134935579, "loss": 1.6928, "step": 5685 }, { "epoch": 0.45, "learning_rate": 0.00028383593276506535, "loss": 1.6959, "step": 5686 }, { "epoch": 0.45, "learning_rate": 0.00028383035112790073, "loss": 1.7759, "step": 5687 }, { "epoch": 0.45, "learning_rate": 0.0002838247685821019, "loss": 1.7249, "step": 5688 }, { "epoch": 0.45, "learning_rate": 0.00028381918512770666, "loss": 1.741, "step": 5689 }, { "epoch": 0.45, "learning_rate": 0.00028381360076475305, "loss": 1.7614, "step": 5690 }, { "epoch": 0.45, "learning_rate": 0.00028380801549327895, "loss": 1.7305, "step": 5691 }, { "epoch": 0.45, "learning_rate": 0.00028380242931332224, "loss": 1.7761, "step": 5692 }, { "epoch": 0.45, "learning_rate": 0.0002837968422249209, "loss": 1.8307, "step": 5693 }, { "epoch": 0.45, "learning_rate": 0.0002837912542281128, "loss": 1.7658, "step": 5694 }, { "epoch": 0.45, "learning_rate": 0.00028378566532293595, "loss": 1.7519, "step": 5695 }, { "epoch": 0.45, "learning_rate": 0.00028378007550942827, "loss": 1.7479, "step": 5696 }, { "epoch": 0.45, "learning_rate": 0.00028377448478762767, "loss": 1.732, "step": 5697 }, { "epoch": 0.45, "learning_rate": 0.00028376889315757215, "loss": 1.7833, "step": 5698 }, { "epoch": 0.45, "learning_rate": 0.00028376330061929966, "loss": 1.804, "step": 5699 }, { "epoch": 0.45, "learning_rate": 0.0002837577071728482, "loss": 1.7489, "step": 5700 }, { "epoch": 0.45, "learning_rate": 0.00028375211281825573, "loss": 1.7838, "step": 5701 }, { "epoch": 0.45, "learning_rate": 0.0002837465175555601, "loss": 1.7723, "step": 5702 }, { "epoch": 0.45, "learning_rate": 0.0002837409213847996, "loss": 1.7778, "step": 5703 }, { "epoch": 0.45, "learning_rate": 0.00028373532430601197, "loss": 1.7513, "step": 5704 }, { "epoch": 0.45, "learning_rate": 0.00028372972631923526, "loss": 1.7986, "step": 5705 }, { "epoch": 0.45, "learning_rate": 0.00028372412742450753, "loss": 1.7059, "step": 5706 }, { "epoch": 0.45, "learning_rate": 0.0002837185276218668, "loss": 1.7452, "step": 5707 }, { "epoch": 0.45, "learning_rate": 0.00028371292691135104, "loss": 1.7699, "step": 5708 }, { "epoch": 0.45, "learning_rate": 0.0002837073252929983, "loss": 1.7875, "step": 5709 }, { "epoch": 0.45, "learning_rate": 0.00028370172276684656, "loss": 1.7451, "step": 5710 }, { "epoch": 0.45, "learning_rate": 0.00028369611933293394, "loss": 1.7751, "step": 5711 }, { "epoch": 0.45, "learning_rate": 0.0002836905149912985, "loss": 1.6999, "step": 5712 }, { "epoch": 0.45, "learning_rate": 0.0002836849097419781, "loss": 1.766, "step": 5713 }, { "epoch": 0.45, "learning_rate": 0.0002836793035850111, "loss": 1.7244, "step": 5714 }, { "epoch": 0.45, "learning_rate": 0.0002836736965204353, "loss": 1.7591, "step": 5715 }, { "epoch": 0.45, "learning_rate": 0.0002836680885482889, "loss": 1.7189, "step": 5716 }, { "epoch": 0.45, "learning_rate": 0.00028366247966860996, "loss": 1.7841, "step": 5717 }, { "epoch": 0.45, "learning_rate": 0.0002836568698814365, "loss": 1.7912, "step": 5718 }, { "epoch": 0.45, "learning_rate": 0.00028365125918680667, "loss": 1.7726, "step": 5719 }, { "epoch": 0.45, "learning_rate": 0.00028364564758475856, "loss": 1.7983, "step": 5720 }, { "epoch": 0.45, "learning_rate": 0.00028364003507533027, "loss": 1.7505, "step": 5721 }, { "epoch": 0.45, "learning_rate": 0.00028363442165855985, "loss": 1.7568, "step": 5722 }, { "epoch": 0.45, "learning_rate": 0.00028362880733448547, "loss": 1.7721, "step": 5723 }, { "epoch": 0.45, "learning_rate": 0.00028362319210314523, "loss": 1.7586, "step": 5724 }, { "epoch": 0.45, "learning_rate": 0.00028361757596457725, "loss": 1.7901, "step": 5725 }, { "epoch": 0.45, "learning_rate": 0.0002836119589188197, "loss": 1.7695, "step": 5726 }, { "epoch": 0.45, "learning_rate": 0.0002836063409659106, "loss": 1.7329, "step": 5727 }, { "epoch": 0.45, "learning_rate": 0.0002836007221058882, "loss": 1.7158, "step": 5728 }, { "epoch": 0.45, "learning_rate": 0.00028359510233879064, "loss": 1.6727, "step": 5729 }, { "epoch": 0.45, "learning_rate": 0.00028358948166465613, "loss": 1.6923, "step": 5730 }, { "epoch": 0.45, "learning_rate": 0.0002835838600835227, "loss": 1.8064, "step": 5731 }, { "epoch": 0.45, "learning_rate": 0.00028357823759542856, "loss": 1.7706, "step": 5732 }, { "epoch": 0.45, "learning_rate": 0.00028357261420041194, "loss": 1.7537, "step": 5733 }, { "epoch": 0.45, "learning_rate": 0.00028356698989851094, "loss": 1.7257, "step": 5734 }, { "epoch": 0.45, "learning_rate": 0.0002835613646897638, "loss": 1.7715, "step": 5735 }, { "epoch": 0.45, "learning_rate": 0.0002835557385742087, "loss": 1.724, "step": 5736 }, { "epoch": 0.45, "learning_rate": 0.00028355011155188387, "loss": 1.7564, "step": 5737 }, { "epoch": 0.45, "learning_rate": 0.0002835444836228274, "loss": 1.7195, "step": 5738 }, { "epoch": 0.45, "learning_rate": 0.0002835388547870776, "loss": 1.8489, "step": 5739 }, { "epoch": 0.45, "learning_rate": 0.00028353322504467277, "loss": 1.7512, "step": 5740 }, { "epoch": 0.45, "learning_rate": 0.0002835275943956509, "loss": 1.7488, "step": 5741 }, { "epoch": 0.45, "learning_rate": 0.0002835219628400505, "loss": 1.7738, "step": 5742 }, { "epoch": 0.45, "learning_rate": 0.00028351633037790953, "loss": 1.7144, "step": 5743 }, { "epoch": 0.45, "learning_rate": 0.00028351069700926644, "loss": 1.7711, "step": 5744 }, { "epoch": 0.45, "learning_rate": 0.0002835050627341593, "loss": 1.7423, "step": 5745 }, { "epoch": 0.45, "learning_rate": 0.00028349942755262654, "loss": 1.7522, "step": 5746 }, { "epoch": 0.45, "learning_rate": 0.00028349379146470633, "loss": 1.7726, "step": 5747 }, { "epoch": 0.45, "learning_rate": 0.0002834881544704369, "loss": 1.7595, "step": 5748 }, { "epoch": 0.45, "learning_rate": 0.00028348251656985655, "loss": 1.7061, "step": 5749 }, { "epoch": 0.45, "learning_rate": 0.0002834768777630037, "loss": 1.7545, "step": 5750 }, { "epoch": 0.45, "learning_rate": 0.0002834712380499164, "loss": 1.7419, "step": 5751 }, { "epoch": 0.45, "learning_rate": 0.00028346559743063307, "loss": 1.786, "step": 5752 }, { "epoch": 0.45, "learning_rate": 0.000283459955905192, "loss": 1.8005, "step": 5753 }, { "epoch": 0.45, "learning_rate": 0.0002834543134736314, "loss": 1.7811, "step": 5754 }, { "epoch": 0.45, "learning_rate": 0.0002834486701359898, "loss": 1.7368, "step": 5755 }, { "epoch": 0.45, "learning_rate": 0.00028344302589230526, "loss": 1.7161, "step": 5756 }, { "epoch": 0.45, "learning_rate": 0.0002834373807426162, "loss": 1.6974, "step": 5757 }, { "epoch": 0.45, "learning_rate": 0.00028343173468696107, "loss": 1.7741, "step": 5758 }, { "epoch": 0.45, "learning_rate": 0.000283426087725378, "loss": 1.7655, "step": 5759 }, { "epoch": 0.45, "learning_rate": 0.00028342043985790546, "loss": 1.7166, "step": 5760 }, { "epoch": 0.45, "learning_rate": 0.0002834147910845818, "loss": 1.7039, "step": 5761 }, { "epoch": 0.45, "learning_rate": 0.0002834091414054453, "loss": 1.7741, "step": 5762 }, { "epoch": 0.45, "learning_rate": 0.00028340349082053433, "loss": 1.8258, "step": 5763 }, { "epoch": 0.45, "learning_rate": 0.0002833978393298873, "loss": 1.8011, "step": 5764 }, { "epoch": 0.45, "learning_rate": 0.0002833921869335425, "loss": 1.7801, "step": 5765 }, { "epoch": 0.45, "learning_rate": 0.0002833865336315384, "loss": 1.7179, "step": 5766 }, { "epoch": 0.45, "learning_rate": 0.00028338087942391337, "loss": 1.7158, "step": 5767 }, { "epoch": 0.45, "learning_rate": 0.0002833752243107058, "loss": 1.7789, "step": 5768 }, { "epoch": 0.45, "learning_rate": 0.000283369568291954, "loss": 1.7765, "step": 5769 }, { "epoch": 0.45, "learning_rate": 0.0002833639113676965, "loss": 1.778, "step": 5770 }, { "epoch": 0.45, "learning_rate": 0.00028335825353797153, "loss": 1.7731, "step": 5771 }, { "epoch": 0.45, "learning_rate": 0.0002833525948028177, "loss": 1.807, "step": 5772 }, { "epoch": 0.45, "learning_rate": 0.0002833469351622733, "loss": 1.8399, "step": 5773 }, { "epoch": 0.45, "learning_rate": 0.00028334127461637684, "loss": 1.7909, "step": 5774 }, { "epoch": 0.45, "learning_rate": 0.00028333561316516665, "loss": 1.7203, "step": 5775 }, { "epoch": 0.45, "learning_rate": 0.00028332995080868127, "loss": 1.7137, "step": 5776 }, { "epoch": 0.45, "learning_rate": 0.00028332428754695906, "loss": 1.8245, "step": 5777 }, { "epoch": 0.45, "learning_rate": 0.0002833186233800386, "loss": 1.7043, "step": 5778 }, { "epoch": 0.45, "learning_rate": 0.00028331295830795813, "loss": 1.7199, "step": 5779 }, { "epoch": 0.45, "learning_rate": 0.00028330729233075634, "loss": 1.7488, "step": 5780 }, { "epoch": 0.45, "learning_rate": 0.00028330162544847157, "loss": 1.7223, "step": 5781 }, { "epoch": 0.45, "learning_rate": 0.0002832959576611423, "loss": 1.7393, "step": 5782 }, { "epoch": 0.46, "learning_rate": 0.0002832902889688071, "loss": 1.7445, "step": 5783 }, { "epoch": 0.46, "learning_rate": 0.00028328461937150435, "loss": 1.7209, "step": 5784 }, { "epoch": 0.46, "learning_rate": 0.0002832789488692726, "loss": 1.786, "step": 5785 }, { "epoch": 0.46, "learning_rate": 0.00028327327746215027, "loss": 1.7588, "step": 5786 }, { "epoch": 0.46, "learning_rate": 0.00028326760515017603, "loss": 1.7391, "step": 5787 }, { "epoch": 0.46, "learning_rate": 0.00028326193193338824, "loss": 1.7547, "step": 5788 }, { "epoch": 0.46, "learning_rate": 0.0002832562578118255, "loss": 1.7407, "step": 5789 }, { "epoch": 0.46, "learning_rate": 0.0002832505827855263, "loss": 1.7628, "step": 5790 }, { "epoch": 0.46, "learning_rate": 0.0002832449068545292, "loss": 1.7346, "step": 5791 }, { "epoch": 0.46, "learning_rate": 0.0002832392300188726, "loss": 1.7203, "step": 5792 }, { "epoch": 0.46, "learning_rate": 0.0002832335522785953, "loss": 1.7586, "step": 5793 }, { "epoch": 0.46, "learning_rate": 0.0002832278736337356, "loss": 1.7596, "step": 5794 }, { "epoch": 0.46, "learning_rate": 0.00028322219408433223, "loss": 1.756, "step": 5795 }, { "epoch": 0.46, "learning_rate": 0.00028321651363042365, "loss": 1.7617, "step": 5796 }, { "epoch": 0.46, "learning_rate": 0.0002832108322720484, "loss": 1.8447, "step": 5797 }, { "epoch": 0.46, "learning_rate": 0.00028320515000924523, "loss": 1.8204, "step": 5798 }, { "epoch": 0.46, "learning_rate": 0.0002831994668420525, "loss": 1.7361, "step": 5799 }, { "epoch": 0.46, "learning_rate": 0.000283193782770509, "loss": 1.7862, "step": 5800 }, { "epoch": 0.46, "learning_rate": 0.0002831880977946531, "loss": 1.797, "step": 5801 }, { "epoch": 0.46, "learning_rate": 0.0002831824119145236, "loss": 1.72, "step": 5802 }, { "epoch": 0.46, "learning_rate": 0.000283176725130159, "loss": 1.747, "step": 5803 }, { "epoch": 0.46, "learning_rate": 0.0002831710374415979, "loss": 1.752, "step": 5804 }, { "epoch": 0.46, "learning_rate": 0.000283165348848879, "loss": 1.8023, "step": 5805 }, { "epoch": 0.46, "learning_rate": 0.0002831596593520408, "loss": 1.7759, "step": 5806 }, { "epoch": 0.46, "learning_rate": 0.00028315396895112205, "loss": 1.7615, "step": 5807 }, { "epoch": 0.46, "learning_rate": 0.00028314827764616126, "loss": 1.7967, "step": 5808 }, { "epoch": 0.46, "learning_rate": 0.0002831425854371972, "loss": 1.7357, "step": 5809 }, { "epoch": 0.46, "learning_rate": 0.0002831368923242685, "loss": 1.7686, "step": 5810 }, { "epoch": 0.46, "learning_rate": 0.00028313119830741367, "loss": 1.7653, "step": 5811 }, { "epoch": 0.46, "learning_rate": 0.00028312550338667155, "loss": 1.7987, "step": 5812 }, { "epoch": 0.46, "learning_rate": 0.0002831198075620807, "loss": 1.7577, "step": 5813 }, { "epoch": 0.46, "learning_rate": 0.0002831141108336798, "loss": 1.738, "step": 5814 }, { "epoch": 0.46, "learning_rate": 0.0002831084132015076, "loss": 1.755, "step": 5815 }, { "epoch": 0.46, "learning_rate": 0.00028310271466560266, "loss": 1.7782, "step": 5816 }, { "epoch": 0.46, "learning_rate": 0.0002830970152260038, "loss": 1.7861, "step": 5817 }, { "epoch": 0.46, "learning_rate": 0.0002830913148827496, "loss": 1.7542, "step": 5818 }, { "epoch": 0.46, "learning_rate": 0.00028308561363587885, "loss": 1.8072, "step": 5819 }, { "epoch": 0.46, "learning_rate": 0.00028307991148543026, "loss": 1.7424, "step": 5820 }, { "epoch": 0.46, "learning_rate": 0.00028307420843144243, "loss": 1.7708, "step": 5821 }, { "epoch": 0.46, "learning_rate": 0.0002830685044739542, "loss": 1.7454, "step": 5822 }, { "epoch": 0.46, "learning_rate": 0.0002830627996130043, "loss": 1.7777, "step": 5823 }, { "epoch": 0.46, "learning_rate": 0.00028305709384863136, "loss": 1.7144, "step": 5824 }, { "epoch": 0.46, "learning_rate": 0.0002830513871808742, "loss": 1.7414, "step": 5825 }, { "epoch": 0.46, "learning_rate": 0.00028304567960977156, "loss": 1.7461, "step": 5826 }, { "epoch": 0.46, "learning_rate": 0.0002830399711353622, "loss": 1.7013, "step": 5827 }, { "epoch": 0.46, "learning_rate": 0.0002830342617576848, "loss": 1.7324, "step": 5828 }, { "epoch": 0.46, "learning_rate": 0.00028302855147677814, "loss": 1.7198, "step": 5829 }, { "epoch": 0.46, "learning_rate": 0.0002830228402926811, "loss": 1.7489, "step": 5830 }, { "epoch": 0.46, "learning_rate": 0.00028301712820543237, "loss": 1.6915, "step": 5831 }, { "epoch": 0.46, "learning_rate": 0.00028301141521507077, "loss": 1.7466, "step": 5832 }, { "epoch": 0.46, "learning_rate": 0.000283005701321635, "loss": 1.7427, "step": 5833 }, { "epoch": 0.46, "learning_rate": 0.00028299998652516395, "loss": 1.7652, "step": 5834 }, { "epoch": 0.46, "learning_rate": 0.0002829942708256964, "loss": 1.7718, "step": 5835 }, { "epoch": 0.46, "learning_rate": 0.00028298855422327114, "loss": 1.7657, "step": 5836 }, { "epoch": 0.46, "learning_rate": 0.00028298283671792697, "loss": 1.7428, "step": 5837 }, { "epoch": 0.46, "learning_rate": 0.0002829771183097027, "loss": 1.7426, "step": 5838 }, { "epoch": 0.46, "learning_rate": 0.0002829713989986372, "loss": 1.812, "step": 5839 }, { "epoch": 0.46, "learning_rate": 0.0002829656787847693, "loss": 1.7145, "step": 5840 }, { "epoch": 0.46, "learning_rate": 0.0002829599576681378, "loss": 1.7772, "step": 5841 }, { "epoch": 0.46, "learning_rate": 0.00028295423564878155, "loss": 1.7236, "step": 5842 }, { "epoch": 0.46, "learning_rate": 0.0002829485127267394, "loss": 1.7365, "step": 5843 }, { "epoch": 0.46, "learning_rate": 0.0002829427889020503, "loss": 1.7083, "step": 5844 }, { "epoch": 0.46, "learning_rate": 0.00028293706417475295, "loss": 1.7294, "step": 5845 }, { "epoch": 0.46, "learning_rate": 0.00028293133854488634, "loss": 1.7473, "step": 5846 }, { "epoch": 0.46, "learning_rate": 0.00028292561201248925, "loss": 1.7058, "step": 5847 }, { "epoch": 0.46, "learning_rate": 0.00028291988457760064, "loss": 1.7552, "step": 5848 }, { "epoch": 0.46, "learning_rate": 0.00028291415624025933, "loss": 1.7927, "step": 5849 }, { "epoch": 0.46, "learning_rate": 0.0002829084270005043, "loss": 1.7293, "step": 5850 }, { "epoch": 0.46, "learning_rate": 0.00028290269685837436, "loss": 1.7065, "step": 5851 }, { "epoch": 0.46, "learning_rate": 0.0002828969658139085, "loss": 1.7332, "step": 5852 }, { "epoch": 0.46, "learning_rate": 0.0002828912338671455, "loss": 1.7918, "step": 5853 }, { "epoch": 0.46, "learning_rate": 0.0002828855010181244, "loss": 1.809, "step": 5854 }, { "epoch": 0.46, "learning_rate": 0.0002828797672668841, "loss": 1.7228, "step": 5855 }, { "epoch": 0.46, "learning_rate": 0.0002828740326134635, "loss": 1.7241, "step": 5856 }, { "epoch": 0.46, "learning_rate": 0.00028286829705790153, "loss": 1.6957, "step": 5857 }, { "epoch": 0.46, "learning_rate": 0.0002828625606002371, "loss": 1.7006, "step": 5858 }, { "epoch": 0.46, "learning_rate": 0.00028285682324050924, "loss": 1.6802, "step": 5859 }, { "epoch": 0.46, "learning_rate": 0.0002828510849787569, "loss": 1.7942, "step": 5860 }, { "epoch": 0.46, "learning_rate": 0.00028284534581501903, "loss": 1.7433, "step": 5861 }, { "epoch": 0.46, "learning_rate": 0.0002828396057493345, "loss": 1.7092, "step": 5862 }, { "epoch": 0.46, "learning_rate": 0.0002828338647817424, "loss": 1.6962, "step": 5863 }, { "epoch": 0.46, "learning_rate": 0.00028282812291228164, "loss": 1.734, "step": 5864 }, { "epoch": 0.46, "learning_rate": 0.00028282238014099123, "loss": 1.7522, "step": 5865 }, { "epoch": 0.46, "learning_rate": 0.00028281663646791014, "loss": 1.7451, "step": 5866 }, { "epoch": 0.46, "learning_rate": 0.0002828108918930774, "loss": 1.8301, "step": 5867 }, { "epoch": 0.46, "learning_rate": 0.000282805146416532, "loss": 1.7581, "step": 5868 }, { "epoch": 0.46, "learning_rate": 0.00028279940003831294, "loss": 1.7312, "step": 5869 }, { "epoch": 0.46, "learning_rate": 0.00028279365275845925, "loss": 1.7344, "step": 5870 }, { "epoch": 0.46, "learning_rate": 0.00028278790457700987, "loss": 1.7213, "step": 5871 }, { "epoch": 0.46, "learning_rate": 0.00028278215549400393, "loss": 1.7604, "step": 5872 }, { "epoch": 0.46, "learning_rate": 0.00028277640550948053, "loss": 1.7778, "step": 5873 }, { "epoch": 0.46, "learning_rate": 0.0002827706546234785, "loss": 1.8177, "step": 5874 }, { "epoch": 0.46, "learning_rate": 0.000282764902836037, "loss": 1.7496, "step": 5875 }, { "epoch": 0.46, "learning_rate": 0.0002827591501471951, "loss": 1.7593, "step": 5876 }, { "epoch": 0.46, "learning_rate": 0.0002827533965569919, "loss": 1.7531, "step": 5877 }, { "epoch": 0.46, "learning_rate": 0.0002827476420654663, "loss": 1.7603, "step": 5878 }, { "epoch": 0.46, "learning_rate": 0.0002827418866726575, "loss": 1.7327, "step": 5879 }, { "epoch": 0.46, "learning_rate": 0.0002827361303786045, "loss": 1.7316, "step": 5880 }, { "epoch": 0.46, "learning_rate": 0.00028273037318334645, "loss": 1.7118, "step": 5881 }, { "epoch": 0.46, "learning_rate": 0.00028272461508692246, "loss": 1.7085, "step": 5882 }, { "epoch": 0.46, "learning_rate": 0.00028271885608937154, "loss": 1.7868, "step": 5883 }, { "epoch": 0.46, "learning_rate": 0.0002827130961907328, "loss": 1.7373, "step": 5884 }, { "epoch": 0.46, "learning_rate": 0.00028270733539104544, "loss": 1.783, "step": 5885 }, { "epoch": 0.46, "learning_rate": 0.00028270157369034843, "loss": 1.7772, "step": 5886 }, { "epoch": 0.46, "learning_rate": 0.00028269581108868104, "loss": 1.7721, "step": 5887 }, { "epoch": 0.46, "learning_rate": 0.0002826900475860823, "loss": 1.7806, "step": 5888 }, { "epoch": 0.46, "learning_rate": 0.00028268428318259137, "loss": 1.7484, "step": 5889 }, { "epoch": 0.46, "learning_rate": 0.0002826785178782473, "loss": 1.7267, "step": 5890 }, { "epoch": 0.46, "learning_rate": 0.0002826727516730894, "loss": 1.7253, "step": 5891 }, { "epoch": 0.46, "learning_rate": 0.00028266698456715664, "loss": 1.7475, "step": 5892 }, { "epoch": 0.46, "learning_rate": 0.00028266121656048837, "loss": 1.7583, "step": 5893 }, { "epoch": 0.46, "learning_rate": 0.0002826554476531236, "loss": 1.7744, "step": 5894 }, { "epoch": 0.46, "learning_rate": 0.00028264967784510155, "loss": 1.7089, "step": 5895 }, { "epoch": 0.46, "learning_rate": 0.0002826439071364614, "loss": 1.7784, "step": 5896 }, { "epoch": 0.46, "learning_rate": 0.0002826381355272423, "loss": 1.8067, "step": 5897 }, { "epoch": 0.46, "learning_rate": 0.0002826323630174834, "loss": 1.749, "step": 5898 }, { "epoch": 0.46, "learning_rate": 0.00028262658960722406, "loss": 1.7851, "step": 5899 }, { "epoch": 0.46, "learning_rate": 0.00028262081529650335, "loss": 1.7517, "step": 5900 }, { "epoch": 0.46, "learning_rate": 0.00028261504008536044, "loss": 1.761, "step": 5901 }, { "epoch": 0.46, "learning_rate": 0.0002826092639738346, "loss": 1.6759, "step": 5902 }, { "epoch": 0.46, "learning_rate": 0.0002826034869619651, "loss": 1.7585, "step": 5903 }, { "epoch": 0.46, "learning_rate": 0.000282597709049791, "loss": 1.8012, "step": 5904 }, { "epoch": 0.46, "learning_rate": 0.00028259193023735167, "loss": 1.7643, "step": 5905 }, { "epoch": 0.46, "learning_rate": 0.00028258615052468634, "loss": 1.693, "step": 5906 }, { "epoch": 0.46, "learning_rate": 0.0002825803699118341, "loss": 1.7844, "step": 5907 }, { "epoch": 0.46, "learning_rate": 0.00028257458839883444, "loss": 1.7447, "step": 5908 }, { "epoch": 0.46, "learning_rate": 0.0002825688059857264, "loss": 1.7118, "step": 5909 }, { "epoch": 0.47, "learning_rate": 0.00028256302267254944, "loss": 1.7281, "step": 5910 }, { "epoch": 0.47, "learning_rate": 0.0002825572384593426, "loss": 1.7033, "step": 5911 }, { "epoch": 0.47, "learning_rate": 0.0002825514533461453, "loss": 1.7728, "step": 5912 }, { "epoch": 0.47, "learning_rate": 0.0002825456673329968, "loss": 1.7453, "step": 5913 }, { "epoch": 0.47, "learning_rate": 0.00028253988041993634, "loss": 1.758, "step": 5914 }, { "epoch": 0.47, "learning_rate": 0.0002825340926070032, "loss": 1.7223, "step": 5915 }, { "epoch": 0.47, "learning_rate": 0.00028252830389423675, "loss": 1.7399, "step": 5916 }, { "epoch": 0.47, "learning_rate": 0.0002825225142816763, "loss": 1.7667, "step": 5917 }, { "epoch": 0.47, "learning_rate": 0.00028251672376936103, "loss": 1.6907, "step": 5918 }, { "epoch": 0.47, "learning_rate": 0.00028251093235733037, "loss": 1.7817, "step": 5919 }, { "epoch": 0.47, "learning_rate": 0.00028250514004562354, "loss": 1.7041, "step": 5920 }, { "epoch": 0.47, "learning_rate": 0.00028249934683428, "loss": 1.7445, "step": 5921 }, { "epoch": 0.47, "learning_rate": 0.00028249355272333903, "loss": 1.7472, "step": 5922 }, { "epoch": 0.47, "learning_rate": 0.0002824877577128399, "loss": 1.7564, "step": 5923 }, { "epoch": 0.47, "learning_rate": 0.000282481961802822, "loss": 1.7069, "step": 5924 }, { "epoch": 0.47, "learning_rate": 0.00028247616499332476, "loss": 1.7561, "step": 5925 }, { "epoch": 0.47, "learning_rate": 0.0002824703672843874, "loss": 1.7708, "step": 5926 }, { "epoch": 0.47, "learning_rate": 0.0002824645686760494, "loss": 1.7869, "step": 5927 }, { "epoch": 0.47, "learning_rate": 0.0002824587691683501, "loss": 1.7465, "step": 5928 }, { "epoch": 0.47, "learning_rate": 0.0002824529687613288, "loss": 1.8167, "step": 5929 }, { "epoch": 0.47, "learning_rate": 0.00028244716745502496, "loss": 1.7559, "step": 5930 }, { "epoch": 0.47, "learning_rate": 0.00028244136524947794, "loss": 1.815, "step": 5931 }, { "epoch": 0.47, "learning_rate": 0.0002824355621447271, "loss": 1.7111, "step": 5932 }, { "epoch": 0.47, "learning_rate": 0.0002824297581408119, "loss": 1.7495, "step": 5933 }, { "epoch": 0.47, "learning_rate": 0.0002824239532377717, "loss": 1.7243, "step": 5934 }, { "epoch": 0.47, "learning_rate": 0.00028241814743564593, "loss": 1.7171, "step": 5935 }, { "epoch": 0.47, "learning_rate": 0.0002824123407344741, "loss": 1.7218, "step": 5936 }, { "epoch": 0.47, "learning_rate": 0.00028240653313429547, "loss": 1.8036, "step": 5937 }, { "epoch": 0.47, "learning_rate": 0.00028240072463514955, "loss": 1.7522, "step": 5938 }, { "epoch": 0.47, "learning_rate": 0.0002823949152370758, "loss": 1.7295, "step": 5939 }, { "epoch": 0.47, "learning_rate": 0.00028238910494011364, "loss": 1.6867, "step": 5940 }, { "epoch": 0.47, "learning_rate": 0.0002823832937443025, "loss": 1.7602, "step": 5941 }, { "epoch": 0.47, "learning_rate": 0.0002823774816496819, "loss": 1.74, "step": 5942 }, { "epoch": 0.47, "learning_rate": 0.0002823716686562912, "loss": 1.7181, "step": 5943 }, { "epoch": 0.47, "learning_rate": 0.00028236585476416995, "loss": 1.7738, "step": 5944 }, { "epoch": 0.47, "learning_rate": 0.0002823600399733575, "loss": 1.7303, "step": 5945 }, { "epoch": 0.47, "learning_rate": 0.00028235422428389355, "loss": 1.7125, "step": 5946 }, { "epoch": 0.47, "learning_rate": 0.00028234840769581735, "loss": 1.7598, "step": 5947 }, { "epoch": 0.47, "learning_rate": 0.00028234259020916853, "loss": 1.7187, "step": 5948 }, { "epoch": 0.47, "learning_rate": 0.0002823367718239866, "loss": 1.7014, "step": 5949 }, { "epoch": 0.47, "learning_rate": 0.00028233095254031097, "loss": 1.7412, "step": 5950 }, { "epoch": 0.47, "learning_rate": 0.00028232513235818126, "loss": 1.7449, "step": 5951 }, { "epoch": 0.47, "learning_rate": 0.00028231931127763686, "loss": 1.7449, "step": 5952 }, { "epoch": 0.47, "learning_rate": 0.00028231348929871734, "loss": 1.8149, "step": 5953 }, { "epoch": 0.47, "learning_rate": 0.0002823076664214623, "loss": 1.7204, "step": 5954 }, { "epoch": 0.47, "learning_rate": 0.0002823018426459112, "loss": 1.7082, "step": 5955 }, { "epoch": 0.47, "learning_rate": 0.00028229601797210365, "loss": 1.7224, "step": 5956 }, { "epoch": 0.47, "learning_rate": 0.0002822901924000791, "loss": 1.7829, "step": 5957 }, { "epoch": 0.47, "learning_rate": 0.0002822843659298771, "loss": 1.688, "step": 5958 }, { "epoch": 0.47, "learning_rate": 0.0002822785385615373, "loss": 1.7462, "step": 5959 }, { "epoch": 0.47, "learning_rate": 0.00028227271029509924, "loss": 1.7409, "step": 5960 }, { "epoch": 0.47, "learning_rate": 0.00028226688113060244, "loss": 1.7247, "step": 5961 }, { "epoch": 0.47, "learning_rate": 0.0002822610510680865, "loss": 1.757, "step": 5962 }, { "epoch": 0.47, "learning_rate": 0.00028225522010759104, "loss": 1.695, "step": 5963 }, { "epoch": 0.47, "learning_rate": 0.00028224938824915563, "loss": 1.7502, "step": 5964 }, { "epoch": 0.47, "learning_rate": 0.0002822435554928198, "loss": 1.7504, "step": 5965 }, { "epoch": 0.47, "learning_rate": 0.00028223772183862323, "loss": 1.7479, "step": 5966 }, { "epoch": 0.47, "learning_rate": 0.00028223188728660555, "loss": 1.7924, "step": 5967 }, { "epoch": 0.47, "learning_rate": 0.0002822260518368063, "loss": 1.8104, "step": 5968 }, { "epoch": 0.47, "learning_rate": 0.00028222021548926507, "loss": 1.7742, "step": 5969 }, { "epoch": 0.47, "learning_rate": 0.0002822143782440216, "loss": 1.7279, "step": 5970 }, { "epoch": 0.47, "learning_rate": 0.0002822085401011154, "loss": 1.6748, "step": 5971 }, { "epoch": 0.47, "learning_rate": 0.00028220270106058627, "loss": 1.7378, "step": 5972 }, { "epoch": 0.47, "learning_rate": 0.0002821968611224737, "loss": 1.7403, "step": 5973 }, { "epoch": 0.47, "learning_rate": 0.0002821910202868174, "loss": 1.7597, "step": 5974 }, { "epoch": 0.47, "learning_rate": 0.00028218517855365706, "loss": 1.7459, "step": 5975 }, { "epoch": 0.47, "learning_rate": 0.00028217933592303225, "loss": 1.6828, "step": 5976 }, { "epoch": 0.47, "learning_rate": 0.0002821734923949827, "loss": 1.709, "step": 5977 }, { "epoch": 0.47, "learning_rate": 0.0002821676479695481, "loss": 1.7441, "step": 5978 }, { "epoch": 0.47, "learning_rate": 0.00028216180264676807, "loss": 1.7052, "step": 5979 }, { "epoch": 0.47, "learning_rate": 0.00028215595642668234, "loss": 1.7512, "step": 5980 }, { "epoch": 0.47, "learning_rate": 0.00028215010930933063, "loss": 1.6881, "step": 5981 }, { "epoch": 0.47, "learning_rate": 0.0002821442612947526, "loss": 1.7449, "step": 5982 }, { "epoch": 0.47, "learning_rate": 0.0002821384123829879, "loss": 1.7585, "step": 5983 }, { "epoch": 0.47, "learning_rate": 0.00028213256257407634, "loss": 1.7852, "step": 5984 }, { "epoch": 0.47, "learning_rate": 0.0002821267118680576, "loss": 1.7157, "step": 5985 }, { "epoch": 0.47, "learning_rate": 0.0002821208602649714, "loss": 1.7362, "step": 5986 }, { "epoch": 0.47, "learning_rate": 0.0002821150077648575, "loss": 1.6737, "step": 5987 }, { "epoch": 0.47, "learning_rate": 0.00028210915436775556, "loss": 1.7969, "step": 5988 }, { "epoch": 0.47, "learning_rate": 0.0002821033000737054, "loss": 1.7283, "step": 5989 }, { "epoch": 0.47, "learning_rate": 0.0002820974448827467, "loss": 1.7579, "step": 5990 }, { "epoch": 0.47, "learning_rate": 0.0002820915887949192, "loss": 1.7856, "step": 5991 }, { "epoch": 0.47, "learning_rate": 0.00028208573181026284, "loss": 1.7261, "step": 5992 }, { "epoch": 0.47, "learning_rate": 0.0002820798739288172, "loss": 1.7512, "step": 5993 }, { "epoch": 0.47, "learning_rate": 0.0002820740151506221, "loss": 1.7857, "step": 5994 }, { "epoch": 0.47, "learning_rate": 0.0002820681554757172, "loss": 1.7364, "step": 5995 }, { "epoch": 0.47, "learning_rate": 0.0002820622949041425, "loss": 1.7692, "step": 5996 }, { "epoch": 0.47, "learning_rate": 0.0002820564334359378, "loss": 1.7385, "step": 5997 }, { "epoch": 0.47, "learning_rate": 0.0002820505710711427, "loss": 1.7543, "step": 5998 }, { "epoch": 0.47, "learning_rate": 0.00028204470780979706, "loss": 1.7145, "step": 5999 }, { "epoch": 0.47, "learning_rate": 0.00028203884365194076, "loss": 1.7802, "step": 6000 }, { "epoch": 0.47, "learning_rate": 0.0002820329785976136, "loss": 1.7078, "step": 6001 }, { "epoch": 0.47, "learning_rate": 0.0002820271126468553, "loss": 1.7503, "step": 6002 }, { "epoch": 0.47, "learning_rate": 0.0002820212457997058, "loss": 1.6863, "step": 6003 }, { "epoch": 0.47, "learning_rate": 0.00028201537805620493, "loss": 1.7566, "step": 6004 }, { "epoch": 0.47, "learning_rate": 0.00028200950941639243, "loss": 1.7958, "step": 6005 }, { "epoch": 0.47, "learning_rate": 0.00028200363988030826, "loss": 1.7451, "step": 6006 }, { "epoch": 0.47, "learning_rate": 0.0002819977694479922, "loss": 1.7641, "step": 6007 }, { "epoch": 0.47, "learning_rate": 0.00028199189811948416, "loss": 1.7198, "step": 6008 }, { "epoch": 0.47, "learning_rate": 0.00028198602589482396, "loss": 1.7844, "step": 6009 }, { "epoch": 0.47, "learning_rate": 0.0002819801527740515, "loss": 1.7489, "step": 6010 }, { "epoch": 0.47, "learning_rate": 0.00028197427875720655, "loss": 1.7228, "step": 6011 }, { "epoch": 0.47, "learning_rate": 0.00028196840384432913, "loss": 1.7081, "step": 6012 }, { "epoch": 0.47, "learning_rate": 0.0002819625280354591, "loss": 1.7148, "step": 6013 }, { "epoch": 0.47, "learning_rate": 0.00028195665133063627, "loss": 1.7223, "step": 6014 }, { "epoch": 0.47, "learning_rate": 0.0002819507737299006, "loss": 1.7607, "step": 6015 }, { "epoch": 0.47, "learning_rate": 0.0002819448952332921, "loss": 1.7018, "step": 6016 }, { "epoch": 0.47, "learning_rate": 0.0002819390158408505, "loss": 1.7631, "step": 6017 }, { "epoch": 0.47, "learning_rate": 0.0002819331355526158, "loss": 1.7815, "step": 6018 }, { "epoch": 0.47, "learning_rate": 0.0002819272543686279, "loss": 1.7034, "step": 6019 }, { "epoch": 0.47, "learning_rate": 0.0002819213722889267, "loss": 1.7529, "step": 6020 }, { "epoch": 0.47, "learning_rate": 0.0002819154893135523, "loss": 1.74, "step": 6021 }, { "epoch": 0.47, "learning_rate": 0.00028190960544254446, "loss": 1.7343, "step": 6022 }, { "epoch": 0.47, "learning_rate": 0.0002819037206759432, "loss": 1.7279, "step": 6023 }, { "epoch": 0.47, "learning_rate": 0.00028189783501378845, "loss": 1.7349, "step": 6024 }, { "epoch": 0.47, "learning_rate": 0.00028189194845612016, "loss": 1.7588, "step": 6025 }, { "epoch": 0.47, "learning_rate": 0.0002818860610029784, "loss": 1.7529, "step": 6026 }, { "epoch": 0.47, "learning_rate": 0.000281880172654403, "loss": 1.7834, "step": 6027 }, { "epoch": 0.47, "learning_rate": 0.00028187428341043406, "loss": 1.7683, "step": 6028 }, { "epoch": 0.47, "learning_rate": 0.0002818683932711115, "loss": 1.8212, "step": 6029 }, { "epoch": 0.47, "learning_rate": 0.00028186250223647525, "loss": 1.7206, "step": 6030 }, { "epoch": 0.47, "learning_rate": 0.00028185661030656546, "loss": 1.7137, "step": 6031 }, { "epoch": 0.47, "learning_rate": 0.00028185071748142203, "loss": 1.7347, "step": 6032 }, { "epoch": 0.47, "learning_rate": 0.00028184482376108496, "loss": 1.7052, "step": 6033 }, { "epoch": 0.47, "learning_rate": 0.0002818389291455943, "loss": 1.739, "step": 6034 }, { "epoch": 0.47, "learning_rate": 0.00028183303363499013, "loss": 1.7502, "step": 6035 }, { "epoch": 0.47, "learning_rate": 0.00028182713722931234, "loss": 1.7279, "step": 6036 }, { "epoch": 0.47, "learning_rate": 0.00028182123992860105, "loss": 1.7379, "step": 6037 }, { "epoch": 0.48, "learning_rate": 0.0002818153417328963, "loss": 1.7222, "step": 6038 }, { "epoch": 0.48, "learning_rate": 0.00028180944264223813, "loss": 1.7478, "step": 6039 }, { "epoch": 0.48, "learning_rate": 0.0002818035426566666, "loss": 1.7194, "step": 6040 }, { "epoch": 0.48, "learning_rate": 0.0002817976417762217, "loss": 1.7428, "step": 6041 }, { "epoch": 0.48, "learning_rate": 0.0002817917400009436, "loss": 1.7971, "step": 6042 }, { "epoch": 0.48, "learning_rate": 0.0002817858373308723, "loss": 1.7293, "step": 6043 }, { "epoch": 0.48, "learning_rate": 0.00028177993376604784, "loss": 1.7019, "step": 6044 }, { "epoch": 0.48, "learning_rate": 0.0002817740293065104, "loss": 1.7469, "step": 6045 }, { "epoch": 0.48, "learning_rate": 0.0002817681239523, "loss": 1.7403, "step": 6046 }, { "epoch": 0.48, "learning_rate": 0.00028176221770345673, "loss": 1.7446, "step": 6047 }, { "epoch": 0.48, "learning_rate": 0.0002817563105600207, "loss": 1.7682, "step": 6048 }, { "epoch": 0.48, "learning_rate": 0.0002817504025220321, "loss": 1.7888, "step": 6049 }, { "epoch": 0.48, "learning_rate": 0.00028174449358953096, "loss": 1.712, "step": 6050 }, { "epoch": 0.48, "learning_rate": 0.0002817385837625574, "loss": 1.7811, "step": 6051 }, { "epoch": 0.48, "learning_rate": 0.00028173267304115154, "loss": 1.7094, "step": 6052 }, { "epoch": 0.48, "learning_rate": 0.00028172676142535353, "loss": 1.7465, "step": 6053 }, { "epoch": 0.48, "learning_rate": 0.00028172084891520355, "loss": 1.765, "step": 6054 }, { "epoch": 0.48, "learning_rate": 0.00028171493551074165, "loss": 1.7443, "step": 6055 }, { "epoch": 0.48, "learning_rate": 0.000281709021212008, "loss": 1.7379, "step": 6056 }, { "epoch": 0.48, "learning_rate": 0.00028170310601904284, "loss": 1.6928, "step": 6057 }, { "epoch": 0.48, "learning_rate": 0.0002816971899318862, "loss": 1.7364, "step": 6058 }, { "epoch": 0.48, "learning_rate": 0.00028169127295057836, "loss": 1.7368, "step": 6059 }, { "epoch": 0.48, "learning_rate": 0.0002816853550751595, "loss": 1.7039, "step": 6060 }, { "epoch": 0.48, "learning_rate": 0.00028167943630566966, "loss": 1.7439, "step": 6061 }, { "epoch": 0.48, "learning_rate": 0.0002816735166421491, "loss": 1.7575, "step": 6062 }, { "epoch": 0.48, "learning_rate": 0.0002816675960846381, "loss": 1.7966, "step": 6063 }, { "epoch": 0.48, "learning_rate": 0.0002816616746331768, "loss": 1.7449, "step": 6064 }, { "epoch": 0.48, "learning_rate": 0.0002816557522878053, "loss": 1.6841, "step": 6065 }, { "epoch": 0.48, "learning_rate": 0.000281649829048564, "loss": 1.7261, "step": 6066 }, { "epoch": 0.48, "learning_rate": 0.0002816439049154929, "loss": 1.7703, "step": 6067 }, { "epoch": 0.48, "learning_rate": 0.0002816379798886324, "loss": 1.7271, "step": 6068 }, { "epoch": 0.48, "learning_rate": 0.0002816320539680226, "loss": 1.7275, "step": 6069 }, { "epoch": 0.48, "learning_rate": 0.0002816261271537039, "loss": 1.8034, "step": 6070 }, { "epoch": 0.48, "learning_rate": 0.00028162019944571635, "loss": 1.7319, "step": 6071 }, { "epoch": 0.48, "learning_rate": 0.0002816142708441003, "loss": 1.6624, "step": 6072 }, { "epoch": 0.48, "learning_rate": 0.00028160834134889596, "loss": 1.7423, "step": 6073 }, { "epoch": 0.48, "learning_rate": 0.0002816024109601437, "loss": 1.7165, "step": 6074 }, { "epoch": 0.48, "learning_rate": 0.0002815964796778836, "loss": 1.7225, "step": 6075 }, { "epoch": 0.48, "learning_rate": 0.000281590547502156, "loss": 1.7804, "step": 6076 }, { "epoch": 0.48, "learning_rate": 0.00028158461443300126, "loss": 1.7656, "step": 6077 }, { "epoch": 0.48, "learning_rate": 0.0002815786804704596, "loss": 1.7634, "step": 6078 }, { "epoch": 0.48, "learning_rate": 0.0002815727456145713, "loss": 1.7508, "step": 6079 }, { "epoch": 0.48, "learning_rate": 0.00028156680986537666, "loss": 1.7425, "step": 6080 }, { "epoch": 0.48, "learning_rate": 0.000281560873222916, "loss": 1.7223, "step": 6081 }, { "epoch": 0.48, "learning_rate": 0.0002815549356872296, "loss": 1.7071, "step": 6082 }, { "epoch": 0.48, "learning_rate": 0.0002815489972583578, "loss": 1.7575, "step": 6083 }, { "epoch": 0.48, "learning_rate": 0.0002815430579363409, "loss": 1.6968, "step": 6084 }, { "epoch": 0.48, "learning_rate": 0.0002815371177212192, "loss": 1.7515, "step": 6085 }, { "epoch": 0.48, "learning_rate": 0.0002815311766130331, "loss": 1.7067, "step": 6086 }, { "epoch": 0.48, "learning_rate": 0.0002815252346118229, "loss": 1.7349, "step": 6087 }, { "epoch": 0.48, "learning_rate": 0.0002815192917176289, "loss": 1.6768, "step": 6088 }, { "epoch": 0.48, "learning_rate": 0.0002815133479304915, "loss": 1.7331, "step": 6089 }, { "epoch": 0.48, "learning_rate": 0.00028150740325045106, "loss": 1.7947, "step": 6090 }, { "epoch": 0.48, "learning_rate": 0.0002815014576775479, "loss": 1.6965, "step": 6091 }, { "epoch": 0.48, "learning_rate": 0.0002814955112118224, "loss": 1.6943, "step": 6092 }, { "epoch": 0.48, "learning_rate": 0.000281489563853315, "loss": 1.7619, "step": 6093 }, { "epoch": 0.48, "learning_rate": 0.000281483615602066, "loss": 1.7339, "step": 6094 }, { "epoch": 0.48, "learning_rate": 0.0002814776664581158, "loss": 1.7435, "step": 6095 }, { "epoch": 0.48, "learning_rate": 0.00028147171642150474, "loss": 1.6698, "step": 6096 }, { "epoch": 0.48, "learning_rate": 0.00028146576549227336, "loss": 1.6833, "step": 6097 }, { "epoch": 0.48, "learning_rate": 0.00028145981367046197, "loss": 1.7384, "step": 6098 }, { "epoch": 0.48, "learning_rate": 0.00028145386095611096, "loss": 1.7458, "step": 6099 }, { "epoch": 0.48, "learning_rate": 0.00028144790734926077, "loss": 1.793, "step": 6100 }, { "epoch": 0.48, "learning_rate": 0.0002814419528499519, "loss": 1.6815, "step": 6101 }, { "epoch": 0.48, "learning_rate": 0.0002814359974582246, "loss": 1.7132, "step": 6102 }, { "epoch": 0.48, "learning_rate": 0.0002814300411741195, "loss": 1.6975, "step": 6103 }, { "epoch": 0.48, "learning_rate": 0.00028142408399767693, "loss": 1.7, "step": 6104 }, { "epoch": 0.48, "learning_rate": 0.00028141812592893733, "loss": 1.7282, "step": 6105 }, { "epoch": 0.48, "learning_rate": 0.0002814121669679412, "loss": 1.7541, "step": 6106 }, { "epoch": 0.48, "learning_rate": 0.00028140620711472895, "loss": 1.7665, "step": 6107 }, { "epoch": 0.48, "learning_rate": 0.00028140024636934106, "loss": 1.7076, "step": 6108 }, { "epoch": 0.48, "learning_rate": 0.00028139428473181806, "loss": 1.7058, "step": 6109 }, { "epoch": 0.48, "learning_rate": 0.00028138832220220034, "loss": 1.7582, "step": 6110 }, { "epoch": 0.48, "learning_rate": 0.00028138235878052845, "loss": 1.7524, "step": 6111 }, { "epoch": 0.48, "learning_rate": 0.0002813763944668428, "loss": 1.7315, "step": 6112 }, { "epoch": 0.48, "learning_rate": 0.00028137042926118397, "loss": 1.7164, "step": 6113 }, { "epoch": 0.48, "learning_rate": 0.0002813644631635924, "loss": 1.7359, "step": 6114 }, { "epoch": 0.48, "learning_rate": 0.00028135849617410863, "loss": 1.7564, "step": 6115 }, { "epoch": 0.48, "learning_rate": 0.00028135252829277315, "loss": 1.685, "step": 6116 }, { "epoch": 0.48, "learning_rate": 0.0002813465595196265, "loss": 1.7915, "step": 6117 }, { "epoch": 0.48, "learning_rate": 0.00028134058985470917, "loss": 1.7385, "step": 6118 }, { "epoch": 0.48, "learning_rate": 0.0002813346192980618, "loss": 1.7581, "step": 6119 }, { "epoch": 0.48, "learning_rate": 0.00028132864784972467, "loss": 1.7604, "step": 6120 }, { "epoch": 0.48, "learning_rate": 0.00028132267550973867, "loss": 1.7564, "step": 6121 }, { "epoch": 0.48, "learning_rate": 0.0002813167022781441, "loss": 1.6957, "step": 6122 }, { "epoch": 0.48, "learning_rate": 0.00028131072815498157, "loss": 1.7351, "step": 6123 }, { "epoch": 0.48, "learning_rate": 0.0002813047531402917, "loss": 1.7092, "step": 6124 }, { "epoch": 0.48, "learning_rate": 0.00028129877723411493, "loss": 1.7522, "step": 6125 }, { "epoch": 0.48, "learning_rate": 0.000281292800436492, "loss": 1.7533, "step": 6126 }, { "epoch": 0.48, "learning_rate": 0.0002812868227474634, "loss": 1.7893, "step": 6127 }, { "epoch": 0.48, "learning_rate": 0.00028128084416706976, "loss": 1.7232, "step": 6128 }, { "epoch": 0.48, "learning_rate": 0.0002812748646953516, "loss": 1.7314, "step": 6129 }, { "epoch": 0.48, "learning_rate": 0.00028126888433234953, "loss": 1.7247, "step": 6130 }, { "epoch": 0.48, "learning_rate": 0.00028126290307810416, "loss": 1.688, "step": 6131 }, { "epoch": 0.48, "learning_rate": 0.00028125692093265616, "loss": 1.7822, "step": 6132 }, { "epoch": 0.48, "learning_rate": 0.00028125093789604607, "loss": 1.7528, "step": 6133 }, { "epoch": 0.48, "learning_rate": 0.00028124495396831455, "loss": 1.7363, "step": 6134 }, { "epoch": 0.48, "learning_rate": 0.00028123896914950225, "loss": 1.6881, "step": 6135 }, { "epoch": 0.48, "learning_rate": 0.0002812329834396497, "loss": 1.773, "step": 6136 }, { "epoch": 0.48, "learning_rate": 0.0002812269968387977, "loss": 1.7654, "step": 6137 }, { "epoch": 0.48, "learning_rate": 0.0002812210093469868, "loss": 1.6834, "step": 6138 }, { "epoch": 0.48, "learning_rate": 0.0002812150209642576, "loss": 1.7041, "step": 6139 }, { "epoch": 0.48, "learning_rate": 0.00028120903169065085, "loss": 1.7341, "step": 6140 }, { "epoch": 0.48, "learning_rate": 0.00028120304152620717, "loss": 1.6551, "step": 6141 }, { "epoch": 0.48, "learning_rate": 0.00028119705047096726, "loss": 1.701, "step": 6142 }, { "epoch": 0.48, "learning_rate": 0.0002811910585249718, "loss": 1.6974, "step": 6143 }, { "epoch": 0.48, "learning_rate": 0.0002811850656882614, "loss": 1.7449, "step": 6144 }, { "epoch": 0.48, "learning_rate": 0.0002811790719608768, "loss": 1.7485, "step": 6145 }, { "epoch": 0.48, "learning_rate": 0.00028117307734285875, "loss": 1.683, "step": 6146 }, { "epoch": 0.48, "learning_rate": 0.0002811670818342478, "loss": 1.6956, "step": 6147 }, { "epoch": 0.48, "learning_rate": 0.0002811610854350848, "loss": 1.7484, "step": 6148 }, { "epoch": 0.48, "learning_rate": 0.00028115508814541046, "loss": 1.7748, "step": 6149 }, { "epoch": 0.48, "learning_rate": 0.0002811490899652654, "loss": 1.743, "step": 6150 }, { "epoch": 0.48, "learning_rate": 0.0002811430908946904, "loss": 1.7348, "step": 6151 }, { "epoch": 0.48, "learning_rate": 0.00028113709093372614, "loss": 1.6675, "step": 6152 }, { "epoch": 0.48, "learning_rate": 0.0002811310900824135, "loss": 1.7234, "step": 6153 }, { "epoch": 0.48, "learning_rate": 0.000281125088340793, "loss": 1.767, "step": 6154 }, { "epoch": 0.48, "learning_rate": 0.00028111908570890555, "loss": 1.6916, "step": 6155 }, { "epoch": 0.48, "learning_rate": 0.0002811130821867919, "loss": 1.7496, "step": 6156 }, { "epoch": 0.48, "learning_rate": 0.00028110707777449274, "loss": 1.7454, "step": 6157 }, { "epoch": 0.48, "learning_rate": 0.00028110107247204894, "loss": 1.7291, "step": 6158 }, { "epoch": 0.48, "learning_rate": 0.0002810950662795011, "loss": 1.7677, "step": 6159 }, { "epoch": 0.48, "learning_rate": 0.0002810890591968902, "loss": 1.746, "step": 6160 }, { "epoch": 0.48, "learning_rate": 0.00028108305122425694, "loss": 1.6873, "step": 6161 }, { "epoch": 0.48, "learning_rate": 0.00028107704236164205, "loss": 1.7179, "step": 6162 }, { "epoch": 0.48, "learning_rate": 0.00028107103260908636, "loss": 1.7373, "step": 6163 }, { "epoch": 0.48, "learning_rate": 0.00028106502196663066, "loss": 1.7913, "step": 6164 }, { "epoch": 0.49, "learning_rate": 0.00028105901043431585, "loss": 1.6983, "step": 6165 }, { "epoch": 0.49, "learning_rate": 0.0002810529980121827, "loss": 1.7446, "step": 6166 }, { "epoch": 0.49, "learning_rate": 0.00028104698470027197, "loss": 1.7262, "step": 6167 }, { "epoch": 0.49, "learning_rate": 0.0002810409704986246, "loss": 1.7148, "step": 6168 }, { "epoch": 0.49, "learning_rate": 0.0002810349554072812, "loss": 1.7531, "step": 6169 }, { "epoch": 0.49, "learning_rate": 0.0002810289394262829, "loss": 1.7398, "step": 6170 }, { "epoch": 0.49, "learning_rate": 0.0002810229225556704, "loss": 1.7371, "step": 6171 }, { "epoch": 0.49, "learning_rate": 0.0002810169047954845, "loss": 1.7498, "step": 6172 }, { "epoch": 0.49, "learning_rate": 0.0002810108861457662, "loss": 1.7428, "step": 6173 }, { "epoch": 0.49, "learning_rate": 0.0002810048666065562, "loss": 1.7016, "step": 6174 }, { "epoch": 0.49, "learning_rate": 0.00028099884617789546, "loss": 1.7825, "step": 6175 }, { "epoch": 0.49, "learning_rate": 0.0002809928248598249, "loss": 1.7414, "step": 6176 }, { "epoch": 0.49, "learning_rate": 0.0002809868026523853, "loss": 1.8137, "step": 6177 }, { "epoch": 0.49, "learning_rate": 0.00028098077955561766, "loss": 1.775, "step": 6178 }, { "epoch": 0.49, "learning_rate": 0.0002809747555695627, "loss": 1.7211, "step": 6179 }, { "epoch": 0.49, "learning_rate": 0.00028096873069426154, "loss": 1.8102, "step": 6180 }, { "epoch": 0.49, "learning_rate": 0.0002809627049297549, "loss": 1.7098, "step": 6181 }, { "epoch": 0.49, "learning_rate": 0.0002809566782760838, "loss": 1.7974, "step": 6182 }, { "epoch": 0.49, "learning_rate": 0.0002809506507332891, "loss": 1.7155, "step": 6183 }, { "epoch": 0.49, "learning_rate": 0.0002809446223014118, "loss": 1.7136, "step": 6184 }, { "epoch": 0.49, "learning_rate": 0.0002809385929804927, "loss": 1.7356, "step": 6185 }, { "epoch": 0.49, "learning_rate": 0.00028093256277057283, "loss": 1.7836, "step": 6186 }, { "epoch": 0.49, "learning_rate": 0.00028092653167169314, "loss": 1.719, "step": 6187 }, { "epoch": 0.49, "learning_rate": 0.0002809204996838945, "loss": 1.7578, "step": 6188 }, { "epoch": 0.49, "learning_rate": 0.00028091446680721794, "loss": 1.7333, "step": 6189 }, { "epoch": 0.49, "learning_rate": 0.00028090843304170445, "loss": 1.7255, "step": 6190 }, { "epoch": 0.49, "learning_rate": 0.0002809023983873949, "loss": 1.7043, "step": 6191 }, { "epoch": 0.49, "learning_rate": 0.00028089636284433025, "loss": 1.7229, "step": 6192 }, { "epoch": 0.49, "learning_rate": 0.0002808903264125516, "loss": 1.7692, "step": 6193 }, { "epoch": 0.49, "learning_rate": 0.00028088428909209983, "loss": 1.8104, "step": 6194 }, { "epoch": 0.49, "learning_rate": 0.00028087825088301594, "loss": 1.7348, "step": 6195 }, { "epoch": 0.49, "learning_rate": 0.00028087221178534104, "loss": 1.7982, "step": 6196 }, { "epoch": 0.49, "learning_rate": 0.000280866171799116, "loss": 1.73, "step": 6197 }, { "epoch": 0.49, "learning_rate": 0.00028086013092438187, "loss": 1.7639, "step": 6198 }, { "epoch": 0.49, "learning_rate": 0.0002808540891611796, "loss": 1.7554, "step": 6199 }, { "epoch": 0.49, "learning_rate": 0.0002808480465095504, "loss": 1.7697, "step": 6200 }, { "epoch": 0.49, "learning_rate": 0.0002808420029695351, "loss": 1.6884, "step": 6201 }, { "epoch": 0.49, "learning_rate": 0.0002808359585411748, "loss": 1.7261, "step": 6202 }, { "epoch": 0.49, "learning_rate": 0.00028082991322451057, "loss": 1.7619, "step": 6203 }, { "epoch": 0.49, "learning_rate": 0.0002808238670195834, "loss": 1.7615, "step": 6204 }, { "epoch": 0.49, "learning_rate": 0.0002808178199264344, "loss": 1.7188, "step": 6205 }, { "epoch": 0.49, "learning_rate": 0.0002808117719451045, "loss": 1.747, "step": 6206 }, { "epoch": 0.49, "learning_rate": 0.000280805723075635, "loss": 1.7393, "step": 6207 }, { "epoch": 0.49, "learning_rate": 0.00028079967331806675, "loss": 1.7482, "step": 6208 }, { "epoch": 0.49, "learning_rate": 0.0002807936226724409, "loss": 1.7509, "step": 6209 }, { "epoch": 0.49, "learning_rate": 0.00028078757113879853, "loss": 1.7088, "step": 6210 }, { "epoch": 0.49, "learning_rate": 0.0002807815187171807, "loss": 1.7358, "step": 6211 }, { "epoch": 0.49, "learning_rate": 0.0002807754654076286, "loss": 1.7239, "step": 6212 }, { "epoch": 0.49, "learning_rate": 0.0002807694112101832, "loss": 1.7528, "step": 6213 }, { "epoch": 0.49, "learning_rate": 0.0002807633561248857, "loss": 1.689, "step": 6214 }, { "epoch": 0.49, "learning_rate": 0.00028075730015177715, "loss": 1.7306, "step": 6215 }, { "epoch": 0.49, "learning_rate": 0.00028075124329089864, "loss": 1.732, "step": 6216 }, { "epoch": 0.49, "learning_rate": 0.0002807451855422915, "loss": 1.701, "step": 6217 }, { "epoch": 0.49, "learning_rate": 0.0002807391269059965, "loss": 1.7309, "step": 6218 }, { "epoch": 0.49, "learning_rate": 0.00028073306738205515, "loss": 1.7088, "step": 6219 }, { "epoch": 0.49, "learning_rate": 0.0002807270069705083, "loss": 1.692, "step": 6220 }, { "epoch": 0.49, "learning_rate": 0.00028072094567139724, "loss": 1.6638, "step": 6221 }, { "epoch": 0.49, "learning_rate": 0.00028071488348476315, "loss": 1.7203, "step": 6222 }, { "epoch": 0.49, "learning_rate": 0.0002807088204106471, "loss": 1.7302, "step": 6223 }, { "epoch": 0.49, "learning_rate": 0.0002807027564490903, "loss": 1.6807, "step": 6224 }, { "epoch": 0.49, "learning_rate": 0.00028069669160013386, "loss": 1.7711, "step": 6225 }, { "epoch": 0.49, "learning_rate": 0.00028069062586381905, "loss": 1.7591, "step": 6226 }, { "epoch": 0.49, "learning_rate": 0.00028068455924018705, "loss": 1.7772, "step": 6227 }, { "epoch": 0.49, "learning_rate": 0.0002806784917292789, "loss": 1.7381, "step": 6228 }, { "epoch": 0.49, "learning_rate": 0.000280672423331136, "loss": 1.6998, "step": 6229 }, { "epoch": 0.49, "learning_rate": 0.0002806663540457994, "loss": 1.7914, "step": 6230 }, { "epoch": 0.49, "learning_rate": 0.00028066028387331045, "loss": 1.7664, "step": 6231 }, { "epoch": 0.49, "learning_rate": 0.0002806542128137102, "loss": 1.7424, "step": 6232 }, { "epoch": 0.49, "learning_rate": 0.00028064814086703997, "loss": 1.6753, "step": 6233 }, { "epoch": 0.49, "learning_rate": 0.00028064206803334095, "loss": 1.6829, "step": 6234 }, { "epoch": 0.49, "learning_rate": 0.0002806359943126544, "loss": 1.7317, "step": 6235 }, { "epoch": 0.49, "learning_rate": 0.0002806299197050215, "loss": 1.7572, "step": 6236 }, { "epoch": 0.49, "learning_rate": 0.0002806238442104836, "loss": 1.8075, "step": 6237 }, { "epoch": 0.49, "learning_rate": 0.0002806177678290818, "loss": 1.7425, "step": 6238 }, { "epoch": 0.49, "learning_rate": 0.0002806116905608575, "loss": 1.7287, "step": 6239 }, { "epoch": 0.49, "learning_rate": 0.0002806056124058519, "loss": 1.7177, "step": 6240 }, { "epoch": 0.49, "learning_rate": 0.0002805995333641063, "loss": 1.7469, "step": 6241 }, { "epoch": 0.49, "learning_rate": 0.00028059345343566184, "loss": 1.7101, "step": 6242 }, { "epoch": 0.49, "learning_rate": 0.00028058737262055995, "loss": 1.7482, "step": 6243 }, { "epoch": 0.49, "learning_rate": 0.0002805812909188418, "loss": 1.6973, "step": 6244 }, { "epoch": 0.49, "learning_rate": 0.0002805752083305488, "loss": 1.6837, "step": 6245 }, { "epoch": 0.49, "learning_rate": 0.0002805691248557222, "loss": 1.7621, "step": 6246 }, { "epoch": 0.49, "learning_rate": 0.00028056304049440335, "loss": 1.6998, "step": 6247 }, { "epoch": 0.49, "learning_rate": 0.0002805569552466334, "loss": 1.7209, "step": 6248 }, { "epoch": 0.49, "learning_rate": 0.00028055086911245384, "loss": 1.7213, "step": 6249 }, { "epoch": 0.49, "learning_rate": 0.0002805447820919059, "loss": 1.731, "step": 6250 }, { "epoch": 0.49, "learning_rate": 0.00028053869418503095, "loss": 1.7525, "step": 6251 }, { "epoch": 0.49, "learning_rate": 0.0002805326053918703, "loss": 1.7279, "step": 6252 }, { "epoch": 0.49, "learning_rate": 0.00028052651571246526, "loss": 1.6719, "step": 6253 }, { "epoch": 0.49, "learning_rate": 0.00028052042514685726, "loss": 1.7389, "step": 6254 }, { "epoch": 0.49, "learning_rate": 0.00028051433369508756, "loss": 1.7217, "step": 6255 }, { "epoch": 0.49, "learning_rate": 0.0002805082413571975, "loss": 1.7081, "step": 6256 }, { "epoch": 0.49, "learning_rate": 0.00028050214813322863, "loss": 1.6749, "step": 6257 }, { "epoch": 0.49, "learning_rate": 0.0002804960540232221, "loss": 1.772, "step": 6258 }, { "epoch": 0.49, "learning_rate": 0.00028048995902721943, "loss": 1.7273, "step": 6259 }, { "epoch": 0.49, "learning_rate": 0.00028048386314526196, "loss": 1.7053, "step": 6260 }, { "epoch": 0.49, "learning_rate": 0.00028047776637739097, "loss": 1.7285, "step": 6261 }, { "epoch": 0.49, "learning_rate": 0.00028047166872364804, "loss": 1.7409, "step": 6262 }, { "epoch": 0.49, "learning_rate": 0.00028046557018407447, "loss": 1.7133, "step": 6263 }, { "epoch": 0.49, "learning_rate": 0.00028045947075871163, "loss": 1.7332, "step": 6264 }, { "epoch": 0.49, "learning_rate": 0.000280453370447601, "loss": 1.7776, "step": 6265 }, { "epoch": 0.49, "learning_rate": 0.00028044726925078396, "loss": 1.7339, "step": 6266 }, { "epoch": 0.49, "learning_rate": 0.000280441167168302, "loss": 1.7182, "step": 6267 }, { "epoch": 0.49, "learning_rate": 0.0002804350642001965, "loss": 1.654, "step": 6268 }, { "epoch": 0.49, "learning_rate": 0.00028042896034650885, "loss": 1.7025, "step": 6269 }, { "epoch": 0.49, "learning_rate": 0.0002804228556072805, "loss": 1.7331, "step": 6270 }, { "epoch": 0.49, "learning_rate": 0.00028041674998255297, "loss": 1.721, "step": 6271 }, { "epoch": 0.49, "learning_rate": 0.0002804106434723677, "loss": 1.7909, "step": 6272 }, { "epoch": 0.49, "learning_rate": 0.0002804045360767661, "loss": 1.7442, "step": 6273 }, { "epoch": 0.49, "learning_rate": 0.00028039842779578974, "loss": 1.7249, "step": 6274 }, { "epoch": 0.49, "learning_rate": 0.00028039231862947986, "loss": 1.6706, "step": 6275 }, { "epoch": 0.49, "learning_rate": 0.0002803862085778782, "loss": 1.7599, "step": 6276 }, { "epoch": 0.49, "learning_rate": 0.0002803800976410261, "loss": 1.7306, "step": 6277 }, { "epoch": 0.49, "learning_rate": 0.00028037398581896514, "loss": 1.7468, "step": 6278 }, { "epoch": 0.49, "learning_rate": 0.0002803678731117368, "loss": 1.7281, "step": 6279 }, { "epoch": 0.49, "learning_rate": 0.0002803617595193824, "loss": 1.7935, "step": 6280 }, { "epoch": 0.49, "learning_rate": 0.0002803556450419437, "loss": 1.7549, "step": 6281 }, { "epoch": 0.49, "learning_rate": 0.00028034952967946207, "loss": 1.7556, "step": 6282 }, { "epoch": 0.49, "learning_rate": 0.0002803434134319791, "loss": 1.7802, "step": 6283 }, { "epoch": 0.49, "learning_rate": 0.00028033729629953625, "loss": 1.7577, "step": 6284 }, { "epoch": 0.49, "learning_rate": 0.00028033117828217503, "loss": 1.7551, "step": 6285 }, { "epoch": 0.49, "learning_rate": 0.0002803250593799371, "loss": 1.6604, "step": 6286 }, { "epoch": 0.49, "learning_rate": 0.0002803189395928639, "loss": 1.7723, "step": 6287 }, { "epoch": 0.49, "learning_rate": 0.00028031281892099705, "loss": 1.7216, "step": 6288 }, { "epoch": 0.49, "learning_rate": 0.00028030669736437807, "loss": 1.7348, "step": 6289 }, { "epoch": 0.49, "learning_rate": 0.0002803005749230485, "loss": 1.7448, "step": 6290 }, { "epoch": 0.49, "learning_rate": 0.00028029445159705, "loss": 1.7529, "step": 6291 }, { "epoch": 0.5, "learning_rate": 0.000280288327386424, "loss": 1.6949, "step": 6292 }, { "epoch": 0.5, "learning_rate": 0.00028028220229121223, "loss": 1.7185, "step": 6293 }, { "epoch": 0.5, "learning_rate": 0.0002802760763114561, "loss": 1.7771, "step": 6294 }, { "epoch": 0.5, "learning_rate": 0.0002802699494471974, "loss": 1.7277, "step": 6295 }, { "epoch": 0.5, "learning_rate": 0.00028026382169847754, "loss": 1.7292, "step": 6296 }, { "epoch": 0.5, "learning_rate": 0.0002802576930653383, "loss": 1.7001, "step": 6297 }, { "epoch": 0.5, "learning_rate": 0.00028025156354782117, "loss": 1.7637, "step": 6298 }, { "epoch": 0.5, "learning_rate": 0.0002802454331459678, "loss": 1.7713, "step": 6299 }, { "epoch": 0.5, "learning_rate": 0.0002802393018598198, "loss": 1.7067, "step": 6300 }, { "epoch": 0.5, "learning_rate": 0.00028023316968941883, "loss": 1.7554, "step": 6301 }, { "epoch": 0.5, "learning_rate": 0.00028022703663480654, "loss": 1.7438, "step": 6302 }, { "epoch": 0.5, "learning_rate": 0.0002802209026960245, "loss": 1.725, "step": 6303 }, { "epoch": 0.5, "learning_rate": 0.0002802147678731144, "loss": 1.7597, "step": 6304 }, { "epoch": 0.5, "learning_rate": 0.00028020863216611785, "loss": 1.7168, "step": 6305 }, { "epoch": 0.5, "learning_rate": 0.0002802024955750766, "loss": 1.734, "step": 6306 }, { "epoch": 0.5, "learning_rate": 0.00028019635810003224, "loss": 1.7382, "step": 6307 }, { "epoch": 0.5, "learning_rate": 0.0002801902197410264, "loss": 1.7324, "step": 6308 }, { "epoch": 0.5, "learning_rate": 0.0002801840804981009, "loss": 1.7409, "step": 6309 }, { "epoch": 0.5, "learning_rate": 0.0002801779403712973, "loss": 1.6836, "step": 6310 }, { "epoch": 0.5, "learning_rate": 0.0002801717993606573, "loss": 1.7021, "step": 6311 }, { "epoch": 0.5, "learning_rate": 0.0002801656574662226, "loss": 1.7473, "step": 6312 }, { "epoch": 0.5, "learning_rate": 0.00028015951468803496, "loss": 1.7324, "step": 6313 }, { "epoch": 0.5, "learning_rate": 0.0002801533710261361, "loss": 1.7486, "step": 6314 }, { "epoch": 0.5, "learning_rate": 0.0002801472264805676, "loss": 1.7344, "step": 6315 }, { "epoch": 0.5, "learning_rate": 0.00028014108105137126, "loss": 1.6802, "step": 6316 }, { "epoch": 0.5, "learning_rate": 0.0002801349347385888, "loss": 1.7148, "step": 6317 }, { "epoch": 0.5, "learning_rate": 0.0002801287875422619, "loss": 1.7526, "step": 6318 }, { "epoch": 0.5, "learning_rate": 0.00028012263946243244, "loss": 1.7327, "step": 6319 }, { "epoch": 0.5, "learning_rate": 0.00028011649049914197, "loss": 1.7071, "step": 6320 }, { "epoch": 0.5, "learning_rate": 0.00028011034065243245, "loss": 1.7458, "step": 6321 }, { "epoch": 0.5, "learning_rate": 0.0002801041899223454, "loss": 1.7569, "step": 6322 }, { "epoch": 0.5, "learning_rate": 0.00028009803830892277, "loss": 1.813, "step": 6323 }, { "epoch": 0.5, "learning_rate": 0.00028009188581220625, "loss": 1.7048, "step": 6324 }, { "epoch": 0.5, "learning_rate": 0.0002800857324322376, "loss": 1.818, "step": 6325 }, { "epoch": 0.5, "learning_rate": 0.0002800795781690586, "loss": 1.7902, "step": 6326 }, { "epoch": 0.5, "learning_rate": 0.00028007342302271103, "loss": 1.7313, "step": 6327 }, { "epoch": 0.5, "learning_rate": 0.00028006726699323676, "loss": 1.6926, "step": 6328 }, { "epoch": 0.5, "learning_rate": 0.0002800611100806775, "loss": 1.7295, "step": 6329 }, { "epoch": 0.5, "learning_rate": 0.0002800549522850751, "loss": 1.7065, "step": 6330 }, { "epoch": 0.5, "learning_rate": 0.00028004879360647126, "loss": 1.7145, "step": 6331 }, { "epoch": 0.5, "learning_rate": 0.0002800426340449079, "loss": 1.6929, "step": 6332 }, { "epoch": 0.5, "learning_rate": 0.0002800364736004269, "loss": 1.7912, "step": 6333 }, { "epoch": 0.5, "learning_rate": 0.00028003031227306994, "loss": 1.717, "step": 6334 }, { "epoch": 0.5, "learning_rate": 0.0002800241500628789, "loss": 1.717, "step": 6335 }, { "epoch": 0.5, "learning_rate": 0.0002800179869698957, "loss": 1.7337, "step": 6336 }, { "epoch": 0.5, "learning_rate": 0.00028001182299416206, "loss": 1.7268, "step": 6337 }, { "epoch": 0.5, "learning_rate": 0.0002800056581357199, "loss": 1.7323, "step": 6338 }, { "epoch": 0.5, "learning_rate": 0.0002799994923946111, "loss": 1.7303, "step": 6339 }, { "epoch": 0.5, "learning_rate": 0.0002799933257708774, "loss": 1.7364, "step": 6340 }, { "epoch": 0.5, "learning_rate": 0.0002799871582645609, "loss": 1.7077, "step": 6341 }, { "epoch": 0.5, "learning_rate": 0.0002799809898757032, "loss": 1.7403, "step": 6342 }, { "epoch": 0.5, "learning_rate": 0.00027997482060434636, "loss": 1.7504, "step": 6343 }, { "epoch": 0.5, "learning_rate": 0.0002799686504505322, "loss": 1.7716, "step": 6344 }, { "epoch": 0.5, "learning_rate": 0.00027996247941430266, "loss": 1.7628, "step": 6345 }, { "epoch": 0.5, "learning_rate": 0.00027995630749569957, "loss": 1.7, "step": 6346 }, { "epoch": 0.5, "learning_rate": 0.00027995013469476484, "loss": 1.6764, "step": 6347 }, { "epoch": 0.5, "learning_rate": 0.0002799439610115405, "loss": 1.7131, "step": 6348 }, { "epoch": 0.5, "learning_rate": 0.0002799377864460683, "loss": 1.7505, "step": 6349 }, { "epoch": 0.5, "learning_rate": 0.0002799316109983902, "loss": 1.7455, "step": 6350 }, { "epoch": 0.5, "learning_rate": 0.00027992543466854827, "loss": 1.7098, "step": 6351 }, { "epoch": 0.5, "learning_rate": 0.0002799192574565842, "loss": 1.7231, "step": 6352 }, { "epoch": 0.5, "learning_rate": 0.0002799130793625402, "loss": 1.7053, "step": 6353 }, { "epoch": 0.5, "learning_rate": 0.00027990690038645806, "loss": 1.7165, "step": 6354 }, { "epoch": 0.5, "learning_rate": 0.00027990072052837966, "loss": 1.776, "step": 6355 }, { "epoch": 0.5, "learning_rate": 0.00027989453978834715, "loss": 1.7236, "step": 6356 }, { "epoch": 0.5, "learning_rate": 0.0002798883581664024, "loss": 1.6895, "step": 6357 }, { "epoch": 0.5, "learning_rate": 0.00027988217566258736, "loss": 1.6676, "step": 6358 }, { "epoch": 0.5, "learning_rate": 0.00027987599227694395, "loss": 1.7377, "step": 6359 }, { "epoch": 0.5, "learning_rate": 0.0002798698080095143, "loss": 1.7201, "step": 6360 }, { "epoch": 0.5, "learning_rate": 0.00027986362286034033, "loss": 1.7368, "step": 6361 }, { "epoch": 0.5, "learning_rate": 0.000279857436829464, "loss": 1.7611, "step": 6362 }, { "epoch": 0.5, "learning_rate": 0.0002798512499169273, "loss": 1.721, "step": 6363 }, { "epoch": 0.5, "learning_rate": 0.0002798450621227723, "loss": 1.7011, "step": 6364 }, { "epoch": 0.5, "learning_rate": 0.000279838873447041, "loss": 1.7073, "step": 6365 }, { "epoch": 0.5, "learning_rate": 0.00027983268388977536, "loss": 1.7653, "step": 6366 }, { "epoch": 0.5, "learning_rate": 0.00027982649345101746, "loss": 1.6634, "step": 6367 }, { "epoch": 0.5, "learning_rate": 0.00027982030213080937, "loss": 1.7163, "step": 6368 }, { "epoch": 0.5, "learning_rate": 0.000279814109929193, "loss": 1.7438, "step": 6369 }, { "epoch": 0.5, "learning_rate": 0.00027980791684621047, "loss": 1.6752, "step": 6370 }, { "epoch": 0.5, "learning_rate": 0.00027980172288190385, "loss": 1.6947, "step": 6371 }, { "epoch": 0.5, "learning_rate": 0.00027979552803631514, "loss": 1.7305, "step": 6372 }, { "epoch": 0.5, "learning_rate": 0.0002797893323094864, "loss": 1.7077, "step": 6373 }, { "epoch": 0.5, "learning_rate": 0.00027978313570145975, "loss": 1.7576, "step": 6374 }, { "epoch": 0.5, "learning_rate": 0.00027977693821227726, "loss": 1.7551, "step": 6375 }, { "epoch": 0.5, "learning_rate": 0.0002797707398419809, "loss": 1.7285, "step": 6376 }, { "epoch": 0.5, "learning_rate": 0.0002797645405906129, "loss": 1.7573, "step": 6377 }, { "epoch": 0.5, "learning_rate": 0.00027975834045821524, "loss": 1.7459, "step": 6378 }, { "epoch": 0.5, "learning_rate": 0.00027975213944483006, "loss": 1.7425, "step": 6379 }, { "epoch": 0.5, "learning_rate": 0.0002797459375504995, "loss": 1.7546, "step": 6380 }, { "epoch": 0.5, "learning_rate": 0.0002797397347752656, "loss": 1.7541, "step": 6381 }, { "epoch": 0.5, "learning_rate": 0.0002797335311191704, "loss": 1.7514, "step": 6382 }, { "epoch": 0.5, "learning_rate": 0.0002797273265822562, "loss": 1.7805, "step": 6383 }, { "epoch": 0.5, "learning_rate": 0.00027972112116456506, "loss": 1.7244, "step": 6384 }, { "epoch": 0.5, "learning_rate": 0.0002797149148661391, "loss": 1.6954, "step": 6385 }, { "epoch": 0.5, "learning_rate": 0.0002797087076870204, "loss": 1.7489, "step": 6386 }, { "epoch": 0.5, "learning_rate": 0.00027970249962725114, "loss": 1.7813, "step": 6387 }, { "epoch": 0.5, "learning_rate": 0.00027969629068687357, "loss": 1.7301, "step": 6388 }, { "epoch": 0.5, "learning_rate": 0.0002796900808659297, "loss": 1.7295, "step": 6389 }, { "epoch": 0.5, "learning_rate": 0.0002796838701644617, "loss": 1.7665, "step": 6390 }, { "epoch": 0.5, "learning_rate": 0.00027967765858251186, "loss": 1.7328, "step": 6391 }, { "epoch": 0.5, "learning_rate": 0.0002796714461201223, "loss": 1.7264, "step": 6392 }, { "epoch": 0.5, "learning_rate": 0.0002796652327773351, "loss": 1.6307, "step": 6393 }, { "epoch": 0.5, "learning_rate": 0.0002796590185541926, "loss": 1.7393, "step": 6394 }, { "epoch": 0.5, "learning_rate": 0.0002796528034507369, "loss": 1.6998, "step": 6395 }, { "epoch": 0.5, "learning_rate": 0.0002796465874670102, "loss": 1.6921, "step": 6396 }, { "epoch": 0.5, "learning_rate": 0.00027964037060305475, "loss": 1.7419, "step": 6397 }, { "epoch": 0.5, "learning_rate": 0.00027963415285891266, "loss": 1.6931, "step": 6398 }, { "epoch": 0.5, "learning_rate": 0.00027962793423462625, "loss": 1.7914, "step": 6399 }, { "epoch": 0.5, "learning_rate": 0.00027962171473023764, "loss": 1.6819, "step": 6400 }, { "epoch": 0.5, "learning_rate": 0.00027961549434578917, "loss": 1.723, "step": 6401 }, { "epoch": 0.5, "learning_rate": 0.000279609273081323, "loss": 1.6826, "step": 6402 }, { "epoch": 0.5, "learning_rate": 0.00027960305093688146, "loss": 1.7493, "step": 6403 }, { "epoch": 0.5, "learning_rate": 0.0002795968279125067, "loss": 1.7227, "step": 6404 }, { "epoch": 0.5, "learning_rate": 0.0002795906040082409, "loss": 1.7463, "step": 6405 }, { "epoch": 0.5, "learning_rate": 0.00027958437922412653, "loss": 1.748, "step": 6406 }, { "epoch": 0.5, "learning_rate": 0.0002795781535602057, "loss": 1.7243, "step": 6407 }, { "epoch": 0.5, "learning_rate": 0.00027957192701652067, "loss": 1.6791, "step": 6408 }, { "epoch": 0.5, "learning_rate": 0.0002795656995931138, "loss": 1.7301, "step": 6409 }, { "epoch": 0.5, "learning_rate": 0.0002795594712900274, "loss": 1.6999, "step": 6410 }, { "epoch": 0.5, "learning_rate": 0.00027955324210730354, "loss": 1.6761, "step": 6411 }, { "epoch": 0.5, "learning_rate": 0.00027954701204498475, "loss": 1.6959, "step": 6412 }, { "epoch": 0.5, "learning_rate": 0.00027954078110311323, "loss": 1.651, "step": 6413 }, { "epoch": 0.5, "learning_rate": 0.0002795345492817313, "loss": 1.7039, "step": 6414 }, { "epoch": 0.5, "learning_rate": 0.0002795283165808812, "loss": 1.6764, "step": 6415 }, { "epoch": 0.5, "learning_rate": 0.00027952208300060534, "loss": 1.6986, "step": 6416 }, { "epoch": 0.5, "learning_rate": 0.00027951584854094604, "loss": 1.7201, "step": 6417 }, { "epoch": 0.5, "learning_rate": 0.0002795096132019456, "loss": 1.7204, "step": 6418 }, { "epoch": 0.51, "learning_rate": 0.0002795033769836463, "loss": 1.7246, "step": 6419 }, { "epoch": 0.51, "learning_rate": 0.0002794971398860906, "loss": 1.7147, "step": 6420 }, { "epoch": 0.51, "learning_rate": 0.00027949090190932074, "loss": 1.7625, "step": 6421 }, { "epoch": 0.51, "learning_rate": 0.00027948466305337917, "loss": 1.8001, "step": 6422 }, { "epoch": 0.51, "learning_rate": 0.00027947842331830814, "loss": 1.7558, "step": 6423 }, { "epoch": 0.51, "learning_rate": 0.0002794721827041501, "loss": 1.6814, "step": 6424 }, { "epoch": 0.51, "learning_rate": 0.0002794659412109474, "loss": 1.7182, "step": 6425 }, { "epoch": 0.51, "learning_rate": 0.0002794596988387424, "loss": 1.7447, "step": 6426 }, { "epoch": 0.51, "learning_rate": 0.0002794534555875774, "loss": 1.7521, "step": 6427 }, { "epoch": 0.51, "learning_rate": 0.00027944721145749496, "loss": 1.746, "step": 6428 }, { "epoch": 0.51, "learning_rate": 0.00027944096644853735, "loss": 1.778, "step": 6429 }, { "epoch": 0.51, "learning_rate": 0.0002794347205607471, "loss": 1.7368, "step": 6430 }, { "epoch": 0.51, "learning_rate": 0.0002794284737941664, "loss": 1.7175, "step": 6431 }, { "epoch": 0.51, "learning_rate": 0.00027942222614883787, "loss": 1.6786, "step": 6432 }, { "epoch": 0.51, "learning_rate": 0.0002794159776248038, "loss": 1.6717, "step": 6433 }, { "epoch": 0.51, "learning_rate": 0.00027940972822210663, "loss": 1.7345, "step": 6434 }, { "epoch": 0.51, "learning_rate": 0.0002794034779407889, "loss": 1.7289, "step": 6435 }, { "epoch": 0.51, "learning_rate": 0.00027939722678089297, "loss": 1.6706, "step": 6436 }, { "epoch": 0.51, "learning_rate": 0.00027939097474246125, "loss": 1.7483, "step": 6437 }, { "epoch": 0.51, "learning_rate": 0.00027938472182553617, "loss": 1.7264, "step": 6438 }, { "epoch": 0.51, "learning_rate": 0.00027937846803016025, "loss": 1.723, "step": 6439 }, { "epoch": 0.51, "learning_rate": 0.000279372213356376, "loss": 1.7328, "step": 6440 }, { "epoch": 0.51, "learning_rate": 0.00027936595780422575, "loss": 1.6919, "step": 6441 }, { "epoch": 0.51, "learning_rate": 0.000279359701373752, "loss": 1.7078, "step": 6442 }, { "epoch": 0.51, "learning_rate": 0.0002793534440649973, "loss": 1.7308, "step": 6443 }, { "epoch": 0.51, "learning_rate": 0.00027934718587800417, "loss": 1.749, "step": 6444 }, { "epoch": 0.51, "learning_rate": 0.00027934092681281496, "loss": 1.7148, "step": 6445 }, { "epoch": 0.51, "learning_rate": 0.0002793346668694722, "loss": 1.738, "step": 6446 }, { "epoch": 0.51, "learning_rate": 0.00027932840604801847, "loss": 1.7988, "step": 6447 }, { "epoch": 0.51, "learning_rate": 0.00027932214434849624, "loss": 1.7712, "step": 6448 }, { "epoch": 0.51, "learning_rate": 0.000279315881770948, "loss": 1.6733, "step": 6449 }, { "epoch": 0.51, "learning_rate": 0.0002793096183154163, "loss": 1.7283, "step": 6450 }, { "epoch": 0.51, "learning_rate": 0.00027930335398194364, "loss": 1.73, "step": 6451 }, { "epoch": 0.51, "learning_rate": 0.0002792970887705725, "loss": 1.6999, "step": 6452 }, { "epoch": 0.51, "learning_rate": 0.0002792908226813456, "loss": 1.7126, "step": 6453 }, { "epoch": 0.51, "learning_rate": 0.0002792845557143053, "loss": 1.6731, "step": 6454 }, { "epoch": 0.51, "learning_rate": 0.00027927828786949424, "loss": 1.7258, "step": 6455 }, { "epoch": 0.51, "learning_rate": 0.0002792720191469549, "loss": 1.698, "step": 6456 }, { "epoch": 0.51, "learning_rate": 0.00027926574954672986, "loss": 1.6815, "step": 6457 }, { "epoch": 0.51, "learning_rate": 0.00027925947906886175, "loss": 1.7246, "step": 6458 }, { "epoch": 0.51, "learning_rate": 0.0002792532077133932, "loss": 1.7025, "step": 6459 }, { "epoch": 0.51, "learning_rate": 0.0002792469354803666, "loss": 1.7481, "step": 6460 }, { "epoch": 0.51, "learning_rate": 0.00027924066236982467, "loss": 1.7517, "step": 6461 }, { "epoch": 0.51, "learning_rate": 0.0002792343883818099, "loss": 1.7243, "step": 6462 }, { "epoch": 0.51, "learning_rate": 0.000279228113516365, "loss": 1.702, "step": 6463 }, { "epoch": 0.51, "learning_rate": 0.00027922183777353253, "loss": 1.7976, "step": 6464 }, { "epoch": 0.51, "learning_rate": 0.0002792155611533551, "loss": 1.6861, "step": 6465 }, { "epoch": 0.51, "learning_rate": 0.00027920928365587525, "loss": 1.6724, "step": 6466 }, { "epoch": 0.51, "learning_rate": 0.0002792030052811358, "loss": 1.7223, "step": 6467 }, { "epoch": 0.51, "learning_rate": 0.0002791967260291791, "loss": 1.7722, "step": 6468 }, { "epoch": 0.51, "learning_rate": 0.00027919044590004797, "loss": 1.7211, "step": 6469 }, { "epoch": 0.51, "learning_rate": 0.000279184164893785, "loss": 1.6966, "step": 6470 }, { "epoch": 0.51, "learning_rate": 0.00027917788301043287, "loss": 1.7232, "step": 6471 }, { "epoch": 0.51, "learning_rate": 0.00027917160025003423, "loss": 1.7423, "step": 6472 }, { "epoch": 0.51, "learning_rate": 0.0002791653166126317, "loss": 1.7043, "step": 6473 }, { "epoch": 0.51, "learning_rate": 0.00027915903209826785, "loss": 1.7739, "step": 6474 }, { "epoch": 0.51, "learning_rate": 0.00027915274670698554, "loss": 1.6869, "step": 6475 }, { "epoch": 0.51, "learning_rate": 0.00027914646043882734, "loss": 1.7173, "step": 6476 }, { "epoch": 0.51, "learning_rate": 0.0002791401732938359, "loss": 1.705, "step": 6477 }, { "epoch": 0.51, "learning_rate": 0.000279133885272054, "loss": 1.7384, "step": 6478 }, { "epoch": 0.51, "learning_rate": 0.00027912759637352424, "loss": 1.767, "step": 6479 }, { "epoch": 0.51, "learning_rate": 0.0002791213065982894, "loss": 1.7043, "step": 6480 }, { "epoch": 0.51, "learning_rate": 0.00027911501594639213, "loss": 1.7626, "step": 6481 }, { "epoch": 0.51, "learning_rate": 0.00027910872441787516, "loss": 1.6991, "step": 6482 }, { "epoch": 0.51, "learning_rate": 0.00027910243201278117, "loss": 1.6855, "step": 6483 }, { "epoch": 0.51, "learning_rate": 0.0002790961387311529, "loss": 1.7112, "step": 6484 }, { "epoch": 0.51, "learning_rate": 0.00027908984457303314, "loss": 1.7663, "step": 6485 }, { "epoch": 0.51, "learning_rate": 0.00027908354953846455, "loss": 1.6907, "step": 6486 }, { "epoch": 0.51, "learning_rate": 0.0002790772536274899, "loss": 1.7255, "step": 6487 }, { "epoch": 0.51, "learning_rate": 0.00027907095684015195, "loss": 1.7331, "step": 6488 }, { "epoch": 0.51, "learning_rate": 0.0002790646591764934, "loss": 1.7509, "step": 6489 }, { "epoch": 0.51, "learning_rate": 0.000279058360636557, "loss": 1.7532, "step": 6490 }, { "epoch": 0.51, "learning_rate": 0.0002790520612203856, "loss": 1.6756, "step": 6491 }, { "epoch": 0.51, "learning_rate": 0.00027904576092802194, "loss": 1.7715, "step": 6492 }, { "epoch": 0.51, "learning_rate": 0.00027903945975950875, "loss": 1.7358, "step": 6493 }, { "epoch": 0.51, "learning_rate": 0.00027903315771488877, "loss": 1.794, "step": 6494 }, { "epoch": 0.51, "learning_rate": 0.00027902685479420496, "loss": 1.7656, "step": 6495 }, { "epoch": 0.51, "learning_rate": 0.00027902055099749995, "loss": 1.6967, "step": 6496 }, { "epoch": 0.51, "learning_rate": 0.00027901424632481667, "loss": 1.7021, "step": 6497 }, { "epoch": 0.51, "learning_rate": 0.0002790079407761978, "loss": 1.6688, "step": 6498 }, { "epoch": 0.51, "learning_rate": 0.00027900163435168616, "loss": 1.7222, "step": 6499 }, { "epoch": 0.51, "learning_rate": 0.0002789953270513247, "loss": 1.6959, "step": 6500 }, { "epoch": 0.51, "learning_rate": 0.0002789890188751561, "loss": 1.6891, "step": 6501 }, { "epoch": 0.51, "learning_rate": 0.00027898270982322325, "loss": 1.7416, "step": 6502 }, { "epoch": 0.51, "learning_rate": 0.000278976399895569, "loss": 1.6971, "step": 6503 }, { "epoch": 0.51, "learning_rate": 0.00027897008909223616, "loss": 1.6435, "step": 6504 }, { "epoch": 0.51, "learning_rate": 0.00027896377741326757, "loss": 1.7754, "step": 6505 }, { "epoch": 0.51, "learning_rate": 0.00027895746485870614, "loss": 1.7301, "step": 6506 }, { "epoch": 0.51, "learning_rate": 0.00027895115142859465, "loss": 1.6806, "step": 6507 }, { "epoch": 0.51, "learning_rate": 0.000278944837122976, "loss": 1.7272, "step": 6508 }, { "epoch": 0.51, "learning_rate": 0.00027893852194189303, "loss": 1.7342, "step": 6509 }, { "epoch": 0.51, "learning_rate": 0.0002789322058853887, "loss": 1.7646, "step": 6510 }, { "epoch": 0.51, "learning_rate": 0.0002789258889535059, "loss": 1.7782, "step": 6511 }, { "epoch": 0.51, "learning_rate": 0.00027891957114628736, "loss": 1.7032, "step": 6512 }, { "epoch": 0.51, "learning_rate": 0.0002789132524637761, "loss": 1.7216, "step": 6513 }, { "epoch": 0.51, "learning_rate": 0.00027890693290601507, "loss": 1.7721, "step": 6514 }, { "epoch": 0.51, "learning_rate": 0.00027890061247304705, "loss": 1.7192, "step": 6515 }, { "epoch": 0.51, "learning_rate": 0.00027889429116491495, "loss": 1.7449, "step": 6516 }, { "epoch": 0.51, "learning_rate": 0.00027888796898166185, "loss": 1.7559, "step": 6517 }, { "epoch": 0.51, "learning_rate": 0.0002788816459233305, "loss": 1.669, "step": 6518 }, { "epoch": 0.51, "learning_rate": 0.00027887532198996387, "loss": 1.7113, "step": 6519 }, { "epoch": 0.51, "learning_rate": 0.00027886899718160496, "loss": 1.7367, "step": 6520 }, { "epoch": 0.51, "learning_rate": 0.0002788626714982967, "loss": 1.7003, "step": 6521 }, { "epoch": 0.51, "learning_rate": 0.000278856344940082, "loss": 1.7205, "step": 6522 }, { "epoch": 0.51, "learning_rate": 0.0002788500175070038, "loss": 1.736, "step": 6523 }, { "epoch": 0.51, "learning_rate": 0.0002788436891991051, "loss": 1.74, "step": 6524 }, { "epoch": 0.51, "learning_rate": 0.0002788373600164288, "loss": 1.6851, "step": 6525 }, { "epoch": 0.51, "learning_rate": 0.000278831029959018, "loss": 1.7153, "step": 6526 }, { "epoch": 0.51, "learning_rate": 0.0002788246990269156, "loss": 1.6971, "step": 6527 }, { "epoch": 0.51, "learning_rate": 0.00027881836722016455, "loss": 1.7596, "step": 6528 }, { "epoch": 0.51, "learning_rate": 0.00027881203453880793, "loss": 1.7591, "step": 6529 }, { "epoch": 0.51, "learning_rate": 0.0002788057009828886, "loss": 1.7202, "step": 6530 }, { "epoch": 0.51, "learning_rate": 0.0002787993665524497, "loss": 1.7645, "step": 6531 }, { "epoch": 0.51, "learning_rate": 0.0002787930312475341, "loss": 1.7292, "step": 6532 }, { "epoch": 0.51, "learning_rate": 0.00027878669506818497, "loss": 1.7523, "step": 6533 }, { "epoch": 0.51, "learning_rate": 0.00027878035801444525, "loss": 1.6762, "step": 6534 }, { "epoch": 0.51, "learning_rate": 0.0002787740200863579, "loss": 1.7102, "step": 6535 }, { "epoch": 0.51, "learning_rate": 0.0002787676812839661, "loss": 1.7355, "step": 6536 }, { "epoch": 0.51, "learning_rate": 0.0002787613416073128, "loss": 1.742, "step": 6537 }, { "epoch": 0.51, "learning_rate": 0.000278755001056441, "loss": 1.6556, "step": 6538 }, { "epoch": 0.51, "learning_rate": 0.0002787486596313938, "loss": 1.6981, "step": 6539 }, { "epoch": 0.51, "learning_rate": 0.0002787423173322142, "loss": 1.7037, "step": 6540 }, { "epoch": 0.51, "learning_rate": 0.0002787359741589454, "loss": 1.7417, "step": 6541 }, { "epoch": 0.51, "learning_rate": 0.0002787296301116304, "loss": 1.7035, "step": 6542 }, { "epoch": 0.51, "learning_rate": 0.00027872328519031216, "loss": 1.777, "step": 6543 }, { "epoch": 0.51, "learning_rate": 0.0002787169393950339, "loss": 1.73, "step": 6544 }, { "epoch": 0.51, "learning_rate": 0.0002787105927258386, "loss": 1.7654, "step": 6545 }, { "epoch": 0.52, "learning_rate": 0.0002787042451827695, "loss": 1.6976, "step": 6546 }, { "epoch": 0.52, "learning_rate": 0.0002786978967658695, "loss": 1.7034, "step": 6547 }, { "epoch": 0.52, "learning_rate": 0.00027869154747518185, "loss": 1.7517, "step": 6548 }, { "epoch": 0.52, "learning_rate": 0.00027868519731074964, "loss": 1.7139, "step": 6549 }, { "epoch": 0.52, "learning_rate": 0.00027867884627261587, "loss": 1.7455, "step": 6550 }, { "epoch": 0.52, "learning_rate": 0.0002786724943608238, "loss": 1.7106, "step": 6551 }, { "epoch": 0.52, "learning_rate": 0.00027866614157541654, "loss": 1.7166, "step": 6552 }, { "epoch": 0.52, "learning_rate": 0.0002786597879164372, "loss": 1.6647, "step": 6553 }, { "epoch": 0.52, "learning_rate": 0.00027865343338392875, "loss": 1.7183, "step": 6554 }, { "epoch": 0.52, "learning_rate": 0.00027864707797793463, "loss": 1.7466, "step": 6555 }, { "epoch": 0.52, "learning_rate": 0.00027864072169849776, "loss": 1.6588, "step": 6556 }, { "epoch": 0.52, "learning_rate": 0.00027863436454566144, "loss": 1.7044, "step": 6557 }, { "epoch": 0.52, "learning_rate": 0.00027862800651946867, "loss": 1.6899, "step": 6558 }, { "epoch": 0.52, "learning_rate": 0.0002786216476199628, "loss": 1.7101, "step": 6559 }, { "epoch": 0.52, "learning_rate": 0.0002786152878471869, "loss": 1.7285, "step": 6560 }, { "epoch": 0.52, "learning_rate": 0.0002786089272011842, "loss": 1.7483, "step": 6561 }, { "epoch": 0.52, "learning_rate": 0.00027860256568199785, "loss": 1.6971, "step": 6562 }, { "epoch": 0.52, "learning_rate": 0.00027859620328967105, "loss": 1.7548, "step": 6563 }, { "epoch": 0.52, "learning_rate": 0.000278589840024247, "loss": 1.6768, "step": 6564 }, { "epoch": 0.52, "learning_rate": 0.00027858347588576883, "loss": 1.7085, "step": 6565 }, { "epoch": 0.52, "learning_rate": 0.0002785771108742799, "loss": 1.7269, "step": 6566 }, { "epoch": 0.52, "learning_rate": 0.0002785707449898233, "loss": 1.7005, "step": 6567 }, { "epoch": 0.52, "learning_rate": 0.00027856437823244224, "loss": 1.7143, "step": 6568 }, { "epoch": 0.52, "learning_rate": 0.00027855801060218014, "loss": 1.733, "step": 6569 }, { "epoch": 0.52, "learning_rate": 0.00027855164209908, "loss": 1.7112, "step": 6570 }, { "epoch": 0.52, "learning_rate": 0.0002785452727231851, "loss": 1.6473, "step": 6571 }, { "epoch": 0.52, "learning_rate": 0.00027853890247453883, "loss": 1.693, "step": 6572 }, { "epoch": 0.52, "learning_rate": 0.00027853253135318433, "loss": 1.7095, "step": 6573 }, { "epoch": 0.52, "learning_rate": 0.00027852615935916483, "loss": 1.7471, "step": 6574 }, { "epoch": 0.52, "learning_rate": 0.0002785197864925237, "loss": 1.7225, "step": 6575 }, { "epoch": 0.52, "learning_rate": 0.00027851341275330406, "loss": 1.6914, "step": 6576 }, { "epoch": 0.52, "learning_rate": 0.0002785070381415493, "loss": 1.7763, "step": 6577 }, { "epoch": 0.52, "learning_rate": 0.0002785006626573027, "loss": 1.6899, "step": 6578 }, { "epoch": 0.52, "learning_rate": 0.00027849428630060747, "loss": 1.6986, "step": 6579 }, { "epoch": 0.52, "learning_rate": 0.000278487909071507, "loss": 1.7473, "step": 6580 }, { "epoch": 0.52, "learning_rate": 0.0002784815309700445, "loss": 1.7203, "step": 6581 }, { "epoch": 0.52, "learning_rate": 0.00027847515199626327, "loss": 1.6784, "step": 6582 }, { "epoch": 0.52, "learning_rate": 0.0002784687721502067, "loss": 1.6678, "step": 6583 }, { "epoch": 0.52, "learning_rate": 0.00027846239143191807, "loss": 1.7429, "step": 6584 }, { "epoch": 0.52, "learning_rate": 0.00027845600984144066, "loss": 1.6504, "step": 6585 }, { "epoch": 0.52, "learning_rate": 0.00027844962737881785, "loss": 1.7155, "step": 6586 }, { "epoch": 0.52, "learning_rate": 0.00027844324404409295, "loss": 1.6812, "step": 6587 }, { "epoch": 0.52, "learning_rate": 0.00027843685983730933, "loss": 1.714, "step": 6588 }, { "epoch": 0.52, "learning_rate": 0.00027843047475851026, "loss": 1.7454, "step": 6589 }, { "epoch": 0.52, "learning_rate": 0.0002784240888077392, "loss": 1.7672, "step": 6590 }, { "epoch": 0.52, "learning_rate": 0.0002784177019850394, "loss": 1.7039, "step": 6591 }, { "epoch": 0.52, "learning_rate": 0.0002784113142904543, "loss": 1.6814, "step": 6592 }, { "epoch": 0.52, "learning_rate": 0.0002784049257240272, "loss": 1.7421, "step": 6593 }, { "epoch": 0.52, "learning_rate": 0.00027839853628580153, "loss": 1.7038, "step": 6594 }, { "epoch": 0.52, "learning_rate": 0.00027839214597582065, "loss": 1.6524, "step": 6595 }, { "epoch": 0.52, "learning_rate": 0.000278385754794128, "loss": 1.7291, "step": 6596 }, { "epoch": 0.52, "learning_rate": 0.0002783793627407668, "loss": 1.7463, "step": 6597 }, { "epoch": 0.52, "learning_rate": 0.0002783729698157807, "loss": 1.7277, "step": 6598 }, { "epoch": 0.52, "learning_rate": 0.0002783665760192129, "loss": 1.7246, "step": 6599 }, { "epoch": 0.52, "learning_rate": 0.00027836018135110694, "loss": 1.7199, "step": 6600 }, { "epoch": 0.52, "learning_rate": 0.0002783537858115062, "loss": 1.7504, "step": 6601 }, { "epoch": 0.52, "learning_rate": 0.00027834738940045407, "loss": 1.6706, "step": 6602 }, { "epoch": 0.52, "learning_rate": 0.00027834099211799395, "loss": 1.7471, "step": 6603 }, { "epoch": 0.52, "learning_rate": 0.0002783345939641694, "loss": 1.7631, "step": 6604 }, { "epoch": 0.52, "learning_rate": 0.0002783281949390237, "loss": 1.7094, "step": 6605 }, { "epoch": 0.52, "learning_rate": 0.0002783217950426004, "loss": 1.7173, "step": 6606 }, { "epoch": 0.52, "learning_rate": 0.0002783153942749429, "loss": 1.7045, "step": 6607 }, { "epoch": 0.52, "learning_rate": 0.0002783089926360947, "loss": 1.6935, "step": 6608 }, { "epoch": 0.52, "learning_rate": 0.0002783025901260992, "loss": 1.6977, "step": 6609 }, { "epoch": 0.52, "learning_rate": 0.00027829618674500003, "loss": 1.7072, "step": 6610 }, { "epoch": 0.52, "learning_rate": 0.00027828978249284047, "loss": 1.7201, "step": 6611 }, { "epoch": 0.52, "learning_rate": 0.0002782833773696641, "loss": 1.7124, "step": 6612 }, { "epoch": 0.52, "learning_rate": 0.0002782769713755144, "loss": 1.7481, "step": 6613 }, { "epoch": 0.52, "learning_rate": 0.0002782705645104348, "loss": 1.7306, "step": 6614 }, { "epoch": 0.52, "learning_rate": 0.0002782641567744689, "loss": 1.7558, "step": 6615 }, { "epoch": 0.52, "learning_rate": 0.0002782577481676602, "loss": 1.7206, "step": 6616 }, { "epoch": 0.52, "learning_rate": 0.0002782513386900521, "loss": 1.7527, "step": 6617 }, { "epoch": 0.52, "learning_rate": 0.00027824492834168827, "loss": 1.6809, "step": 6618 }, { "epoch": 0.52, "learning_rate": 0.0002782385171226121, "loss": 1.7148, "step": 6619 }, { "epoch": 0.52, "learning_rate": 0.0002782321050328671, "loss": 1.7761, "step": 6620 }, { "epoch": 0.52, "learning_rate": 0.0002782256920724969, "loss": 1.7334, "step": 6621 }, { "epoch": 0.52, "learning_rate": 0.0002782192782415451, "loss": 1.7266, "step": 6622 }, { "epoch": 0.52, "learning_rate": 0.00027821286354005507, "loss": 1.7076, "step": 6623 }, { "epoch": 0.52, "learning_rate": 0.0002782064479680705, "loss": 1.692, "step": 6624 }, { "epoch": 0.52, "learning_rate": 0.00027820003152563484, "loss": 1.7214, "step": 6625 }, { "epoch": 0.52, "learning_rate": 0.0002781936142127918, "loss": 1.7074, "step": 6626 }, { "epoch": 0.52, "learning_rate": 0.00027818719602958476, "loss": 1.7009, "step": 6627 }, { "epoch": 0.52, "learning_rate": 0.0002781807769760575, "loss": 1.7311, "step": 6628 }, { "epoch": 0.52, "learning_rate": 0.0002781743570522534, "loss": 1.7322, "step": 6629 }, { "epoch": 0.52, "learning_rate": 0.0002781679362582162, "loss": 1.6982, "step": 6630 }, { "epoch": 0.52, "learning_rate": 0.0002781615145939894, "loss": 1.656, "step": 6631 }, { "epoch": 0.52, "learning_rate": 0.0002781550920596167, "loss": 1.7172, "step": 6632 }, { "epoch": 0.52, "learning_rate": 0.00027814866865514165, "loss": 1.6937, "step": 6633 }, { "epoch": 0.52, "learning_rate": 0.0002781422443806078, "loss": 1.73, "step": 6634 }, { "epoch": 0.52, "learning_rate": 0.00027813581923605887, "loss": 1.783, "step": 6635 }, { "epoch": 0.52, "learning_rate": 0.00027812939322153845, "loss": 1.7431, "step": 6636 }, { "epoch": 0.52, "learning_rate": 0.00027812296633709016, "loss": 1.7204, "step": 6637 }, { "epoch": 0.52, "learning_rate": 0.00027811653858275757, "loss": 1.7376, "step": 6638 }, { "epoch": 0.52, "learning_rate": 0.0002781101099585844, "loss": 1.7162, "step": 6639 }, { "epoch": 0.52, "learning_rate": 0.0002781036804646143, "loss": 1.7299, "step": 6640 }, { "epoch": 0.52, "learning_rate": 0.00027809725010089094, "loss": 1.6732, "step": 6641 }, { "epoch": 0.52, "learning_rate": 0.0002780908188674579, "loss": 1.7362, "step": 6642 }, { "epoch": 0.52, "learning_rate": 0.0002780843867643589, "loss": 1.6963, "step": 6643 }, { "epoch": 0.52, "learning_rate": 0.0002780779537916376, "loss": 1.764, "step": 6644 }, { "epoch": 0.52, "learning_rate": 0.00027807151994933767, "loss": 1.7137, "step": 6645 }, { "epoch": 0.52, "learning_rate": 0.00027806508523750274, "loss": 1.7017, "step": 6646 }, { "epoch": 0.52, "learning_rate": 0.00027805864965617665, "loss": 1.7497, "step": 6647 }, { "epoch": 0.52, "learning_rate": 0.0002780522132054029, "loss": 1.756, "step": 6648 }, { "epoch": 0.52, "learning_rate": 0.00027804577588522536, "loss": 1.6898, "step": 6649 }, { "epoch": 0.52, "learning_rate": 0.00027803933769568766, "loss": 1.7316, "step": 6650 }, { "epoch": 0.52, "learning_rate": 0.0002780328986368335, "loss": 1.652, "step": 6651 }, { "epoch": 0.52, "learning_rate": 0.0002780264587087066, "loss": 1.8018, "step": 6652 }, { "epoch": 0.52, "learning_rate": 0.00027802001791135065, "loss": 1.7478, "step": 6653 }, { "epoch": 0.52, "learning_rate": 0.0002780135762448095, "loss": 1.7146, "step": 6654 }, { "epoch": 0.52, "learning_rate": 0.0002780071337091268, "loss": 1.7546, "step": 6655 }, { "epoch": 0.52, "learning_rate": 0.00027800069030434627, "loss": 1.7529, "step": 6656 }, { "epoch": 0.52, "learning_rate": 0.0002779942460305117, "loss": 1.748, "step": 6657 }, { "epoch": 0.52, "learning_rate": 0.0002779878008876669, "loss": 1.752, "step": 6658 }, { "epoch": 0.52, "learning_rate": 0.0002779813548758555, "loss": 1.8219, "step": 6659 }, { "epoch": 0.52, "learning_rate": 0.0002779749079951213, "loss": 1.7758, "step": 6660 }, { "epoch": 0.52, "learning_rate": 0.0002779684602455082, "loss": 1.7223, "step": 6661 }, { "epoch": 0.52, "learning_rate": 0.00027796201162705975, "loss": 1.7127, "step": 6662 }, { "epoch": 0.52, "learning_rate": 0.0002779555621398199, "loss": 1.6688, "step": 6663 }, { "epoch": 0.52, "learning_rate": 0.0002779491117838324, "loss": 1.7415, "step": 6664 }, { "epoch": 0.52, "learning_rate": 0.00027794266055914107, "loss": 1.7453, "step": 6665 }, { "epoch": 0.52, "learning_rate": 0.00027793620846578966, "loss": 1.7489, "step": 6666 }, { "epoch": 0.52, "learning_rate": 0.000277929755503822, "loss": 1.6325, "step": 6667 }, { "epoch": 0.52, "learning_rate": 0.00027792330167328186, "loss": 1.7024, "step": 6668 }, { "epoch": 0.52, "learning_rate": 0.00027791684697421316, "loss": 1.6875, "step": 6669 }, { "epoch": 0.52, "learning_rate": 0.00027791039140665955, "loss": 1.7483, "step": 6670 }, { "epoch": 0.52, "learning_rate": 0.00027790393497066504, "loss": 1.7, "step": 6671 }, { "epoch": 0.52, "learning_rate": 0.00027789747766627344, "loss": 1.7463, "step": 6672 }, { "epoch": 0.53, "learning_rate": 0.0002778910194935285, "loss": 1.6924, "step": 6673 }, { "epoch": 0.53, "learning_rate": 0.0002778845604524741, "loss": 1.7316, "step": 6674 }, { "epoch": 0.53, "learning_rate": 0.0002778781005431541, "loss": 1.7188, "step": 6675 }, { "epoch": 0.53, "learning_rate": 0.0002778716397656124, "loss": 1.7501, "step": 6676 }, { "epoch": 0.53, "learning_rate": 0.00027786517811989283, "loss": 1.7406, "step": 6677 }, { "epoch": 0.53, "learning_rate": 0.00027785871560603924, "loss": 1.7205, "step": 6678 }, { "epoch": 0.53, "learning_rate": 0.0002778522522240956, "loss": 1.7061, "step": 6679 }, { "epoch": 0.53, "learning_rate": 0.0002778457879741056, "loss": 1.6583, "step": 6680 }, { "epoch": 0.53, "learning_rate": 0.0002778393228561133, "loss": 1.7453, "step": 6681 }, { "epoch": 0.53, "learning_rate": 0.0002778328568701626, "loss": 1.7636, "step": 6682 }, { "epoch": 0.53, "learning_rate": 0.0002778263900162973, "loss": 1.7326, "step": 6683 }, { "epoch": 0.53, "learning_rate": 0.00027781992229456137, "loss": 1.7128, "step": 6684 }, { "epoch": 0.53, "learning_rate": 0.00027781345370499867, "loss": 1.7173, "step": 6685 }, { "epoch": 0.53, "learning_rate": 0.0002778069842476532, "loss": 1.7456, "step": 6686 }, { "epoch": 0.53, "learning_rate": 0.0002778005139225688, "loss": 1.7166, "step": 6687 }, { "epoch": 0.53, "learning_rate": 0.0002777940427297894, "loss": 1.7527, "step": 6688 }, { "epoch": 0.53, "learning_rate": 0.0002777875706693591, "loss": 1.7323, "step": 6689 }, { "epoch": 0.53, "learning_rate": 0.0002777810977413216, "loss": 1.7366, "step": 6690 }, { "epoch": 0.53, "learning_rate": 0.000277774623945721, "loss": 1.7354, "step": 6691 }, { "epoch": 0.53, "learning_rate": 0.0002777681492826012, "loss": 1.6613, "step": 6692 }, { "epoch": 0.53, "learning_rate": 0.00027776167375200624, "loss": 1.71, "step": 6693 }, { "epoch": 0.53, "learning_rate": 0.0002777551973539799, "loss": 1.7264, "step": 6694 }, { "epoch": 0.53, "learning_rate": 0.0002777487200885664, "loss": 1.7381, "step": 6695 }, { "epoch": 0.53, "learning_rate": 0.0002777422419558095, "loss": 1.7231, "step": 6696 }, { "epoch": 0.53, "learning_rate": 0.0002777357629557533, "loss": 1.706, "step": 6697 }, { "epoch": 0.53, "learning_rate": 0.00027772928308844174, "loss": 1.7122, "step": 6698 }, { "epoch": 0.53, "learning_rate": 0.00027772280235391887, "loss": 1.7186, "step": 6699 }, { "epoch": 0.53, "learning_rate": 0.0002777163207522286, "loss": 1.746, "step": 6700 }, { "epoch": 0.53, "learning_rate": 0.000277709838283415, "loss": 1.7045, "step": 6701 }, { "epoch": 0.53, "learning_rate": 0.0002777033549475222, "loss": 1.7281, "step": 6702 }, { "epoch": 0.53, "learning_rate": 0.00027769687074459396, "loss": 1.7153, "step": 6703 }, { "epoch": 0.53, "learning_rate": 0.0002776903856746744, "loss": 1.701, "step": 6704 }, { "epoch": 0.53, "learning_rate": 0.0002776838997378077, "loss": 1.7078, "step": 6705 }, { "epoch": 0.53, "learning_rate": 0.00027767741293403776, "loss": 1.6796, "step": 6706 }, { "epoch": 0.53, "learning_rate": 0.00027767092526340863, "loss": 1.7053, "step": 6707 }, { "epoch": 0.53, "learning_rate": 0.00027766443672596437, "loss": 1.7652, "step": 6708 }, { "epoch": 0.53, "learning_rate": 0.00027765794732174904, "loss": 1.7206, "step": 6709 }, { "epoch": 0.53, "learning_rate": 0.00027765145705080667, "loss": 1.7203, "step": 6710 }, { "epoch": 0.53, "learning_rate": 0.0002776449659131814, "loss": 1.6887, "step": 6711 }, { "epoch": 0.53, "learning_rate": 0.0002776384739089172, "loss": 1.656, "step": 6712 }, { "epoch": 0.53, "learning_rate": 0.0002776319810380582, "loss": 1.7712, "step": 6713 }, { "epoch": 0.53, "learning_rate": 0.0002776254873006485, "loss": 1.7178, "step": 6714 }, { "epoch": 0.53, "learning_rate": 0.0002776189926967322, "loss": 1.7181, "step": 6715 }, { "epoch": 0.53, "learning_rate": 0.0002776124972263533, "loss": 1.7096, "step": 6716 }, { "epoch": 0.53, "learning_rate": 0.000277606000889556, "loss": 1.7278, "step": 6717 }, { "epoch": 0.53, "learning_rate": 0.0002775995036863844, "loss": 1.7281, "step": 6718 }, { "epoch": 0.53, "learning_rate": 0.0002775930056168826, "loss": 1.7324, "step": 6719 }, { "epoch": 0.53, "learning_rate": 0.0002775865066810946, "loss": 1.6555, "step": 6720 }, { "epoch": 0.53, "learning_rate": 0.0002775800068790647, "loss": 1.7297, "step": 6721 }, { "epoch": 0.53, "learning_rate": 0.000277573506210837, "loss": 1.7173, "step": 6722 }, { "epoch": 0.53, "learning_rate": 0.0002775670046764555, "loss": 1.7076, "step": 6723 }, { "epoch": 0.53, "learning_rate": 0.0002775605022759645, "loss": 1.7064, "step": 6724 }, { "epoch": 0.53, "learning_rate": 0.00027755399900940807, "loss": 1.7229, "step": 6725 }, { "epoch": 0.53, "learning_rate": 0.00027754749487683033, "loss": 1.7288, "step": 6726 }, { "epoch": 0.53, "learning_rate": 0.00027754098987827554, "loss": 1.7743, "step": 6727 }, { "epoch": 0.53, "learning_rate": 0.0002775344840137878, "loss": 1.6536, "step": 6728 }, { "epoch": 0.53, "learning_rate": 0.0002775279772834113, "loss": 1.7238, "step": 6729 }, { "epoch": 0.53, "learning_rate": 0.0002775214696871902, "loss": 1.706, "step": 6730 }, { "epoch": 0.53, "learning_rate": 0.0002775149612251687, "loss": 1.6528, "step": 6731 }, { "epoch": 0.53, "learning_rate": 0.00027750845189739097, "loss": 1.7394, "step": 6732 }, { "epoch": 0.53, "learning_rate": 0.0002775019417039012, "loss": 1.7231, "step": 6733 }, { "epoch": 0.53, "learning_rate": 0.00027749543064474366, "loss": 1.7642, "step": 6734 }, { "epoch": 0.53, "learning_rate": 0.00027748891871996246, "loss": 1.6535, "step": 6735 }, { "epoch": 0.53, "learning_rate": 0.00027748240592960185, "loss": 1.7214, "step": 6736 }, { "epoch": 0.53, "learning_rate": 0.0002774758922737061, "loss": 1.73, "step": 6737 }, { "epoch": 0.53, "learning_rate": 0.00027746937775231936, "loss": 1.7467, "step": 6738 }, { "epoch": 0.53, "learning_rate": 0.0002774628623654859, "loss": 1.7334, "step": 6739 }, { "epoch": 0.53, "learning_rate": 0.00027745634611324997, "loss": 1.7138, "step": 6740 }, { "epoch": 0.53, "learning_rate": 0.0002774498289956557, "loss": 1.7306, "step": 6741 }, { "epoch": 0.53, "learning_rate": 0.0002774433110127475, "loss": 1.6839, "step": 6742 }, { "epoch": 0.53, "learning_rate": 0.0002774367921645695, "loss": 1.7248, "step": 6743 }, { "epoch": 0.53, "learning_rate": 0.000277430272451166, "loss": 1.6768, "step": 6744 }, { "epoch": 0.53, "learning_rate": 0.00027742375187258134, "loss": 1.7145, "step": 6745 }, { "epoch": 0.53, "learning_rate": 0.0002774172304288597, "loss": 1.685, "step": 6746 }, { "epoch": 0.53, "learning_rate": 0.00027741070812004536, "loss": 1.755, "step": 6747 }, { "epoch": 0.53, "learning_rate": 0.00027740418494618264, "loss": 1.6851, "step": 6748 }, { "epoch": 0.53, "learning_rate": 0.0002773976609073158, "loss": 1.6851, "step": 6749 }, { "epoch": 0.53, "learning_rate": 0.00027739113600348917, "loss": 1.7623, "step": 6750 }, { "epoch": 0.53, "learning_rate": 0.00027738461023474694, "loss": 1.7391, "step": 6751 }, { "epoch": 0.53, "learning_rate": 0.00027737808360113356, "loss": 1.7152, "step": 6752 }, { "epoch": 0.53, "learning_rate": 0.0002773715561026933, "loss": 1.7103, "step": 6753 }, { "epoch": 0.53, "learning_rate": 0.00027736502773947045, "loss": 1.69, "step": 6754 }, { "epoch": 0.53, "learning_rate": 0.00027735849851150937, "loss": 1.6602, "step": 6755 }, { "epoch": 0.53, "learning_rate": 0.00027735196841885434, "loss": 1.7107, "step": 6756 }, { "epoch": 0.53, "learning_rate": 0.00027734543746154975, "loss": 1.7041, "step": 6757 }, { "epoch": 0.53, "learning_rate": 0.00027733890563963985, "loss": 1.7574, "step": 6758 }, { "epoch": 0.53, "learning_rate": 0.00027733237295316914, "loss": 1.722, "step": 6759 }, { "epoch": 0.53, "learning_rate": 0.00027732583940218186, "loss": 1.7084, "step": 6760 }, { "epoch": 0.53, "learning_rate": 0.00027731930498672234, "loss": 1.7444, "step": 6761 }, { "epoch": 0.53, "learning_rate": 0.00027731276970683504, "loss": 1.734, "step": 6762 }, { "epoch": 0.53, "learning_rate": 0.0002773062335625643, "loss": 1.7522, "step": 6763 }, { "epoch": 0.53, "learning_rate": 0.00027729969655395444, "loss": 1.728, "step": 6764 }, { "epoch": 0.53, "learning_rate": 0.00027729315868105, "loss": 1.7487, "step": 6765 }, { "epoch": 0.53, "learning_rate": 0.0002772866199438951, "loss": 1.7091, "step": 6766 }, { "epoch": 0.53, "learning_rate": 0.0002772800803425344, "loss": 1.7565, "step": 6767 }, { "epoch": 0.53, "learning_rate": 0.0002772735398770122, "loss": 1.7214, "step": 6768 }, { "epoch": 0.53, "learning_rate": 0.00027726699854737285, "loss": 1.7308, "step": 6769 }, { "epoch": 0.53, "learning_rate": 0.0002772604563536609, "loss": 1.7541, "step": 6770 }, { "epoch": 0.53, "learning_rate": 0.00027725391329592054, "loss": 1.7079, "step": 6771 }, { "epoch": 0.53, "learning_rate": 0.00027724736937419643, "loss": 1.7237, "step": 6772 }, { "epoch": 0.53, "learning_rate": 0.00027724082458853287, "loss": 1.7549, "step": 6773 }, { "epoch": 0.53, "learning_rate": 0.00027723427893897436, "loss": 1.7365, "step": 6774 }, { "epoch": 0.53, "learning_rate": 0.00027722773242556525, "loss": 1.7366, "step": 6775 }, { "epoch": 0.53, "learning_rate": 0.0002772211850483501, "loss": 1.703, "step": 6776 }, { "epoch": 0.53, "learning_rate": 0.0002772146368073733, "loss": 1.7129, "step": 6777 }, { "epoch": 0.53, "learning_rate": 0.00027720808770267935, "loss": 1.6492, "step": 6778 }, { "epoch": 0.53, "learning_rate": 0.0002772015377343126, "loss": 1.7078, "step": 6779 }, { "epoch": 0.53, "learning_rate": 0.00027719498690231766, "loss": 1.7007, "step": 6780 }, { "epoch": 0.53, "learning_rate": 0.0002771884352067389, "loss": 1.7191, "step": 6781 }, { "epoch": 0.53, "learning_rate": 0.00027718188264762094, "loss": 1.6973, "step": 6782 }, { "epoch": 0.53, "learning_rate": 0.0002771753292250081, "loss": 1.7514, "step": 6783 }, { "epoch": 0.53, "learning_rate": 0.00027716877493894505, "loss": 1.7366, "step": 6784 }, { "epoch": 0.53, "learning_rate": 0.00027716221978947613, "loss": 1.6782, "step": 6785 }, { "epoch": 0.53, "learning_rate": 0.0002771556637766459, "loss": 1.7314, "step": 6786 }, { "epoch": 0.53, "learning_rate": 0.0002771491069004989, "loss": 1.7407, "step": 6787 }, { "epoch": 0.53, "learning_rate": 0.00027714254916107964, "loss": 1.6886, "step": 6788 }, { "epoch": 0.53, "learning_rate": 0.0002771359905584326, "loss": 1.7309, "step": 6789 }, { "epoch": 0.53, "learning_rate": 0.0002771294310926024, "loss": 1.6684, "step": 6790 }, { "epoch": 0.53, "learning_rate": 0.0002771228707636335, "loss": 1.7344, "step": 6791 }, { "epoch": 0.53, "learning_rate": 0.00027711630957157047, "loss": 1.7083, "step": 6792 }, { "epoch": 0.53, "learning_rate": 0.0002771097475164578, "loss": 1.6901, "step": 6793 }, { "epoch": 0.53, "learning_rate": 0.0002771031845983401, "loss": 1.6888, "step": 6794 }, { "epoch": 0.53, "learning_rate": 0.0002770966208172619, "loss": 1.7514, "step": 6795 }, { "epoch": 0.53, "learning_rate": 0.0002770900561732679, "loss": 1.725, "step": 6796 }, { "epoch": 0.53, "learning_rate": 0.00027708349066640244, "loss": 1.7335, "step": 6797 }, { "epoch": 0.53, "learning_rate": 0.00027707692429671026, "loss": 1.7109, "step": 6798 }, { "epoch": 0.53, "learning_rate": 0.0002770703570642358, "loss": 1.7157, "step": 6799 }, { "epoch": 0.54, "learning_rate": 0.0002770637889690238, "loss": 1.7145, "step": 6800 }, { "epoch": 0.54, "learning_rate": 0.00027705722001111885, "loss": 1.7318, "step": 6801 }, { "epoch": 0.54, "learning_rate": 0.00027705065019056544, "loss": 1.6894, "step": 6802 }, { "epoch": 0.54, "learning_rate": 0.0002770440795074082, "loss": 1.6756, "step": 6803 }, { "epoch": 0.54, "learning_rate": 0.0002770375079616918, "loss": 1.7443, "step": 6804 }, { "epoch": 0.54, "learning_rate": 0.00027703093555346087, "loss": 1.672, "step": 6805 }, { "epoch": 0.54, "learning_rate": 0.00027702436228275995, "loss": 1.6296, "step": 6806 }, { "epoch": 0.54, "learning_rate": 0.00027701778814963367, "loss": 1.7238, "step": 6807 }, { "epoch": 0.54, "learning_rate": 0.00027701121315412675, "loss": 1.7108, "step": 6808 }, { "epoch": 0.54, "learning_rate": 0.00027700463729628374, "loss": 1.7094, "step": 6809 }, { "epoch": 0.54, "learning_rate": 0.0002769980605761494, "loss": 1.6888, "step": 6810 }, { "epoch": 0.54, "learning_rate": 0.0002769914829937682, "loss": 1.7023, "step": 6811 }, { "epoch": 0.54, "learning_rate": 0.00027698490454918504, "loss": 1.7126, "step": 6812 }, { "epoch": 0.54, "learning_rate": 0.00027697832524244435, "loss": 1.7322, "step": 6813 }, { "epoch": 0.54, "learning_rate": 0.0002769717450735909, "loss": 1.6808, "step": 6814 }, { "epoch": 0.54, "learning_rate": 0.0002769651640426695, "loss": 1.7052, "step": 6815 }, { "epoch": 0.54, "learning_rate": 0.0002769585821497246, "loss": 1.7243, "step": 6816 }, { "epoch": 0.54, "learning_rate": 0.000276951999394801, "loss": 1.686, "step": 6817 }, { "epoch": 0.54, "learning_rate": 0.0002769454157779434, "loss": 1.7047, "step": 6818 }, { "epoch": 0.54, "learning_rate": 0.00027693883129919643, "loss": 1.7124, "step": 6819 }, { "epoch": 0.54, "learning_rate": 0.0002769322459586049, "loss": 1.6934, "step": 6820 }, { "epoch": 0.54, "learning_rate": 0.0002769256597562135, "loss": 1.6955, "step": 6821 }, { "epoch": 0.54, "learning_rate": 0.00027691907269206687, "loss": 1.7141, "step": 6822 }, { "epoch": 0.54, "learning_rate": 0.00027691248476620974, "loss": 1.7337, "step": 6823 }, { "epoch": 0.54, "learning_rate": 0.00027690589597868695, "loss": 1.6953, "step": 6824 }, { "epoch": 0.54, "learning_rate": 0.0002768993063295431, "loss": 1.7385, "step": 6825 }, { "epoch": 0.54, "learning_rate": 0.000276892715818823, "loss": 1.7263, "step": 6826 }, { "epoch": 0.54, "learning_rate": 0.0002768861244465714, "loss": 1.7028, "step": 6827 }, { "epoch": 0.54, "learning_rate": 0.000276879532212833, "loss": 1.7515, "step": 6828 }, { "epoch": 0.54, "learning_rate": 0.0002768729391176526, "loss": 1.7491, "step": 6829 }, { "epoch": 0.54, "learning_rate": 0.00027686634516107503, "loss": 1.7145, "step": 6830 }, { "epoch": 0.54, "learning_rate": 0.0002768597503431449, "loss": 1.6598, "step": 6831 }, { "epoch": 0.54, "learning_rate": 0.0002768531546639071, "loss": 1.7571, "step": 6832 }, { "epoch": 0.54, "learning_rate": 0.0002768465581234064, "loss": 1.6584, "step": 6833 }, { "epoch": 0.54, "learning_rate": 0.00027683996072168756, "loss": 1.7214, "step": 6834 }, { "epoch": 0.54, "learning_rate": 0.0002768333624587954, "loss": 1.7112, "step": 6835 }, { "epoch": 0.54, "learning_rate": 0.0002768267633347747, "loss": 1.7303, "step": 6836 }, { "epoch": 0.54, "learning_rate": 0.0002768201633496702, "loss": 1.7411, "step": 6837 }, { "epoch": 0.54, "learning_rate": 0.0002768135625035268, "loss": 1.6945, "step": 6838 }, { "epoch": 0.54, "learning_rate": 0.0002768069607963894, "loss": 1.6894, "step": 6839 }, { "epoch": 0.54, "learning_rate": 0.0002768003582283026, "loss": 1.7243, "step": 6840 }, { "epoch": 0.54, "learning_rate": 0.0002767937547993114, "loss": 1.7614, "step": 6841 }, { "epoch": 0.54, "learning_rate": 0.00027678715050946054, "loss": 1.7279, "step": 6842 }, { "epoch": 0.54, "learning_rate": 0.00027678054535879487, "loss": 1.7034, "step": 6843 }, { "epoch": 0.54, "learning_rate": 0.0002767739393473593, "loss": 1.6552, "step": 6844 }, { "epoch": 0.54, "learning_rate": 0.00027676733247519866, "loss": 1.7339, "step": 6845 }, { "epoch": 0.54, "learning_rate": 0.0002767607247423578, "loss": 1.7431, "step": 6846 }, { "epoch": 0.54, "learning_rate": 0.00027675411614888146, "loss": 1.7431, "step": 6847 }, { "epoch": 0.54, "learning_rate": 0.0002767475066948147, "loss": 1.7251, "step": 6848 }, { "epoch": 0.54, "learning_rate": 0.00027674089638020236, "loss": 1.7313, "step": 6849 }, { "epoch": 0.54, "learning_rate": 0.0002767342852050892, "loss": 1.7774, "step": 6850 }, { "epoch": 0.54, "learning_rate": 0.00027672767316952023, "loss": 1.7315, "step": 6851 }, { "epoch": 0.54, "learning_rate": 0.00027672106027354024, "loss": 1.7438, "step": 6852 }, { "epoch": 0.54, "learning_rate": 0.00027671444651719427, "loss": 1.7128, "step": 6853 }, { "epoch": 0.54, "learning_rate": 0.00027670783190052704, "loss": 1.7129, "step": 6854 }, { "epoch": 0.54, "learning_rate": 0.0002767012164235836, "loss": 1.7589, "step": 6855 }, { "epoch": 0.54, "learning_rate": 0.0002766946000864088, "loss": 1.6906, "step": 6856 }, { "epoch": 0.54, "learning_rate": 0.0002766879828890476, "loss": 1.741, "step": 6857 }, { "epoch": 0.54, "learning_rate": 0.0002766813648315449, "loss": 1.7747, "step": 6858 }, { "epoch": 0.54, "learning_rate": 0.00027667474591394566, "loss": 1.6846, "step": 6859 }, { "epoch": 0.54, "learning_rate": 0.00027666812613629476, "loss": 1.7204, "step": 6860 }, { "epoch": 0.54, "learning_rate": 0.0002766615054986372, "loss": 1.7305, "step": 6861 }, { "epoch": 0.54, "learning_rate": 0.0002766548840010179, "loss": 1.712, "step": 6862 }, { "epoch": 0.54, "learning_rate": 0.0002766482616434819, "loss": 1.6962, "step": 6863 }, { "epoch": 0.54, "learning_rate": 0.00027664163842607405, "loss": 1.78, "step": 6864 }, { "epoch": 0.54, "learning_rate": 0.00027663501434883935, "loss": 1.7327, "step": 6865 }, { "epoch": 0.54, "learning_rate": 0.0002766283894118228, "loss": 1.7601, "step": 6866 }, { "epoch": 0.54, "learning_rate": 0.00027662176361506935, "loss": 1.7068, "step": 6867 }, { "epoch": 0.54, "learning_rate": 0.00027661513695862404, "loss": 1.6565, "step": 6868 }, { "epoch": 0.54, "learning_rate": 0.00027660850944253174, "loss": 1.7151, "step": 6869 }, { "epoch": 0.54, "learning_rate": 0.00027660188106683756, "loss": 1.6957, "step": 6870 }, { "epoch": 0.54, "learning_rate": 0.00027659525183158654, "loss": 1.675, "step": 6871 }, { "epoch": 0.54, "learning_rate": 0.00027658862173682357, "loss": 1.7233, "step": 6872 }, { "epoch": 0.54, "learning_rate": 0.00027658199078259375, "loss": 1.681, "step": 6873 }, { "epoch": 0.54, "learning_rate": 0.000276575358968942, "loss": 1.719, "step": 6874 }, { "epoch": 0.54, "learning_rate": 0.0002765687262959135, "loss": 1.7199, "step": 6875 }, { "epoch": 0.54, "learning_rate": 0.00027656209276355313, "loss": 1.7243, "step": 6876 }, { "epoch": 0.54, "learning_rate": 0.00027655545837190597, "loss": 1.7342, "step": 6877 }, { "epoch": 0.54, "learning_rate": 0.00027654882312101714, "loss": 1.7169, "step": 6878 }, { "epoch": 0.54, "learning_rate": 0.0002765421870109316, "loss": 1.6998, "step": 6879 }, { "epoch": 0.54, "learning_rate": 0.0002765355500416945, "loss": 1.6621, "step": 6880 }, { "epoch": 0.54, "learning_rate": 0.0002765289122133508, "loss": 1.7408, "step": 6881 }, { "epoch": 0.54, "learning_rate": 0.0002765222735259456, "loss": 1.6668, "step": 6882 }, { "epoch": 0.54, "learning_rate": 0.000276515633979524, "loss": 1.6829, "step": 6883 }, { "epoch": 0.54, "learning_rate": 0.0002765089935741311, "loss": 1.7657, "step": 6884 }, { "epoch": 0.54, "learning_rate": 0.0002765023523098119, "loss": 1.7352, "step": 6885 }, { "epoch": 0.54, "learning_rate": 0.00027649571018661153, "loss": 1.6866, "step": 6886 }, { "epoch": 0.54, "learning_rate": 0.0002764890672045751, "loss": 1.6866, "step": 6887 }, { "epoch": 0.54, "learning_rate": 0.00027648242336374775, "loss": 1.7646, "step": 6888 }, { "epoch": 0.54, "learning_rate": 0.00027647577866417446, "loss": 1.7021, "step": 6889 }, { "epoch": 0.54, "learning_rate": 0.00027646913310590054, "loss": 1.7139, "step": 6890 }, { "epoch": 0.54, "learning_rate": 0.0002764624866889709, "loss": 1.6926, "step": 6891 }, { "epoch": 0.54, "learning_rate": 0.00027645583941343085, "loss": 1.6871, "step": 6892 }, { "epoch": 0.54, "learning_rate": 0.00027644919127932534, "loss": 1.7267, "step": 6893 }, { "epoch": 0.54, "learning_rate": 0.00027644254228669966, "loss": 1.7336, "step": 6894 }, { "epoch": 0.54, "learning_rate": 0.0002764358924355989, "loss": 1.7091, "step": 6895 }, { "epoch": 0.54, "learning_rate": 0.00027642924172606816, "loss": 1.7114, "step": 6896 }, { "epoch": 0.54, "learning_rate": 0.00027642259015815267, "loss": 1.6996, "step": 6897 }, { "epoch": 0.54, "learning_rate": 0.0002764159377318975, "loss": 1.6798, "step": 6898 }, { "epoch": 0.54, "learning_rate": 0.000276409284447348, "loss": 1.7236, "step": 6899 }, { "epoch": 0.54, "learning_rate": 0.00027640263030454914, "loss": 1.7044, "step": 6900 }, { "epoch": 0.54, "learning_rate": 0.0002763959753035461, "loss": 1.7595, "step": 6901 }, { "epoch": 0.54, "learning_rate": 0.00027638931944438423, "loss": 1.679, "step": 6902 }, { "epoch": 0.54, "learning_rate": 0.00027638266272710864, "loss": 1.6613, "step": 6903 }, { "epoch": 0.54, "learning_rate": 0.0002763760051517645, "loss": 1.655, "step": 6904 }, { "epoch": 0.54, "learning_rate": 0.00027636934671839704, "loss": 1.6844, "step": 6905 }, { "epoch": 0.54, "learning_rate": 0.0002763626874270514, "loss": 1.7382, "step": 6906 }, { "epoch": 0.54, "learning_rate": 0.0002763560272777729, "loss": 1.7226, "step": 6907 }, { "epoch": 0.54, "learning_rate": 0.0002763493662706067, "loss": 1.6828, "step": 6908 }, { "epoch": 0.54, "learning_rate": 0.000276342704405598, "loss": 1.7463, "step": 6909 }, { "epoch": 0.54, "learning_rate": 0.00027633604168279206, "loss": 1.7174, "step": 6910 }, { "epoch": 0.54, "learning_rate": 0.0002763293781022341, "loss": 1.7264, "step": 6911 }, { "epoch": 0.54, "learning_rate": 0.0002763227136639694, "loss": 1.6589, "step": 6912 }, { "epoch": 0.54, "learning_rate": 0.00027631604836804316, "loss": 1.6813, "step": 6913 }, { "epoch": 0.54, "learning_rate": 0.0002763093822145007, "loss": 1.7818, "step": 6914 }, { "epoch": 0.54, "learning_rate": 0.0002763027152033872, "loss": 1.7151, "step": 6915 }, { "epoch": 0.54, "learning_rate": 0.000276296047334748, "loss": 1.7381, "step": 6916 }, { "epoch": 0.54, "learning_rate": 0.0002762893786086283, "loss": 1.7218, "step": 6917 }, { "epoch": 0.54, "learning_rate": 0.0002762827090250734, "loss": 1.6786, "step": 6918 }, { "epoch": 0.54, "learning_rate": 0.00027627603858412867, "loss": 1.6569, "step": 6919 }, { "epoch": 0.54, "learning_rate": 0.00027626936728583927, "loss": 1.6893, "step": 6920 }, { "epoch": 0.54, "learning_rate": 0.0002762626951302505, "loss": 1.6849, "step": 6921 }, { "epoch": 0.54, "learning_rate": 0.0002762560221174078, "loss": 1.6641, "step": 6922 }, { "epoch": 0.54, "learning_rate": 0.0002762493482473563, "loss": 1.7621, "step": 6923 }, { "epoch": 0.54, "learning_rate": 0.00027624267352014146, "loss": 1.6572, "step": 6924 }, { "epoch": 0.54, "learning_rate": 0.0002762359979358085, "loss": 1.682, "step": 6925 }, { "epoch": 0.54, "learning_rate": 0.0002762293214944028, "loss": 1.6615, "step": 6926 }, { "epoch": 0.55, "learning_rate": 0.00027622264419596964, "loss": 1.73, "step": 6927 }, { "epoch": 0.55, "learning_rate": 0.00027621596604055437, "loss": 1.7212, "step": 6928 }, { "epoch": 0.55, "learning_rate": 0.0002762092870282024, "loss": 1.6969, "step": 6929 }, { "epoch": 0.55, "learning_rate": 0.000276202607158959, "loss": 1.6757, "step": 6930 }, { "epoch": 0.55, "learning_rate": 0.0002761959264328695, "loss": 1.7498, "step": 6931 }, { "epoch": 0.55, "learning_rate": 0.00027618924484997936, "loss": 1.7078, "step": 6932 }, { "epoch": 0.55, "learning_rate": 0.00027618256241033383, "loss": 1.6907, "step": 6933 }, { "epoch": 0.55, "learning_rate": 0.00027617587911397837, "loss": 1.6965, "step": 6934 }, { "epoch": 0.55, "learning_rate": 0.0002761691949609583, "loss": 1.7275, "step": 6935 }, { "epoch": 0.55, "learning_rate": 0.000276162509951319, "loss": 1.6994, "step": 6936 }, { "epoch": 0.55, "learning_rate": 0.0002761558240851059, "loss": 1.7246, "step": 6937 }, { "epoch": 0.55, "learning_rate": 0.00027614913736236443, "loss": 1.6536, "step": 6938 }, { "epoch": 0.55, "learning_rate": 0.0002761424497831399, "loss": 1.7332, "step": 6939 }, { "epoch": 0.55, "learning_rate": 0.0002761357613474777, "loss": 1.7046, "step": 6940 }, { "epoch": 0.55, "learning_rate": 0.00027612907205542327, "loss": 1.6753, "step": 6941 }, { "epoch": 0.55, "learning_rate": 0.0002761223819070222, "loss": 1.7171, "step": 6942 }, { "epoch": 0.55, "learning_rate": 0.0002761156909023196, "loss": 1.6956, "step": 6943 }, { "epoch": 0.55, "learning_rate": 0.0002761089990413611, "loss": 1.653, "step": 6944 }, { "epoch": 0.55, "learning_rate": 0.0002761023063241921, "loss": 1.6632, "step": 6945 }, { "epoch": 0.55, "learning_rate": 0.00027609561275085805, "loss": 1.7819, "step": 6946 }, { "epoch": 0.55, "learning_rate": 0.00027608891832140434, "loss": 1.714, "step": 6947 }, { "epoch": 0.55, "learning_rate": 0.0002760822230358765, "loss": 1.7401, "step": 6948 }, { "epoch": 0.55, "learning_rate": 0.00027607552689431987, "loss": 1.7146, "step": 6949 }, { "epoch": 0.55, "learning_rate": 0.00027606882989678, "loss": 1.7226, "step": 6950 }, { "epoch": 0.55, "learning_rate": 0.0002760621320433024, "loss": 1.6873, "step": 6951 }, { "epoch": 0.55, "learning_rate": 0.00027605543333393247, "loss": 1.7237, "step": 6952 }, { "epoch": 0.55, "learning_rate": 0.00027604873376871564, "loss": 1.6683, "step": 6953 }, { "epoch": 0.55, "learning_rate": 0.0002760420333476976, "loss": 1.7443, "step": 6954 }, { "epoch": 0.55, "learning_rate": 0.0002760353320709236, "loss": 1.6814, "step": 6955 }, { "epoch": 0.55, "learning_rate": 0.0002760286299384393, "loss": 1.6943, "step": 6956 }, { "epoch": 0.55, "learning_rate": 0.0002760219269502901, "loss": 1.701, "step": 6957 }, { "epoch": 0.55, "learning_rate": 0.0002760152231065216, "loss": 1.7409, "step": 6958 }, { "epoch": 0.55, "learning_rate": 0.0002760085184071793, "loss": 1.7155, "step": 6959 }, { "epoch": 0.55, "learning_rate": 0.00027600181285230863, "loss": 1.7862, "step": 6960 }, { "epoch": 0.55, "learning_rate": 0.00027599510644195526, "loss": 1.6773, "step": 6961 }, { "epoch": 0.55, "learning_rate": 0.0002759883991761646, "loss": 1.6984, "step": 6962 }, { "epoch": 0.55, "learning_rate": 0.0002759816910549823, "loss": 1.692, "step": 6963 }, { "epoch": 0.55, "learning_rate": 0.0002759749820784537, "loss": 1.702, "step": 6964 }, { "epoch": 0.55, "learning_rate": 0.00027596827224662463, "loss": 1.7238, "step": 6965 }, { "epoch": 0.55, "learning_rate": 0.00027596156155954043, "loss": 1.697, "step": 6966 }, { "epoch": 0.55, "learning_rate": 0.00027595485001724677, "loss": 1.7191, "step": 6967 }, { "epoch": 0.55, "learning_rate": 0.0002759481376197892, "loss": 1.7045, "step": 6968 }, { "epoch": 0.55, "learning_rate": 0.0002759414243672132, "loss": 1.7422, "step": 6969 }, { "epoch": 0.55, "learning_rate": 0.0002759347102595646, "loss": 1.6836, "step": 6970 }, { "epoch": 0.55, "learning_rate": 0.00027592799529688866, "loss": 1.6986, "step": 6971 }, { "epoch": 0.55, "learning_rate": 0.00027592127947923114, "loss": 1.7466, "step": 6972 }, { "epoch": 0.55, "learning_rate": 0.00027591456280663765, "loss": 1.7445, "step": 6973 }, { "epoch": 0.55, "learning_rate": 0.00027590784527915373, "loss": 1.784, "step": 6974 }, { "epoch": 0.55, "learning_rate": 0.0002759011268968251, "loss": 1.7018, "step": 6975 }, { "epoch": 0.55, "learning_rate": 0.00027589440765969723, "loss": 1.6726, "step": 6976 }, { "epoch": 0.55, "learning_rate": 0.00027588768756781583, "loss": 1.7061, "step": 6977 }, { "epoch": 0.55, "learning_rate": 0.00027588096662122647, "loss": 1.7027, "step": 6978 }, { "epoch": 0.55, "learning_rate": 0.0002758742448199749, "loss": 1.7087, "step": 6979 }, { "epoch": 0.55, "learning_rate": 0.00027586752216410656, "loss": 1.7004, "step": 6980 }, { "epoch": 0.55, "learning_rate": 0.0002758607986536673, "loss": 1.7196, "step": 6981 }, { "epoch": 0.55, "learning_rate": 0.0002758540742887026, "loss": 1.7186, "step": 6982 }, { "epoch": 0.55, "learning_rate": 0.00027584734906925827, "loss": 1.7389, "step": 6983 }, { "epoch": 0.55, "learning_rate": 0.0002758406229953798, "loss": 1.7082, "step": 6984 }, { "epoch": 0.55, "learning_rate": 0.000275833896067113, "loss": 1.7484, "step": 6985 }, { "epoch": 0.55, "learning_rate": 0.00027582716828450344, "loss": 1.6895, "step": 6986 }, { "epoch": 0.55, "learning_rate": 0.0002758204396475969, "loss": 1.738, "step": 6987 }, { "epoch": 0.55, "learning_rate": 0.00027581371015643894, "loss": 1.69, "step": 6988 }, { "epoch": 0.55, "learning_rate": 0.00027580697981107534, "loss": 1.5823, "step": 6989 }, { "epoch": 0.55, "learning_rate": 0.00027580024861155185, "loss": 1.7508, "step": 6990 }, { "epoch": 0.55, "learning_rate": 0.000275793516557914, "loss": 1.6626, "step": 6991 }, { "epoch": 0.55, "learning_rate": 0.0002757867836502076, "loss": 1.7423, "step": 6992 }, { "epoch": 0.55, "learning_rate": 0.0002757800498884784, "loss": 1.6746, "step": 6993 }, { "epoch": 0.55, "learning_rate": 0.00027577331527277207, "loss": 1.7043, "step": 6994 }, { "epoch": 0.55, "learning_rate": 0.0002757665798031343, "loss": 1.6954, "step": 6995 }, { "epoch": 0.55, "learning_rate": 0.00027575984347961085, "loss": 1.6967, "step": 6996 }, { "epoch": 0.55, "learning_rate": 0.0002757531063022475, "loss": 1.6704, "step": 6997 }, { "epoch": 0.55, "learning_rate": 0.00027574636827109, "loss": 1.7194, "step": 6998 }, { "epoch": 0.55, "learning_rate": 0.00027573962938618396, "loss": 1.6873, "step": 6999 }, { "epoch": 0.55, "learning_rate": 0.0002757328896475753, "loss": 1.6182, "step": 7000 }, { "epoch": 0.55, "learning_rate": 0.0002757261490553096, "loss": 1.6519, "step": 7001 }, { "epoch": 0.55, "learning_rate": 0.00027571940760943276, "loss": 1.7633, "step": 7002 }, { "epoch": 0.55, "learning_rate": 0.0002757126653099906, "loss": 1.7525, "step": 7003 }, { "epoch": 0.55, "learning_rate": 0.00027570592215702875, "loss": 1.7154, "step": 7004 }, { "epoch": 0.55, "learning_rate": 0.00027569917815059315, "loss": 1.7136, "step": 7005 }, { "epoch": 0.55, "learning_rate": 0.0002756924332907294, "loss": 1.7437, "step": 7006 }, { "epoch": 0.55, "learning_rate": 0.00027568568757748335, "loss": 1.6922, "step": 7007 }, { "epoch": 0.55, "learning_rate": 0.00027567894101090094, "loss": 1.719, "step": 7008 }, { "epoch": 0.55, "learning_rate": 0.00027567219359102784, "loss": 1.7282, "step": 7009 }, { "epoch": 0.55, "learning_rate": 0.0002756654453179099, "loss": 1.7205, "step": 7010 }, { "epoch": 0.55, "learning_rate": 0.00027565869619159295, "loss": 1.6503, "step": 7011 }, { "epoch": 0.55, "learning_rate": 0.0002756519462121228, "loss": 1.6643, "step": 7012 }, { "epoch": 0.55, "learning_rate": 0.00027564519537954526, "loss": 1.6904, "step": 7013 }, { "epoch": 0.55, "learning_rate": 0.00027563844369390614, "loss": 1.6951, "step": 7014 }, { "epoch": 0.55, "learning_rate": 0.0002756316911552514, "loss": 1.7011, "step": 7015 }, { "epoch": 0.55, "learning_rate": 0.00027562493776362676, "loss": 1.736, "step": 7016 }, { "epoch": 0.55, "learning_rate": 0.0002756181835190781, "loss": 1.6697, "step": 7017 }, { "epoch": 0.55, "learning_rate": 0.00027561142842165133, "loss": 1.7037, "step": 7018 }, { "epoch": 0.55, "learning_rate": 0.00027560467247139225, "loss": 1.6921, "step": 7019 }, { "epoch": 0.55, "learning_rate": 0.0002755979156683468, "loss": 1.6691, "step": 7020 }, { "epoch": 0.55, "learning_rate": 0.00027559115801256077, "loss": 1.7762, "step": 7021 }, { "epoch": 0.55, "learning_rate": 0.0002755843995040801, "loss": 1.7451, "step": 7022 }, { "epoch": 0.55, "learning_rate": 0.0002755776401429507, "loss": 1.7366, "step": 7023 }, { "epoch": 0.55, "learning_rate": 0.00027557087992921835, "loss": 1.7962, "step": 7024 }, { "epoch": 0.55, "learning_rate": 0.00027556411886292905, "loss": 1.6746, "step": 7025 }, { "epoch": 0.55, "learning_rate": 0.0002755573569441287, "loss": 1.7363, "step": 7026 }, { "epoch": 0.55, "learning_rate": 0.0002755505941728632, "loss": 1.6771, "step": 7027 }, { "epoch": 0.55, "learning_rate": 0.00027554383054917837, "loss": 1.738, "step": 7028 }, { "epoch": 0.55, "learning_rate": 0.00027553706607312024, "loss": 1.6795, "step": 7029 }, { "epoch": 0.55, "learning_rate": 0.00027553030074473474, "loss": 1.7375, "step": 7030 }, { "epoch": 0.55, "learning_rate": 0.0002755235345640678, "loss": 1.7046, "step": 7031 }, { "epoch": 0.55, "learning_rate": 0.00027551676753116526, "loss": 1.6994, "step": 7032 }, { "epoch": 0.55, "learning_rate": 0.0002755099996460732, "loss": 1.7188, "step": 7033 }, { "epoch": 0.55, "learning_rate": 0.00027550323090883743, "loss": 1.7179, "step": 7034 }, { "epoch": 0.55, "learning_rate": 0.000275496461319504, "loss": 1.7295, "step": 7035 }, { "epoch": 0.55, "learning_rate": 0.00027548969087811884, "loss": 1.701, "step": 7036 }, { "epoch": 0.55, "learning_rate": 0.000275482919584728, "loss": 1.6783, "step": 7037 }, { "epoch": 0.55, "learning_rate": 0.00027547614743937736, "loss": 1.7533, "step": 7038 }, { "epoch": 0.55, "learning_rate": 0.00027546937444211287, "loss": 1.6904, "step": 7039 }, { "epoch": 0.55, "learning_rate": 0.00027546260059298065, "loss": 1.7126, "step": 7040 }, { "epoch": 0.55, "learning_rate": 0.00027545582589202656, "loss": 1.6889, "step": 7041 }, { "epoch": 0.55, "learning_rate": 0.0002754490503392966, "loss": 1.7107, "step": 7042 }, { "epoch": 0.55, "learning_rate": 0.0002754422739348369, "loss": 1.6761, "step": 7043 }, { "epoch": 0.55, "learning_rate": 0.0002754354966786933, "loss": 1.6811, "step": 7044 }, { "epoch": 0.55, "learning_rate": 0.00027542871857091195, "loss": 1.7036, "step": 7045 }, { "epoch": 0.55, "learning_rate": 0.00027542193961153883, "loss": 1.7097, "step": 7046 }, { "epoch": 0.55, "learning_rate": 0.00027541515980061994, "loss": 1.6582, "step": 7047 }, { "epoch": 0.55, "learning_rate": 0.0002754083791382013, "loss": 1.6621, "step": 7048 }, { "epoch": 0.55, "learning_rate": 0.000275401597624329, "loss": 1.655, "step": 7049 }, { "epoch": 0.55, "learning_rate": 0.00027539481525904906, "loss": 1.6941, "step": 7050 }, { "epoch": 0.55, "learning_rate": 0.0002753880320424075, "loss": 1.7182, "step": 7051 }, { "epoch": 0.55, "learning_rate": 0.0002753812479744504, "loss": 1.68, "step": 7052 }, { "epoch": 0.55, "learning_rate": 0.00027537446305522383, "loss": 1.7235, "step": 7053 }, { "epoch": 0.56, "learning_rate": 0.0002753676772847739, "loss": 1.7324, "step": 7054 }, { "epoch": 0.56, "learning_rate": 0.0002753608906631465, "loss": 1.74, "step": 7055 }, { "epoch": 0.56, "learning_rate": 0.00027535410319038794, "loss": 1.7361, "step": 7056 }, { "epoch": 0.56, "learning_rate": 0.0002753473148665441, "loss": 1.7285, "step": 7057 }, { "epoch": 0.56, "learning_rate": 0.0002753405256916612, "loss": 1.7201, "step": 7058 }, { "epoch": 0.56, "learning_rate": 0.00027533373566578534, "loss": 1.7012, "step": 7059 }, { "epoch": 0.56, "learning_rate": 0.00027532694478896256, "loss": 1.732, "step": 7060 }, { "epoch": 0.56, "learning_rate": 0.000275320153061239, "loss": 1.726, "step": 7061 }, { "epoch": 0.56, "learning_rate": 0.0002753133604826607, "loss": 1.7224, "step": 7062 }, { "epoch": 0.56, "learning_rate": 0.0002753065670532739, "loss": 1.7337, "step": 7063 }, { "epoch": 0.56, "learning_rate": 0.00027529977277312463, "loss": 1.7393, "step": 7064 }, { "epoch": 0.56, "learning_rate": 0.00027529297764225904, "loss": 1.7359, "step": 7065 }, { "epoch": 0.56, "learning_rate": 0.0002752861816607233, "loss": 1.7072, "step": 7066 }, { "epoch": 0.56, "learning_rate": 0.0002752793848285635, "loss": 1.6722, "step": 7067 }, { "epoch": 0.56, "learning_rate": 0.00027527258714582584, "loss": 1.725, "step": 7068 }, { "epoch": 0.56, "learning_rate": 0.0002752657886125564, "loss": 1.6411, "step": 7069 }, { "epoch": 0.56, "learning_rate": 0.0002752589892288014, "loss": 1.7263, "step": 7070 }, { "epoch": 0.56, "learning_rate": 0.000275252188994607, "loss": 1.7484, "step": 7071 }, { "epoch": 0.56, "learning_rate": 0.0002752453879100194, "loss": 1.6115, "step": 7072 }, { "epoch": 0.56, "learning_rate": 0.00027523858597508467, "loss": 1.6346, "step": 7073 }, { "epoch": 0.56, "learning_rate": 0.0002752317831898491, "loss": 1.714, "step": 7074 }, { "epoch": 0.56, "learning_rate": 0.00027522497955435876, "loss": 1.7235, "step": 7075 }, { "epoch": 0.56, "learning_rate": 0.00027521817506866, "loss": 1.7166, "step": 7076 }, { "epoch": 0.56, "learning_rate": 0.0002752113697327989, "loss": 1.6951, "step": 7077 }, { "epoch": 0.56, "learning_rate": 0.00027520456354682165, "loss": 1.7324, "step": 7078 }, { "epoch": 0.56, "learning_rate": 0.0002751977565107745, "loss": 1.7113, "step": 7079 }, { "epoch": 0.56, "learning_rate": 0.00027519094862470377, "loss": 1.724, "step": 7080 }, { "epoch": 0.56, "learning_rate": 0.00027518413988865555, "loss": 1.7077, "step": 7081 }, { "epoch": 0.56, "learning_rate": 0.00027517733030267604, "loss": 1.7046, "step": 7082 }, { "epoch": 0.56, "learning_rate": 0.0002751705198668116, "loss": 1.7046, "step": 7083 }, { "epoch": 0.56, "learning_rate": 0.0002751637085811084, "loss": 1.7354, "step": 7084 }, { "epoch": 0.56, "learning_rate": 0.00027515689644561265, "loss": 1.6923, "step": 7085 }, { "epoch": 0.56, "learning_rate": 0.00027515008346037066, "loss": 1.6874, "step": 7086 }, { "epoch": 0.56, "learning_rate": 0.00027514326962542864, "loss": 1.6773, "step": 7087 }, { "epoch": 0.56, "learning_rate": 0.00027513645494083293, "loss": 1.6428, "step": 7088 }, { "epoch": 0.56, "learning_rate": 0.00027512963940662974, "loss": 1.6665, "step": 7089 }, { "epoch": 0.56, "learning_rate": 0.00027512282302286534, "loss": 1.7623, "step": 7090 }, { "epoch": 0.56, "learning_rate": 0.000275116005789586, "loss": 1.7122, "step": 7091 }, { "epoch": 0.56, "learning_rate": 0.000275109187706838, "loss": 1.7169, "step": 7092 }, { "epoch": 0.56, "learning_rate": 0.00027510236877466775, "loss": 1.6866, "step": 7093 }, { "epoch": 0.56, "learning_rate": 0.0002750955489931214, "loss": 1.6789, "step": 7094 }, { "epoch": 0.56, "learning_rate": 0.0002750887283622453, "loss": 1.7291, "step": 7095 }, { "epoch": 0.56, "learning_rate": 0.00027508190688208575, "loss": 1.6356, "step": 7096 }, { "epoch": 0.56, "learning_rate": 0.00027507508455268913, "loss": 1.6606, "step": 7097 }, { "epoch": 0.56, "learning_rate": 0.0002750682613741017, "loss": 1.7075, "step": 7098 }, { "epoch": 0.56, "learning_rate": 0.00027506143734636973, "loss": 1.7456, "step": 7099 }, { "epoch": 0.56, "learning_rate": 0.00027505461246953966, "loss": 1.7374, "step": 7100 }, { "epoch": 0.56, "learning_rate": 0.0002750477867436578, "loss": 1.7225, "step": 7101 }, { "epoch": 0.56, "learning_rate": 0.00027504096016877044, "loss": 1.7296, "step": 7102 }, { "epoch": 0.56, "learning_rate": 0.00027503413274492395, "loss": 1.7073, "step": 7103 }, { "epoch": 0.56, "learning_rate": 0.0002750273044721647, "loss": 1.727, "step": 7104 }, { "epoch": 0.56, "learning_rate": 0.0002750204753505391, "loss": 1.6974, "step": 7105 }, { "epoch": 0.56, "learning_rate": 0.00027501364538009345, "loss": 1.6792, "step": 7106 }, { "epoch": 0.56, "learning_rate": 0.0002750068145608741, "loss": 1.6584, "step": 7107 }, { "epoch": 0.56, "learning_rate": 0.00027499998289292753, "loss": 1.7238, "step": 7108 }, { "epoch": 0.56, "learning_rate": 0.0002749931503763, "loss": 1.696, "step": 7109 }, { "epoch": 0.56, "learning_rate": 0.000274986317011038, "loss": 1.7342, "step": 7110 }, { "epoch": 0.56, "learning_rate": 0.0002749794827971878, "loss": 1.6997, "step": 7111 }, { "epoch": 0.56, "learning_rate": 0.00027497264773479593, "loss": 1.7, "step": 7112 }, { "epoch": 0.56, "learning_rate": 0.0002749658118239088, "loss": 1.688, "step": 7113 }, { "epoch": 0.56, "learning_rate": 0.00027495897506457265, "loss": 1.7038, "step": 7114 }, { "epoch": 0.56, "learning_rate": 0.00027495213745683413, "loss": 1.7227, "step": 7115 }, { "epoch": 0.56, "learning_rate": 0.0002749452990007395, "loss": 1.7272, "step": 7116 }, { "epoch": 0.56, "learning_rate": 0.00027493845969633527, "loss": 1.6635, "step": 7117 }, { "epoch": 0.56, "learning_rate": 0.0002749316195436678, "loss": 1.6852, "step": 7118 }, { "epoch": 0.56, "learning_rate": 0.0002749247785427836, "loss": 1.7519, "step": 7119 }, { "epoch": 0.56, "learning_rate": 0.0002749179366937291, "loss": 1.6978, "step": 7120 }, { "epoch": 0.56, "learning_rate": 0.00027491109399655075, "loss": 1.7611, "step": 7121 }, { "epoch": 0.56, "learning_rate": 0.000274904250451295, "loss": 1.667, "step": 7122 }, { "epoch": 0.56, "learning_rate": 0.00027489740605800826, "loss": 1.7406, "step": 7123 }, { "epoch": 0.56, "learning_rate": 0.00027489056081673714, "loss": 1.7218, "step": 7124 }, { "epoch": 0.56, "learning_rate": 0.000274883714727528, "loss": 1.7536, "step": 7125 }, { "epoch": 0.56, "learning_rate": 0.0002748768677904273, "loss": 1.7492, "step": 7126 }, { "epoch": 0.56, "learning_rate": 0.0002748700200054817, "loss": 1.7163, "step": 7127 }, { "epoch": 0.56, "learning_rate": 0.0002748631713727375, "loss": 1.725, "step": 7128 }, { "epoch": 0.56, "learning_rate": 0.00027485632189224124, "loss": 1.6479, "step": 7129 }, { "epoch": 0.56, "learning_rate": 0.00027484947156403947, "loss": 1.6916, "step": 7130 }, { "epoch": 0.56, "learning_rate": 0.00027484262038817873, "loss": 1.7334, "step": 7131 }, { "epoch": 0.56, "learning_rate": 0.0002748357683647055, "loss": 1.6743, "step": 7132 }, { "epoch": 0.56, "learning_rate": 0.00027482891549366625, "loss": 1.7078, "step": 7133 }, { "epoch": 0.56, "learning_rate": 0.0002748220617751076, "loss": 1.6987, "step": 7134 }, { "epoch": 0.56, "learning_rate": 0.00027481520720907594, "loss": 1.7193, "step": 7135 }, { "epoch": 0.56, "learning_rate": 0.000274808351795618, "loss": 1.6678, "step": 7136 }, { "epoch": 0.56, "learning_rate": 0.0002748014955347802, "loss": 1.7213, "step": 7137 }, { "epoch": 0.56, "learning_rate": 0.000274794638426609, "loss": 1.6856, "step": 7138 }, { "epoch": 0.56, "learning_rate": 0.0002747877804711512, "loss": 1.7042, "step": 7139 }, { "epoch": 0.56, "learning_rate": 0.0002747809216684532, "loss": 1.6896, "step": 7140 }, { "epoch": 0.56, "learning_rate": 0.00027477406201856165, "loss": 1.6152, "step": 7141 }, { "epoch": 0.56, "learning_rate": 0.00027476720152152303, "loss": 1.7573, "step": 7142 }, { "epoch": 0.56, "learning_rate": 0.00027476034017738396, "loss": 1.6789, "step": 7143 }, { "epoch": 0.56, "learning_rate": 0.000274753477986191, "loss": 1.7242, "step": 7144 }, { "epoch": 0.56, "learning_rate": 0.0002747466149479909, "loss": 1.7252, "step": 7145 }, { "epoch": 0.56, "learning_rate": 0.00027473975106282996, "loss": 1.6718, "step": 7146 }, { "epoch": 0.56, "learning_rate": 0.000274732886330755, "loss": 1.6937, "step": 7147 }, { "epoch": 0.56, "learning_rate": 0.0002747260207518126, "loss": 1.7351, "step": 7148 }, { "epoch": 0.56, "learning_rate": 0.0002747191543260494, "loss": 1.7141, "step": 7149 }, { "epoch": 0.56, "learning_rate": 0.00027471228705351186, "loss": 1.7058, "step": 7150 }, { "epoch": 0.56, "learning_rate": 0.00027470541893424676, "loss": 1.746, "step": 7151 }, { "epoch": 0.56, "learning_rate": 0.0002746985499683007, "loss": 1.7033, "step": 7152 }, { "epoch": 0.56, "learning_rate": 0.0002746916801557203, "loss": 1.7098, "step": 7153 }, { "epoch": 0.56, "learning_rate": 0.0002746848094965522, "loss": 1.7052, "step": 7154 }, { "epoch": 0.56, "learning_rate": 0.000274677937990843, "loss": 1.7307, "step": 7155 }, { "epoch": 0.56, "learning_rate": 0.0002746710656386395, "loss": 1.7294, "step": 7156 }, { "epoch": 0.56, "learning_rate": 0.00027466419243998814, "loss": 1.7069, "step": 7157 }, { "epoch": 0.56, "learning_rate": 0.0002746573183949358, "loss": 1.7524, "step": 7158 }, { "epoch": 0.56, "learning_rate": 0.000274650443503529, "loss": 1.7312, "step": 7159 }, { "epoch": 0.56, "learning_rate": 0.00027464356776581454, "loss": 1.7324, "step": 7160 }, { "epoch": 0.56, "learning_rate": 0.000274636691181839, "loss": 1.6611, "step": 7161 }, { "epoch": 0.56, "learning_rate": 0.00027462981375164916, "loss": 1.662, "step": 7162 }, { "epoch": 0.56, "learning_rate": 0.0002746229354752916, "loss": 1.7474, "step": 7163 }, { "epoch": 0.56, "learning_rate": 0.0002746160563528131, "loss": 1.7362, "step": 7164 }, { "epoch": 0.56, "learning_rate": 0.0002746091763842603, "loss": 1.6331, "step": 7165 }, { "epoch": 0.56, "learning_rate": 0.00027460229556968004, "loss": 1.7027, "step": 7166 }, { "epoch": 0.56, "learning_rate": 0.00027459541390911893, "loss": 1.7335, "step": 7167 }, { "epoch": 0.56, "learning_rate": 0.00027458853140262365, "loss": 1.6725, "step": 7168 }, { "epoch": 0.56, "learning_rate": 0.00027458164805024105, "loss": 1.702, "step": 7169 }, { "epoch": 0.56, "learning_rate": 0.00027457476385201786, "loss": 1.7045, "step": 7170 }, { "epoch": 0.56, "learning_rate": 0.0002745678788080007, "loss": 1.6392, "step": 7171 }, { "epoch": 0.56, "learning_rate": 0.00027456099291823643, "loss": 1.716, "step": 7172 }, { "epoch": 0.56, "learning_rate": 0.0002745541061827717, "loss": 1.6506, "step": 7173 }, { "epoch": 0.56, "learning_rate": 0.00027454721860165337, "loss": 1.6424, "step": 7174 }, { "epoch": 0.56, "learning_rate": 0.0002745403301749281, "loss": 1.6725, "step": 7175 }, { "epoch": 0.56, "learning_rate": 0.0002745334409026428, "loss": 1.691, "step": 7176 }, { "epoch": 0.56, "learning_rate": 0.0002745265507848441, "loss": 1.6637, "step": 7177 }, { "epoch": 0.56, "learning_rate": 0.0002745196598215788, "loss": 1.6703, "step": 7178 }, { "epoch": 0.56, "learning_rate": 0.0002745127680128938, "loss": 1.7103, "step": 7179 }, { "epoch": 0.56, "learning_rate": 0.00027450587535883585, "loss": 1.7012, "step": 7180 }, { "epoch": 0.57, "learning_rate": 0.0002744989818594516, "loss": 1.7088, "step": 7181 }, { "epoch": 0.57, "learning_rate": 0.00027449208751478805, "loss": 1.7116, "step": 7182 }, { "epoch": 0.57, "learning_rate": 0.0002744851923248919, "loss": 1.751, "step": 7183 }, { "epoch": 0.57, "learning_rate": 0.00027447829628981, "loss": 1.7358, "step": 7184 }, { "epoch": 0.57, "learning_rate": 0.00027447139940958915, "loss": 1.688, "step": 7185 }, { "epoch": 0.57, "learning_rate": 0.0002744645016842762, "loss": 1.6977, "step": 7186 }, { "epoch": 0.57, "learning_rate": 0.000274457603113918, "loss": 1.7358, "step": 7187 }, { "epoch": 0.57, "learning_rate": 0.00027445070369856126, "loss": 1.6731, "step": 7188 }, { "epoch": 0.57, "learning_rate": 0.000274443803438253, "loss": 1.7612, "step": 7189 }, { "epoch": 0.57, "learning_rate": 0.00027443690233303997, "loss": 1.7282, "step": 7190 }, { "epoch": 0.57, "learning_rate": 0.00027443000038296903, "loss": 1.7321, "step": 7191 }, { "epoch": 0.57, "learning_rate": 0.0002744230975880871, "loss": 1.6646, "step": 7192 }, { "epoch": 0.57, "learning_rate": 0.00027441619394844095, "loss": 1.7344, "step": 7193 }, { "epoch": 0.57, "learning_rate": 0.00027440928946407747, "loss": 1.7433, "step": 7194 }, { "epoch": 0.57, "learning_rate": 0.00027440238413504363, "loss": 1.6871, "step": 7195 }, { "epoch": 0.57, "learning_rate": 0.0002743954779613862, "loss": 1.7465, "step": 7196 }, { "epoch": 0.57, "learning_rate": 0.0002743885709431522, "loss": 1.7622, "step": 7197 }, { "epoch": 0.57, "learning_rate": 0.0002743816630803884, "loss": 1.7202, "step": 7198 }, { "epoch": 0.57, "learning_rate": 0.0002743747543731417, "loss": 1.706, "step": 7199 }, { "epoch": 0.57, "learning_rate": 0.0002743678448214592, "loss": 1.6755, "step": 7200 }, { "epoch": 0.57, "learning_rate": 0.0002743609344253875, "loss": 1.743, "step": 7201 }, { "epoch": 0.57, "learning_rate": 0.0002743540231849738, "loss": 1.6447, "step": 7202 }, { "epoch": 0.57, "learning_rate": 0.0002743471111002648, "loss": 1.7041, "step": 7203 }, { "epoch": 0.57, "learning_rate": 0.00027434019817130763, "loss": 1.6975, "step": 7204 }, { "epoch": 0.57, "learning_rate": 0.0002743332843981491, "loss": 1.6761, "step": 7205 }, { "epoch": 0.57, "learning_rate": 0.0002743263697808362, "loss": 1.6906, "step": 7206 }, { "epoch": 0.57, "learning_rate": 0.00027431945431941583, "loss": 1.7098, "step": 7207 }, { "epoch": 0.57, "learning_rate": 0.00027431253801393497, "loss": 1.7379, "step": 7208 }, { "epoch": 0.57, "learning_rate": 0.00027430562086444056, "loss": 1.7465, "step": 7209 }, { "epoch": 0.57, "learning_rate": 0.0002742987028709796, "loss": 1.7137, "step": 7210 }, { "epoch": 0.57, "learning_rate": 0.0002742917840335991, "loss": 1.6391, "step": 7211 }, { "epoch": 0.57, "learning_rate": 0.0002742848643523459, "loss": 1.6919, "step": 7212 }, { "epoch": 0.57, "learning_rate": 0.00027427794382726706, "loss": 1.7165, "step": 7213 }, { "epoch": 0.57, "learning_rate": 0.0002742710224584096, "loss": 1.6913, "step": 7214 }, { "epoch": 0.57, "learning_rate": 0.00027426410024582046, "loss": 1.7072, "step": 7215 }, { "epoch": 0.57, "learning_rate": 0.00027425717718954665, "loss": 1.7079, "step": 7216 }, { "epoch": 0.57, "learning_rate": 0.0002742502532896352, "loss": 1.7005, "step": 7217 }, { "epoch": 0.57, "learning_rate": 0.0002742433285461331, "loss": 1.7091, "step": 7218 }, { "epoch": 0.57, "learning_rate": 0.00027423640295908734, "loss": 1.6715, "step": 7219 }, { "epoch": 0.57, "learning_rate": 0.00027422947652854494, "loss": 1.6733, "step": 7220 }, { "epoch": 0.57, "learning_rate": 0.000274222549254553, "loss": 1.6844, "step": 7221 }, { "epoch": 0.57, "learning_rate": 0.0002742156211371585, "loss": 1.6926, "step": 7222 }, { "epoch": 0.57, "learning_rate": 0.00027420869217640844, "loss": 1.7072, "step": 7223 }, { "epoch": 0.57, "learning_rate": 0.0002742017623723499, "loss": 1.6361, "step": 7224 }, { "epoch": 0.57, "learning_rate": 0.00027419483172502995, "loss": 1.6924, "step": 7225 }, { "epoch": 0.57, "learning_rate": 0.0002741879002344957, "loss": 1.737, "step": 7226 }, { "epoch": 0.57, "learning_rate": 0.000274180967900794, "loss": 1.6845, "step": 7227 }, { "epoch": 0.57, "learning_rate": 0.00027417403472397215, "loss": 1.7363, "step": 7228 }, { "epoch": 0.57, "learning_rate": 0.0002741671007040771, "loss": 1.649, "step": 7229 }, { "epoch": 0.57, "learning_rate": 0.000274160165841156, "loss": 1.7558, "step": 7230 }, { "epoch": 0.57, "learning_rate": 0.00027415323013525587, "loss": 1.7086, "step": 7231 }, { "epoch": 0.57, "learning_rate": 0.0002741462935864238, "loss": 1.7699, "step": 7232 }, { "epoch": 0.57, "learning_rate": 0.0002741393561947069, "loss": 1.681, "step": 7233 }, { "epoch": 0.57, "learning_rate": 0.0002741324179601523, "loss": 1.6729, "step": 7234 }, { "epoch": 0.57, "learning_rate": 0.00027412547888280706, "loss": 1.6764, "step": 7235 }, { "epoch": 0.57, "learning_rate": 0.0002741185389627183, "loss": 1.6911, "step": 7236 }, { "epoch": 0.57, "learning_rate": 0.0002741115981999332, "loss": 1.7415, "step": 7237 }, { "epoch": 0.57, "learning_rate": 0.0002741046565944989, "loss": 1.694, "step": 7238 }, { "epoch": 0.57, "learning_rate": 0.0002740977141464624, "loss": 1.6839, "step": 7239 }, { "epoch": 0.57, "learning_rate": 0.0002740907708558709, "loss": 1.694, "step": 7240 }, { "epoch": 0.57, "learning_rate": 0.0002740838267227715, "loss": 1.6872, "step": 7241 }, { "epoch": 0.57, "learning_rate": 0.00027407688174721143, "loss": 1.6714, "step": 7242 }, { "epoch": 0.57, "learning_rate": 0.0002740699359292378, "loss": 1.7636, "step": 7243 }, { "epoch": 0.57, "learning_rate": 0.0002740629892688978, "loss": 1.7375, "step": 7244 }, { "epoch": 0.57, "learning_rate": 0.00027405604176623853, "loss": 1.7212, "step": 7245 }, { "epoch": 0.57, "learning_rate": 0.00027404909342130726, "loss": 1.6814, "step": 7246 }, { "epoch": 0.57, "learning_rate": 0.00027404214423415105, "loss": 1.7453, "step": 7247 }, { "epoch": 0.57, "learning_rate": 0.0002740351942048171, "loss": 1.6563, "step": 7248 }, { "epoch": 0.57, "learning_rate": 0.0002740282433333527, "loss": 1.7289, "step": 7249 }, { "epoch": 0.57, "learning_rate": 0.00027402129161980496, "loss": 1.6788, "step": 7250 }, { "epoch": 0.57, "learning_rate": 0.00027401433906422103, "loss": 1.6721, "step": 7251 }, { "epoch": 0.57, "learning_rate": 0.00027400738566664824, "loss": 1.6991, "step": 7252 }, { "epoch": 0.57, "learning_rate": 0.0002740004314271337, "loss": 1.7167, "step": 7253 }, { "epoch": 0.57, "learning_rate": 0.0002739934763457247, "loss": 1.708, "step": 7254 }, { "epoch": 0.57, "learning_rate": 0.00027398652042246835, "loss": 1.6674, "step": 7255 }, { "epoch": 0.57, "learning_rate": 0.00027397956365741196, "loss": 1.6944, "step": 7256 }, { "epoch": 0.57, "learning_rate": 0.0002739726060506028, "loss": 1.6932, "step": 7257 }, { "epoch": 0.57, "learning_rate": 0.00027396564760208804, "loss": 1.6736, "step": 7258 }, { "epoch": 0.57, "learning_rate": 0.000273958688311915, "loss": 1.692, "step": 7259 }, { "epoch": 0.57, "learning_rate": 0.00027395172818013076, "loss": 1.6457, "step": 7260 }, { "epoch": 0.57, "learning_rate": 0.0002739447672067828, "loss": 1.6636, "step": 7261 }, { "epoch": 0.57, "learning_rate": 0.00027393780539191817, "loss": 1.6826, "step": 7262 }, { "epoch": 0.57, "learning_rate": 0.0002739308427355843, "loss": 1.7193, "step": 7263 }, { "epoch": 0.57, "learning_rate": 0.00027392387923782835, "loss": 1.6984, "step": 7264 }, { "epoch": 0.57, "learning_rate": 0.0002739169148986977, "loss": 1.6863, "step": 7265 }, { "epoch": 0.57, "learning_rate": 0.0002739099497182395, "loss": 1.7484, "step": 7266 }, { "epoch": 0.57, "learning_rate": 0.0002739029836965012, "loss": 1.7186, "step": 7267 }, { "epoch": 0.57, "learning_rate": 0.00027389601683353, "loss": 1.7261, "step": 7268 }, { "epoch": 0.57, "learning_rate": 0.00027388904912937324, "loss": 1.7251, "step": 7269 }, { "epoch": 0.57, "learning_rate": 0.0002738820805840781, "loss": 1.6625, "step": 7270 }, { "epoch": 0.57, "learning_rate": 0.0002738751111976921, "loss": 1.645, "step": 7271 }, { "epoch": 0.57, "learning_rate": 0.0002738681409702624, "loss": 1.6945, "step": 7272 }, { "epoch": 0.57, "learning_rate": 0.0002738611699018364, "loss": 1.6807, "step": 7273 }, { "epoch": 0.57, "learning_rate": 0.0002738541979924614, "loss": 1.7028, "step": 7274 }, { "epoch": 0.57, "learning_rate": 0.0002738472252421848, "loss": 1.7183, "step": 7275 }, { "epoch": 0.57, "learning_rate": 0.0002738402516510538, "loss": 1.6715, "step": 7276 }, { "epoch": 0.57, "learning_rate": 0.0002738332772191159, "loss": 1.6736, "step": 7277 }, { "epoch": 0.57, "learning_rate": 0.00027382630194641835, "loss": 1.6983, "step": 7278 }, { "epoch": 0.57, "learning_rate": 0.00027381932583300854, "loss": 1.7309, "step": 7279 }, { "epoch": 0.57, "learning_rate": 0.00027381234887893384, "loss": 1.6717, "step": 7280 }, { "epoch": 0.57, "learning_rate": 0.00027380537108424163, "loss": 1.6581, "step": 7281 }, { "epoch": 0.57, "learning_rate": 0.00027379839244897925, "loss": 1.6988, "step": 7282 }, { "epoch": 0.57, "learning_rate": 0.0002737914129731941, "loss": 1.7154, "step": 7283 }, { "epoch": 0.57, "learning_rate": 0.0002737844326569336, "loss": 1.656, "step": 7284 }, { "epoch": 0.57, "learning_rate": 0.00027377745150024513, "loss": 1.6587, "step": 7285 }, { "epoch": 0.57, "learning_rate": 0.000273770469503176, "loss": 1.7215, "step": 7286 }, { "epoch": 0.57, "learning_rate": 0.0002737634866657737, "loss": 1.7035, "step": 7287 }, { "epoch": 0.57, "learning_rate": 0.0002737565029880857, "loss": 1.7507, "step": 7288 }, { "epoch": 0.57, "learning_rate": 0.00027374951847015927, "loss": 1.6739, "step": 7289 }, { "epoch": 0.57, "learning_rate": 0.0002737425331120419, "loss": 1.7164, "step": 7290 }, { "epoch": 0.57, "learning_rate": 0.000273735546913781, "loss": 1.7387, "step": 7291 }, { "epoch": 0.57, "learning_rate": 0.00027372855987542406, "loss": 1.6993, "step": 7292 }, { "epoch": 0.57, "learning_rate": 0.0002737215719970185, "loss": 1.6979, "step": 7293 }, { "epoch": 0.57, "learning_rate": 0.0002737145832786117, "loss": 1.6798, "step": 7294 }, { "epoch": 0.57, "learning_rate": 0.00027370759372025117, "loss": 1.6757, "step": 7295 }, { "epoch": 0.57, "learning_rate": 0.00027370060332198437, "loss": 1.6954, "step": 7296 }, { "epoch": 0.57, "learning_rate": 0.0002736936120838587, "loss": 1.7194, "step": 7297 }, { "epoch": 0.57, "learning_rate": 0.00027368662000592164, "loss": 1.7211, "step": 7298 }, { "epoch": 0.57, "learning_rate": 0.00027367962708822074, "loss": 1.6754, "step": 7299 }, { "epoch": 0.57, "learning_rate": 0.00027367263333080336, "loss": 1.6892, "step": 7300 }, { "epoch": 0.57, "learning_rate": 0.0002736656387337171, "loss": 1.7016, "step": 7301 }, { "epoch": 0.57, "learning_rate": 0.0002736586432970094, "loss": 1.7017, "step": 7302 }, { "epoch": 0.57, "learning_rate": 0.00027365164702072777, "loss": 1.6597, "step": 7303 }, { "epoch": 0.57, "learning_rate": 0.0002736446499049196, "loss": 1.7208, "step": 7304 }, { "epoch": 0.57, "learning_rate": 0.00027363765194963254, "loss": 1.7203, "step": 7305 }, { "epoch": 0.57, "learning_rate": 0.00027363065315491413, "loss": 1.6773, "step": 7306 }, { "epoch": 0.57, "learning_rate": 0.0002736236535208117, "loss": 1.756, "step": 7307 }, { "epoch": 0.58, "learning_rate": 0.0002736166530473729, "loss": 1.7135, "step": 7308 }, { "epoch": 0.58, "learning_rate": 0.00027360965173464527, "loss": 1.7484, "step": 7309 }, { "epoch": 0.58, "learning_rate": 0.00027360264958267635, "loss": 1.7042, "step": 7310 }, { "epoch": 0.58, "learning_rate": 0.00027359564659151363, "loss": 1.6986, "step": 7311 }, { "epoch": 0.58, "learning_rate": 0.0002735886427612046, "loss": 1.6595, "step": 7312 }, { "epoch": 0.58, "learning_rate": 0.000273581638091797, "loss": 1.6817, "step": 7313 }, { "epoch": 0.58, "learning_rate": 0.0002735746325833382, "loss": 1.6621, "step": 7314 }, { "epoch": 0.58, "learning_rate": 0.0002735676262358759, "loss": 1.7131, "step": 7315 }, { "epoch": 0.58, "learning_rate": 0.00027356061904945753, "loss": 1.6775, "step": 7316 }, { "epoch": 0.58, "learning_rate": 0.0002735536110241308, "loss": 1.633, "step": 7317 }, { "epoch": 0.58, "learning_rate": 0.0002735466021599432, "loss": 1.6893, "step": 7318 }, { "epoch": 0.58, "learning_rate": 0.0002735395924569424, "loss": 1.6531, "step": 7319 }, { "epoch": 0.58, "learning_rate": 0.00027353258191517587, "loss": 1.7092, "step": 7320 }, { "epoch": 0.58, "learning_rate": 0.00027352557053469137, "loss": 1.7188, "step": 7321 }, { "epoch": 0.58, "learning_rate": 0.0002735185583155364, "loss": 1.6959, "step": 7322 }, { "epoch": 0.58, "learning_rate": 0.0002735115452577585, "loss": 1.7081, "step": 7323 }, { "epoch": 0.58, "learning_rate": 0.0002735045313614054, "loss": 1.7294, "step": 7324 }, { "epoch": 0.58, "learning_rate": 0.0002734975166265247, "loss": 1.6498, "step": 7325 }, { "epoch": 0.58, "learning_rate": 0.000273490501053164, "loss": 1.7136, "step": 7326 }, { "epoch": 0.58, "learning_rate": 0.00027348348464137096, "loss": 1.6797, "step": 7327 }, { "epoch": 0.58, "learning_rate": 0.0002734764673911932, "loss": 1.6597, "step": 7328 }, { "epoch": 0.58, "learning_rate": 0.0002734694493026784, "loss": 1.6858, "step": 7329 }, { "epoch": 0.58, "learning_rate": 0.00027346243037587413, "loss": 1.6957, "step": 7330 }, { "epoch": 0.58, "learning_rate": 0.0002734554106108281, "loss": 1.707, "step": 7331 }, { "epoch": 0.58, "learning_rate": 0.000273448390007588, "loss": 1.6612, "step": 7332 }, { "epoch": 0.58, "learning_rate": 0.00027344136856620135, "loss": 1.6894, "step": 7333 }, { "epoch": 0.58, "learning_rate": 0.000273434346286716, "loss": 1.7276, "step": 7334 }, { "epoch": 0.58, "learning_rate": 0.0002734273231691796, "loss": 1.7069, "step": 7335 }, { "epoch": 0.58, "learning_rate": 0.0002734202992136397, "loss": 1.6988, "step": 7336 }, { "epoch": 0.58, "learning_rate": 0.0002734132744201441, "loss": 1.7179, "step": 7337 }, { "epoch": 0.58, "learning_rate": 0.00027340624878874055, "loss": 1.6774, "step": 7338 }, { "epoch": 0.58, "learning_rate": 0.0002733992223194766, "loss": 1.7101, "step": 7339 }, { "epoch": 0.58, "learning_rate": 0.0002733921950124, "loss": 1.6655, "step": 7340 }, { "epoch": 0.58, "learning_rate": 0.0002733851668675586, "loss": 1.7331, "step": 7341 }, { "epoch": 0.58, "learning_rate": 0.0002733781378849999, "loss": 1.6466, "step": 7342 }, { "epoch": 0.58, "learning_rate": 0.00027337110806477177, "loss": 1.6617, "step": 7343 }, { "epoch": 0.58, "learning_rate": 0.00027336407740692186, "loss": 1.7116, "step": 7344 }, { "epoch": 0.58, "learning_rate": 0.00027335704591149797, "loss": 1.6811, "step": 7345 }, { "epoch": 0.58, "learning_rate": 0.00027335001357854785, "loss": 1.6613, "step": 7346 }, { "epoch": 0.58, "learning_rate": 0.00027334298040811915, "loss": 1.7293, "step": 7347 }, { "epoch": 0.58, "learning_rate": 0.0002733359464002597, "loss": 1.706, "step": 7348 }, { "epoch": 0.58, "learning_rate": 0.00027332891155501727, "loss": 1.7406, "step": 7349 }, { "epoch": 0.58, "learning_rate": 0.00027332187587243955, "loss": 1.6606, "step": 7350 }, { "epoch": 0.58, "learning_rate": 0.0002733148393525744, "loss": 1.6678, "step": 7351 }, { "epoch": 0.58, "learning_rate": 0.00027330780199546947, "loss": 1.6643, "step": 7352 }, { "epoch": 0.58, "learning_rate": 0.0002733007638011726, "loss": 1.6802, "step": 7353 }, { "epoch": 0.58, "learning_rate": 0.00027329372476973167, "loss": 1.7152, "step": 7354 }, { "epoch": 0.58, "learning_rate": 0.0002732866849011944, "loss": 1.6373, "step": 7355 }, { "epoch": 0.58, "learning_rate": 0.00027327964419560845, "loss": 1.7166, "step": 7356 }, { "epoch": 0.58, "learning_rate": 0.0002732726026530218, "loss": 1.7315, "step": 7357 }, { "epoch": 0.58, "learning_rate": 0.00027326556027348225, "loss": 1.6591, "step": 7358 }, { "epoch": 0.58, "learning_rate": 0.00027325851705703756, "loss": 1.7136, "step": 7359 }, { "epoch": 0.58, "learning_rate": 0.00027325147300373553, "loss": 1.7133, "step": 7360 }, { "epoch": 0.58, "learning_rate": 0.00027324442811362405, "loss": 1.6686, "step": 7361 }, { "epoch": 0.58, "learning_rate": 0.00027323738238675086, "loss": 1.6545, "step": 7362 }, { "epoch": 0.58, "learning_rate": 0.0002732303358231639, "loss": 1.668, "step": 7363 }, { "epoch": 0.58, "learning_rate": 0.00027322328842291094, "loss": 1.7098, "step": 7364 }, { "epoch": 0.58, "learning_rate": 0.00027321624018603985, "loss": 1.678, "step": 7365 }, { "epoch": 0.58, "learning_rate": 0.0002732091911125985, "loss": 1.7293, "step": 7366 }, { "epoch": 0.58, "learning_rate": 0.0002732021412026347, "loss": 1.6602, "step": 7367 }, { "epoch": 0.58, "learning_rate": 0.0002731950904561964, "loss": 1.6711, "step": 7368 }, { "epoch": 0.58, "learning_rate": 0.0002731880388733314, "loss": 1.6574, "step": 7369 }, { "epoch": 0.58, "learning_rate": 0.0002731809864540876, "loss": 1.667, "step": 7370 }, { "epoch": 0.58, "learning_rate": 0.00027317393319851286, "loss": 1.6663, "step": 7371 }, { "epoch": 0.58, "learning_rate": 0.0002731668791066551, "loss": 1.7467, "step": 7372 }, { "epoch": 0.58, "learning_rate": 0.00027315982417856224, "loss": 1.7269, "step": 7373 }, { "epoch": 0.58, "learning_rate": 0.0002731527684142821, "loss": 1.7135, "step": 7374 }, { "epoch": 0.58, "learning_rate": 0.0002731457118138626, "loss": 1.7304, "step": 7375 }, { "epoch": 0.58, "learning_rate": 0.0002731386543773517, "loss": 1.6677, "step": 7376 }, { "epoch": 0.58, "learning_rate": 0.0002731315961047973, "loss": 1.6231, "step": 7377 }, { "epoch": 0.58, "learning_rate": 0.0002731245369962473, "loss": 1.6929, "step": 7378 }, { "epoch": 0.58, "learning_rate": 0.00027311747705174963, "loss": 1.7472, "step": 7379 }, { "epoch": 0.58, "learning_rate": 0.00027311041627135226, "loss": 1.7249, "step": 7380 }, { "epoch": 0.58, "learning_rate": 0.00027310335465510305, "loss": 1.6644, "step": 7381 }, { "epoch": 0.58, "learning_rate": 0.00027309629220305, "loss": 1.6636, "step": 7382 }, { "epoch": 0.58, "learning_rate": 0.0002730892289152411, "loss": 1.6641, "step": 7383 }, { "epoch": 0.58, "learning_rate": 0.0002730821647917243, "loss": 1.6093, "step": 7384 }, { "epoch": 0.58, "learning_rate": 0.00027307509983254746, "loss": 1.6596, "step": 7385 }, { "epoch": 0.58, "learning_rate": 0.0002730680340377586, "loss": 1.6534, "step": 7386 }, { "epoch": 0.58, "learning_rate": 0.00027306096740740575, "loss": 1.6771, "step": 7387 }, { "epoch": 0.58, "learning_rate": 0.0002730538999415368, "loss": 1.7429, "step": 7388 }, { "epoch": 0.58, "learning_rate": 0.0002730468316401998, "loss": 1.6808, "step": 7389 }, { "epoch": 0.58, "learning_rate": 0.00027303976250344275, "loss": 1.7538, "step": 7390 }, { "epoch": 0.58, "learning_rate": 0.00027303269253131353, "loss": 1.73, "step": 7391 }, { "epoch": 0.58, "learning_rate": 0.00027302562172386026, "loss": 1.7462, "step": 7392 }, { "epoch": 0.58, "learning_rate": 0.0002730185500811309, "loss": 1.7653, "step": 7393 }, { "epoch": 0.58, "learning_rate": 0.0002730114776031735, "loss": 1.697, "step": 7394 }, { "epoch": 0.58, "learning_rate": 0.00027300440429003605, "loss": 1.7309, "step": 7395 }, { "epoch": 0.58, "learning_rate": 0.00027299733014176655, "loss": 1.7191, "step": 7396 }, { "epoch": 0.58, "learning_rate": 0.00027299025515841303, "loss": 1.7404, "step": 7397 }, { "epoch": 0.58, "learning_rate": 0.0002729831793400236, "loss": 1.7365, "step": 7398 }, { "epoch": 0.58, "learning_rate": 0.00027297610268664627, "loss": 1.648, "step": 7399 }, { "epoch": 0.58, "learning_rate": 0.000272969025198329, "loss": 1.6472, "step": 7400 }, { "epoch": 0.58, "learning_rate": 0.00027296194687511993, "loss": 1.7005, "step": 7401 }, { "epoch": 0.58, "learning_rate": 0.0002729548677170671, "loss": 1.7607, "step": 7402 }, { "epoch": 0.58, "learning_rate": 0.0002729477877242186, "loss": 1.6589, "step": 7403 }, { "epoch": 0.58, "learning_rate": 0.00027294070689662245, "loss": 1.7632, "step": 7404 }, { "epoch": 0.58, "learning_rate": 0.00027293362523432677, "loss": 1.6916, "step": 7405 }, { "epoch": 0.58, "learning_rate": 0.00027292654273737956, "loss": 1.7092, "step": 7406 }, { "epoch": 0.58, "learning_rate": 0.000272919459405829, "loss": 1.7189, "step": 7407 }, { "epoch": 0.58, "learning_rate": 0.00027291237523972313, "loss": 1.6406, "step": 7408 }, { "epoch": 0.58, "learning_rate": 0.00027290529023911, "loss": 1.6986, "step": 7409 }, { "epoch": 0.58, "learning_rate": 0.0002728982044040379, "loss": 1.6349, "step": 7410 }, { "epoch": 0.58, "learning_rate": 0.00027289111773455473, "loss": 1.6958, "step": 7411 }, { "epoch": 0.58, "learning_rate": 0.0002728840302307087, "loss": 1.7451, "step": 7412 }, { "epoch": 0.58, "learning_rate": 0.0002728769418925479, "loss": 1.7363, "step": 7413 }, { "epoch": 0.58, "learning_rate": 0.0002728698527201205, "loss": 1.7257, "step": 7414 }, { "epoch": 0.58, "learning_rate": 0.00027286276271347464, "loss": 1.6821, "step": 7415 }, { "epoch": 0.58, "learning_rate": 0.0002728556718726584, "loss": 1.7299, "step": 7416 }, { "epoch": 0.58, "learning_rate": 0.0002728485801977199, "loss": 1.6805, "step": 7417 }, { "epoch": 0.58, "learning_rate": 0.0002728414876887073, "loss": 1.7392, "step": 7418 }, { "epoch": 0.58, "learning_rate": 0.0002728343943456689, "loss": 1.7125, "step": 7419 }, { "epoch": 0.58, "learning_rate": 0.0002728273001686527, "loss": 1.693, "step": 7420 }, { "epoch": 0.58, "learning_rate": 0.0002728202051577069, "loss": 1.7288, "step": 7421 }, { "epoch": 0.58, "learning_rate": 0.0002728131093128797, "loss": 1.7333, "step": 7422 }, { "epoch": 0.58, "learning_rate": 0.0002728060126342193, "loss": 1.659, "step": 7423 }, { "epoch": 0.58, "learning_rate": 0.0002727989151217738, "loss": 1.6812, "step": 7424 }, { "epoch": 0.58, "learning_rate": 0.0002727918167755914, "loss": 1.6266, "step": 7425 }, { "epoch": 0.58, "learning_rate": 0.0002727847175957204, "loss": 1.7365, "step": 7426 }, { "epoch": 0.58, "learning_rate": 0.0002727776175822089, "loss": 1.6815, "step": 7427 }, { "epoch": 0.58, "learning_rate": 0.0002727705167351051, "loss": 1.6792, "step": 7428 }, { "epoch": 0.58, "learning_rate": 0.00027276341505445725, "loss": 1.6886, "step": 7429 }, { "epoch": 0.58, "learning_rate": 0.00027275631254031354, "loss": 1.6489, "step": 7430 }, { "epoch": 0.58, "learning_rate": 0.00027274920919272225, "loss": 1.6632, "step": 7431 }, { "epoch": 0.58, "learning_rate": 0.0002727421050117316, "loss": 1.6688, "step": 7432 }, { "epoch": 0.58, "learning_rate": 0.0002727349999973897, "loss": 1.726, "step": 7433 }, { "epoch": 0.58, "learning_rate": 0.0002727278941497449, "loss": 1.6739, "step": 7434 }, { "epoch": 0.58, "learning_rate": 0.0002727207874688455, "loss": 1.7166, "step": 7435 }, { "epoch": 0.59, "learning_rate": 0.0002727136799547396, "loss": 1.6968, "step": 7436 }, { "epoch": 0.59, "learning_rate": 0.0002727065716074756, "loss": 1.7008, "step": 7437 }, { "epoch": 0.59, "learning_rate": 0.00027269946242710166, "loss": 1.7715, "step": 7438 }, { "epoch": 0.59, "learning_rate": 0.00027269235241366606, "loss": 1.7009, "step": 7439 }, { "epoch": 0.59, "learning_rate": 0.0002726852415672171, "loss": 1.6875, "step": 7440 }, { "epoch": 0.59, "learning_rate": 0.0002726781298878031, "loss": 1.6621, "step": 7441 }, { "epoch": 0.59, "learning_rate": 0.00027267101737547226, "loss": 1.747, "step": 7442 }, { "epoch": 0.59, "learning_rate": 0.0002726639040302729, "loss": 1.6621, "step": 7443 }, { "epoch": 0.59, "learning_rate": 0.00027265678985225334, "loss": 1.6542, "step": 7444 }, { "epoch": 0.59, "learning_rate": 0.0002726496748414618, "loss": 1.6746, "step": 7445 }, { "epoch": 0.59, "learning_rate": 0.00027264255899794675, "loss": 1.72, "step": 7446 }, { "epoch": 0.59, "learning_rate": 0.0002726354423217564, "loss": 1.6879, "step": 7447 }, { "epoch": 0.59, "learning_rate": 0.000272628324812939, "loss": 1.6036, "step": 7448 }, { "epoch": 0.59, "learning_rate": 0.000272621206471543, "loss": 1.6652, "step": 7449 }, { "epoch": 0.59, "learning_rate": 0.00027261408729761663, "loss": 1.6986, "step": 7450 }, { "epoch": 0.59, "learning_rate": 0.00027260696729120834, "loss": 1.6844, "step": 7451 }, { "epoch": 0.59, "learning_rate": 0.0002725998464523663, "loss": 1.6611, "step": 7452 }, { "epoch": 0.59, "learning_rate": 0.00027259272478113907, "loss": 1.689, "step": 7453 }, { "epoch": 0.59, "learning_rate": 0.00027258560227757487, "loss": 1.709, "step": 7454 }, { "epoch": 0.59, "learning_rate": 0.00027257847894172205, "loss": 1.7184, "step": 7455 }, { "epoch": 0.59, "learning_rate": 0.000272571354773629, "loss": 1.677, "step": 7456 }, { "epoch": 0.59, "learning_rate": 0.00027256422977334406, "loss": 1.7562, "step": 7457 }, { "epoch": 0.59, "learning_rate": 0.0002725571039409157, "loss": 1.7093, "step": 7458 }, { "epoch": 0.59, "learning_rate": 0.0002725499772763922, "loss": 1.7101, "step": 7459 }, { "epoch": 0.59, "learning_rate": 0.000272542849779822, "loss": 1.7496, "step": 7460 }, { "epoch": 0.59, "learning_rate": 0.00027253572145125347, "loss": 1.6623, "step": 7461 }, { "epoch": 0.59, "learning_rate": 0.000272528592290735, "loss": 1.6913, "step": 7462 }, { "epoch": 0.59, "learning_rate": 0.000272521462298315, "loss": 1.6682, "step": 7463 }, { "epoch": 0.59, "learning_rate": 0.0002725143314740419, "loss": 1.6638, "step": 7464 }, { "epoch": 0.59, "learning_rate": 0.0002725071998179641, "loss": 1.6805, "step": 7465 }, { "epoch": 0.59, "learning_rate": 0.00027250006733013003, "loss": 1.7034, "step": 7466 }, { "epoch": 0.59, "learning_rate": 0.0002724929340105881, "loss": 1.6365, "step": 7467 }, { "epoch": 0.59, "learning_rate": 0.0002724857998593867, "loss": 1.7336, "step": 7468 }, { "epoch": 0.59, "learning_rate": 0.0002724786648765743, "loss": 1.758, "step": 7469 }, { "epoch": 0.59, "learning_rate": 0.0002724715290621995, "loss": 1.7362, "step": 7470 }, { "epoch": 0.59, "learning_rate": 0.0002724643924163104, "loss": 1.7271, "step": 7471 }, { "epoch": 0.59, "learning_rate": 0.0002724572549389558, "loss": 1.6865, "step": 7472 }, { "epoch": 0.59, "learning_rate": 0.000272450116630184, "loss": 1.6176, "step": 7473 }, { "epoch": 0.59, "learning_rate": 0.00027244297749004346, "loss": 1.642, "step": 7474 }, { "epoch": 0.59, "learning_rate": 0.00027243583751858266, "loss": 1.6027, "step": 7475 }, { "epoch": 0.59, "learning_rate": 0.00027242869671585007, "loss": 1.7254, "step": 7476 }, { "epoch": 0.59, "learning_rate": 0.00027242155508189425, "loss": 1.6935, "step": 7477 }, { "epoch": 0.59, "learning_rate": 0.0002724144126167636, "loss": 1.6866, "step": 7478 }, { "epoch": 0.59, "learning_rate": 0.0002724072693205066, "loss": 1.6449, "step": 7479 }, { "epoch": 0.59, "learning_rate": 0.00027240012519317186, "loss": 1.6805, "step": 7480 }, { "epoch": 0.59, "learning_rate": 0.0002723929802348078, "loss": 1.7547, "step": 7481 }, { "epoch": 0.59, "learning_rate": 0.0002723858344454629, "loss": 1.7058, "step": 7482 }, { "epoch": 0.59, "learning_rate": 0.0002723786878251858, "loss": 1.6961, "step": 7483 }, { "epoch": 0.59, "learning_rate": 0.00027237154037402486, "loss": 1.7095, "step": 7484 }, { "epoch": 0.59, "learning_rate": 0.00027236439209202875, "loss": 1.7127, "step": 7485 }, { "epoch": 0.59, "learning_rate": 0.0002723572429792459, "loss": 1.673, "step": 7486 }, { "epoch": 0.59, "learning_rate": 0.00027235009303572494, "loss": 1.705, "step": 7487 }, { "epoch": 0.59, "learning_rate": 0.0002723429422615143, "loss": 1.7004, "step": 7488 }, { "epoch": 0.59, "learning_rate": 0.0002723357906566627, "loss": 1.6681, "step": 7489 }, { "epoch": 0.59, "learning_rate": 0.00027232863822121856, "loss": 1.6708, "step": 7490 }, { "epoch": 0.59, "learning_rate": 0.0002723214849552304, "loss": 1.6854, "step": 7491 }, { "epoch": 0.59, "learning_rate": 0.00027231433085874693, "loss": 1.6313, "step": 7492 }, { "epoch": 0.59, "learning_rate": 0.00027230717593181665, "loss": 1.6786, "step": 7493 }, { "epoch": 0.59, "learning_rate": 0.0002723000201744881, "loss": 1.7119, "step": 7494 }, { "epoch": 0.59, "learning_rate": 0.0002722928635868099, "loss": 1.6515, "step": 7495 }, { "epoch": 0.59, "learning_rate": 0.0002722857061688307, "loss": 1.7052, "step": 7496 }, { "epoch": 0.59, "learning_rate": 0.00027227854792059896, "loss": 1.6641, "step": 7497 }, { "epoch": 0.59, "learning_rate": 0.0002722713888421634, "loss": 1.714, "step": 7498 }, { "epoch": 0.59, "learning_rate": 0.0002722642289335726, "loss": 1.6976, "step": 7499 }, { "epoch": 0.59, "learning_rate": 0.0002722570681948752, "loss": 1.6988, "step": 7500 }, { "epoch": 0.59, "learning_rate": 0.0002722499066261197, "loss": 1.6927, "step": 7501 }, { "epoch": 0.59, "learning_rate": 0.0002722427442273548, "loss": 1.6721, "step": 7502 }, { "epoch": 0.59, "learning_rate": 0.00027223558099862916, "loss": 1.6471, "step": 7503 }, { "epoch": 0.59, "learning_rate": 0.00027222841693999133, "loss": 1.6269, "step": 7504 }, { "epoch": 0.59, "learning_rate": 0.00027222125205149004, "loss": 1.704, "step": 7505 }, { "epoch": 0.59, "learning_rate": 0.00027221408633317385, "loss": 1.6941, "step": 7506 }, { "epoch": 0.59, "learning_rate": 0.0002722069197850915, "loss": 1.7167, "step": 7507 }, { "epoch": 0.59, "learning_rate": 0.0002721997524072916, "loss": 1.7624, "step": 7508 }, { "epoch": 0.59, "learning_rate": 0.00027219258419982283, "loss": 1.6585, "step": 7509 }, { "epoch": 0.59, "learning_rate": 0.0002721854151627338, "loss": 1.6781, "step": 7510 }, { "epoch": 0.59, "learning_rate": 0.00027217824529607326, "loss": 1.6971, "step": 7511 }, { "epoch": 0.59, "learning_rate": 0.0002721710745998899, "loss": 1.7003, "step": 7512 }, { "epoch": 0.59, "learning_rate": 0.00027216390307423233, "loss": 1.7285, "step": 7513 }, { "epoch": 0.59, "learning_rate": 0.0002721567307191492, "loss": 1.6951, "step": 7514 }, { "epoch": 0.59, "learning_rate": 0.0002721495575346894, "loss": 1.7496, "step": 7515 }, { "epoch": 0.59, "learning_rate": 0.0002721423835209014, "loss": 1.6229, "step": 7516 }, { "epoch": 0.59, "learning_rate": 0.0002721352086778341, "loss": 1.6905, "step": 7517 }, { "epoch": 0.59, "learning_rate": 0.00027212803300553614, "loss": 1.6032, "step": 7518 }, { "epoch": 0.59, "learning_rate": 0.00027212085650405615, "loss": 1.71, "step": 7519 }, { "epoch": 0.59, "learning_rate": 0.000272113679173443, "loss": 1.7566, "step": 7520 }, { "epoch": 0.59, "learning_rate": 0.00027210650101374534, "loss": 1.7173, "step": 7521 }, { "epoch": 0.59, "learning_rate": 0.00027209932202501195, "loss": 1.6939, "step": 7522 }, { "epoch": 0.59, "learning_rate": 0.0002720921422072915, "loss": 1.7184, "step": 7523 }, { "epoch": 0.59, "learning_rate": 0.0002720849615606328, "loss": 1.7055, "step": 7524 }, { "epoch": 0.59, "learning_rate": 0.00027207778008508455, "loss": 1.7349, "step": 7525 }, { "epoch": 0.59, "learning_rate": 0.0002720705977806956, "loss": 1.6973, "step": 7526 }, { "epoch": 0.59, "learning_rate": 0.0002720634146475146, "loss": 1.7144, "step": 7527 }, { "epoch": 0.59, "learning_rate": 0.0002720562306855904, "loss": 1.7277, "step": 7528 }, { "epoch": 0.59, "learning_rate": 0.00027204904589497175, "loss": 1.7266, "step": 7529 }, { "epoch": 0.59, "learning_rate": 0.0002720418602757075, "loss": 1.7176, "step": 7530 }, { "epoch": 0.59, "learning_rate": 0.0002720346738278462, "loss": 1.6831, "step": 7531 }, { "epoch": 0.59, "learning_rate": 0.00027202748655143693, "loss": 1.6788, "step": 7532 }, { "epoch": 0.59, "learning_rate": 0.00027202029844652833, "loss": 1.6641, "step": 7533 }, { "epoch": 0.59, "learning_rate": 0.0002720131095131693, "loss": 1.6553, "step": 7534 }, { "epoch": 0.59, "learning_rate": 0.0002720059197514085, "loss": 1.7215, "step": 7535 }, { "epoch": 0.59, "learning_rate": 0.00027199872916129495, "loss": 1.6752, "step": 7536 }, { "epoch": 0.59, "learning_rate": 0.0002719915377428772, "loss": 1.7179, "step": 7537 }, { "epoch": 0.59, "learning_rate": 0.00027198434549620436, "loss": 1.6815, "step": 7538 }, { "epoch": 0.59, "learning_rate": 0.0002719771524213251, "loss": 1.7041, "step": 7539 }, { "epoch": 0.59, "learning_rate": 0.00027196995851828823, "loss": 1.7207, "step": 7540 }, { "epoch": 0.59, "learning_rate": 0.0002719627637871427, "loss": 1.6795, "step": 7541 }, { "epoch": 0.59, "learning_rate": 0.00027195556822793724, "loss": 1.6931, "step": 7542 }, { "epoch": 0.59, "learning_rate": 0.00027194837184072086, "loss": 1.6665, "step": 7543 }, { "epoch": 0.59, "learning_rate": 0.0002719411746255423, "loss": 1.7126, "step": 7544 }, { "epoch": 0.59, "learning_rate": 0.00027193397658245046, "loss": 1.671, "step": 7545 }, { "epoch": 0.59, "learning_rate": 0.0002719267777114942, "loss": 1.6831, "step": 7546 }, { "epoch": 0.59, "learning_rate": 0.0002719195780127224, "loss": 1.678, "step": 7547 }, { "epoch": 0.59, "learning_rate": 0.000271912377486184, "loss": 1.6946, "step": 7548 }, { "epoch": 0.59, "learning_rate": 0.00027190517613192775, "loss": 1.7116, "step": 7549 }, { "epoch": 0.59, "learning_rate": 0.0002718979739500027, "loss": 1.6463, "step": 7550 }, { "epoch": 0.59, "learning_rate": 0.00027189077094045763, "loss": 1.6066, "step": 7551 }, { "epoch": 0.59, "learning_rate": 0.0002718835671033415, "loss": 1.6624, "step": 7552 }, { "epoch": 0.59, "learning_rate": 0.0002718763624387032, "loss": 1.7158, "step": 7553 }, { "epoch": 0.59, "learning_rate": 0.0002718691569465917, "loss": 1.6491, "step": 7554 }, { "epoch": 0.59, "learning_rate": 0.00027186195062705584, "loss": 1.7374, "step": 7555 }, { "epoch": 0.59, "learning_rate": 0.00027185474348014456, "loss": 1.743, "step": 7556 }, { "epoch": 0.59, "learning_rate": 0.0002718475355059069, "loss": 1.6777, "step": 7557 }, { "epoch": 0.59, "learning_rate": 0.0002718403267043916, "loss": 1.6868, "step": 7558 }, { "epoch": 0.59, "learning_rate": 0.0002718331170756478, "loss": 1.6627, "step": 7559 }, { "epoch": 0.59, "learning_rate": 0.00027182590661972434, "loss": 1.6575, "step": 7560 }, { "epoch": 0.59, "learning_rate": 0.0002718186953366702, "loss": 1.6577, "step": 7561 }, { "epoch": 0.59, "learning_rate": 0.00027181148322653437, "loss": 1.7298, "step": 7562 }, { "epoch": 0.6, "learning_rate": 0.00027180427028936576, "loss": 1.6644, "step": 7563 }, { "epoch": 0.6, "learning_rate": 0.0002717970565252134, "loss": 1.6828, "step": 7564 }, { "epoch": 0.6, "learning_rate": 0.00027178984193412624, "loss": 1.6782, "step": 7565 }, { "epoch": 0.6, "learning_rate": 0.00027178262651615323, "loss": 1.7056, "step": 7566 }, { "epoch": 0.6, "learning_rate": 0.0002717754102713434, "loss": 1.7003, "step": 7567 }, { "epoch": 0.6, "learning_rate": 0.00027176819319974573, "loss": 1.6483, "step": 7568 }, { "epoch": 0.6, "learning_rate": 0.00027176097530140925, "loss": 1.6868, "step": 7569 }, { "epoch": 0.6, "learning_rate": 0.00027175375657638294, "loss": 1.7036, "step": 7570 }, { "epoch": 0.6, "learning_rate": 0.00027174653702471583, "loss": 1.6919, "step": 7571 }, { "epoch": 0.6, "learning_rate": 0.0002717393166464569, "loss": 1.6507, "step": 7572 }, { "epoch": 0.6, "learning_rate": 0.00027173209544165513, "loss": 1.6637, "step": 7573 }, { "epoch": 0.6, "learning_rate": 0.0002717248734103597, "loss": 1.7043, "step": 7574 }, { "epoch": 0.6, "learning_rate": 0.0002717176505526195, "loss": 1.7313, "step": 7575 }, { "epoch": 0.6, "learning_rate": 0.00027171042686848363, "loss": 1.6536, "step": 7576 }, { "epoch": 0.6, "learning_rate": 0.00027170320235800116, "loss": 1.6796, "step": 7577 }, { "epoch": 0.6, "learning_rate": 0.00027169597702122105, "loss": 1.7097, "step": 7578 }, { "epoch": 0.6, "learning_rate": 0.0002716887508581925, "loss": 1.6431, "step": 7579 }, { "epoch": 0.6, "learning_rate": 0.0002716815238689644, "loss": 1.6832, "step": 7580 }, { "epoch": 0.6, "learning_rate": 0.0002716742960535859, "loss": 1.6959, "step": 7581 }, { "epoch": 0.6, "learning_rate": 0.00027166706741210613, "loss": 1.6647, "step": 7582 }, { "epoch": 0.6, "learning_rate": 0.0002716598379445741, "loss": 1.7074, "step": 7583 }, { "epoch": 0.6, "learning_rate": 0.0002716526076510389, "loss": 1.7063, "step": 7584 }, { "epoch": 0.6, "learning_rate": 0.0002716453765315496, "loss": 1.6459, "step": 7585 }, { "epoch": 0.6, "learning_rate": 0.0002716381445861554, "loss": 1.6759, "step": 7586 }, { "epoch": 0.6, "learning_rate": 0.00027163091181490524, "loss": 1.6879, "step": 7587 }, { "epoch": 0.6, "learning_rate": 0.00027162367821784834, "loss": 1.6841, "step": 7588 }, { "epoch": 0.6, "learning_rate": 0.0002716164437950338, "loss": 1.729, "step": 7589 }, { "epoch": 0.6, "learning_rate": 0.0002716092085465107, "loss": 1.6496, "step": 7590 }, { "epoch": 0.6, "learning_rate": 0.0002716019724723282, "loss": 1.7051, "step": 7591 }, { "epoch": 0.6, "learning_rate": 0.0002715947355725354, "loss": 1.6829, "step": 7592 }, { "epoch": 0.6, "learning_rate": 0.00027158749784718145, "loss": 1.7166, "step": 7593 }, { "epoch": 0.6, "learning_rate": 0.0002715802592963155, "loss": 1.6905, "step": 7594 }, { "epoch": 0.6, "learning_rate": 0.00027157301991998666, "loss": 1.6995, "step": 7595 }, { "epoch": 0.6, "learning_rate": 0.0002715657797182441, "loss": 1.7148, "step": 7596 }, { "epoch": 0.6, "learning_rate": 0.000271558538691137, "loss": 1.6967, "step": 7597 }, { "epoch": 0.6, "learning_rate": 0.00027155129683871455, "loss": 1.6451, "step": 7598 }, { "epoch": 0.6, "learning_rate": 0.0002715440541610258, "loss": 1.6819, "step": 7599 }, { "epoch": 0.6, "learning_rate": 0.00027153681065811996, "loss": 1.6892, "step": 7600 }, { "epoch": 0.6, "learning_rate": 0.00027152956633004634, "loss": 1.716, "step": 7601 }, { "epoch": 0.6, "learning_rate": 0.000271522321176854, "loss": 1.6712, "step": 7602 }, { "epoch": 0.6, "learning_rate": 0.00027151507519859215, "loss": 1.6829, "step": 7603 }, { "epoch": 0.6, "learning_rate": 0.00027150782839530996, "loss": 1.6926, "step": 7604 }, { "epoch": 0.6, "learning_rate": 0.0002715005807670567, "loss": 1.6415, "step": 7605 }, { "epoch": 0.6, "learning_rate": 0.0002714933323138816, "loss": 1.7427, "step": 7606 }, { "epoch": 0.6, "learning_rate": 0.0002714860830358338, "loss": 1.7141, "step": 7607 }, { "epoch": 0.6, "learning_rate": 0.00027147883293296253, "loss": 1.7217, "step": 7608 }, { "epoch": 0.6, "learning_rate": 0.00027147158200531695, "loss": 1.6666, "step": 7609 }, { "epoch": 0.6, "learning_rate": 0.0002714643302529464, "loss": 1.6895, "step": 7610 }, { "epoch": 0.6, "learning_rate": 0.0002714570776759001, "loss": 1.7176, "step": 7611 }, { "epoch": 0.6, "learning_rate": 0.00027144982427422727, "loss": 1.651, "step": 7612 }, { "epoch": 0.6, "learning_rate": 0.0002714425700479772, "loss": 1.6567, "step": 7613 }, { "epoch": 0.6, "learning_rate": 0.000271435314997199, "loss": 1.6357, "step": 7614 }, { "epoch": 0.6, "learning_rate": 0.00027142805912194203, "loss": 1.7244, "step": 7615 }, { "epoch": 0.6, "learning_rate": 0.0002714208024222556, "loss": 1.6917, "step": 7616 }, { "epoch": 0.6, "learning_rate": 0.00027141354489818893, "loss": 1.6865, "step": 7617 }, { "epoch": 0.6, "learning_rate": 0.00027140628654979124, "loss": 1.664, "step": 7618 }, { "epoch": 0.6, "learning_rate": 0.00027139902737711194, "loss": 1.6724, "step": 7619 }, { "epoch": 0.6, "learning_rate": 0.0002713917673802002, "loss": 1.6994, "step": 7620 }, { "epoch": 0.6, "learning_rate": 0.0002713845065591053, "loss": 1.7345, "step": 7621 }, { "epoch": 0.6, "learning_rate": 0.0002713772449138766, "loss": 1.7213, "step": 7622 }, { "epoch": 0.6, "learning_rate": 0.00027136998244456346, "loss": 1.6804, "step": 7623 }, { "epoch": 0.6, "learning_rate": 0.00027136271915121507, "loss": 1.6839, "step": 7624 }, { "epoch": 0.6, "learning_rate": 0.00027135545503388083, "loss": 1.6774, "step": 7625 }, { "epoch": 0.6, "learning_rate": 0.00027134819009261, "loss": 1.7246, "step": 7626 }, { "epoch": 0.6, "learning_rate": 0.00027134092432745183, "loss": 1.7027, "step": 7627 }, { "epoch": 0.6, "learning_rate": 0.00027133365773845584, "loss": 1.6628, "step": 7628 }, { "epoch": 0.6, "learning_rate": 0.0002713263903256713, "loss": 1.6895, "step": 7629 }, { "epoch": 0.6, "learning_rate": 0.00027131912208914745, "loss": 1.7026, "step": 7630 }, { "epoch": 0.6, "learning_rate": 0.0002713118530289338, "loss": 1.6778, "step": 7631 }, { "epoch": 0.6, "learning_rate": 0.00027130458314507947, "loss": 1.6521, "step": 7632 }, { "epoch": 0.6, "learning_rate": 0.0002712973124376341, "loss": 1.7371, "step": 7633 }, { "epoch": 0.6, "learning_rate": 0.0002712900409066468, "loss": 1.7016, "step": 7634 }, { "epoch": 0.6, "learning_rate": 0.00027128276855216713, "loss": 1.6897, "step": 7635 }, { "epoch": 0.6, "learning_rate": 0.0002712754953742444, "loss": 1.7815, "step": 7636 }, { "epoch": 0.6, "learning_rate": 0.00027126822137292793, "loss": 1.7339, "step": 7637 }, { "epoch": 0.6, "learning_rate": 0.00027126094654826723, "loss": 1.7283, "step": 7638 }, { "epoch": 0.6, "learning_rate": 0.00027125367090031154, "loss": 1.6899, "step": 7639 }, { "epoch": 0.6, "learning_rate": 0.0002712463944291104, "loss": 1.7126, "step": 7640 }, { "epoch": 0.6, "learning_rate": 0.0002712391171347131, "loss": 1.66, "step": 7641 }, { "epoch": 0.6, "learning_rate": 0.00027123183901716914, "loss": 1.6935, "step": 7642 }, { "epoch": 0.6, "learning_rate": 0.0002712245600765279, "loss": 1.6505, "step": 7643 }, { "epoch": 0.6, "learning_rate": 0.0002712172803128387, "loss": 1.7, "step": 7644 }, { "epoch": 0.6, "learning_rate": 0.0002712099997261512, "loss": 1.6673, "step": 7645 }, { "epoch": 0.6, "learning_rate": 0.0002712027183165146, "loss": 1.726, "step": 7646 }, { "epoch": 0.6, "learning_rate": 0.00027119543608397845, "loss": 1.6576, "step": 7647 }, { "epoch": 0.6, "learning_rate": 0.0002711881530285922, "loss": 1.6803, "step": 7648 }, { "epoch": 0.6, "learning_rate": 0.00027118086915040523, "loss": 1.6988, "step": 7649 }, { "epoch": 0.6, "learning_rate": 0.00027117358444946705, "loss": 1.7356, "step": 7650 }, { "epoch": 0.6, "learning_rate": 0.0002711662989258271, "loss": 1.6083, "step": 7651 }, { "epoch": 0.6, "learning_rate": 0.00027115901257953484, "loss": 1.6747, "step": 7652 }, { "epoch": 0.6, "learning_rate": 0.0002711517254106397, "loss": 1.6436, "step": 7653 }, { "epoch": 0.6, "learning_rate": 0.00027114443741919127, "loss": 1.6734, "step": 7654 }, { "epoch": 0.6, "learning_rate": 0.00027113714860523897, "loss": 1.6759, "step": 7655 }, { "epoch": 0.6, "learning_rate": 0.0002711298589688322, "loss": 1.6685, "step": 7656 }, { "epoch": 0.6, "learning_rate": 0.00027112256851002063, "loss": 1.6957, "step": 7657 }, { "epoch": 0.6, "learning_rate": 0.0002711152772288536, "loss": 1.6581, "step": 7658 }, { "epoch": 0.6, "learning_rate": 0.00027110798512538066, "loss": 1.6624, "step": 7659 }, { "epoch": 0.6, "learning_rate": 0.00027110069219965136, "loss": 1.6734, "step": 7660 }, { "epoch": 0.6, "learning_rate": 0.0002710933984517152, "loss": 1.6636, "step": 7661 }, { "epoch": 0.6, "learning_rate": 0.0002710861038816217, "loss": 1.657, "step": 7662 }, { "epoch": 0.6, "learning_rate": 0.0002710788084894204, "loss": 1.6635, "step": 7663 }, { "epoch": 0.6, "learning_rate": 0.0002710715122751607, "loss": 1.6743, "step": 7664 }, { "epoch": 0.6, "learning_rate": 0.0002710642152388923, "loss": 1.648, "step": 7665 }, { "epoch": 0.6, "learning_rate": 0.0002710569173806647, "loss": 1.6809, "step": 7666 }, { "epoch": 0.6, "learning_rate": 0.00027104961870052743, "loss": 1.6991, "step": 7667 }, { "epoch": 0.6, "learning_rate": 0.00027104231919853006, "loss": 1.6813, "step": 7668 }, { "epoch": 0.6, "learning_rate": 0.00027103501887472213, "loss": 1.6652, "step": 7669 }, { "epoch": 0.6, "learning_rate": 0.0002710277177291532, "loss": 1.6722, "step": 7670 }, { "epoch": 0.6, "learning_rate": 0.00027102041576187286, "loss": 1.671, "step": 7671 }, { "epoch": 0.6, "learning_rate": 0.0002710131129729307, "loss": 1.6618, "step": 7672 }, { "epoch": 0.6, "learning_rate": 0.00027100580936237627, "loss": 1.7084, "step": 7673 }, { "epoch": 0.6, "learning_rate": 0.00027099850493025917, "loss": 1.6027, "step": 7674 }, { "epoch": 0.6, "learning_rate": 0.000270991199676629, "loss": 1.7443, "step": 7675 }, { "epoch": 0.6, "learning_rate": 0.00027098389360153536, "loss": 1.7147, "step": 7676 }, { "epoch": 0.6, "learning_rate": 0.00027097658670502785, "loss": 1.6694, "step": 7677 }, { "epoch": 0.6, "learning_rate": 0.00027096927898715605, "loss": 1.6139, "step": 7678 }, { "epoch": 0.6, "learning_rate": 0.00027096197044796966, "loss": 1.6711, "step": 7679 }, { "epoch": 0.6, "learning_rate": 0.0002709546610875182, "loss": 1.6158, "step": 7680 }, { "epoch": 0.6, "learning_rate": 0.0002709473509058513, "loss": 1.6948, "step": 7681 }, { "epoch": 0.6, "learning_rate": 0.00027094003990301867, "loss": 1.7084, "step": 7682 }, { "epoch": 0.6, "learning_rate": 0.0002709327280790699, "loss": 1.6321, "step": 7683 }, { "epoch": 0.6, "learning_rate": 0.00027092541543405466, "loss": 1.6759, "step": 7684 }, { "epoch": 0.6, "learning_rate": 0.0002709181019680226, "loss": 1.6781, "step": 7685 }, { "epoch": 0.6, "learning_rate": 0.00027091078768102335, "loss": 1.7327, "step": 7686 }, { "epoch": 0.6, "learning_rate": 0.00027090347257310653, "loss": 1.6678, "step": 7687 }, { "epoch": 0.6, "learning_rate": 0.0002708961566443219, "loss": 1.6637, "step": 7688 }, { "epoch": 0.6, "learning_rate": 0.000270888839894719, "loss": 1.666, "step": 7689 }, { "epoch": 0.61, "learning_rate": 0.00027088152232434767, "loss": 1.6964, "step": 7690 }, { "epoch": 0.61, "learning_rate": 0.0002708742039332575, "loss": 1.6335, "step": 7691 }, { "epoch": 0.61, "learning_rate": 0.00027086688472149813, "loss": 1.7199, "step": 7692 }, { "epoch": 0.61, "learning_rate": 0.0002708595646891194, "loss": 1.7476, "step": 7693 }, { "epoch": 0.61, "learning_rate": 0.00027085224383617085, "loss": 1.6736, "step": 7694 }, { "epoch": 0.61, "learning_rate": 0.0002708449221627023, "loss": 1.6997, "step": 7695 }, { "epoch": 0.61, "learning_rate": 0.00027083759966876344, "loss": 1.7053, "step": 7696 }, { "epoch": 0.61, "learning_rate": 0.0002708302763544039, "loss": 1.6823, "step": 7697 }, { "epoch": 0.61, "learning_rate": 0.00027082295221967354, "loss": 1.6817, "step": 7698 }, { "epoch": 0.61, "learning_rate": 0.00027081562726462196, "loss": 1.6933, "step": 7699 }, { "epoch": 0.61, "learning_rate": 0.0002708083014892989, "loss": 1.7048, "step": 7700 }, { "epoch": 0.61, "learning_rate": 0.0002708009748937542, "loss": 1.6492, "step": 7701 }, { "epoch": 0.61, "learning_rate": 0.0002707936474780375, "loss": 1.683, "step": 7702 }, { "epoch": 0.61, "learning_rate": 0.00027078631924219867, "loss": 1.7572, "step": 7703 }, { "epoch": 0.61, "learning_rate": 0.0002707789901862873, "loss": 1.6935, "step": 7704 }, { "epoch": 0.61, "learning_rate": 0.00027077166031035327, "loss": 1.6798, "step": 7705 }, { "epoch": 0.61, "learning_rate": 0.0002707643296144463, "loss": 1.6856, "step": 7706 }, { "epoch": 0.61, "learning_rate": 0.0002707569980986162, "loss": 1.7108, "step": 7707 }, { "epoch": 0.61, "learning_rate": 0.0002707496657629127, "loss": 1.6775, "step": 7708 }, { "epoch": 0.61, "learning_rate": 0.0002707423326073856, "loss": 1.6686, "step": 7709 }, { "epoch": 0.61, "learning_rate": 0.0002707349986320848, "loss": 1.713, "step": 7710 }, { "epoch": 0.61, "learning_rate": 0.0002707276638370599, "loss": 1.7308, "step": 7711 }, { "epoch": 0.61, "learning_rate": 0.00027072032822236076, "loss": 1.645, "step": 7712 }, { "epoch": 0.61, "learning_rate": 0.00027071299178803727, "loss": 1.5611, "step": 7713 }, { "epoch": 0.61, "learning_rate": 0.0002707056545341391, "loss": 1.6941, "step": 7714 }, { "epoch": 0.61, "learning_rate": 0.00027069831646071624, "loss": 1.7899, "step": 7715 }, { "epoch": 0.61, "learning_rate": 0.0002706909775678184, "loss": 1.6771, "step": 7716 }, { "epoch": 0.61, "learning_rate": 0.00027068363785549533, "loss": 1.7044, "step": 7717 }, { "epoch": 0.61, "learning_rate": 0.000270676297323797, "loss": 1.7449, "step": 7718 }, { "epoch": 0.61, "learning_rate": 0.0002706689559727733, "loss": 1.689, "step": 7719 }, { "epoch": 0.61, "learning_rate": 0.00027066161380247386, "loss": 1.6919, "step": 7720 }, { "epoch": 0.61, "learning_rate": 0.00027065427081294873, "loss": 1.6797, "step": 7721 }, { "epoch": 0.61, "learning_rate": 0.0002706469270042476, "loss": 1.6803, "step": 7722 }, { "epoch": 0.61, "learning_rate": 0.0002706395823764205, "loss": 1.7253, "step": 7723 }, { "epoch": 0.61, "learning_rate": 0.00027063223692951716, "loss": 1.6653, "step": 7724 }, { "epoch": 0.61, "learning_rate": 0.00027062489066358755, "loss": 1.7012, "step": 7725 }, { "epoch": 0.61, "learning_rate": 0.0002706175435786815, "loss": 1.7188, "step": 7726 }, { "epoch": 0.61, "learning_rate": 0.0002706101956748488, "loss": 1.7028, "step": 7727 }, { "epoch": 0.61, "learning_rate": 0.0002706028469521395, "loss": 1.7062, "step": 7728 }, { "epoch": 0.61, "learning_rate": 0.0002705954974106034, "loss": 1.6785, "step": 7729 }, { "epoch": 0.61, "learning_rate": 0.00027058814705029045, "loss": 1.6871, "step": 7730 }, { "epoch": 0.61, "learning_rate": 0.0002705807958712505, "loss": 1.6439, "step": 7731 }, { "epoch": 0.61, "learning_rate": 0.0002705734438735335, "loss": 1.689, "step": 7732 }, { "epoch": 0.61, "learning_rate": 0.0002705660910571894, "loss": 1.6852, "step": 7733 }, { "epoch": 0.61, "learning_rate": 0.000270558737422268, "loss": 1.5901, "step": 7734 }, { "epoch": 0.61, "learning_rate": 0.0002705513829688193, "loss": 1.7427, "step": 7735 }, { "epoch": 0.61, "learning_rate": 0.0002705440276968933, "loss": 1.7023, "step": 7736 }, { "epoch": 0.61, "learning_rate": 0.00027053667160653984, "loss": 1.6657, "step": 7737 }, { "epoch": 0.61, "learning_rate": 0.0002705293146978089, "loss": 1.7394, "step": 7738 }, { "epoch": 0.61, "learning_rate": 0.0002705219569707504, "loss": 1.6606, "step": 7739 }, { "epoch": 0.61, "learning_rate": 0.0002705145984254144, "loss": 1.6896, "step": 7740 }, { "epoch": 0.61, "learning_rate": 0.00027050723906185074, "loss": 1.7368, "step": 7741 }, { "epoch": 0.61, "learning_rate": 0.00027049987888010937, "loss": 1.7081, "step": 7742 }, { "epoch": 0.61, "learning_rate": 0.0002704925178802404, "loss": 1.7303, "step": 7743 }, { "epoch": 0.61, "learning_rate": 0.00027048515606229367, "loss": 1.6666, "step": 7744 }, { "epoch": 0.61, "learning_rate": 0.00027047779342631925, "loss": 1.7523, "step": 7745 }, { "epoch": 0.61, "learning_rate": 0.0002704704299723671, "loss": 1.696, "step": 7746 }, { "epoch": 0.61, "learning_rate": 0.0002704630657004872, "loss": 1.6861, "step": 7747 }, { "epoch": 0.61, "learning_rate": 0.00027045570061072955, "loss": 1.6846, "step": 7748 }, { "epoch": 0.61, "learning_rate": 0.00027044833470314417, "loss": 1.6473, "step": 7749 }, { "epoch": 0.61, "learning_rate": 0.0002704409679777811, "loss": 1.6845, "step": 7750 }, { "epoch": 0.61, "learning_rate": 0.0002704336004346903, "loss": 1.7137, "step": 7751 }, { "epoch": 0.61, "learning_rate": 0.0002704262320739218, "loss": 1.7047, "step": 7752 }, { "epoch": 0.61, "learning_rate": 0.0002704188628955257, "loss": 1.6997, "step": 7753 }, { "epoch": 0.61, "learning_rate": 0.00027041149289955187, "loss": 1.7023, "step": 7754 }, { "epoch": 0.61, "learning_rate": 0.00027040412208605055, "loss": 1.73, "step": 7755 }, { "epoch": 0.61, "learning_rate": 0.0002703967504550716, "loss": 1.6937, "step": 7756 }, { "epoch": 0.61, "learning_rate": 0.0002703893780066652, "loss": 1.6907, "step": 7757 }, { "epoch": 0.61, "learning_rate": 0.00027038200474088135, "loss": 1.7197, "step": 7758 }, { "epoch": 0.61, "learning_rate": 0.00027037463065777013, "loss": 1.6411, "step": 7759 }, { "epoch": 0.61, "learning_rate": 0.0002703672557573816, "loss": 1.6598, "step": 7760 }, { "epoch": 0.61, "learning_rate": 0.00027035988003976585, "loss": 1.7087, "step": 7761 }, { "epoch": 0.61, "learning_rate": 0.0002703525035049729, "loss": 1.6556, "step": 7762 }, { "epoch": 0.61, "learning_rate": 0.00027034512615305286, "loss": 1.5966, "step": 7763 }, { "epoch": 0.61, "learning_rate": 0.0002703377479840559, "loss": 1.6523, "step": 7764 }, { "epoch": 0.61, "learning_rate": 0.0002703303689980319, "loss": 1.6382, "step": 7765 }, { "epoch": 0.61, "learning_rate": 0.0002703229891950312, "loss": 1.6864, "step": 7766 }, { "epoch": 0.61, "learning_rate": 0.0002703156085751038, "loss": 1.6932, "step": 7767 }, { "epoch": 0.61, "learning_rate": 0.0002703082271382998, "loss": 1.7289, "step": 7768 }, { "epoch": 0.61, "learning_rate": 0.0002703008448846693, "loss": 1.6609, "step": 7769 }, { "epoch": 0.61, "learning_rate": 0.00027029346181426246, "loss": 1.6464, "step": 7770 }, { "epoch": 0.61, "learning_rate": 0.00027028607792712944, "loss": 1.658, "step": 7771 }, { "epoch": 0.61, "learning_rate": 0.00027027869322332026, "loss": 1.7308, "step": 7772 }, { "epoch": 0.61, "learning_rate": 0.0002702713077028852, "loss": 1.687, "step": 7773 }, { "epoch": 0.61, "learning_rate": 0.00027026392136587425, "loss": 1.6734, "step": 7774 }, { "epoch": 0.61, "learning_rate": 0.00027025653421233775, "loss": 1.6608, "step": 7775 }, { "epoch": 0.61, "learning_rate": 0.0002702491462423257, "loss": 1.7244, "step": 7776 }, { "epoch": 0.61, "learning_rate": 0.00027024175745588827, "loss": 1.6772, "step": 7777 }, { "epoch": 0.61, "learning_rate": 0.0002702343678530757, "loss": 1.7196, "step": 7778 }, { "epoch": 0.61, "learning_rate": 0.0002702269774339381, "loss": 1.6846, "step": 7779 }, { "epoch": 0.61, "learning_rate": 0.0002702195861985257, "loss": 1.6852, "step": 7780 }, { "epoch": 0.61, "learning_rate": 0.0002702121941468886, "loss": 1.662, "step": 7781 }, { "epoch": 0.61, "learning_rate": 0.00027020480127907707, "loss": 1.6846, "step": 7782 }, { "epoch": 0.61, "learning_rate": 0.0002701974075951413, "loss": 1.682, "step": 7783 }, { "epoch": 0.61, "learning_rate": 0.0002701900130951314, "loss": 1.7145, "step": 7784 }, { "epoch": 0.61, "learning_rate": 0.0002701826177790977, "loss": 1.6503, "step": 7785 }, { "epoch": 0.61, "learning_rate": 0.0002701752216470903, "loss": 1.6752, "step": 7786 }, { "epoch": 0.61, "learning_rate": 0.0002701678246991595, "loss": 1.6866, "step": 7787 }, { "epoch": 0.61, "learning_rate": 0.0002701604269353555, "loss": 1.6393, "step": 7788 }, { "epoch": 0.61, "learning_rate": 0.00027015302835572844, "loss": 1.7086, "step": 7789 }, { "epoch": 0.61, "learning_rate": 0.00027014562896032865, "loss": 1.7065, "step": 7790 }, { "epoch": 0.61, "learning_rate": 0.0002701382287492064, "loss": 1.6913, "step": 7791 }, { "epoch": 0.61, "learning_rate": 0.0002701308277224118, "loss": 1.7747, "step": 7792 }, { "epoch": 0.61, "learning_rate": 0.0002701234258799952, "loss": 1.6597, "step": 7793 }, { "epoch": 0.61, "learning_rate": 0.0002701160232220068, "loss": 1.699, "step": 7794 }, { "epoch": 0.61, "learning_rate": 0.00027010861974849696, "loss": 1.683, "step": 7795 }, { "epoch": 0.61, "learning_rate": 0.00027010121545951586, "loss": 1.7259, "step": 7796 }, { "epoch": 0.61, "learning_rate": 0.00027009381035511374, "loss": 1.6702, "step": 7797 }, { "epoch": 0.61, "learning_rate": 0.0002700864044353409, "loss": 1.7118, "step": 7798 }, { "epoch": 0.61, "learning_rate": 0.00027007899770024776, "loss": 1.6849, "step": 7799 }, { "epoch": 0.61, "learning_rate": 0.0002700715901498844, "loss": 1.6357, "step": 7800 }, { "epoch": 0.61, "learning_rate": 0.0002700641817843012, "loss": 1.6534, "step": 7801 }, { "epoch": 0.61, "learning_rate": 0.00027005677260354843, "loss": 1.6837, "step": 7802 }, { "epoch": 0.61, "learning_rate": 0.00027004936260767654, "loss": 1.6363, "step": 7803 }, { "epoch": 0.61, "learning_rate": 0.00027004195179673566, "loss": 1.6498, "step": 7804 }, { "epoch": 0.61, "learning_rate": 0.00027003454017077616, "loss": 1.7204, "step": 7805 }, { "epoch": 0.61, "learning_rate": 0.00027002712772984834, "loss": 1.6746, "step": 7806 }, { "epoch": 0.61, "learning_rate": 0.0002700197144740026, "loss": 1.673, "step": 7807 }, { "epoch": 0.61, "learning_rate": 0.0002700123004032893, "loss": 1.6588, "step": 7808 }, { "epoch": 0.61, "learning_rate": 0.00027000488551775863, "loss": 1.6707, "step": 7809 }, { "epoch": 0.61, "learning_rate": 0.00026999746981746104, "loss": 1.6246, "step": 7810 }, { "epoch": 0.61, "learning_rate": 0.00026999005330244683, "loss": 1.6991, "step": 7811 }, { "epoch": 0.61, "learning_rate": 0.00026998263597276636, "loss": 1.6535, "step": 7812 }, { "epoch": 0.61, "learning_rate": 0.00026997521782847004, "loss": 1.6328, "step": 7813 }, { "epoch": 0.61, "learning_rate": 0.0002699677988696082, "loss": 1.672, "step": 7814 }, { "epoch": 0.61, "learning_rate": 0.00026996037909623116, "loss": 1.6721, "step": 7815 }, { "epoch": 0.61, "learning_rate": 0.0002699529585083894, "loss": 1.6931, "step": 7816 }, { "epoch": 0.62, "learning_rate": 0.00026994553710613323, "loss": 1.6709, "step": 7817 }, { "epoch": 0.62, "learning_rate": 0.00026993811488951305, "loss": 1.7594, "step": 7818 }, { "epoch": 0.62, "learning_rate": 0.00026993069185857926, "loss": 1.6703, "step": 7819 }, { "epoch": 0.62, "learning_rate": 0.00026992326801338225, "loss": 1.659, "step": 7820 }, { "epoch": 0.62, "learning_rate": 0.0002699158433539724, "loss": 1.6641, "step": 7821 }, { "epoch": 0.62, "learning_rate": 0.0002699084178804002, "loss": 1.7007, "step": 7822 }, { "epoch": 0.62, "learning_rate": 0.000269900991592716, "loss": 1.6525, "step": 7823 }, { "epoch": 0.62, "learning_rate": 0.0002698935644909702, "loss": 1.6699, "step": 7824 }, { "epoch": 0.62, "learning_rate": 0.0002698861365752133, "loss": 1.715, "step": 7825 }, { "epoch": 0.62, "learning_rate": 0.0002698787078454957, "loss": 1.6312, "step": 7826 }, { "epoch": 0.62, "learning_rate": 0.0002698712783018678, "loss": 1.705, "step": 7827 }, { "epoch": 0.62, "learning_rate": 0.0002698638479443801, "loss": 1.6992, "step": 7828 }, { "epoch": 0.62, "learning_rate": 0.00026985641677308296, "loss": 1.6437, "step": 7829 }, { "epoch": 0.62, "learning_rate": 0.00026984898478802695, "loss": 1.6819, "step": 7830 }, { "epoch": 0.62, "learning_rate": 0.00026984155198926245, "loss": 1.6611, "step": 7831 }, { "epoch": 0.62, "learning_rate": 0.00026983411837683995, "loss": 1.6746, "step": 7832 }, { "epoch": 0.62, "learning_rate": 0.0002698266839508099, "loss": 1.7234, "step": 7833 }, { "epoch": 0.62, "learning_rate": 0.00026981924871122287, "loss": 1.7195, "step": 7834 }, { "epoch": 0.62, "learning_rate": 0.00026981181265812917, "loss": 1.6817, "step": 7835 }, { "epoch": 0.62, "learning_rate": 0.0002698043757915794, "loss": 1.6272, "step": 7836 }, { "epoch": 0.62, "learning_rate": 0.000269796938111624, "loss": 1.692, "step": 7837 }, { "epoch": 0.62, "learning_rate": 0.00026978949961831356, "loss": 1.6702, "step": 7838 }, { "epoch": 0.62, "learning_rate": 0.0002697820603116985, "loss": 1.6806, "step": 7839 }, { "epoch": 0.62, "learning_rate": 0.00026977462019182934, "loss": 1.6646, "step": 7840 }, { "epoch": 0.62, "learning_rate": 0.0002697671792587567, "loss": 1.655, "step": 7841 }, { "epoch": 0.62, "learning_rate": 0.00026975973751253087, "loss": 1.7019, "step": 7842 }, { "epoch": 0.62, "learning_rate": 0.0002697522949532026, "loss": 1.6034, "step": 7843 }, { "epoch": 0.62, "learning_rate": 0.0002697448515808223, "loss": 1.6622, "step": 7844 }, { "epoch": 0.62, "learning_rate": 0.0002697374073954405, "loss": 1.7003, "step": 7845 }, { "epoch": 0.62, "learning_rate": 0.0002697299623971078, "loss": 1.7274, "step": 7846 }, { "epoch": 0.62, "learning_rate": 0.0002697225165858748, "loss": 1.6939, "step": 7847 }, { "epoch": 0.62, "learning_rate": 0.0002697150699617919, "loss": 1.6633, "step": 7848 }, { "epoch": 0.62, "learning_rate": 0.00026970762252490977, "loss": 1.6455, "step": 7849 }, { "epoch": 0.62, "learning_rate": 0.00026970017427527894, "loss": 1.7162, "step": 7850 }, { "epoch": 0.62, "learning_rate": 0.00026969272521294995, "loss": 1.7257, "step": 7851 }, { "epoch": 0.62, "learning_rate": 0.0002696852753379734, "loss": 1.7001, "step": 7852 }, { "epoch": 0.62, "learning_rate": 0.00026967782465039995, "loss": 1.6862, "step": 7853 }, { "epoch": 0.62, "learning_rate": 0.0002696703731502801, "loss": 1.6244, "step": 7854 }, { "epoch": 0.62, "learning_rate": 0.00026966292083766447, "loss": 1.652, "step": 7855 }, { "epoch": 0.62, "learning_rate": 0.0002696554677126036, "loss": 1.6518, "step": 7856 }, { "epoch": 0.62, "learning_rate": 0.0002696480137751481, "loss": 1.6362, "step": 7857 }, { "epoch": 0.62, "learning_rate": 0.00026964055902534866, "loss": 1.688, "step": 7858 }, { "epoch": 0.62, "learning_rate": 0.0002696331034632559, "loss": 1.6737, "step": 7859 }, { "epoch": 0.62, "learning_rate": 0.0002696256470889203, "loss": 1.6757, "step": 7860 }, { "epoch": 0.62, "learning_rate": 0.00026961818990239265, "loss": 1.7131, "step": 7861 }, { "epoch": 0.62, "learning_rate": 0.00026961073190372343, "loss": 1.6642, "step": 7862 }, { "epoch": 0.62, "learning_rate": 0.0002696032730929634, "loss": 1.6989, "step": 7863 }, { "epoch": 0.62, "learning_rate": 0.00026959581347016305, "loss": 1.6412, "step": 7864 }, { "epoch": 0.62, "learning_rate": 0.00026958835303537325, "loss": 1.6775, "step": 7865 }, { "epoch": 0.62, "learning_rate": 0.00026958089178864445, "loss": 1.658, "step": 7866 }, { "epoch": 0.62, "learning_rate": 0.00026957342973002744, "loss": 1.6525, "step": 7867 }, { "epoch": 0.62, "learning_rate": 0.00026956596685957275, "loss": 1.6795, "step": 7868 }, { "epoch": 0.62, "learning_rate": 0.00026955850317733116, "loss": 1.6942, "step": 7869 }, { "epoch": 0.62, "learning_rate": 0.0002695510386833534, "loss": 1.655, "step": 7870 }, { "epoch": 0.62, "learning_rate": 0.00026954357337768996, "loss": 1.6853, "step": 7871 }, { "epoch": 0.62, "learning_rate": 0.00026953610726039167, "loss": 1.6029, "step": 7872 }, { "epoch": 0.62, "learning_rate": 0.0002695286403315091, "loss": 1.6674, "step": 7873 }, { "epoch": 0.62, "learning_rate": 0.0002695211725910931, "loss": 1.6964, "step": 7874 }, { "epoch": 0.62, "learning_rate": 0.00026951370403919433, "loss": 1.7697, "step": 7875 }, { "epoch": 0.62, "learning_rate": 0.0002695062346758634, "loss": 1.6439, "step": 7876 }, { "epoch": 0.62, "learning_rate": 0.0002694987645011511, "loss": 1.6776, "step": 7877 }, { "epoch": 0.62, "learning_rate": 0.0002694912935151081, "loss": 1.6482, "step": 7878 }, { "epoch": 0.62, "learning_rate": 0.0002694838217177852, "loss": 1.7287, "step": 7879 }, { "epoch": 0.62, "learning_rate": 0.00026947634910923305, "loss": 1.6736, "step": 7880 }, { "epoch": 0.62, "learning_rate": 0.00026946887568950244, "loss": 1.7489, "step": 7881 }, { "epoch": 0.62, "learning_rate": 0.00026946140145864413, "loss": 1.6102, "step": 7882 }, { "epoch": 0.62, "learning_rate": 0.00026945392641670876, "loss": 1.6736, "step": 7883 }, { "epoch": 0.62, "learning_rate": 0.00026944645056374724, "loss": 1.6409, "step": 7884 }, { "epoch": 0.62, "learning_rate": 0.0002694389738998102, "loss": 1.6954, "step": 7885 }, { "epoch": 0.62, "learning_rate": 0.0002694314964249484, "loss": 1.6533, "step": 7886 }, { "epoch": 0.62, "learning_rate": 0.0002694240181392126, "loss": 1.674, "step": 7887 }, { "epoch": 0.62, "learning_rate": 0.00026941653904265374, "loss": 1.6555, "step": 7888 }, { "epoch": 0.62, "learning_rate": 0.0002694090591353224, "loss": 1.6473, "step": 7889 }, { "epoch": 0.62, "learning_rate": 0.0002694015784172695, "loss": 1.6539, "step": 7890 }, { "epoch": 0.62, "learning_rate": 0.00026939409688854575, "loss": 1.6771, "step": 7891 }, { "epoch": 0.62, "learning_rate": 0.000269386614549202, "loss": 1.6686, "step": 7892 }, { "epoch": 0.62, "learning_rate": 0.000269379131399289, "loss": 1.6812, "step": 7893 }, { "epoch": 0.62, "learning_rate": 0.00026937164743885754, "loss": 1.6667, "step": 7894 }, { "epoch": 0.62, "learning_rate": 0.0002693641626679585, "loss": 1.6442, "step": 7895 }, { "epoch": 0.62, "learning_rate": 0.00026935667708664267, "loss": 1.686, "step": 7896 }, { "epoch": 0.62, "learning_rate": 0.00026934919069496085, "loss": 1.7095, "step": 7897 }, { "epoch": 0.62, "learning_rate": 0.0002693417034929639, "loss": 1.6472, "step": 7898 }, { "epoch": 0.62, "learning_rate": 0.00026933421548070265, "loss": 1.6792, "step": 7899 }, { "epoch": 0.62, "learning_rate": 0.0002693267266582279, "loss": 1.7338, "step": 7900 }, { "epoch": 0.62, "learning_rate": 0.0002693192370255905, "loss": 1.8002, "step": 7901 }, { "epoch": 0.62, "learning_rate": 0.0002693117465828414, "loss": 1.6385, "step": 7902 }, { "epoch": 0.62, "learning_rate": 0.00026930425533003136, "loss": 1.6931, "step": 7903 }, { "epoch": 0.62, "learning_rate": 0.00026929676326721124, "loss": 1.6821, "step": 7904 }, { "epoch": 0.62, "learning_rate": 0.00026928927039443197, "loss": 1.6751, "step": 7905 }, { "epoch": 0.62, "learning_rate": 0.00026928177671174436, "loss": 1.6336, "step": 7906 }, { "epoch": 0.62, "learning_rate": 0.0002692742822191993, "loss": 1.6661, "step": 7907 }, { "epoch": 0.62, "learning_rate": 0.0002692667869168477, "loss": 1.6494, "step": 7908 }, { "epoch": 0.62, "learning_rate": 0.00026925929080474047, "loss": 1.6953, "step": 7909 }, { "epoch": 0.62, "learning_rate": 0.0002692517938829284, "loss": 1.6734, "step": 7910 }, { "epoch": 0.62, "learning_rate": 0.0002692442961514625, "loss": 1.7193, "step": 7911 }, { "epoch": 0.62, "learning_rate": 0.0002692367976103936, "loss": 1.6322, "step": 7912 }, { "epoch": 0.62, "learning_rate": 0.0002692292982597726, "loss": 1.5961, "step": 7913 }, { "epoch": 0.62, "learning_rate": 0.0002692217980996506, "loss": 1.6965, "step": 7914 }, { "epoch": 0.62, "learning_rate": 0.0002692142971300783, "loss": 1.6774, "step": 7915 }, { "epoch": 0.62, "learning_rate": 0.0002692067953511067, "loss": 1.6905, "step": 7916 }, { "epoch": 0.62, "learning_rate": 0.0002691992927627868, "loss": 1.7207, "step": 7917 }, { "epoch": 0.62, "learning_rate": 0.0002691917893651694, "loss": 1.7294, "step": 7918 }, { "epoch": 0.62, "learning_rate": 0.00026918428515830555, "loss": 1.7074, "step": 7919 }, { "epoch": 0.62, "learning_rate": 0.0002691767801422462, "loss": 1.7388, "step": 7920 }, { "epoch": 0.62, "learning_rate": 0.0002691692743170423, "loss": 1.7046, "step": 7921 }, { "epoch": 0.62, "learning_rate": 0.0002691617676827448, "loss": 1.6875, "step": 7922 }, { "epoch": 0.62, "learning_rate": 0.0002691542602394046, "loss": 1.705, "step": 7923 }, { "epoch": 0.62, "learning_rate": 0.00026914675198707276, "loss": 1.6737, "step": 7924 }, { "epoch": 0.62, "learning_rate": 0.0002691392429258002, "loss": 1.6599, "step": 7925 }, { "epoch": 0.62, "learning_rate": 0.00026913173305563793, "loss": 1.6479, "step": 7926 }, { "epoch": 0.62, "learning_rate": 0.000269124222376637, "loss": 1.7129, "step": 7927 }, { "epoch": 0.62, "learning_rate": 0.00026911671088884824, "loss": 1.6592, "step": 7928 }, { "epoch": 0.62, "learning_rate": 0.0002691091985923228, "loss": 1.646, "step": 7929 }, { "epoch": 0.62, "learning_rate": 0.00026910168548711157, "loss": 1.6659, "step": 7930 }, { "epoch": 0.62, "learning_rate": 0.00026909417157326574, "loss": 1.6579, "step": 7931 }, { "epoch": 0.62, "learning_rate": 0.0002690866568508361, "loss": 1.6447, "step": 7932 }, { "epoch": 0.62, "learning_rate": 0.00026907914131987386, "loss": 1.6983, "step": 7933 }, { "epoch": 0.62, "learning_rate": 0.00026907162498042994, "loss": 1.674, "step": 7934 }, { "epoch": 0.62, "learning_rate": 0.00026906410783255534, "loss": 1.7435, "step": 7935 }, { "epoch": 0.62, "learning_rate": 0.00026905658987630117, "loss": 1.6837, "step": 7936 }, { "epoch": 0.62, "learning_rate": 0.0002690490711117185, "loss": 1.6758, "step": 7937 }, { "epoch": 0.62, "learning_rate": 0.0002690415515388583, "loss": 1.6396, "step": 7938 }, { "epoch": 0.62, "learning_rate": 0.0002690340311577717, "loss": 1.7036, "step": 7939 }, { "epoch": 0.62, "learning_rate": 0.00026902650996850965, "loss": 1.6679, "step": 7940 }, { "epoch": 0.62, "learning_rate": 0.0002690189879711233, "loss": 1.7178, "step": 7941 }, { "epoch": 0.62, "learning_rate": 0.00026901146516566374, "loss": 1.7402, "step": 7942 }, { "epoch": 0.62, "learning_rate": 0.00026900394155218195, "loss": 1.6485, "step": 7943 }, { "epoch": 0.63, "learning_rate": 0.0002689964171307291, "loss": 1.6952, "step": 7944 }, { "epoch": 0.63, "learning_rate": 0.00026898889190135627, "loss": 1.6555, "step": 7945 }, { "epoch": 0.63, "learning_rate": 0.00026898136586411456, "loss": 1.6018, "step": 7946 }, { "epoch": 0.63, "learning_rate": 0.00026897383901905496, "loss": 1.7018, "step": 7947 }, { "epoch": 0.63, "learning_rate": 0.00026896631136622863, "loss": 1.6841, "step": 7948 }, { "epoch": 0.63, "learning_rate": 0.00026895878290568675, "loss": 1.6678, "step": 7949 }, { "epoch": 0.63, "learning_rate": 0.0002689512536374804, "loss": 1.6184, "step": 7950 }, { "epoch": 0.63, "learning_rate": 0.0002689437235616606, "loss": 1.7013, "step": 7951 }, { "epoch": 0.63, "learning_rate": 0.00026893619267827866, "loss": 1.7164, "step": 7952 }, { "epoch": 0.63, "learning_rate": 0.0002689286609873855, "loss": 1.7282, "step": 7953 }, { "epoch": 0.63, "learning_rate": 0.00026892112848903244, "loss": 1.6961, "step": 7954 }, { "epoch": 0.63, "learning_rate": 0.00026891359518327047, "loss": 1.6069, "step": 7955 }, { "epoch": 0.63, "learning_rate": 0.0002689060610701509, "loss": 1.7091, "step": 7956 }, { "epoch": 0.63, "learning_rate": 0.00026889852614972475, "loss": 1.6868, "step": 7957 }, { "epoch": 0.63, "learning_rate": 0.00026889099042204324, "loss": 1.6756, "step": 7958 }, { "epoch": 0.63, "learning_rate": 0.0002688834538871575, "loss": 1.7184, "step": 7959 }, { "epoch": 0.63, "learning_rate": 0.0002688759165451187, "loss": 1.6596, "step": 7960 }, { "epoch": 0.63, "learning_rate": 0.00026886837839597803, "loss": 1.6758, "step": 7961 }, { "epoch": 0.63, "learning_rate": 0.00026886083943978667, "loss": 1.6293, "step": 7962 }, { "epoch": 0.63, "learning_rate": 0.0002688532996765958, "loss": 1.6653, "step": 7963 }, { "epoch": 0.63, "learning_rate": 0.0002688457591064566, "loss": 1.6791, "step": 7964 }, { "epoch": 0.63, "learning_rate": 0.0002688382177294203, "loss": 1.6436, "step": 7965 }, { "epoch": 0.63, "learning_rate": 0.00026883067554553814, "loss": 1.6405, "step": 7966 }, { "epoch": 0.63, "learning_rate": 0.0002688231325548612, "loss": 1.6868, "step": 7967 }, { "epoch": 0.63, "learning_rate": 0.0002688155887574408, "loss": 1.6961, "step": 7968 }, { "epoch": 0.63, "learning_rate": 0.00026880804415332807, "loss": 1.6919, "step": 7969 }, { "epoch": 0.63, "learning_rate": 0.00026880049874257423, "loss": 1.647, "step": 7970 }, { "epoch": 0.63, "learning_rate": 0.0002687929525252307, "loss": 1.7107, "step": 7971 }, { "epoch": 0.63, "learning_rate": 0.0002687854055013485, "loss": 1.6925, "step": 7972 }, { "epoch": 0.63, "learning_rate": 0.000268777857670979, "loss": 1.6872, "step": 7973 }, { "epoch": 0.63, "learning_rate": 0.00026877030903417335, "loss": 1.7126, "step": 7974 }, { "epoch": 0.63, "learning_rate": 0.00026876275959098286, "loss": 1.6558, "step": 7975 }, { "epoch": 0.63, "learning_rate": 0.00026875520934145874, "loss": 1.7005, "step": 7976 }, { "epoch": 0.63, "learning_rate": 0.00026874765828565234, "loss": 1.6815, "step": 7977 }, { "epoch": 0.63, "learning_rate": 0.0002687401064236148, "loss": 1.6932, "step": 7978 }, { "epoch": 0.63, "learning_rate": 0.0002687325537553975, "loss": 1.6381, "step": 7979 }, { "epoch": 0.63, "learning_rate": 0.0002687250002810517, "loss": 1.6071, "step": 7980 }, { "epoch": 0.63, "learning_rate": 0.00026871744600062865, "loss": 1.6768, "step": 7981 }, { "epoch": 0.63, "learning_rate": 0.0002687098909141797, "loss": 1.6963, "step": 7982 }, { "epoch": 0.63, "learning_rate": 0.00026870233502175605, "loss": 1.6512, "step": 7983 }, { "epoch": 0.63, "learning_rate": 0.000268694778323409, "loss": 1.6491, "step": 7984 }, { "epoch": 0.63, "learning_rate": 0.00026868722081919, "loss": 1.6878, "step": 7985 }, { "epoch": 0.63, "learning_rate": 0.0002686796625091502, "loss": 1.673, "step": 7986 }, { "epoch": 0.63, "learning_rate": 0.00026867210339334105, "loss": 1.6792, "step": 7987 }, { "epoch": 0.63, "learning_rate": 0.0002686645434718138, "loss": 1.6862, "step": 7988 }, { "epoch": 0.63, "learning_rate": 0.00026865698274461977, "loss": 1.6718, "step": 7989 }, { "epoch": 0.63, "learning_rate": 0.00026864942121181026, "loss": 1.661, "step": 7990 }, { "epoch": 0.63, "learning_rate": 0.0002686418588734367, "loss": 1.6575, "step": 7991 }, { "epoch": 0.63, "learning_rate": 0.00026863429572955035, "loss": 1.7183, "step": 7992 }, { "epoch": 0.63, "learning_rate": 0.0002686267317802026, "loss": 1.7032, "step": 7993 }, { "epoch": 0.63, "learning_rate": 0.0002686191670254449, "loss": 1.6925, "step": 7994 }, { "epoch": 0.63, "learning_rate": 0.0002686116014653285, "loss": 1.6807, "step": 7995 }, { "epoch": 0.63, "learning_rate": 0.0002686040350999047, "loss": 1.689, "step": 7996 }, { "epoch": 0.63, "learning_rate": 0.00026859646792922495, "loss": 1.7119, "step": 7997 }, { "epoch": 0.63, "learning_rate": 0.0002685888999533407, "loss": 1.6868, "step": 7998 }, { "epoch": 0.63, "learning_rate": 0.00026858133117230317, "loss": 1.7426, "step": 7999 }, { "epoch": 0.63, "learning_rate": 0.0002685737615861639, "loss": 1.6945, "step": 8000 }, { "epoch": 0.63, "learning_rate": 0.00026856619119497427, "loss": 1.6439, "step": 8001 }, { "epoch": 0.63, "learning_rate": 0.00026855861999878556, "loss": 1.722, "step": 8002 }, { "epoch": 0.63, "learning_rate": 0.00026855104799764927, "loss": 1.7296, "step": 8003 }, { "epoch": 0.63, "learning_rate": 0.0002685434751916168, "loss": 1.6209, "step": 8004 }, { "epoch": 0.63, "learning_rate": 0.0002685359015807395, "loss": 1.6897, "step": 8005 }, { "epoch": 0.63, "learning_rate": 0.0002685283271650689, "loss": 1.7329, "step": 8006 }, { "epoch": 0.63, "learning_rate": 0.00026852075194465635, "loss": 1.6984, "step": 8007 }, { "epoch": 0.63, "learning_rate": 0.0002685131759195533, "loss": 1.6564, "step": 8008 }, { "epoch": 0.63, "learning_rate": 0.00026850559908981117, "loss": 1.7169, "step": 8009 }, { "epoch": 0.63, "learning_rate": 0.0002684980214554814, "loss": 1.6742, "step": 8010 }, { "epoch": 0.63, "learning_rate": 0.0002684904430166155, "loss": 1.6893, "step": 8011 }, { "epoch": 0.63, "learning_rate": 0.0002684828637732649, "loss": 1.6508, "step": 8012 }, { "epoch": 0.63, "learning_rate": 0.000268475283725481, "loss": 1.6691, "step": 8013 }, { "epoch": 0.63, "learning_rate": 0.0002684677028733153, "loss": 1.7192, "step": 8014 }, { "epoch": 0.63, "learning_rate": 0.0002684601212168193, "loss": 1.6655, "step": 8015 }, { "epoch": 0.63, "learning_rate": 0.0002684525387560444, "loss": 1.6709, "step": 8016 }, { "epoch": 0.63, "learning_rate": 0.00026844495549104214, "loss": 1.7078, "step": 8017 }, { "epoch": 0.63, "learning_rate": 0.00026843737142186403, "loss": 1.717, "step": 8018 }, { "epoch": 0.63, "learning_rate": 0.0002684297865485615, "loss": 1.6707, "step": 8019 }, { "epoch": 0.63, "learning_rate": 0.0002684222008711861, "loss": 1.6902, "step": 8020 }, { "epoch": 0.63, "learning_rate": 0.00026841461438978934, "loss": 1.6427, "step": 8021 }, { "epoch": 0.63, "learning_rate": 0.0002684070271044226, "loss": 1.6507, "step": 8022 }, { "epoch": 0.63, "learning_rate": 0.00026839943901513756, "loss": 1.6883, "step": 8023 }, { "epoch": 0.63, "learning_rate": 0.00026839185012198565, "loss": 1.6779, "step": 8024 }, { "epoch": 0.63, "learning_rate": 0.0002683842604250184, "loss": 1.6883, "step": 8025 }, { "epoch": 0.63, "learning_rate": 0.00026837666992428734, "loss": 1.709, "step": 8026 }, { "epoch": 0.63, "learning_rate": 0.00026836907861984405, "loss": 1.6425, "step": 8027 }, { "epoch": 0.63, "learning_rate": 0.00026836148651174, "loss": 1.6228, "step": 8028 }, { "epoch": 0.63, "learning_rate": 0.0002683538936000268, "loss": 1.6381, "step": 8029 }, { "epoch": 0.63, "learning_rate": 0.000268346299884756, "loss": 1.6916, "step": 8030 }, { "epoch": 0.63, "learning_rate": 0.00026833870536597913, "loss": 1.6401, "step": 8031 }, { "epoch": 0.63, "learning_rate": 0.00026833111004374773, "loss": 1.6433, "step": 8032 }, { "epoch": 0.63, "learning_rate": 0.00026832351391811336, "loss": 1.7554, "step": 8033 }, { "epoch": 0.63, "learning_rate": 0.0002683159169891277, "loss": 1.6828, "step": 8034 }, { "epoch": 0.63, "learning_rate": 0.00026830831925684224, "loss": 1.669, "step": 8035 }, { "epoch": 0.63, "learning_rate": 0.0002683007207213085, "loss": 1.6838, "step": 8036 }, { "epoch": 0.63, "learning_rate": 0.0002682931213825782, "loss": 1.6407, "step": 8037 }, { "epoch": 0.63, "learning_rate": 0.0002682855212407029, "loss": 1.6445, "step": 8038 }, { "epoch": 0.63, "learning_rate": 0.0002682779202957342, "loss": 1.7145, "step": 8039 }, { "epoch": 0.63, "learning_rate": 0.00026827031854772366, "loss": 1.6482, "step": 8040 }, { "epoch": 0.63, "learning_rate": 0.0002682627159967229, "loss": 1.6455, "step": 8041 }, { "epoch": 0.63, "learning_rate": 0.0002682551126427836, "loss": 1.6741, "step": 8042 }, { "epoch": 0.63, "learning_rate": 0.0002682475084859574, "loss": 1.7201, "step": 8043 }, { "epoch": 0.63, "learning_rate": 0.0002682399035262958, "loss": 1.688, "step": 8044 }, { "epoch": 0.63, "learning_rate": 0.0002682322977638505, "loss": 1.6639, "step": 8045 }, { "epoch": 0.63, "learning_rate": 0.0002682246911986732, "loss": 1.6863, "step": 8046 }, { "epoch": 0.63, "learning_rate": 0.0002682170838308154, "loss": 1.6544, "step": 8047 }, { "epoch": 0.63, "learning_rate": 0.0002682094756603289, "loss": 1.6814, "step": 8048 }, { "epoch": 0.63, "learning_rate": 0.0002682018666872653, "loss": 1.6869, "step": 8049 }, { "epoch": 0.63, "learning_rate": 0.00026819425691167626, "loss": 1.714, "step": 8050 }, { "epoch": 0.63, "learning_rate": 0.0002681866463336134, "loss": 1.6934, "step": 8051 }, { "epoch": 0.63, "learning_rate": 0.00026817903495312845, "loss": 1.632, "step": 8052 }, { "epoch": 0.63, "learning_rate": 0.00026817142277027305, "loss": 1.6972, "step": 8053 }, { "epoch": 0.63, "learning_rate": 0.0002681638097850989, "loss": 1.6909, "step": 8054 }, { "epoch": 0.63, "learning_rate": 0.00026815619599765775, "loss": 1.6625, "step": 8055 }, { "epoch": 0.63, "learning_rate": 0.0002681485814080011, "loss": 1.5984, "step": 8056 }, { "epoch": 0.63, "learning_rate": 0.00026814096601618094, "loss": 1.6554, "step": 8057 }, { "epoch": 0.63, "learning_rate": 0.00026813334982224874, "loss": 1.6908, "step": 8058 }, { "epoch": 0.63, "learning_rate": 0.0002681257328262563, "loss": 1.6707, "step": 8059 }, { "epoch": 0.63, "learning_rate": 0.00026811811502825534, "loss": 1.7074, "step": 8060 }, { "epoch": 0.63, "learning_rate": 0.0002681104964282975, "loss": 1.6452, "step": 8061 }, { "epoch": 0.63, "learning_rate": 0.00026810287702643465, "loss": 1.7012, "step": 8062 }, { "epoch": 0.63, "learning_rate": 0.0002680952568227184, "loss": 1.6252, "step": 8063 }, { "epoch": 0.63, "learning_rate": 0.0002680876358172005, "loss": 1.6627, "step": 8064 }, { "epoch": 0.63, "learning_rate": 0.0002680800140099328, "loss": 1.6289, "step": 8065 }, { "epoch": 0.63, "learning_rate": 0.00026807239140096687, "loss": 1.6608, "step": 8066 }, { "epoch": 0.63, "learning_rate": 0.00026806476799035457, "loss": 1.7209, "step": 8067 }, { "epoch": 0.63, "learning_rate": 0.0002680571437781477, "loss": 1.6477, "step": 8068 }, { "epoch": 0.63, "learning_rate": 0.00026804951876439794, "loss": 1.7136, "step": 8069 }, { "epoch": 0.63, "learning_rate": 0.0002680418929491571, "loss": 1.6526, "step": 8070 }, { "epoch": 0.64, "learning_rate": 0.00026803426633247696, "loss": 1.6023, "step": 8071 }, { "epoch": 0.64, "learning_rate": 0.00026802663891440927, "loss": 1.6697, "step": 8072 }, { "epoch": 0.64, "learning_rate": 0.00026801901069500584, "loss": 1.6448, "step": 8073 }, { "epoch": 0.64, "learning_rate": 0.00026801138167431847, "loss": 1.6497, "step": 8074 }, { "epoch": 0.64, "learning_rate": 0.00026800375185239897, "loss": 1.7163, "step": 8075 }, { "epoch": 0.64, "learning_rate": 0.00026799612122929906, "loss": 1.6562, "step": 8076 }, { "epoch": 0.64, "learning_rate": 0.0002679884898050706, "loss": 1.6522, "step": 8077 }, { "epoch": 0.64, "learning_rate": 0.00026798085757976547, "loss": 1.6682, "step": 8078 }, { "epoch": 0.64, "learning_rate": 0.0002679732245534354, "loss": 1.7205, "step": 8079 }, { "epoch": 0.64, "learning_rate": 0.00026796559072613213, "loss": 1.6988, "step": 8080 }, { "epoch": 0.64, "learning_rate": 0.00026795795609790775, "loss": 1.6689, "step": 8081 }, { "epoch": 0.64, "learning_rate": 0.00026795032066881386, "loss": 1.7073, "step": 8082 }, { "epoch": 0.64, "learning_rate": 0.00026794268443890244, "loss": 1.6581, "step": 8083 }, { "epoch": 0.64, "learning_rate": 0.0002679350474082252, "loss": 1.6882, "step": 8084 }, { "epoch": 0.64, "learning_rate": 0.0002679274095768341, "loss": 1.6925, "step": 8085 }, { "epoch": 0.64, "learning_rate": 0.000267919770944781, "loss": 1.7519, "step": 8086 }, { "epoch": 0.64, "learning_rate": 0.0002679121315121177, "loss": 1.6465, "step": 8087 }, { "epoch": 0.64, "learning_rate": 0.0002679044912788961, "loss": 1.6788, "step": 8088 }, { "epoch": 0.64, "learning_rate": 0.0002678968502451681, "loss": 1.6597, "step": 8089 }, { "epoch": 0.64, "learning_rate": 0.0002678892084109855, "loss": 1.6476, "step": 8090 }, { "epoch": 0.64, "learning_rate": 0.00026788156577640026, "loss": 1.6792, "step": 8091 }, { "epoch": 0.64, "learning_rate": 0.00026787392234146423, "loss": 1.631, "step": 8092 }, { "epoch": 0.64, "learning_rate": 0.0002678662781062293, "loss": 1.7074, "step": 8093 }, { "epoch": 0.64, "learning_rate": 0.0002678586330707474, "loss": 1.685, "step": 8094 }, { "epoch": 0.64, "learning_rate": 0.0002678509872350704, "loss": 1.6629, "step": 8095 }, { "epoch": 0.64, "learning_rate": 0.0002678433405992503, "loss": 1.644, "step": 8096 }, { "epoch": 0.64, "learning_rate": 0.00026783569316333886, "loss": 1.6092, "step": 8097 }, { "epoch": 0.64, "learning_rate": 0.0002678280449273882, "loss": 1.7022, "step": 8098 }, { "epoch": 0.64, "learning_rate": 0.00026782039589145004, "loss": 1.6751, "step": 8099 }, { "epoch": 0.64, "learning_rate": 0.00026781274605557645, "loss": 1.6853, "step": 8100 }, { "epoch": 0.64, "learning_rate": 0.0002678050954198193, "loss": 1.6191, "step": 8101 }, { "epoch": 0.64, "learning_rate": 0.00026779744398423063, "loss": 1.6612, "step": 8102 }, { "epoch": 0.64, "learning_rate": 0.00026778979174886227, "loss": 1.6861, "step": 8103 }, { "epoch": 0.64, "learning_rate": 0.0002677821387137662, "loss": 1.6706, "step": 8104 }, { "epoch": 0.64, "learning_rate": 0.00026777448487899446, "loss": 1.6572, "step": 8105 }, { "epoch": 0.64, "learning_rate": 0.00026776683024459894, "loss": 1.6829, "step": 8106 }, { "epoch": 0.64, "learning_rate": 0.00026775917481063164, "loss": 1.7045, "step": 8107 }, { "epoch": 0.64, "learning_rate": 0.0002677515185771445, "loss": 1.6156, "step": 8108 }, { "epoch": 0.64, "learning_rate": 0.00026774386154418953, "loss": 1.6785, "step": 8109 }, { "epoch": 0.64, "learning_rate": 0.00026773620371181876, "loss": 1.6452, "step": 8110 }, { "epoch": 0.64, "learning_rate": 0.0002677285450800841, "loss": 1.672, "step": 8111 }, { "epoch": 0.64, "learning_rate": 0.0002677208856490376, "loss": 1.624, "step": 8112 }, { "epoch": 0.64, "learning_rate": 0.00026771322541873125, "loss": 1.6388, "step": 8113 }, { "epoch": 0.64, "learning_rate": 0.0002677055643892171, "loss": 1.616, "step": 8114 }, { "epoch": 0.64, "learning_rate": 0.0002676979025605471, "loss": 1.6454, "step": 8115 }, { "epoch": 0.64, "learning_rate": 0.00026769023993277325, "loss": 1.7039, "step": 8116 }, { "epoch": 0.64, "learning_rate": 0.0002676825765059476, "loss": 1.7104, "step": 8117 }, { "epoch": 0.64, "learning_rate": 0.0002676749122801223, "loss": 1.6562, "step": 8118 }, { "epoch": 0.64, "learning_rate": 0.0002676672472553492, "loss": 1.6751, "step": 8119 }, { "epoch": 0.64, "learning_rate": 0.0002676595814316805, "loss": 1.711, "step": 8120 }, { "epoch": 0.64, "learning_rate": 0.0002676519148091681, "loss": 1.6443, "step": 8121 }, { "epoch": 0.64, "learning_rate": 0.0002676442473878641, "loss": 1.6957, "step": 8122 }, { "epoch": 0.64, "learning_rate": 0.00026763657916782066, "loss": 1.6643, "step": 8123 }, { "epoch": 0.64, "learning_rate": 0.00026762891014908973, "loss": 1.6219, "step": 8124 }, { "epoch": 0.64, "learning_rate": 0.0002676212403317234, "loss": 1.6676, "step": 8125 }, { "epoch": 0.64, "learning_rate": 0.0002676135697157738, "loss": 1.6797, "step": 8126 }, { "epoch": 0.64, "learning_rate": 0.0002676058983012929, "loss": 1.6985, "step": 8127 }, { "epoch": 0.64, "learning_rate": 0.0002675982260883329, "loss": 1.7225, "step": 8128 }, { "epoch": 0.64, "learning_rate": 0.00026759055307694585, "loss": 1.7174, "step": 8129 }, { "epoch": 0.64, "learning_rate": 0.00026758287926718384, "loss": 1.6862, "step": 8130 }, { "epoch": 0.64, "learning_rate": 0.0002675752046590989, "loss": 1.6954, "step": 8131 }, { "epoch": 0.64, "learning_rate": 0.00026756752925274327, "loss": 1.6927, "step": 8132 }, { "epoch": 0.64, "learning_rate": 0.000267559853048169, "loss": 1.6237, "step": 8133 }, { "epoch": 0.64, "learning_rate": 0.00026755217604542813, "loss": 1.6414, "step": 8134 }, { "epoch": 0.64, "learning_rate": 0.0002675444982445729, "loss": 1.6172, "step": 8135 }, { "epoch": 0.64, "learning_rate": 0.0002675368196456554, "loss": 1.7271, "step": 8136 }, { "epoch": 0.64, "learning_rate": 0.0002675291402487278, "loss": 1.6144, "step": 8137 }, { "epoch": 0.64, "learning_rate": 0.00026752146005384214, "loss": 1.666, "step": 8138 }, { "epoch": 0.64, "learning_rate": 0.0002675137790610506, "loss": 1.7447, "step": 8139 }, { "epoch": 0.64, "learning_rate": 0.0002675060972704054, "loss": 1.7418, "step": 8140 }, { "epoch": 0.64, "learning_rate": 0.0002674984146819586, "loss": 1.6182, "step": 8141 }, { "epoch": 0.64, "learning_rate": 0.00026749073129576245, "loss": 1.6027, "step": 8142 }, { "epoch": 0.64, "learning_rate": 0.00026748304711186904, "loss": 1.7185, "step": 8143 }, { "epoch": 0.64, "learning_rate": 0.0002674753621303306, "loss": 1.6619, "step": 8144 }, { "epoch": 0.64, "learning_rate": 0.00026746767635119924, "loss": 1.6, "step": 8145 }, { "epoch": 0.64, "learning_rate": 0.0002674599897745272, "loss": 1.686, "step": 8146 }, { "epoch": 0.64, "learning_rate": 0.0002674523024003667, "loss": 1.6941, "step": 8147 }, { "epoch": 0.64, "learning_rate": 0.00026744461422876977, "loss": 1.668, "step": 8148 }, { "epoch": 0.64, "learning_rate": 0.0002674369252597888, "loss": 1.6378, "step": 8149 }, { "epoch": 0.64, "learning_rate": 0.00026742923549347587, "loss": 1.6949, "step": 8150 }, { "epoch": 0.64, "learning_rate": 0.0002674215449298833, "loss": 1.6727, "step": 8151 }, { "epoch": 0.64, "learning_rate": 0.00026741385356906323, "loss": 1.6903, "step": 8152 }, { "epoch": 0.64, "learning_rate": 0.00026740616141106787, "loss": 1.6657, "step": 8153 }, { "epoch": 0.64, "learning_rate": 0.0002673984684559494, "loss": 1.6796, "step": 8154 }, { "epoch": 0.64, "learning_rate": 0.0002673907747037602, "loss": 1.6957, "step": 8155 }, { "epoch": 0.64, "learning_rate": 0.00026738308015455237, "loss": 1.7172, "step": 8156 }, { "epoch": 0.64, "learning_rate": 0.00026737538480837823, "loss": 1.7152, "step": 8157 }, { "epoch": 0.64, "learning_rate": 0.00026736768866529, "loss": 1.6797, "step": 8158 }, { "epoch": 0.64, "learning_rate": 0.0002673599917253399, "loss": 1.6594, "step": 8159 }, { "epoch": 0.64, "learning_rate": 0.0002673522939885803, "loss": 1.6776, "step": 8160 }, { "epoch": 0.64, "learning_rate": 0.0002673445954550633, "loss": 1.6824, "step": 8161 }, { "epoch": 0.64, "learning_rate": 0.0002673368961248413, "loss": 1.6764, "step": 8162 }, { "epoch": 0.64, "learning_rate": 0.0002673291959979665, "loss": 1.6308, "step": 8163 }, { "epoch": 0.64, "learning_rate": 0.0002673214950744912, "loss": 1.6248, "step": 8164 }, { "epoch": 0.64, "learning_rate": 0.0002673137933544677, "loss": 1.6441, "step": 8165 }, { "epoch": 0.64, "learning_rate": 0.0002673060908379483, "loss": 1.6479, "step": 8166 }, { "epoch": 0.64, "learning_rate": 0.00026729838752498526, "loss": 1.6779, "step": 8167 }, { "epoch": 0.64, "learning_rate": 0.00026729068341563094, "loss": 1.6383, "step": 8168 }, { "epoch": 0.64, "learning_rate": 0.00026728297850993755, "loss": 1.6761, "step": 8169 }, { "epoch": 0.64, "learning_rate": 0.0002672752728079575, "loss": 1.6413, "step": 8170 }, { "epoch": 0.64, "learning_rate": 0.00026726756630974304, "loss": 1.6993, "step": 8171 }, { "epoch": 0.64, "learning_rate": 0.0002672598590153466, "loss": 1.6767, "step": 8172 }, { "epoch": 0.64, "learning_rate": 0.0002672521509248203, "loss": 1.6667, "step": 8173 }, { "epoch": 0.64, "learning_rate": 0.00026724444203821666, "loss": 1.6784, "step": 8174 }, { "epoch": 0.64, "learning_rate": 0.0002672367323555879, "loss": 1.6656, "step": 8175 }, { "epoch": 0.64, "learning_rate": 0.00026722902187698656, "loss": 1.6756, "step": 8176 }, { "epoch": 0.64, "learning_rate": 0.00026722131060246475, "loss": 1.656, "step": 8177 }, { "epoch": 0.64, "learning_rate": 0.00026721359853207495, "loss": 1.6413, "step": 8178 }, { "epoch": 0.64, "learning_rate": 0.0002672058856658695, "loss": 1.7307, "step": 8179 }, { "epoch": 0.64, "learning_rate": 0.00026719817200390077, "loss": 1.6537, "step": 8180 }, { "epoch": 0.64, "learning_rate": 0.0002671904575462211, "loss": 1.6717, "step": 8181 }, { "epoch": 0.64, "learning_rate": 0.00026718274229288295, "loss": 1.6689, "step": 8182 }, { "epoch": 0.64, "learning_rate": 0.0002671750262439386, "loss": 1.6661, "step": 8183 }, { "epoch": 0.64, "learning_rate": 0.0002671673093994405, "loss": 1.6373, "step": 8184 }, { "epoch": 0.64, "learning_rate": 0.00026715959175944103, "loss": 1.6083, "step": 8185 }, { "epoch": 0.64, "learning_rate": 0.0002671518733239926, "loss": 1.6498, "step": 8186 }, { "epoch": 0.64, "learning_rate": 0.00026714415409314756, "loss": 1.6772, "step": 8187 }, { "epoch": 0.64, "learning_rate": 0.00026713643406695844, "loss": 1.6516, "step": 8188 }, { "epoch": 0.64, "learning_rate": 0.0002671287132454775, "loss": 1.6847, "step": 8189 }, { "epoch": 0.64, "learning_rate": 0.0002671209916287572, "loss": 1.6567, "step": 8190 }, { "epoch": 0.64, "learning_rate": 0.00026711326921685, "loss": 1.6398, "step": 8191 }, { "epoch": 0.64, "learning_rate": 0.00026710554600980845, "loss": 1.6094, "step": 8192 }, { "epoch": 0.64, "learning_rate": 0.0002670978220076848, "loss": 1.6579, "step": 8193 }, { "epoch": 0.64, "learning_rate": 0.00026709009721053155, "loss": 1.6467, "step": 8194 }, { "epoch": 0.64, "learning_rate": 0.0002670823716184011, "loss": 1.6801, "step": 8195 }, { "epoch": 0.64, "learning_rate": 0.00026707464523134607, "loss": 1.6925, "step": 8196 }, { "epoch": 0.64, "learning_rate": 0.00026706691804941876, "loss": 1.6015, "step": 8197 }, { "epoch": 0.65, "learning_rate": 0.0002670591900726717, "loss": 1.6707, "step": 8198 }, { "epoch": 0.65, "learning_rate": 0.0002670514613011573, "loss": 1.692, "step": 8199 }, { "epoch": 0.65, "learning_rate": 0.0002670437317349281, "loss": 1.6843, "step": 8200 }, { "epoch": 0.65, "learning_rate": 0.00026703600137403653, "loss": 1.6931, "step": 8201 }, { "epoch": 0.65, "learning_rate": 0.0002670282702185351, "loss": 1.6605, "step": 8202 }, { "epoch": 0.65, "learning_rate": 0.00026702053826847626, "loss": 1.7114, "step": 8203 }, { "epoch": 0.65, "learning_rate": 0.0002670128055239126, "loss": 1.738, "step": 8204 }, { "epoch": 0.65, "learning_rate": 0.00026700507198489657, "loss": 1.6886, "step": 8205 }, { "epoch": 0.65, "learning_rate": 0.0002669973376514806, "loss": 1.6997, "step": 8206 }, { "epoch": 0.65, "learning_rate": 0.0002669896025237173, "loss": 1.682, "step": 8207 }, { "epoch": 0.65, "learning_rate": 0.0002669818666016592, "loss": 1.6452, "step": 8208 }, { "epoch": 0.65, "learning_rate": 0.00026697412988535877, "loss": 1.6342, "step": 8209 }, { "epoch": 0.65, "learning_rate": 0.00026696639237486854, "loss": 1.6999, "step": 8210 }, { "epoch": 0.65, "learning_rate": 0.00026695865407024103, "loss": 1.6683, "step": 8211 }, { "epoch": 0.65, "learning_rate": 0.00026695091497152884, "loss": 1.6839, "step": 8212 }, { "epoch": 0.65, "learning_rate": 0.00026694317507878443, "loss": 1.6508, "step": 8213 }, { "epoch": 0.65, "learning_rate": 0.00026693543439206045, "loss": 1.7201, "step": 8214 }, { "epoch": 0.65, "learning_rate": 0.0002669276929114094, "loss": 1.5918, "step": 8215 }, { "epoch": 0.65, "learning_rate": 0.0002669199506368838, "loss": 1.6578, "step": 8216 }, { "epoch": 0.65, "learning_rate": 0.00026691220756853626, "loss": 1.7081, "step": 8217 }, { "epoch": 0.65, "learning_rate": 0.0002669044637064194, "loss": 1.6516, "step": 8218 }, { "epoch": 0.65, "learning_rate": 0.00026689671905058565, "loss": 1.659, "step": 8219 }, { "epoch": 0.65, "learning_rate": 0.0002668889736010878, "loss": 1.7127, "step": 8220 }, { "epoch": 0.65, "learning_rate": 0.00026688122735797826, "loss": 1.6691, "step": 8221 }, { "epoch": 0.65, "learning_rate": 0.0002668734803213097, "loss": 1.657, "step": 8222 }, { "epoch": 0.65, "learning_rate": 0.00026686573249113467, "loss": 1.6452, "step": 8223 }, { "epoch": 0.65, "learning_rate": 0.0002668579838675058, "loss": 1.6932, "step": 8224 }, { "epoch": 0.65, "learning_rate": 0.0002668502344504758, "loss": 1.6244, "step": 8225 }, { "epoch": 0.65, "learning_rate": 0.0002668424842400971, "loss": 1.6358, "step": 8226 }, { "epoch": 0.65, "learning_rate": 0.00026683473323642245, "loss": 1.7188, "step": 8227 }, { "epoch": 0.65, "learning_rate": 0.00026682698143950444, "loss": 1.6375, "step": 8228 }, { "epoch": 0.65, "learning_rate": 0.0002668192288493957, "loss": 1.6967, "step": 8229 }, { "epoch": 0.65, "learning_rate": 0.0002668114754661488, "loss": 1.619, "step": 8230 }, { "epoch": 0.65, "learning_rate": 0.00026680372128981653, "loss": 1.6935, "step": 8231 }, { "epoch": 0.65, "learning_rate": 0.0002667959663204514, "loss": 1.7059, "step": 8232 }, { "epoch": 0.65, "learning_rate": 0.00026678821055810617, "loss": 1.677, "step": 8233 }, { "epoch": 0.65, "learning_rate": 0.00026678045400283336, "loss": 1.6652, "step": 8234 }, { "epoch": 0.65, "learning_rate": 0.00026677269665468573, "loss": 1.7097, "step": 8235 }, { "epoch": 0.65, "learning_rate": 0.00026676493851371597, "loss": 1.6849, "step": 8236 }, { "epoch": 0.65, "learning_rate": 0.0002667571795799767, "loss": 1.7036, "step": 8237 }, { "epoch": 0.65, "learning_rate": 0.0002667494198535206, "loss": 1.7169, "step": 8238 }, { "epoch": 0.65, "learning_rate": 0.0002667416593344004, "loss": 1.6571, "step": 8239 }, { "epoch": 0.65, "learning_rate": 0.0002667338980226687, "loss": 1.6894, "step": 8240 }, { "epoch": 0.65, "learning_rate": 0.0002667261359183783, "loss": 1.724, "step": 8241 }, { "epoch": 0.65, "learning_rate": 0.00026671837302158177, "loss": 1.6543, "step": 8242 }, { "epoch": 0.65, "learning_rate": 0.000266710609332332, "loss": 1.6437, "step": 8243 }, { "epoch": 0.65, "learning_rate": 0.00026670284485068156, "loss": 1.6967, "step": 8244 }, { "epoch": 0.65, "learning_rate": 0.0002666950795766832, "loss": 1.6781, "step": 8245 }, { "epoch": 0.65, "learning_rate": 0.0002666873135103896, "loss": 1.6893, "step": 8246 }, { "epoch": 0.65, "learning_rate": 0.00026667954665185364, "loss": 1.6667, "step": 8247 }, { "epoch": 0.65, "learning_rate": 0.0002666717790011279, "loss": 1.6942, "step": 8248 }, { "epoch": 0.65, "learning_rate": 0.00026666401055826515, "loss": 1.7053, "step": 8249 }, { "epoch": 0.65, "learning_rate": 0.00026665624132331814, "loss": 1.6618, "step": 8250 }, { "epoch": 0.65, "learning_rate": 0.00026664847129633965, "loss": 1.6438, "step": 8251 }, { "epoch": 0.65, "learning_rate": 0.00026664070047738243, "loss": 1.6746, "step": 8252 }, { "epoch": 0.65, "learning_rate": 0.00026663292886649917, "loss": 1.6481, "step": 8253 }, { "epoch": 0.65, "learning_rate": 0.0002666251564637427, "loss": 1.6858, "step": 8254 }, { "epoch": 0.65, "learning_rate": 0.00026661738326916583, "loss": 1.6369, "step": 8255 }, { "epoch": 0.65, "learning_rate": 0.00026660960928282125, "loss": 1.6336, "step": 8256 }, { "epoch": 0.65, "learning_rate": 0.0002666018345047618, "loss": 1.6357, "step": 8257 }, { "epoch": 0.65, "learning_rate": 0.00026659405893504016, "loss": 1.6644, "step": 8258 }, { "epoch": 0.65, "learning_rate": 0.00026658628257370925, "loss": 1.7026, "step": 8259 }, { "epoch": 0.65, "learning_rate": 0.0002665785054208218, "loss": 1.662, "step": 8260 }, { "epoch": 0.65, "learning_rate": 0.00026657072747643065, "loss": 1.6901, "step": 8261 }, { "epoch": 0.65, "learning_rate": 0.00026656294874058856, "loss": 1.6461, "step": 8262 }, { "epoch": 0.65, "learning_rate": 0.00026655516921334844, "loss": 1.6739, "step": 8263 }, { "epoch": 0.65, "learning_rate": 0.000266547388894763, "loss": 1.6479, "step": 8264 }, { "epoch": 0.65, "learning_rate": 0.0002665396077848851, "loss": 1.6645, "step": 8265 }, { "epoch": 0.65, "learning_rate": 0.0002665318258837676, "loss": 1.6764, "step": 8266 }, { "epoch": 0.65, "learning_rate": 0.0002665240431914633, "loss": 1.6517, "step": 8267 }, { "epoch": 0.65, "learning_rate": 0.000266516259708025, "loss": 1.6346, "step": 8268 }, { "epoch": 0.65, "learning_rate": 0.00026650847543350565, "loss": 1.6931, "step": 8269 }, { "epoch": 0.65, "learning_rate": 0.00026650069036795803, "loss": 1.6566, "step": 8270 }, { "epoch": 0.65, "learning_rate": 0.00026649290451143505, "loss": 1.6929, "step": 8271 }, { "epoch": 0.65, "learning_rate": 0.00026648511786398946, "loss": 1.6607, "step": 8272 }, { "epoch": 0.65, "learning_rate": 0.0002664773304256743, "loss": 1.6984, "step": 8273 }, { "epoch": 0.65, "learning_rate": 0.00026646954219654225, "loss": 1.7191, "step": 8274 }, { "epoch": 0.65, "learning_rate": 0.00026646175317664633, "loss": 1.6542, "step": 8275 }, { "epoch": 0.65, "learning_rate": 0.0002664539633660394, "loss": 1.6725, "step": 8276 }, { "epoch": 0.65, "learning_rate": 0.00026644617276477426, "loss": 1.6721, "step": 8277 }, { "epoch": 0.65, "learning_rate": 0.0002664383813729039, "loss": 1.6389, "step": 8278 }, { "epoch": 0.65, "learning_rate": 0.00026643058919048113, "loss": 1.6802, "step": 8279 }, { "epoch": 0.65, "learning_rate": 0.000266422796217559, "loss": 1.6876, "step": 8280 }, { "epoch": 0.65, "learning_rate": 0.00026641500245419027, "loss": 1.6566, "step": 8281 }, { "epoch": 0.65, "learning_rate": 0.0002664072079004279, "loss": 1.6901, "step": 8282 }, { "epoch": 0.65, "learning_rate": 0.0002663994125563249, "loss": 1.6545, "step": 8283 }, { "epoch": 0.65, "learning_rate": 0.0002663916164219341, "loss": 1.7002, "step": 8284 }, { "epoch": 0.65, "learning_rate": 0.0002663838194973085, "loss": 1.6741, "step": 8285 }, { "epoch": 0.65, "learning_rate": 0.0002663760217825009, "loss": 1.6725, "step": 8286 }, { "epoch": 0.65, "learning_rate": 0.00026636822327756436, "loss": 1.6481, "step": 8287 }, { "epoch": 0.65, "learning_rate": 0.0002663604239825518, "loss": 1.662, "step": 8288 }, { "epoch": 0.65, "learning_rate": 0.0002663526238975162, "loss": 1.6934, "step": 8289 }, { "epoch": 0.65, "learning_rate": 0.00026634482302251045, "loss": 1.707, "step": 8290 }, { "epoch": 0.65, "learning_rate": 0.00026633702135758764, "loss": 1.6548, "step": 8291 }, { "epoch": 0.65, "learning_rate": 0.00026632921890280055, "loss": 1.6764, "step": 8292 }, { "epoch": 0.65, "learning_rate": 0.00026632141565820233, "loss": 1.7329, "step": 8293 }, { "epoch": 0.65, "learning_rate": 0.00026631361162384587, "loss": 1.6493, "step": 8294 }, { "epoch": 0.65, "learning_rate": 0.00026630580679978415, "loss": 1.6163, "step": 8295 }, { "epoch": 0.65, "learning_rate": 0.0002662980011860703, "loss": 1.6172, "step": 8296 }, { "epoch": 0.65, "learning_rate": 0.000266290194782757, "loss": 1.6617, "step": 8297 }, { "epoch": 0.65, "learning_rate": 0.00026628238758989763, "loss": 1.7009, "step": 8298 }, { "epoch": 0.65, "learning_rate": 0.0002662745796075449, "loss": 1.6803, "step": 8299 }, { "epoch": 0.65, "learning_rate": 0.00026626677083575203, "loss": 1.7159, "step": 8300 }, { "epoch": 0.65, "learning_rate": 0.0002662589612745719, "loss": 1.6922, "step": 8301 }, { "epoch": 0.65, "learning_rate": 0.00026625115092405755, "loss": 1.7139, "step": 8302 }, { "epoch": 0.65, "learning_rate": 0.0002662433397842621, "loss": 1.7275, "step": 8303 }, { "epoch": 0.65, "learning_rate": 0.00026623552785523844, "loss": 1.694, "step": 8304 }, { "epoch": 0.65, "learning_rate": 0.0002662277151370398, "loss": 1.6196, "step": 8305 }, { "epoch": 0.65, "learning_rate": 0.00026621990162971907, "loss": 1.6839, "step": 8306 }, { "epoch": 0.65, "learning_rate": 0.0002662120873333293, "loss": 1.634, "step": 8307 }, { "epoch": 0.65, "learning_rate": 0.0002662042722479236, "loss": 1.6394, "step": 8308 }, { "epoch": 0.65, "learning_rate": 0.000266196456373555, "loss": 1.6342, "step": 8309 }, { "epoch": 0.65, "learning_rate": 0.00026618863971027666, "loss": 1.6422, "step": 8310 }, { "epoch": 0.65, "learning_rate": 0.00026618082225814154, "loss": 1.6554, "step": 8311 }, { "epoch": 0.65, "learning_rate": 0.0002661730040172028, "loss": 1.6395, "step": 8312 }, { "epoch": 0.65, "learning_rate": 0.0002661651849875134, "loss": 1.6323, "step": 8313 }, { "epoch": 0.65, "learning_rate": 0.0002661573651691265, "loss": 1.6714, "step": 8314 }, { "epoch": 0.65, "learning_rate": 0.0002661495445620952, "loss": 1.6925, "step": 8315 }, { "epoch": 0.65, "learning_rate": 0.00026614172316647257, "loss": 1.6729, "step": 8316 }, { "epoch": 0.65, "learning_rate": 0.0002661339009823118, "loss": 1.6832, "step": 8317 }, { "epoch": 0.65, "learning_rate": 0.0002661260780096659, "loss": 1.7196, "step": 8318 }, { "epoch": 0.65, "learning_rate": 0.000266118254248588, "loss": 1.6565, "step": 8319 }, { "epoch": 0.65, "learning_rate": 0.0002661104296991312, "loss": 1.6616, "step": 8320 }, { "epoch": 0.65, "learning_rate": 0.00026610260436134867, "loss": 1.6832, "step": 8321 }, { "epoch": 0.65, "learning_rate": 0.0002660947782352936, "loss": 1.704, "step": 8322 }, { "epoch": 0.65, "learning_rate": 0.000266086951321019, "loss": 1.6945, "step": 8323 }, { "epoch": 0.65, "learning_rate": 0.00026607912361857806, "loss": 1.6688, "step": 8324 }, { "epoch": 0.66, "learning_rate": 0.00026607129512802396, "loss": 1.6707, "step": 8325 }, { "epoch": 0.66, "learning_rate": 0.0002660634658494098, "loss": 1.677, "step": 8326 }, { "epoch": 0.66, "learning_rate": 0.00026605563578278873, "loss": 1.6515, "step": 8327 }, { "epoch": 0.66, "learning_rate": 0.0002660478049282139, "loss": 1.7121, "step": 8328 }, { "epoch": 0.66, "learning_rate": 0.00026603997328573866, "loss": 1.6814, "step": 8329 }, { "epoch": 0.66, "learning_rate": 0.00026603214085541596, "loss": 1.6447, "step": 8330 }, { "epoch": 0.66, "learning_rate": 0.000266024307637299, "loss": 1.6488, "step": 8331 }, { "epoch": 0.66, "learning_rate": 0.0002660164736314411, "loss": 1.64, "step": 8332 }, { "epoch": 0.66, "learning_rate": 0.00026600863883789527, "loss": 1.6875, "step": 8333 }, { "epoch": 0.66, "learning_rate": 0.0002660008032567149, "loss": 1.644, "step": 8334 }, { "epoch": 0.66, "learning_rate": 0.00026599296688795305, "loss": 1.6525, "step": 8335 }, { "epoch": 0.66, "learning_rate": 0.00026598512973166296, "loss": 1.6783, "step": 8336 }, { "epoch": 0.66, "learning_rate": 0.00026597729178789786, "loss": 1.6297, "step": 8337 }, { "epoch": 0.66, "learning_rate": 0.0002659694530567109, "loss": 1.611, "step": 8338 }, { "epoch": 0.66, "learning_rate": 0.00026596161353815544, "loss": 1.6489, "step": 8339 }, { "epoch": 0.66, "learning_rate": 0.00026595377323228455, "loss": 1.6518, "step": 8340 }, { "epoch": 0.66, "learning_rate": 0.0002659459321391516, "loss": 1.6658, "step": 8341 }, { "epoch": 0.66, "learning_rate": 0.00026593809025880966, "loss": 1.6804, "step": 8342 }, { "epoch": 0.66, "learning_rate": 0.00026593024759131214, "loss": 1.6402, "step": 8343 }, { "epoch": 0.66, "learning_rate": 0.0002659224041367122, "loss": 1.6935, "step": 8344 }, { "epoch": 0.66, "learning_rate": 0.00026591455989506305, "loss": 1.6597, "step": 8345 }, { "epoch": 0.66, "learning_rate": 0.00026590671486641807, "loss": 1.6823, "step": 8346 }, { "epoch": 0.66, "learning_rate": 0.0002658988690508304, "loss": 1.6248, "step": 8347 }, { "epoch": 0.66, "learning_rate": 0.00026589102244835343, "loss": 1.7245, "step": 8348 }, { "epoch": 0.66, "learning_rate": 0.00026588317505904036, "loss": 1.705, "step": 8349 }, { "epoch": 0.66, "learning_rate": 0.0002658753268829445, "loss": 1.6995, "step": 8350 }, { "epoch": 0.66, "learning_rate": 0.00026586747792011904, "loss": 1.6596, "step": 8351 }, { "epoch": 0.66, "learning_rate": 0.0002658596281706174, "loss": 1.6667, "step": 8352 }, { "epoch": 0.66, "learning_rate": 0.0002658517776344928, "loss": 1.6669, "step": 8353 }, { "epoch": 0.66, "learning_rate": 0.00026584392631179857, "loss": 1.6361, "step": 8354 }, { "epoch": 0.66, "learning_rate": 0.00026583607420258806, "loss": 1.6692, "step": 8355 }, { "epoch": 0.66, "learning_rate": 0.00026582822130691443, "loss": 1.6462, "step": 8356 }, { "epoch": 0.66, "learning_rate": 0.0002658203676248312, "loss": 1.6447, "step": 8357 }, { "epoch": 0.66, "learning_rate": 0.0002658125131563915, "loss": 1.6897, "step": 8358 }, { "epoch": 0.66, "learning_rate": 0.0002658046579016488, "loss": 1.6642, "step": 8359 }, { "epoch": 0.66, "learning_rate": 0.0002657968018606563, "loss": 1.6773, "step": 8360 }, { "epoch": 0.66, "learning_rate": 0.00026578894503346753, "loss": 1.6764, "step": 8361 }, { "epoch": 0.66, "learning_rate": 0.0002657810874201357, "loss": 1.6803, "step": 8362 }, { "epoch": 0.66, "learning_rate": 0.00026577322902071414, "loss": 1.6672, "step": 8363 }, { "epoch": 0.66, "learning_rate": 0.0002657653698352562, "loss": 1.708, "step": 8364 }, { "epoch": 0.66, "learning_rate": 0.0002657575098638154, "loss": 1.601, "step": 8365 }, { "epoch": 0.66, "learning_rate": 0.0002657496491064449, "loss": 1.6324, "step": 8366 }, { "epoch": 0.66, "learning_rate": 0.0002657417875631982, "loss": 1.6419, "step": 8367 }, { "epoch": 0.66, "learning_rate": 0.0002657339252341286, "loss": 1.6322, "step": 8368 }, { "epoch": 0.66, "learning_rate": 0.0002657260621192895, "loss": 1.6176, "step": 8369 }, { "epoch": 0.66, "learning_rate": 0.00026571819821873436, "loss": 1.7038, "step": 8370 }, { "epoch": 0.66, "learning_rate": 0.0002657103335325165, "loss": 1.6628, "step": 8371 }, { "epoch": 0.66, "learning_rate": 0.0002657024680606893, "loss": 1.6557, "step": 8372 }, { "epoch": 0.66, "learning_rate": 0.00026569460180330627, "loss": 1.6243, "step": 8373 }, { "epoch": 0.66, "learning_rate": 0.00026568673476042064, "loss": 1.7109, "step": 8374 }, { "epoch": 0.66, "learning_rate": 0.00026567886693208595, "loss": 1.6681, "step": 8375 }, { "epoch": 0.66, "learning_rate": 0.00026567099831835563, "loss": 1.6751, "step": 8376 }, { "epoch": 0.66, "learning_rate": 0.000265663128919283, "loss": 1.6669, "step": 8377 }, { "epoch": 0.66, "learning_rate": 0.0002656552587349216, "loss": 1.6589, "step": 8378 }, { "epoch": 0.66, "learning_rate": 0.00026564738776532477, "loss": 1.6917, "step": 8379 }, { "epoch": 0.66, "learning_rate": 0.00026563951601054606, "loss": 1.6356, "step": 8380 }, { "epoch": 0.66, "learning_rate": 0.0002656316434706388, "loss": 1.6733, "step": 8381 }, { "epoch": 0.66, "learning_rate": 0.00026562377014565655, "loss": 1.6497, "step": 8382 }, { "epoch": 0.66, "learning_rate": 0.00026561589603565266, "loss": 1.7125, "step": 8383 }, { "epoch": 0.66, "learning_rate": 0.00026560802114068065, "loss": 1.6177, "step": 8384 }, { "epoch": 0.66, "learning_rate": 0.00026560014546079397, "loss": 1.7079, "step": 8385 }, { "epoch": 0.66, "learning_rate": 0.0002655922689960461, "loss": 1.6908, "step": 8386 }, { "epoch": 0.66, "learning_rate": 0.0002655843917464905, "loss": 1.6496, "step": 8387 }, { "epoch": 0.66, "learning_rate": 0.00026557651371218066, "loss": 1.6109, "step": 8388 }, { "epoch": 0.66, "learning_rate": 0.00026556863489317014, "loss": 1.6428, "step": 8389 }, { "epoch": 0.66, "learning_rate": 0.00026556075528951233, "loss": 1.7128, "step": 8390 }, { "epoch": 0.66, "learning_rate": 0.0002655528749012607, "loss": 1.6237, "step": 8391 }, { "epoch": 0.66, "learning_rate": 0.00026554499372846886, "loss": 1.6684, "step": 8392 }, { "epoch": 0.66, "learning_rate": 0.0002655371117711903, "loss": 1.6629, "step": 8393 }, { "epoch": 0.66, "learning_rate": 0.00026552922902947846, "loss": 1.6865, "step": 8394 }, { "epoch": 0.66, "learning_rate": 0.000265521345503387, "loss": 1.7029, "step": 8395 }, { "epoch": 0.66, "learning_rate": 0.0002655134611929692, "loss": 1.7273, "step": 8396 }, { "epoch": 0.66, "learning_rate": 0.0002655055760982789, "loss": 1.6498, "step": 8397 }, { "epoch": 0.66, "learning_rate": 0.0002654976902193694, "loss": 1.6741, "step": 8398 }, { "epoch": 0.66, "learning_rate": 0.00026548980355629436, "loss": 1.648, "step": 8399 }, { "epoch": 0.66, "learning_rate": 0.0002654819161091072, "loss": 1.6668, "step": 8400 }, { "epoch": 0.66, "learning_rate": 0.00026547402787786167, "loss": 1.7155, "step": 8401 }, { "epoch": 0.66, "learning_rate": 0.00026546613886261114, "loss": 1.669, "step": 8402 }, { "epoch": 0.66, "learning_rate": 0.00026545824906340927, "loss": 1.6135, "step": 8403 }, { "epoch": 0.66, "learning_rate": 0.00026545035848030965, "loss": 1.6831, "step": 8404 }, { "epoch": 0.66, "learning_rate": 0.00026544246711336574, "loss": 1.7165, "step": 8405 }, { "epoch": 0.66, "learning_rate": 0.0002654345749626312, "loss": 1.6393, "step": 8406 }, { "epoch": 0.66, "learning_rate": 0.0002654266820281596, "loss": 1.66, "step": 8407 }, { "epoch": 0.66, "learning_rate": 0.0002654187883100045, "loss": 1.7154, "step": 8408 }, { "epoch": 0.66, "learning_rate": 0.00026541089380821954, "loss": 1.6877, "step": 8409 }, { "epoch": 0.66, "learning_rate": 0.00026540299852285834, "loss": 1.6762, "step": 8410 }, { "epoch": 0.66, "learning_rate": 0.0002653951024539745, "loss": 1.6611, "step": 8411 }, { "epoch": 0.66, "learning_rate": 0.0002653872056016215, "loss": 1.6467, "step": 8412 }, { "epoch": 0.66, "learning_rate": 0.00026537930796585306, "loss": 1.614, "step": 8413 }, { "epoch": 0.66, "learning_rate": 0.0002653714095467228, "loss": 1.6536, "step": 8414 }, { "epoch": 0.66, "learning_rate": 0.00026536351034428437, "loss": 1.7031, "step": 8415 }, { "epoch": 0.66, "learning_rate": 0.00026535561035859136, "loss": 1.6674, "step": 8416 }, { "epoch": 0.66, "learning_rate": 0.00026534770958969736, "loss": 1.6948, "step": 8417 }, { "epoch": 0.66, "learning_rate": 0.0002653398080376561, "loss": 1.6325, "step": 8418 }, { "epoch": 0.66, "learning_rate": 0.0002653319057025212, "loss": 1.6826, "step": 8419 }, { "epoch": 0.66, "learning_rate": 0.0002653240025843463, "loss": 1.667, "step": 8420 }, { "epoch": 0.66, "learning_rate": 0.00026531609868318514, "loss": 1.6913, "step": 8421 }, { "epoch": 0.66, "learning_rate": 0.00026530819399909117, "loss": 1.7037, "step": 8422 }, { "epoch": 0.66, "learning_rate": 0.0002653002885321183, "loss": 1.6514, "step": 8423 }, { "epoch": 0.66, "learning_rate": 0.00026529238228232004, "loss": 1.664, "step": 8424 }, { "epoch": 0.66, "learning_rate": 0.00026528447524975016, "loss": 1.5901, "step": 8425 }, { "epoch": 0.66, "learning_rate": 0.0002652765674344623, "loss": 1.6372, "step": 8426 }, { "epoch": 0.66, "learning_rate": 0.0002652686588365101, "loss": 1.6541, "step": 8427 }, { "epoch": 0.66, "learning_rate": 0.00026526074945594746, "loss": 1.7356, "step": 8428 }, { "epoch": 0.66, "learning_rate": 0.00026525283929282784, "loss": 1.6413, "step": 8429 }, { "epoch": 0.66, "learning_rate": 0.0002652449283472051, "loss": 1.6368, "step": 8430 }, { "epoch": 0.66, "learning_rate": 0.0002652370166191328, "loss": 1.6625, "step": 8431 }, { "epoch": 0.66, "learning_rate": 0.00026522910410866485, "loss": 1.665, "step": 8432 }, { "epoch": 0.66, "learning_rate": 0.0002652211908158548, "loss": 1.6958, "step": 8433 }, { "epoch": 0.66, "learning_rate": 0.0002652132767407565, "loss": 1.6588, "step": 8434 }, { "epoch": 0.66, "learning_rate": 0.00026520536188342353, "loss": 1.6354, "step": 8435 }, { "epoch": 0.66, "learning_rate": 0.00026519744624390983, "loss": 1.6634, "step": 8436 }, { "epoch": 0.66, "learning_rate": 0.000265189529822269, "loss": 1.6731, "step": 8437 }, { "epoch": 0.66, "learning_rate": 0.00026518161261855486, "loss": 1.7163, "step": 8438 }, { "epoch": 0.66, "learning_rate": 0.0002651736946328211, "loss": 1.6209, "step": 8439 }, { "epoch": 0.66, "learning_rate": 0.00026516577586512154, "loss": 1.6977, "step": 8440 }, { "epoch": 0.66, "learning_rate": 0.0002651578563155099, "loss": 1.6857, "step": 8441 }, { "epoch": 0.66, "learning_rate": 0.00026514993598404, "loss": 1.6142, "step": 8442 }, { "epoch": 0.66, "learning_rate": 0.00026514201487076554, "loss": 1.6964, "step": 8443 }, { "epoch": 0.66, "learning_rate": 0.0002651340929757404, "loss": 1.6311, "step": 8444 }, { "epoch": 0.66, "learning_rate": 0.0002651261702990182, "loss": 1.6064, "step": 8445 }, { "epoch": 0.66, "learning_rate": 0.00026511824684065285, "loss": 1.6125, "step": 8446 }, { "epoch": 0.66, "learning_rate": 0.0002651103226006982, "loss": 1.6544, "step": 8447 }, { "epoch": 0.66, "learning_rate": 0.0002651023975792079, "loss": 1.6808, "step": 8448 }, { "epoch": 0.66, "learning_rate": 0.0002650944717762359, "loss": 1.6919, "step": 8449 }, { "epoch": 0.66, "learning_rate": 0.000265086545191836, "loss": 1.6304, "step": 8450 }, { "epoch": 0.66, "learning_rate": 0.0002650786178260619, "loss": 1.687, "step": 8451 }, { "epoch": 0.67, "learning_rate": 0.0002650706896789675, "loss": 1.6451, "step": 8452 }, { "epoch": 0.67, "learning_rate": 0.0002650627607506066, "loss": 1.7084, "step": 8453 }, { "epoch": 0.67, "learning_rate": 0.00026505483104103305, "loss": 1.6544, "step": 8454 }, { "epoch": 0.67, "learning_rate": 0.00026504690055030074, "loss": 1.6533, "step": 8455 }, { "epoch": 0.67, "learning_rate": 0.0002650389692784634, "loss": 1.7324, "step": 8456 }, { "epoch": 0.67, "learning_rate": 0.000265031037225575, "loss": 1.6456, "step": 8457 }, { "epoch": 0.67, "learning_rate": 0.00026502310439168933, "loss": 1.6474, "step": 8458 }, { "epoch": 0.67, "learning_rate": 0.0002650151707768602, "loss": 1.6866, "step": 8459 }, { "epoch": 0.67, "learning_rate": 0.0002650072363811416, "loss": 1.6879, "step": 8460 }, { "epoch": 0.67, "learning_rate": 0.0002649993012045873, "loss": 1.6496, "step": 8461 }, { "epoch": 0.67, "learning_rate": 0.00026499136524725124, "loss": 1.6901, "step": 8462 }, { "epoch": 0.67, "learning_rate": 0.00026498342850918717, "loss": 1.653, "step": 8463 }, { "epoch": 0.67, "learning_rate": 0.0002649754909904492, "loss": 1.6671, "step": 8464 }, { "epoch": 0.67, "learning_rate": 0.000264967552691091, "loss": 1.7339, "step": 8465 }, { "epoch": 0.67, "learning_rate": 0.0002649596136111666, "loss": 1.687, "step": 8466 }, { "epoch": 0.67, "learning_rate": 0.0002649516737507298, "loss": 1.6517, "step": 8467 }, { "epoch": 0.67, "learning_rate": 0.0002649437331098347, "loss": 1.6547, "step": 8468 }, { "epoch": 0.67, "learning_rate": 0.000264935791688535, "loss": 1.634, "step": 8469 }, { "epoch": 0.67, "learning_rate": 0.00026492784948688473, "loss": 1.641, "step": 8470 }, { "epoch": 0.67, "learning_rate": 0.00026491990650493775, "loss": 1.6909, "step": 8471 }, { "epoch": 0.67, "learning_rate": 0.00026491196274274804, "loss": 1.671, "step": 8472 }, { "epoch": 0.67, "learning_rate": 0.00026490401820036954, "loss": 1.7071, "step": 8473 }, { "epoch": 0.67, "learning_rate": 0.0002648960728778561, "loss": 1.616, "step": 8474 }, { "epoch": 0.67, "learning_rate": 0.0002648881267752618, "loss": 1.6281, "step": 8475 }, { "epoch": 0.67, "learning_rate": 0.0002648801798926405, "loss": 1.6565, "step": 8476 }, { "epoch": 0.67, "learning_rate": 0.00026487223223004615, "loss": 1.6198, "step": 8477 }, { "epoch": 0.67, "learning_rate": 0.00026486428378753277, "loss": 1.6405, "step": 8478 }, { "epoch": 0.67, "learning_rate": 0.0002648563345651543, "loss": 1.6636, "step": 8479 }, { "epoch": 0.67, "learning_rate": 0.0002648483845629646, "loss": 1.6774, "step": 8480 }, { "epoch": 0.67, "learning_rate": 0.0002648404337810179, "loss": 1.674, "step": 8481 }, { "epoch": 0.67, "learning_rate": 0.0002648324822193679, "loss": 1.6031, "step": 8482 }, { "epoch": 0.67, "learning_rate": 0.00026482452987806876, "loss": 1.7357, "step": 8483 }, { "epoch": 0.67, "learning_rate": 0.00026481657675717443, "loss": 1.7086, "step": 8484 }, { "epoch": 0.67, "learning_rate": 0.00026480862285673895, "loss": 1.638, "step": 8485 }, { "epoch": 0.67, "learning_rate": 0.0002648006681768162, "loss": 1.6472, "step": 8486 }, { "epoch": 0.67, "learning_rate": 0.0002647927127174603, "loss": 1.6448, "step": 8487 }, { "epoch": 0.67, "learning_rate": 0.00026478475647872526, "loss": 1.6778, "step": 8488 }, { "epoch": 0.67, "learning_rate": 0.00026477679946066503, "loss": 1.686, "step": 8489 }, { "epoch": 0.67, "learning_rate": 0.00026476884166333367, "loss": 1.6773, "step": 8490 }, { "epoch": 0.67, "learning_rate": 0.00026476088308678524, "loss": 1.6357, "step": 8491 }, { "epoch": 0.67, "learning_rate": 0.0002647529237310737, "loss": 1.6686, "step": 8492 }, { "epoch": 0.67, "learning_rate": 0.00026474496359625316, "loss": 1.7053, "step": 8493 }, { "epoch": 0.67, "learning_rate": 0.0002647370026823776, "loss": 1.7029, "step": 8494 }, { "epoch": 0.67, "learning_rate": 0.0002647290409895012, "loss": 1.687, "step": 8495 }, { "epoch": 0.67, "learning_rate": 0.00026472107851767786, "loss": 1.6612, "step": 8496 }, { "epoch": 0.67, "learning_rate": 0.00026471311526696174, "loss": 1.6718, "step": 8497 }, { "epoch": 0.67, "learning_rate": 0.00026470515123740683, "loss": 1.6405, "step": 8498 }, { "epoch": 0.67, "learning_rate": 0.0002646971864290672, "loss": 1.6993, "step": 8499 }, { "epoch": 0.67, "learning_rate": 0.00026468922084199706, "loss": 1.6868, "step": 8500 }, { "epoch": 0.67, "learning_rate": 0.00026468125447625036, "loss": 1.6091, "step": 8501 }, { "epoch": 0.67, "learning_rate": 0.00026467328733188126, "loss": 1.6344, "step": 8502 }, { "epoch": 0.67, "learning_rate": 0.0002646653194089438, "loss": 1.6538, "step": 8503 }, { "epoch": 0.67, "learning_rate": 0.0002646573507074921, "loss": 1.7218, "step": 8504 }, { "epoch": 0.67, "learning_rate": 0.00026464938122758026, "loss": 1.6765, "step": 8505 }, { "epoch": 0.67, "learning_rate": 0.0002646414109692624, "loss": 1.6668, "step": 8506 }, { "epoch": 0.67, "learning_rate": 0.0002646334399325926, "loss": 1.6509, "step": 8507 }, { "epoch": 0.67, "learning_rate": 0.000264625468117625, "loss": 1.6812, "step": 8508 }, { "epoch": 0.67, "learning_rate": 0.00026461749552441374, "loss": 1.6961, "step": 8509 }, { "epoch": 0.67, "learning_rate": 0.00026460952215301295, "loss": 1.6497, "step": 8510 }, { "epoch": 0.67, "learning_rate": 0.00026460154800347674, "loss": 1.68, "step": 8511 }, { "epoch": 0.67, "learning_rate": 0.00026459357307585926, "loss": 1.6464, "step": 8512 }, { "epoch": 0.67, "learning_rate": 0.0002645855973702146, "loss": 1.647, "step": 8513 }, { "epoch": 0.67, "learning_rate": 0.00026457762088659707, "loss": 1.6499, "step": 8514 }, { "epoch": 0.67, "learning_rate": 0.00026456964362506067, "loss": 1.6893, "step": 8515 }, { "epoch": 0.67, "learning_rate": 0.00026456166558565963, "loss": 1.6394, "step": 8516 }, { "epoch": 0.67, "learning_rate": 0.0002645536867684481, "loss": 1.6482, "step": 8517 }, { "epoch": 0.67, "learning_rate": 0.00026454570717348024, "loss": 1.6966, "step": 8518 }, { "epoch": 0.67, "learning_rate": 0.00026453772680081026, "loss": 1.6507, "step": 8519 }, { "epoch": 0.67, "learning_rate": 0.0002645297456504923, "loss": 1.6653, "step": 8520 }, { "epoch": 0.67, "learning_rate": 0.00026452176372258055, "loss": 1.6944, "step": 8521 }, { "epoch": 0.67, "learning_rate": 0.0002645137810171293, "loss": 1.6271, "step": 8522 }, { "epoch": 0.67, "learning_rate": 0.0002645057975341926, "loss": 1.6714, "step": 8523 }, { "epoch": 0.67, "learning_rate": 0.00026449781327382473, "loss": 1.6707, "step": 8524 }, { "epoch": 0.67, "learning_rate": 0.00026448982823607995, "loss": 1.6867, "step": 8525 }, { "epoch": 0.67, "learning_rate": 0.00026448184242101235, "loss": 1.6663, "step": 8526 }, { "epoch": 0.67, "learning_rate": 0.00026447385582867625, "loss": 1.6422, "step": 8527 }, { "epoch": 0.67, "learning_rate": 0.0002644658684591258, "loss": 1.7278, "step": 8528 }, { "epoch": 0.67, "learning_rate": 0.0002644578803124153, "loss": 1.6775, "step": 8529 }, { "epoch": 0.67, "learning_rate": 0.000264449891388599, "loss": 1.6381, "step": 8530 }, { "epoch": 0.67, "learning_rate": 0.00026444190168773107, "loss": 1.6752, "step": 8531 }, { "epoch": 0.67, "learning_rate": 0.00026443391120986576, "loss": 1.7161, "step": 8532 }, { "epoch": 0.67, "learning_rate": 0.0002644259199550573, "loss": 1.7003, "step": 8533 }, { "epoch": 0.67, "learning_rate": 0.0002644179279233601, "loss": 1.6784, "step": 8534 }, { "epoch": 0.67, "learning_rate": 0.00026440993511482825, "loss": 1.6909, "step": 8535 }, { "epoch": 0.67, "learning_rate": 0.0002644019415295161, "loss": 1.6109, "step": 8536 }, { "epoch": 0.67, "learning_rate": 0.00026439394716747783, "loss": 1.6494, "step": 8537 }, { "epoch": 0.67, "learning_rate": 0.00026438595202876784, "loss": 1.6344, "step": 8538 }, { "epoch": 0.67, "learning_rate": 0.0002643779561134403, "loss": 1.643, "step": 8539 }, { "epoch": 0.67, "learning_rate": 0.0002643699594215496, "loss": 1.6795, "step": 8540 }, { "epoch": 0.67, "learning_rate": 0.00026436196195315007, "loss": 1.6915, "step": 8541 }, { "epoch": 0.67, "learning_rate": 0.00026435396370829583, "loss": 1.6444, "step": 8542 }, { "epoch": 0.67, "learning_rate": 0.0002643459646870413, "loss": 1.6811, "step": 8543 }, { "epoch": 0.67, "learning_rate": 0.00026433796488944077, "loss": 1.661, "step": 8544 }, { "epoch": 0.67, "learning_rate": 0.0002643299643155486, "loss": 1.6509, "step": 8545 }, { "epoch": 0.67, "learning_rate": 0.000264321962965419, "loss": 1.6098, "step": 8546 }, { "epoch": 0.67, "learning_rate": 0.00026431396083910643, "loss": 1.672, "step": 8547 }, { "epoch": 0.67, "learning_rate": 0.00026430595793666505, "loss": 1.7108, "step": 8548 }, { "epoch": 0.67, "learning_rate": 0.00026429795425814937, "loss": 1.721, "step": 8549 }, { "epoch": 0.67, "learning_rate": 0.00026428994980361365, "loss": 1.6781, "step": 8550 }, { "epoch": 0.67, "learning_rate": 0.00026428194457311227, "loss": 1.6106, "step": 8551 }, { "epoch": 0.67, "learning_rate": 0.0002642739385666995, "loss": 1.6463, "step": 8552 }, { "epoch": 0.67, "learning_rate": 0.00026426593178442974, "loss": 1.6935, "step": 8553 }, { "epoch": 0.67, "learning_rate": 0.0002642579242263574, "loss": 1.6907, "step": 8554 }, { "epoch": 0.67, "learning_rate": 0.00026424991589253676, "loss": 1.6893, "step": 8555 }, { "epoch": 0.67, "learning_rate": 0.0002642419067830223, "loss": 1.6331, "step": 8556 }, { "epoch": 0.67, "learning_rate": 0.0002642338968978683, "loss": 1.6651, "step": 8557 }, { "epoch": 0.67, "learning_rate": 0.0002642258862371292, "loss": 1.6471, "step": 8558 }, { "epoch": 0.67, "learning_rate": 0.0002642178748008594, "loss": 1.6479, "step": 8559 }, { "epoch": 0.67, "learning_rate": 0.00026420986258911315, "loss": 1.633, "step": 8560 }, { "epoch": 0.67, "learning_rate": 0.00026420184960194504, "loss": 1.6699, "step": 8561 }, { "epoch": 0.67, "learning_rate": 0.0002641938358394094, "loss": 1.6401, "step": 8562 }, { "epoch": 0.67, "learning_rate": 0.00026418582130156057, "loss": 1.6835, "step": 8563 }, { "epoch": 0.67, "learning_rate": 0.0002641778059884531, "loss": 1.6368, "step": 8564 }, { "epoch": 0.67, "learning_rate": 0.0002641697899001413, "loss": 1.6757, "step": 8565 }, { "epoch": 0.67, "learning_rate": 0.0002641617730366796, "loss": 1.6136, "step": 8566 }, { "epoch": 0.67, "learning_rate": 0.00026415375539812246, "loss": 1.6893, "step": 8567 }, { "epoch": 0.67, "learning_rate": 0.0002641457369845244, "loss": 1.6831, "step": 8568 }, { "epoch": 0.67, "learning_rate": 0.0002641377177959397, "loss": 1.677, "step": 8569 }, { "epoch": 0.67, "learning_rate": 0.0002641296978324229, "loss": 1.6502, "step": 8570 }, { "epoch": 0.67, "learning_rate": 0.00026412167709402844, "loss": 1.6782, "step": 8571 }, { "epoch": 0.67, "learning_rate": 0.0002641136555808108, "loss": 1.683, "step": 8572 }, { "epoch": 0.67, "learning_rate": 0.00026410563329282437, "loss": 1.5964, "step": 8573 }, { "epoch": 0.67, "learning_rate": 0.0002640976102301237, "loss": 1.6773, "step": 8574 }, { "epoch": 0.67, "learning_rate": 0.00026408958639276313, "loss": 1.71, "step": 8575 }, { "epoch": 0.67, "learning_rate": 0.00026408156178079733, "loss": 1.6183, "step": 8576 }, { "epoch": 0.67, "learning_rate": 0.00026407353639428064, "loss": 1.6826, "step": 8577 }, { "epoch": 0.67, "learning_rate": 0.0002640655102332676, "loss": 1.6655, "step": 8578 }, { "epoch": 0.68, "learning_rate": 0.0002640574832978127, "loss": 1.6226, "step": 8579 }, { "epoch": 0.68, "learning_rate": 0.0002640494555879703, "loss": 1.6785, "step": 8580 }, { "epoch": 0.68, "learning_rate": 0.0002640414271037952, "loss": 1.6507, "step": 8581 }, { "epoch": 0.68, "learning_rate": 0.0002640333978453417, "loss": 1.7058, "step": 8582 }, { "epoch": 0.68, "learning_rate": 0.00026402536781266437, "loss": 1.6429, "step": 8583 }, { "epoch": 0.68, "learning_rate": 0.0002640173370058177, "loss": 1.6398, "step": 8584 }, { "epoch": 0.68, "learning_rate": 0.0002640093054248562, "loss": 1.6859, "step": 8585 }, { "epoch": 0.68, "learning_rate": 0.0002640012730698345, "loss": 1.6709, "step": 8586 }, { "epoch": 0.68, "learning_rate": 0.000263993239940807, "loss": 1.6681, "step": 8587 }, { "epoch": 0.68, "learning_rate": 0.0002639852060378283, "loss": 1.7115, "step": 8588 }, { "epoch": 0.68, "learning_rate": 0.000263977171360953, "loss": 1.6381, "step": 8589 }, { "epoch": 0.68, "learning_rate": 0.0002639691359102356, "loss": 1.6652, "step": 8590 }, { "epoch": 0.68, "learning_rate": 0.00026396109968573065, "loss": 1.6606, "step": 8591 }, { "epoch": 0.68, "learning_rate": 0.0002639530626874927, "loss": 1.6481, "step": 8592 }, { "epoch": 0.68, "learning_rate": 0.0002639450249155764, "loss": 1.6273, "step": 8593 }, { "epoch": 0.68, "learning_rate": 0.0002639369863700362, "loss": 1.6437, "step": 8594 }, { "epoch": 0.68, "learning_rate": 0.00026392894705092675, "loss": 1.6717, "step": 8595 }, { "epoch": 0.68, "learning_rate": 0.00026392090695830263, "loss": 1.7021, "step": 8596 }, { "epoch": 0.68, "learning_rate": 0.00026391286609221844, "loss": 1.6918, "step": 8597 }, { "epoch": 0.68, "learning_rate": 0.0002639048244527287, "loss": 1.6659, "step": 8598 }, { "epoch": 0.68, "learning_rate": 0.0002638967820398881, "loss": 1.6215, "step": 8599 }, { "epoch": 0.68, "learning_rate": 0.0002638887388537512, "loss": 1.6561, "step": 8600 }, { "epoch": 0.68, "learning_rate": 0.0002638806948943726, "loss": 1.6738, "step": 8601 }, { "epoch": 0.68, "learning_rate": 0.00026387265016180694, "loss": 1.7176, "step": 8602 }, { "epoch": 0.68, "learning_rate": 0.0002638646046561088, "loss": 1.6061, "step": 8603 }, { "epoch": 0.68, "learning_rate": 0.0002638565583773329, "loss": 1.6535, "step": 8604 }, { "epoch": 0.68, "learning_rate": 0.00026384851132553374, "loss": 1.6781, "step": 8605 }, { "epoch": 0.68, "learning_rate": 0.000263840463500766, "loss": 1.7042, "step": 8606 }, { "epoch": 0.68, "learning_rate": 0.00026383241490308436, "loss": 1.6322, "step": 8607 }, { "epoch": 0.68, "learning_rate": 0.0002638243655325435, "loss": 1.6831, "step": 8608 }, { "epoch": 0.68, "learning_rate": 0.0002638163153891979, "loss": 1.6606, "step": 8609 }, { "epoch": 0.68, "learning_rate": 0.00026380826447310236, "loss": 1.6275, "step": 8610 }, { "epoch": 0.68, "learning_rate": 0.00026380021278431156, "loss": 1.6614, "step": 8611 }, { "epoch": 0.68, "learning_rate": 0.0002637921603228801, "loss": 1.6566, "step": 8612 }, { "epoch": 0.68, "learning_rate": 0.00026378410708886266, "loss": 1.6713, "step": 8613 }, { "epoch": 0.68, "learning_rate": 0.0002637760530823139, "loss": 1.6528, "step": 8614 }, { "epoch": 0.68, "learning_rate": 0.00026376799830328854, "loss": 1.6974, "step": 8615 }, { "epoch": 0.68, "learning_rate": 0.00026375994275184124, "loss": 1.6293, "step": 8616 }, { "epoch": 0.68, "learning_rate": 0.0002637518864280267, "loss": 1.6755, "step": 8617 }, { "epoch": 0.68, "learning_rate": 0.00026374382933189963, "loss": 1.6758, "step": 8618 }, { "epoch": 0.68, "learning_rate": 0.00026373577146351473, "loss": 1.6582, "step": 8619 }, { "epoch": 0.68, "learning_rate": 0.0002637277128229268, "loss": 1.6893, "step": 8620 }, { "epoch": 0.68, "learning_rate": 0.0002637196534101903, "loss": 1.6503, "step": 8621 }, { "epoch": 0.68, "learning_rate": 0.00026371159322536024, "loss": 1.7044, "step": 8622 }, { "epoch": 0.68, "learning_rate": 0.00026370353226849117, "loss": 1.6636, "step": 8623 }, { "epoch": 0.68, "learning_rate": 0.00026369547053963784, "loss": 1.6077, "step": 8624 }, { "epoch": 0.68, "learning_rate": 0.000263687408038855, "loss": 1.6674, "step": 8625 }, { "epoch": 0.68, "learning_rate": 0.0002636793447661974, "loss": 1.6809, "step": 8626 }, { "epoch": 0.68, "learning_rate": 0.00026367128072171984, "loss": 1.5994, "step": 8627 }, { "epoch": 0.68, "learning_rate": 0.00026366321590547695, "loss": 1.6816, "step": 8628 }, { "epoch": 0.68, "learning_rate": 0.0002636551503175236, "loss": 1.608, "step": 8629 }, { "epoch": 0.68, "learning_rate": 0.00026364708395791445, "loss": 1.6375, "step": 8630 }, { "epoch": 0.68, "learning_rate": 0.00026363901682670434, "loss": 1.6741, "step": 8631 }, { "epoch": 0.68, "learning_rate": 0.00026363094892394804, "loss": 1.643, "step": 8632 }, { "epoch": 0.68, "learning_rate": 0.00026362288024970026, "loss": 1.6062, "step": 8633 }, { "epoch": 0.68, "learning_rate": 0.00026361481080401585, "loss": 1.6397, "step": 8634 }, { "epoch": 0.68, "learning_rate": 0.00026360674058694956, "loss": 1.608, "step": 8635 }, { "epoch": 0.68, "learning_rate": 0.0002635986695985562, "loss": 1.6925, "step": 8636 }, { "epoch": 0.68, "learning_rate": 0.0002635905978388906, "loss": 1.6409, "step": 8637 }, { "epoch": 0.68, "learning_rate": 0.0002635825253080075, "loss": 1.6401, "step": 8638 }, { "epoch": 0.68, "learning_rate": 0.00026357445200596167, "loss": 1.6671, "step": 8639 }, { "epoch": 0.68, "learning_rate": 0.00026356637793280806, "loss": 1.5894, "step": 8640 }, { "epoch": 0.68, "learning_rate": 0.0002635583030886014, "loss": 1.5897, "step": 8641 }, { "epoch": 0.68, "learning_rate": 0.0002635502274733965, "loss": 1.6346, "step": 8642 }, { "epoch": 0.68, "learning_rate": 0.00026354215108724825, "loss": 1.6903, "step": 8643 }, { "epoch": 0.68, "learning_rate": 0.00026353407393021145, "loss": 1.6523, "step": 8644 }, { "epoch": 0.68, "learning_rate": 0.0002635259960023409, "loss": 1.6415, "step": 8645 }, { "epoch": 0.68, "learning_rate": 0.0002635179173036915, "loss": 1.7182, "step": 8646 }, { "epoch": 0.68, "learning_rate": 0.00026350983783431813, "loss": 1.6995, "step": 8647 }, { "epoch": 0.68, "learning_rate": 0.0002635017575942756, "loss": 1.6414, "step": 8648 }, { "epoch": 0.68, "learning_rate": 0.0002634936765836187, "loss": 1.7108, "step": 8649 }, { "epoch": 0.68, "learning_rate": 0.0002634855948024024, "loss": 1.72, "step": 8650 }, { "epoch": 0.68, "learning_rate": 0.00026347751225068157, "loss": 1.6993, "step": 8651 }, { "epoch": 0.68, "learning_rate": 0.0002634694289285111, "loss": 1.6653, "step": 8652 }, { "epoch": 0.68, "learning_rate": 0.00026346134483594576, "loss": 1.7251, "step": 8653 }, { "epoch": 0.68, "learning_rate": 0.00026345325997304046, "loss": 1.6401, "step": 8654 }, { "epoch": 0.68, "learning_rate": 0.0002634451743398502, "loss": 1.6432, "step": 8655 }, { "epoch": 0.68, "learning_rate": 0.0002634370879364298, "loss": 1.6281, "step": 8656 }, { "epoch": 0.68, "learning_rate": 0.0002634290007628341, "loss": 1.6793, "step": 8657 }, { "epoch": 0.68, "learning_rate": 0.0002634209128191182, "loss": 1.6376, "step": 8658 }, { "epoch": 0.68, "learning_rate": 0.0002634128241053368, "loss": 1.6209, "step": 8659 }, { "epoch": 0.68, "learning_rate": 0.000263404734621545, "loss": 1.6903, "step": 8660 }, { "epoch": 0.68, "learning_rate": 0.0002633966443677975, "loss": 1.7004, "step": 8661 }, { "epoch": 0.68, "learning_rate": 0.00026338855334414945, "loss": 1.7039, "step": 8662 }, { "epoch": 0.68, "learning_rate": 0.00026338046155065573, "loss": 1.6571, "step": 8663 }, { "epoch": 0.68, "learning_rate": 0.00026337236898737115, "loss": 1.6774, "step": 8664 }, { "epoch": 0.68, "learning_rate": 0.00026336427565435083, "loss": 1.6875, "step": 8665 }, { "epoch": 0.68, "learning_rate": 0.00026335618155164955, "loss": 1.6614, "step": 8666 }, { "epoch": 0.68, "learning_rate": 0.00026334808667932247, "loss": 1.6347, "step": 8667 }, { "epoch": 0.68, "learning_rate": 0.00026333999103742435, "loss": 1.65, "step": 8668 }, { "epoch": 0.68, "learning_rate": 0.00026333189462601027, "loss": 1.6786, "step": 8669 }, { "epoch": 0.68, "learning_rate": 0.00026332379744513514, "loss": 1.6837, "step": 8670 }, { "epoch": 0.68, "learning_rate": 0.00026331569949485394, "loss": 1.6444, "step": 8671 }, { "epoch": 0.68, "learning_rate": 0.0002633076007752218, "loss": 1.6394, "step": 8672 }, { "epoch": 0.68, "learning_rate": 0.00026329950128629344, "loss": 1.6727, "step": 8673 }, { "epoch": 0.68, "learning_rate": 0.00026329140102812404, "loss": 1.6672, "step": 8674 }, { "epoch": 0.68, "learning_rate": 0.00026328330000076854, "loss": 1.6838, "step": 8675 }, { "epoch": 0.68, "learning_rate": 0.00026327519820428197, "loss": 1.6208, "step": 8676 }, { "epoch": 0.68, "learning_rate": 0.0002632670956387193, "loss": 1.6347, "step": 8677 }, { "epoch": 0.68, "learning_rate": 0.00026325899230413555, "loss": 1.6809, "step": 8678 }, { "epoch": 0.68, "learning_rate": 0.00026325088820058575, "loss": 1.6192, "step": 8679 }, { "epoch": 0.68, "learning_rate": 0.0002632427833281249, "loss": 1.6772, "step": 8680 }, { "epoch": 0.68, "learning_rate": 0.0002632346776868081, "loss": 1.698, "step": 8681 }, { "epoch": 0.68, "learning_rate": 0.0002632265712766902, "loss": 1.6756, "step": 8682 }, { "epoch": 0.68, "learning_rate": 0.00026321846409782653, "loss": 1.6565, "step": 8683 }, { "epoch": 0.68, "learning_rate": 0.0002632103561502718, "loss": 1.6132, "step": 8684 }, { "epoch": 0.68, "learning_rate": 0.0002632022474340814, "loss": 1.6934, "step": 8685 }, { "epoch": 0.68, "learning_rate": 0.0002631941379493101, "loss": 1.6907, "step": 8686 }, { "epoch": 0.68, "learning_rate": 0.00026318602769601307, "loss": 1.699, "step": 8687 }, { "epoch": 0.68, "learning_rate": 0.00026317791667424537, "loss": 1.7099, "step": 8688 }, { "epoch": 0.68, "learning_rate": 0.0002631698048840622, "loss": 1.6851, "step": 8689 }, { "epoch": 0.68, "learning_rate": 0.00026316169232551835, "loss": 1.6386, "step": 8690 }, { "epoch": 0.68, "learning_rate": 0.0002631535789986691, "loss": 1.6859, "step": 8691 }, { "epoch": 0.68, "learning_rate": 0.00026314546490356953, "loss": 1.6927, "step": 8692 }, { "epoch": 0.68, "learning_rate": 0.00026313735004027464, "loss": 1.6372, "step": 8693 }, { "epoch": 0.68, "learning_rate": 0.00026312923440883964, "loss": 1.6303, "step": 8694 }, { "epoch": 0.68, "learning_rate": 0.0002631211180093195, "loss": 1.662, "step": 8695 }, { "epoch": 0.68, "learning_rate": 0.00026311300084176946, "loss": 1.6187, "step": 8696 }, { "epoch": 0.68, "learning_rate": 0.00026310488290624454, "loss": 1.6637, "step": 8697 }, { "epoch": 0.68, "learning_rate": 0.0002630967642027999, "loss": 1.6895, "step": 8698 }, { "epoch": 0.68, "learning_rate": 0.00026308864473149055, "loss": 1.6791, "step": 8699 }, { "epoch": 0.68, "learning_rate": 0.0002630805244923718, "loss": 1.6612, "step": 8700 }, { "epoch": 0.68, "learning_rate": 0.0002630724034854987, "loss": 1.6512, "step": 8701 }, { "epoch": 0.68, "learning_rate": 0.0002630642817109263, "loss": 1.6444, "step": 8702 }, { "epoch": 0.68, "learning_rate": 0.00026305615916870985, "loss": 1.6451, "step": 8703 }, { "epoch": 0.68, "learning_rate": 0.0002630480358589045, "loss": 1.6203, "step": 8704 }, { "epoch": 0.68, "learning_rate": 0.00026303991178156536, "loss": 1.6664, "step": 8705 }, { "epoch": 0.68, "learning_rate": 0.00026303178693674764, "loss": 1.6894, "step": 8706 }, { "epoch": 0.69, "learning_rate": 0.00026302366132450637, "loss": 1.621, "step": 8707 }, { "epoch": 0.69, "learning_rate": 0.0002630155349448969, "loss": 1.6409, "step": 8708 }, { "epoch": 0.69, "learning_rate": 0.0002630074077979742, "loss": 1.7074, "step": 8709 }, { "epoch": 0.69, "learning_rate": 0.0002629992798837937, "loss": 1.7262, "step": 8710 }, { "epoch": 0.69, "learning_rate": 0.00026299115120241036, "loss": 1.6874, "step": 8711 }, { "epoch": 0.69, "learning_rate": 0.0002629830217538795, "loss": 1.6558, "step": 8712 }, { "epoch": 0.69, "learning_rate": 0.0002629748915382562, "loss": 1.6414, "step": 8713 }, { "epoch": 0.69, "learning_rate": 0.0002629667605555958, "loss": 1.6961, "step": 8714 }, { "epoch": 0.69, "learning_rate": 0.00026295862880595347, "loss": 1.6513, "step": 8715 }, { "epoch": 0.69, "learning_rate": 0.00026295049628938434, "loss": 1.6567, "step": 8716 }, { "epoch": 0.69, "learning_rate": 0.00026294236300594367, "loss": 1.6563, "step": 8717 }, { "epoch": 0.69, "learning_rate": 0.0002629342289556867, "loss": 1.6486, "step": 8718 }, { "epoch": 0.69, "learning_rate": 0.0002629260941386686, "loss": 1.6909, "step": 8719 }, { "epoch": 0.69, "learning_rate": 0.00026291795855494466, "loss": 1.6562, "step": 8720 }, { "epoch": 0.69, "learning_rate": 0.0002629098222045701, "loss": 1.6452, "step": 8721 }, { "epoch": 0.69, "learning_rate": 0.00026290168508760016, "loss": 1.7005, "step": 8722 }, { "epoch": 0.69, "learning_rate": 0.0002628935472040901, "loss": 1.652, "step": 8723 }, { "epoch": 0.69, "learning_rate": 0.0002628854085540951, "loss": 1.6648, "step": 8724 }, { "epoch": 0.69, "learning_rate": 0.00026287726913767044, "loss": 1.706, "step": 8725 }, { "epoch": 0.69, "learning_rate": 0.0002628691289548715, "loss": 1.6627, "step": 8726 }, { "epoch": 0.69, "learning_rate": 0.00026286098800575345, "loss": 1.6738, "step": 8727 }, { "epoch": 0.69, "learning_rate": 0.00026285284629037155, "loss": 1.6403, "step": 8728 }, { "epoch": 0.69, "learning_rate": 0.00026284470380878115, "loss": 1.7123, "step": 8729 }, { "epoch": 0.69, "learning_rate": 0.0002628365605610374, "loss": 1.691, "step": 8730 }, { "epoch": 0.69, "learning_rate": 0.0002628284165471957, "loss": 1.6401, "step": 8731 }, { "epoch": 0.69, "learning_rate": 0.0002628202717673113, "loss": 1.6364, "step": 8732 }, { "epoch": 0.69, "learning_rate": 0.00026281212622143957, "loss": 1.6665, "step": 8733 }, { "epoch": 0.69, "learning_rate": 0.00026280397990963573, "loss": 1.7127, "step": 8734 }, { "epoch": 0.69, "learning_rate": 0.0002627958328319551, "loss": 1.6302, "step": 8735 }, { "epoch": 0.69, "learning_rate": 0.00026278768498845306, "loss": 1.7086, "step": 8736 }, { "epoch": 0.69, "learning_rate": 0.00026277953637918487, "loss": 1.6277, "step": 8737 }, { "epoch": 0.69, "learning_rate": 0.00026277138700420583, "loss": 1.6057, "step": 8738 }, { "epoch": 0.69, "learning_rate": 0.00026276323686357135, "loss": 1.6379, "step": 8739 }, { "epoch": 0.69, "learning_rate": 0.0002627550859573366, "loss": 1.6342, "step": 8740 }, { "epoch": 0.69, "learning_rate": 0.0002627469342855572, "loss": 1.6334, "step": 8741 }, { "epoch": 0.69, "learning_rate": 0.00026273878184828825, "loss": 1.6526, "step": 8742 }, { "epoch": 0.69, "learning_rate": 0.0002627306286455852, "loss": 1.6416, "step": 8743 }, { "epoch": 0.69, "learning_rate": 0.00026272247467750337, "loss": 1.5685, "step": 8744 }, { "epoch": 0.69, "learning_rate": 0.00026271431994409817, "loss": 1.6743, "step": 8745 }, { "epoch": 0.69, "learning_rate": 0.0002627061644454249, "loss": 1.6429, "step": 8746 }, { "epoch": 0.69, "learning_rate": 0.00026269800818153906, "loss": 1.6921, "step": 8747 }, { "epoch": 0.69, "learning_rate": 0.00026268985115249585, "loss": 1.7483, "step": 8748 }, { "epoch": 0.69, "learning_rate": 0.0002626816933583508, "loss": 1.639, "step": 8749 }, { "epoch": 0.69, "learning_rate": 0.00026267353479915916, "loss": 1.6756, "step": 8750 }, { "epoch": 0.69, "learning_rate": 0.00026266537547497645, "loss": 1.6295, "step": 8751 }, { "epoch": 0.69, "learning_rate": 0.000262657215385858, "loss": 1.6294, "step": 8752 }, { "epoch": 0.69, "learning_rate": 0.0002626490545318592, "loss": 1.6263, "step": 8753 }, { "epoch": 0.69, "learning_rate": 0.0002626408929130355, "loss": 1.6534, "step": 8754 }, { "epoch": 0.69, "learning_rate": 0.00026263273052944233, "loss": 1.6365, "step": 8755 }, { "epoch": 0.69, "learning_rate": 0.00026262456738113506, "loss": 1.6568, "step": 8756 }, { "epoch": 0.69, "learning_rate": 0.00026261640346816916, "loss": 1.6515, "step": 8757 }, { "epoch": 0.69, "learning_rate": 0.0002626082387906, "loss": 1.6525, "step": 8758 }, { "epoch": 0.69, "learning_rate": 0.000262600073348483, "loss": 1.6226, "step": 8759 }, { "epoch": 0.69, "learning_rate": 0.00026259190714187367, "loss": 1.6437, "step": 8760 }, { "epoch": 0.69, "learning_rate": 0.0002625837401708274, "loss": 1.6137, "step": 8761 }, { "epoch": 0.69, "learning_rate": 0.0002625755724353997, "loss": 1.6618, "step": 8762 }, { "epoch": 0.69, "learning_rate": 0.000262567403935646, "loss": 1.6705, "step": 8763 }, { "epoch": 0.69, "learning_rate": 0.0002625592346716217, "loss": 1.634, "step": 8764 }, { "epoch": 0.69, "learning_rate": 0.00026255106464338236, "loss": 1.6698, "step": 8765 }, { "epoch": 0.69, "learning_rate": 0.00026254289385098335, "loss": 1.6321, "step": 8766 }, { "epoch": 0.69, "learning_rate": 0.0002625347222944803, "loss": 1.652, "step": 8767 }, { "epoch": 0.69, "learning_rate": 0.0002625265499739285, "loss": 1.6549, "step": 8768 }, { "epoch": 0.69, "learning_rate": 0.00026251837688938347, "loss": 1.6767, "step": 8769 }, { "epoch": 0.69, "learning_rate": 0.00026251020304090086, "loss": 1.6521, "step": 8770 }, { "epoch": 0.69, "learning_rate": 0.00026250202842853596, "loss": 1.5983, "step": 8771 }, { "epoch": 0.69, "learning_rate": 0.0002624938530523445, "loss": 1.6327, "step": 8772 }, { "epoch": 0.69, "learning_rate": 0.00026248567691238174, "loss": 1.7048, "step": 8773 }, { "epoch": 0.69, "learning_rate": 0.0002624775000087034, "loss": 1.681, "step": 8774 }, { "epoch": 0.69, "learning_rate": 0.00026246932234136485, "loss": 1.7397, "step": 8775 }, { "epoch": 0.69, "learning_rate": 0.00026246114391042163, "loss": 1.708, "step": 8776 }, { "epoch": 0.69, "learning_rate": 0.0002624529647159294, "loss": 1.6257, "step": 8777 }, { "epoch": 0.69, "learning_rate": 0.00026244478475794355, "loss": 1.6826, "step": 8778 }, { "epoch": 0.69, "learning_rate": 0.00026243660403651965, "loss": 1.6339, "step": 8779 }, { "epoch": 0.69, "learning_rate": 0.0002624284225517133, "loss": 1.6081, "step": 8780 }, { "epoch": 0.69, "learning_rate": 0.0002624202403035799, "loss": 1.6687, "step": 8781 }, { "epoch": 0.69, "learning_rate": 0.0002624120572921752, "loss": 1.7141, "step": 8782 }, { "epoch": 0.69, "learning_rate": 0.00026240387351755465, "loss": 1.6584, "step": 8783 }, { "epoch": 0.69, "learning_rate": 0.0002623956889797738, "loss": 1.6685, "step": 8784 }, { "epoch": 0.69, "learning_rate": 0.0002623875036788883, "loss": 1.6172, "step": 8785 }, { "epoch": 0.69, "learning_rate": 0.00026237931761495363, "loss": 1.6042, "step": 8786 }, { "epoch": 0.69, "learning_rate": 0.0002623711307880254, "loss": 1.6878, "step": 8787 }, { "epoch": 0.69, "learning_rate": 0.00026236294319815926, "loss": 1.699, "step": 8788 }, { "epoch": 0.69, "learning_rate": 0.00026235475484541064, "loss": 1.6354, "step": 8789 }, { "epoch": 0.69, "learning_rate": 0.00026234656572983537, "loss": 1.6744, "step": 8790 }, { "epoch": 0.69, "learning_rate": 0.00026233837585148886, "loss": 1.669, "step": 8791 }, { "epoch": 0.69, "learning_rate": 0.0002623301852104267, "loss": 1.6822, "step": 8792 }, { "epoch": 0.69, "learning_rate": 0.00026232199380670467, "loss": 1.6185, "step": 8793 }, { "epoch": 0.69, "learning_rate": 0.00026231380164037823, "loss": 1.7071, "step": 8794 }, { "epoch": 0.69, "learning_rate": 0.0002623056087115031, "loss": 1.6689, "step": 8795 }, { "epoch": 0.69, "learning_rate": 0.00026229741502013484, "loss": 1.6542, "step": 8796 }, { "epoch": 0.69, "learning_rate": 0.00026228922056632906, "loss": 1.5947, "step": 8797 }, { "epoch": 0.69, "learning_rate": 0.0002622810253501415, "loss": 1.659, "step": 8798 }, { "epoch": 0.69, "learning_rate": 0.0002622728293716277, "loss": 1.7103, "step": 8799 }, { "epoch": 0.69, "learning_rate": 0.0002622646326308434, "loss": 1.653, "step": 8800 }, { "epoch": 0.69, "learning_rate": 0.0002622564351278441, "loss": 1.6607, "step": 8801 }, { "epoch": 0.69, "learning_rate": 0.00026224823686268563, "loss": 1.7031, "step": 8802 }, { "epoch": 0.69, "learning_rate": 0.00026224003783542355, "loss": 1.6192, "step": 8803 }, { "epoch": 0.69, "learning_rate": 0.0002622318380461136, "loss": 1.6708, "step": 8804 }, { "epoch": 0.69, "learning_rate": 0.00026222363749481135, "loss": 1.6208, "step": 8805 }, { "epoch": 0.69, "learning_rate": 0.0002622154361815726, "loss": 1.6806, "step": 8806 }, { "epoch": 0.69, "learning_rate": 0.0002622072341064529, "loss": 1.605, "step": 8807 }, { "epoch": 0.69, "learning_rate": 0.000262199031269508, "loss": 1.6771, "step": 8808 }, { "epoch": 0.69, "learning_rate": 0.0002621908276707936, "loss": 1.633, "step": 8809 }, { "epoch": 0.69, "learning_rate": 0.0002621826233103654, "loss": 1.5956, "step": 8810 }, { "epoch": 0.69, "learning_rate": 0.0002621744181882791, "loss": 1.6823, "step": 8811 }, { "epoch": 0.69, "learning_rate": 0.0002621662123045904, "loss": 1.6577, "step": 8812 }, { "epoch": 0.69, "learning_rate": 0.000262158005659355, "loss": 1.7249, "step": 8813 }, { "epoch": 0.69, "learning_rate": 0.0002621497982526287, "loss": 1.6074, "step": 8814 }, { "epoch": 0.69, "learning_rate": 0.00026214159008446704, "loss": 1.6679, "step": 8815 }, { "epoch": 0.69, "learning_rate": 0.00026213338115492593, "loss": 1.6363, "step": 8816 }, { "epoch": 0.69, "learning_rate": 0.0002621251714640611, "loss": 1.6787, "step": 8817 }, { "epoch": 0.69, "learning_rate": 0.00026211696101192814, "loss": 1.6321, "step": 8818 }, { "epoch": 0.69, "learning_rate": 0.00026210874979858297, "loss": 1.7233, "step": 8819 }, { "epoch": 0.69, "learning_rate": 0.0002621005378240812, "loss": 1.6847, "step": 8820 }, { "epoch": 0.69, "learning_rate": 0.00026209232508847866, "loss": 1.6527, "step": 8821 }, { "epoch": 0.69, "learning_rate": 0.0002620841115918311, "loss": 1.6794, "step": 8822 }, { "epoch": 0.69, "learning_rate": 0.0002620758973341942, "loss": 1.6254, "step": 8823 }, { "epoch": 0.69, "learning_rate": 0.0002620676823156239, "loss": 1.6423, "step": 8824 }, { "epoch": 0.69, "learning_rate": 0.00026205946653617583, "loss": 1.6624, "step": 8825 }, { "epoch": 0.69, "learning_rate": 0.0002620512499959059, "loss": 1.7093, "step": 8826 }, { "epoch": 0.69, "learning_rate": 0.0002620430326948697, "loss": 1.6684, "step": 8827 }, { "epoch": 0.69, "learning_rate": 0.00026203481463312324, "loss": 1.6841, "step": 8828 }, { "epoch": 0.69, "learning_rate": 0.00026202659581072216, "loss": 1.6046, "step": 8829 }, { "epoch": 0.69, "learning_rate": 0.0002620183762277223, "loss": 1.6457, "step": 8830 }, { "epoch": 0.69, "learning_rate": 0.0002620101558841795, "loss": 1.7032, "step": 8831 }, { "epoch": 0.69, "learning_rate": 0.0002620019347801496, "loss": 1.6418, "step": 8832 }, { "epoch": 0.69, "learning_rate": 0.0002619937129156883, "loss": 1.6511, "step": 8833 }, { "epoch": 0.7, "learning_rate": 0.00026198549029085154, "loss": 1.6541, "step": 8834 }, { "epoch": 0.7, "learning_rate": 0.00026197726690569507, "loss": 1.642, "step": 8835 }, { "epoch": 0.7, "learning_rate": 0.00026196904276027473, "loss": 1.6489, "step": 8836 }, { "epoch": 0.7, "learning_rate": 0.00026196081785464647, "loss": 1.6572, "step": 8837 }, { "epoch": 0.7, "learning_rate": 0.000261952592188866, "loss": 1.7017, "step": 8838 }, { "epoch": 0.7, "learning_rate": 0.00026194436576298914, "loss": 1.6042, "step": 8839 }, { "epoch": 0.7, "learning_rate": 0.0002619361385770719, "loss": 1.6689, "step": 8840 }, { "epoch": 0.7, "learning_rate": 0.00026192791063117004, "loss": 1.6472, "step": 8841 }, { "epoch": 0.7, "learning_rate": 0.0002619196819253394, "loss": 1.6515, "step": 8842 }, { "epoch": 0.7, "learning_rate": 0.00026191145245963587, "loss": 1.7106, "step": 8843 }, { "epoch": 0.7, "learning_rate": 0.00026190322223411535, "loss": 1.6475, "step": 8844 }, { "epoch": 0.7, "learning_rate": 0.00026189499124883376, "loss": 1.6444, "step": 8845 }, { "epoch": 0.7, "learning_rate": 0.0002618867595038469, "loss": 1.6468, "step": 8846 }, { "epoch": 0.7, "learning_rate": 0.00026187852699921066, "loss": 1.6189, "step": 8847 }, { "epoch": 0.7, "learning_rate": 0.00026187029373498093, "loss": 1.6704, "step": 8848 }, { "epoch": 0.7, "learning_rate": 0.0002618620597112137, "loss": 1.6431, "step": 8849 }, { "epoch": 0.7, "learning_rate": 0.0002618538249279648, "loss": 1.6163, "step": 8850 }, { "epoch": 0.7, "learning_rate": 0.0002618455893852901, "loss": 1.6895, "step": 8851 }, { "epoch": 0.7, "learning_rate": 0.00026183735308324565, "loss": 1.6458, "step": 8852 }, { "epoch": 0.7, "learning_rate": 0.0002618291160218873, "loss": 1.6668, "step": 8853 }, { "epoch": 0.7, "learning_rate": 0.0002618208782012709, "loss": 1.6292, "step": 8854 }, { "epoch": 0.7, "learning_rate": 0.0002618126396214525, "loss": 1.7078, "step": 8855 }, { "epoch": 0.7, "learning_rate": 0.00026180440028248796, "loss": 1.628, "step": 8856 }, { "epoch": 0.7, "learning_rate": 0.0002617961601844332, "loss": 1.6727, "step": 8857 }, { "epoch": 0.7, "learning_rate": 0.0002617879193273442, "loss": 1.6696, "step": 8858 }, { "epoch": 0.7, "learning_rate": 0.00026177967771127703, "loss": 1.706, "step": 8859 }, { "epoch": 0.7, "learning_rate": 0.0002617714353362874, "loss": 1.6659, "step": 8860 }, { "epoch": 0.7, "learning_rate": 0.0002617631922024315, "loss": 1.5907, "step": 8861 }, { "epoch": 0.7, "learning_rate": 0.00026175494830976513, "loss": 1.6477, "step": 8862 }, { "epoch": 0.7, "learning_rate": 0.0002617467036583444, "loss": 1.6526, "step": 8863 }, { "epoch": 0.7, "learning_rate": 0.0002617384582482252, "loss": 1.6614, "step": 8864 }, { "epoch": 0.7, "learning_rate": 0.00026173021207946353, "loss": 1.6608, "step": 8865 }, { "epoch": 0.7, "learning_rate": 0.0002617219651521153, "loss": 1.6157, "step": 8866 }, { "epoch": 0.7, "learning_rate": 0.00026171371746623666, "loss": 1.6491, "step": 8867 }, { "epoch": 0.7, "learning_rate": 0.00026170546902188355, "loss": 1.751, "step": 8868 }, { "epoch": 0.7, "learning_rate": 0.0002616972198191119, "loss": 1.6584, "step": 8869 }, { "epoch": 0.7, "learning_rate": 0.0002616889698579778, "loss": 1.6008, "step": 8870 }, { "epoch": 0.7, "learning_rate": 0.00026168071913853716, "loss": 1.5715, "step": 8871 }, { "epoch": 0.7, "learning_rate": 0.00026167246766084615, "loss": 1.622, "step": 8872 }, { "epoch": 0.7, "learning_rate": 0.0002616642154249607, "loss": 1.628, "step": 8873 }, { "epoch": 0.7, "learning_rate": 0.0002616559624309368, "loss": 1.6638, "step": 8874 }, { "epoch": 0.7, "learning_rate": 0.0002616477086788305, "loss": 1.6578, "step": 8875 }, { "epoch": 0.7, "learning_rate": 0.00026163945416869796, "loss": 1.6256, "step": 8876 }, { "epoch": 0.7, "learning_rate": 0.0002616311989005951, "loss": 1.6469, "step": 8877 }, { "epoch": 0.7, "learning_rate": 0.00026162294287457804, "loss": 1.6976, "step": 8878 }, { "epoch": 0.7, "learning_rate": 0.00026161468609070277, "loss": 1.7056, "step": 8879 }, { "epoch": 0.7, "learning_rate": 0.00026160642854902537, "loss": 1.6637, "step": 8880 }, { "epoch": 0.7, "learning_rate": 0.0002615981702496019, "loss": 1.6656, "step": 8881 }, { "epoch": 0.7, "learning_rate": 0.0002615899111924884, "loss": 1.6816, "step": 8882 }, { "epoch": 0.7, "learning_rate": 0.000261581651377741, "loss": 1.6265, "step": 8883 }, { "epoch": 0.7, "learning_rate": 0.0002615733908054159, "loss": 1.6813, "step": 8884 }, { "epoch": 0.7, "learning_rate": 0.0002615651294755689, "loss": 1.6401, "step": 8885 }, { "epoch": 0.7, "learning_rate": 0.0002615568673882563, "loss": 1.6281, "step": 8886 }, { "epoch": 0.7, "learning_rate": 0.00026154860454353406, "loss": 1.693, "step": 8887 }, { "epoch": 0.7, "learning_rate": 0.00026154034094145844, "loss": 1.6396, "step": 8888 }, { "epoch": 0.7, "learning_rate": 0.00026153207658208543, "loss": 1.7, "step": 8889 }, { "epoch": 0.7, "learning_rate": 0.00026152381146547115, "loss": 1.6635, "step": 8890 }, { "epoch": 0.7, "learning_rate": 0.0002615155455916717, "loss": 1.6973, "step": 8891 }, { "epoch": 0.7, "learning_rate": 0.0002615072789607433, "loss": 1.6575, "step": 8892 }, { "epoch": 0.7, "learning_rate": 0.000261499011572742, "loss": 1.6669, "step": 8893 }, { "epoch": 0.7, "learning_rate": 0.0002614907434277239, "loss": 1.6565, "step": 8894 }, { "epoch": 0.7, "learning_rate": 0.0002614824745257452, "loss": 1.7059, "step": 8895 }, { "epoch": 0.7, "learning_rate": 0.00026147420486686207, "loss": 1.666, "step": 8896 }, { "epoch": 0.7, "learning_rate": 0.0002614659344511305, "loss": 1.6792, "step": 8897 }, { "epoch": 0.7, "learning_rate": 0.00026145766327860683, "loss": 1.6696, "step": 8898 }, { "epoch": 0.7, "learning_rate": 0.00026144939134934716, "loss": 1.6722, "step": 8899 }, { "epoch": 0.7, "learning_rate": 0.00026144111866340756, "loss": 1.6576, "step": 8900 }, { "epoch": 0.7, "learning_rate": 0.0002614328452208443, "loss": 1.6609, "step": 8901 }, { "epoch": 0.7, "learning_rate": 0.0002614245710217135, "loss": 1.6514, "step": 8902 }, { "epoch": 0.7, "learning_rate": 0.00026141629606607134, "loss": 1.6917, "step": 8903 }, { "epoch": 0.7, "learning_rate": 0.000261408020353974, "loss": 1.695, "step": 8904 }, { "epoch": 0.7, "learning_rate": 0.00026139974388547773, "loss": 1.6117, "step": 8905 }, { "epoch": 0.7, "learning_rate": 0.00026139146666063866, "loss": 1.6455, "step": 8906 }, { "epoch": 0.7, "learning_rate": 0.00026138318867951295, "loss": 1.6652, "step": 8907 }, { "epoch": 0.7, "learning_rate": 0.00026137490994215687, "loss": 1.6562, "step": 8908 }, { "epoch": 0.7, "learning_rate": 0.00026136663044862664, "loss": 1.6286, "step": 8909 }, { "epoch": 0.7, "learning_rate": 0.0002613583501989785, "loss": 1.6391, "step": 8910 }, { "epoch": 0.7, "learning_rate": 0.00026135006919326856, "loss": 1.6757, "step": 8911 }, { "epoch": 0.7, "learning_rate": 0.00026134178743155307, "loss": 1.6743, "step": 8912 }, { "epoch": 0.7, "learning_rate": 0.0002613335049138883, "loss": 1.6758, "step": 8913 }, { "epoch": 0.7, "learning_rate": 0.0002613252216403305, "loss": 1.6471, "step": 8914 }, { "epoch": 0.7, "learning_rate": 0.0002613169376109359, "loss": 1.6035, "step": 8915 }, { "epoch": 0.7, "learning_rate": 0.00026130865282576065, "loss": 1.6493, "step": 8916 }, { "epoch": 0.7, "learning_rate": 0.0002613003672848611, "loss": 1.6333, "step": 8917 }, { "epoch": 0.7, "learning_rate": 0.00026129208098829354, "loss": 1.6818, "step": 8918 }, { "epoch": 0.7, "learning_rate": 0.0002612837939361141, "loss": 1.6977, "step": 8919 }, { "epoch": 0.7, "learning_rate": 0.0002612755061283791, "loss": 1.7199, "step": 8920 }, { "epoch": 0.7, "learning_rate": 0.00026126721756514486, "loss": 1.6949, "step": 8921 }, { "epoch": 0.7, "learning_rate": 0.0002612589282464676, "loss": 1.6815, "step": 8922 }, { "epoch": 0.7, "learning_rate": 0.00026125063817240363, "loss": 1.6224, "step": 8923 }, { "epoch": 0.7, "learning_rate": 0.00026124234734300924, "loss": 1.5872, "step": 8924 }, { "epoch": 0.7, "learning_rate": 0.0002612340557583406, "loss": 1.6515, "step": 8925 }, { "epoch": 0.7, "learning_rate": 0.0002612257634184542, "loss": 1.6311, "step": 8926 }, { "epoch": 0.7, "learning_rate": 0.0002612174703234062, "loss": 1.6006, "step": 8927 }, { "epoch": 0.7, "learning_rate": 0.000261209176473253, "loss": 1.6888, "step": 8928 }, { "epoch": 0.7, "learning_rate": 0.0002612008818680508, "loss": 1.631, "step": 8929 }, { "epoch": 0.7, "learning_rate": 0.000261192586507856, "loss": 1.6433, "step": 8930 }, { "epoch": 0.7, "learning_rate": 0.0002611842903927249, "loss": 1.6595, "step": 8931 }, { "epoch": 0.7, "learning_rate": 0.00026117599352271385, "loss": 1.7044, "step": 8932 }, { "epoch": 0.7, "learning_rate": 0.0002611676958978791, "loss": 1.6102, "step": 8933 }, { "epoch": 0.7, "learning_rate": 0.0002611593975182771, "loss": 1.6546, "step": 8934 }, { "epoch": 0.7, "learning_rate": 0.0002611510983839641, "loss": 1.7387, "step": 8935 }, { "epoch": 0.7, "learning_rate": 0.00026114279849499654, "loss": 1.6446, "step": 8936 }, { "epoch": 0.7, "learning_rate": 0.00026113449785143065, "loss": 1.6597, "step": 8937 }, { "epoch": 0.7, "learning_rate": 0.00026112619645332283, "loss": 1.6834, "step": 8938 }, { "epoch": 0.7, "learning_rate": 0.0002611178943007295, "loss": 1.6538, "step": 8939 }, { "epoch": 0.7, "learning_rate": 0.000261109591393707, "loss": 1.7417, "step": 8940 }, { "epoch": 0.7, "learning_rate": 0.0002611012877323117, "loss": 1.6459, "step": 8941 }, { "epoch": 0.7, "learning_rate": 0.0002610929833165999, "loss": 1.6095, "step": 8942 }, { "epoch": 0.7, "learning_rate": 0.0002610846781466281, "loss": 1.6754, "step": 8943 }, { "epoch": 0.7, "learning_rate": 0.00026107637222245263, "loss": 1.6623, "step": 8944 }, { "epoch": 0.7, "learning_rate": 0.0002610680655441299, "loss": 1.6512, "step": 8945 }, { "epoch": 0.7, "learning_rate": 0.00026105975811171626, "loss": 1.6974, "step": 8946 }, { "epoch": 0.7, "learning_rate": 0.0002610514499252682, "loss": 1.6833, "step": 8947 }, { "epoch": 0.7, "learning_rate": 0.00026104314098484205, "loss": 1.6398, "step": 8948 }, { "epoch": 0.7, "learning_rate": 0.0002610348312904942, "loss": 1.6039, "step": 8949 }, { "epoch": 0.7, "learning_rate": 0.00026102652084228123, "loss": 1.67, "step": 8950 }, { "epoch": 0.7, "learning_rate": 0.0002610182096402594, "loss": 1.6378, "step": 8951 }, { "epoch": 0.7, "learning_rate": 0.00026100989768448516, "loss": 1.6719, "step": 8952 }, { "epoch": 0.7, "learning_rate": 0.000261001584975015, "loss": 1.6526, "step": 8953 }, { "epoch": 0.7, "learning_rate": 0.0002609932715119053, "loss": 1.6509, "step": 8954 }, { "epoch": 0.7, "learning_rate": 0.00026098495729521263, "loss": 1.7062, "step": 8955 }, { "epoch": 0.7, "learning_rate": 0.0002609766423249933, "loss": 1.6363, "step": 8956 }, { "epoch": 0.7, "learning_rate": 0.00026096832660130377, "loss": 1.6303, "step": 8957 }, { "epoch": 0.7, "learning_rate": 0.00026096001012420055, "loss": 1.6906, "step": 8958 }, { "epoch": 0.7, "learning_rate": 0.00026095169289374015, "loss": 1.695, "step": 8959 }, { "epoch": 0.7, "learning_rate": 0.00026094337490997896, "loss": 1.6024, "step": 8960 }, { "epoch": 0.71, "learning_rate": 0.00026093505617297345, "loss": 1.6761, "step": 8961 }, { "epoch": 0.71, "learning_rate": 0.00026092673668278013, "loss": 1.6675, "step": 8962 }, { "epoch": 0.71, "learning_rate": 0.0002609184164394555, "loss": 1.6458, "step": 8963 }, { "epoch": 0.71, "learning_rate": 0.00026091009544305607, "loss": 1.7007, "step": 8964 }, { "epoch": 0.71, "learning_rate": 0.0002609017736936382, "loss": 1.6425, "step": 8965 }, { "epoch": 0.71, "learning_rate": 0.00026089345119125856, "loss": 1.6744, "step": 8966 }, { "epoch": 0.71, "learning_rate": 0.0002608851279359736, "loss": 1.7085, "step": 8967 }, { "epoch": 0.71, "learning_rate": 0.0002608768039278397, "loss": 1.6471, "step": 8968 }, { "epoch": 0.71, "learning_rate": 0.00026086847916691365, "loss": 1.6222, "step": 8969 }, { "epoch": 0.71, "learning_rate": 0.00026086015365325165, "loss": 1.6444, "step": 8970 }, { "epoch": 0.71, "learning_rate": 0.0002608518273869105, "loss": 1.6697, "step": 8971 }, { "epoch": 0.71, "learning_rate": 0.00026084350036794654, "loss": 1.6015, "step": 8972 }, { "epoch": 0.71, "learning_rate": 0.00026083517259641644, "loss": 1.6528, "step": 8973 }, { "epoch": 0.71, "learning_rate": 0.00026082684407237664, "loss": 1.6863, "step": 8974 }, { "epoch": 0.71, "learning_rate": 0.0002608185147958838, "loss": 1.6691, "step": 8975 }, { "epoch": 0.71, "learning_rate": 0.0002608101847669943, "loss": 1.6282, "step": 8976 }, { "epoch": 0.71, "learning_rate": 0.0002608018539857648, "loss": 1.6683, "step": 8977 }, { "epoch": 0.71, "learning_rate": 0.0002607935224522519, "loss": 1.6365, "step": 8978 }, { "epoch": 0.71, "learning_rate": 0.0002607851901665122, "loss": 1.6099, "step": 8979 }, { "epoch": 0.71, "learning_rate": 0.0002607768571286021, "loss": 1.678, "step": 8980 }, { "epoch": 0.71, "learning_rate": 0.00026076852333857824, "loss": 1.6629, "step": 8981 }, { "epoch": 0.71, "learning_rate": 0.0002607601887964973, "loss": 1.656, "step": 8982 }, { "epoch": 0.71, "learning_rate": 0.0002607518535024158, "loss": 1.667, "step": 8983 }, { "epoch": 0.71, "learning_rate": 0.0002607435174563903, "loss": 1.6252, "step": 8984 }, { "epoch": 0.71, "learning_rate": 0.00026073518065847744, "loss": 1.6009, "step": 8985 }, { "epoch": 0.71, "learning_rate": 0.00026072684310873384, "loss": 1.6241, "step": 8986 }, { "epoch": 0.71, "learning_rate": 0.00026071850480721605, "loss": 1.7118, "step": 8987 }, { "epoch": 0.71, "learning_rate": 0.00026071016575398073, "loss": 1.5982, "step": 8988 }, { "epoch": 0.71, "learning_rate": 0.0002607018259490844, "loss": 1.6285, "step": 8989 }, { "epoch": 0.71, "learning_rate": 0.00026069348539258387, "loss": 1.6529, "step": 8990 }, { "epoch": 0.71, "learning_rate": 0.00026068514408453567, "loss": 1.626, "step": 8991 }, { "epoch": 0.71, "learning_rate": 0.0002606768020249963, "loss": 1.684, "step": 8992 }, { "epoch": 0.71, "learning_rate": 0.0002606684592140226, "loss": 1.7219, "step": 8993 }, { "epoch": 0.71, "learning_rate": 0.00026066011565167114, "loss": 1.6288, "step": 8994 }, { "epoch": 0.71, "learning_rate": 0.0002606517713379985, "loss": 1.6826, "step": 8995 }, { "epoch": 0.71, "learning_rate": 0.00026064342627306146, "loss": 1.6557, "step": 8996 }, { "epoch": 0.71, "learning_rate": 0.00026063508045691663, "loss": 1.654, "step": 8997 }, { "epoch": 0.71, "learning_rate": 0.00026062673388962065, "loss": 1.6171, "step": 8998 }, { "epoch": 0.71, "learning_rate": 0.0002606183865712301, "loss": 1.6659, "step": 8999 }, { "epoch": 0.71, "learning_rate": 0.0002606100385018019, "loss": 1.6526, "step": 9000 }, { "epoch": 0.71, "learning_rate": 0.00026060168968139246, "loss": 1.6561, "step": 9001 }, { "epoch": 0.71, "learning_rate": 0.00026059334011005865, "loss": 1.6565, "step": 9002 }, { "epoch": 0.71, "learning_rate": 0.00026058498978785705, "loss": 1.6448, "step": 9003 }, { "epoch": 0.71, "learning_rate": 0.00026057663871484435, "loss": 1.6793, "step": 9004 }, { "epoch": 0.71, "learning_rate": 0.0002605682868910774, "loss": 1.6565, "step": 9005 }, { "epoch": 0.71, "learning_rate": 0.00026055993431661274, "loss": 1.6452, "step": 9006 }, { "epoch": 0.71, "learning_rate": 0.00026055158099150716, "loss": 1.6375, "step": 9007 }, { "epoch": 0.71, "learning_rate": 0.0002605432269158173, "loss": 1.6418, "step": 9008 }, { "epoch": 0.71, "learning_rate": 0.0002605348720896, "loss": 1.6654, "step": 9009 }, { "epoch": 0.71, "learning_rate": 0.0002605265165129119, "loss": 1.6605, "step": 9010 }, { "epoch": 0.71, "learning_rate": 0.0002605181601858097, "loss": 1.6509, "step": 9011 }, { "epoch": 0.71, "learning_rate": 0.0002605098031083502, "loss": 1.6323, "step": 9012 }, { "epoch": 0.71, "learning_rate": 0.0002605014452805902, "loss": 1.6409, "step": 9013 }, { "epoch": 0.71, "learning_rate": 0.0002604930867025863, "loss": 1.6394, "step": 9014 }, { "epoch": 0.71, "learning_rate": 0.00026048472737439526, "loss": 1.6625, "step": 9015 }, { "epoch": 0.71, "learning_rate": 0.00026047636729607397, "loss": 1.6863, "step": 9016 }, { "epoch": 0.71, "learning_rate": 0.0002604680064676791, "loss": 1.6719, "step": 9017 }, { "epoch": 0.71, "learning_rate": 0.00026045964488926747, "loss": 1.674, "step": 9018 }, { "epoch": 0.71, "learning_rate": 0.0002604512825608957, "loss": 1.7074, "step": 9019 }, { "epoch": 0.71, "learning_rate": 0.00026044291948262074, "loss": 1.6664, "step": 9020 }, { "epoch": 0.71, "learning_rate": 0.00026043455565449933, "loss": 1.6716, "step": 9021 }, { "epoch": 0.71, "learning_rate": 0.00026042619107658816, "loss": 1.6631, "step": 9022 }, { "epoch": 0.71, "learning_rate": 0.00026041782574894414, "loss": 1.6812, "step": 9023 }, { "epoch": 0.71, "learning_rate": 0.00026040945967162397, "loss": 1.6625, "step": 9024 }, { "epoch": 0.71, "learning_rate": 0.0002604010928446846, "loss": 1.6647, "step": 9025 }, { "epoch": 0.71, "learning_rate": 0.0002603927252681826, "loss": 1.6525, "step": 9026 }, { "epoch": 0.71, "learning_rate": 0.00026038435694217504, "loss": 1.6624, "step": 9027 }, { "epoch": 0.71, "learning_rate": 0.0002603759878667185, "loss": 1.6841, "step": 9028 }, { "epoch": 0.71, "learning_rate": 0.00026036761804187, "loss": 1.6574, "step": 9029 }, { "epoch": 0.71, "learning_rate": 0.0002603592474676862, "loss": 1.6895, "step": 9030 }, { "epoch": 0.71, "learning_rate": 0.0002603508761442241, "loss": 1.6614, "step": 9031 }, { "epoch": 0.71, "learning_rate": 0.0002603425040715404, "loss": 1.6147, "step": 9032 }, { "epoch": 0.71, "learning_rate": 0.000260334131249692, "loss": 1.6085, "step": 9033 }, { "epoch": 0.71, "learning_rate": 0.0002603257576787357, "loss": 1.6495, "step": 9034 }, { "epoch": 0.71, "learning_rate": 0.0002603173833587284, "loss": 1.6233, "step": 9035 }, { "epoch": 0.71, "learning_rate": 0.000260309008289727, "loss": 1.655, "step": 9036 }, { "epoch": 0.71, "learning_rate": 0.00026030063247178825, "loss": 1.6711, "step": 9037 }, { "epoch": 0.71, "learning_rate": 0.0002602922559049691, "loss": 1.6406, "step": 9038 }, { "epoch": 0.71, "learning_rate": 0.0002602838785893264, "loss": 1.7259, "step": 9039 }, { "epoch": 0.71, "learning_rate": 0.000260275500524917, "loss": 1.6481, "step": 9040 }, { "epoch": 0.71, "learning_rate": 0.0002602671217117978, "loss": 1.6929, "step": 9041 }, { "epoch": 0.71, "learning_rate": 0.00026025874215002576, "loss": 1.6257, "step": 9042 }, { "epoch": 0.71, "learning_rate": 0.00026025036183965764, "loss": 1.6238, "step": 9043 }, { "epoch": 0.71, "learning_rate": 0.00026024198078075043, "loss": 1.6537, "step": 9044 }, { "epoch": 0.71, "learning_rate": 0.00026023359897336105, "loss": 1.6811, "step": 9045 }, { "epoch": 0.71, "learning_rate": 0.00026022521641754626, "loss": 1.6417, "step": 9046 }, { "epoch": 0.71, "learning_rate": 0.00026021683311336314, "loss": 1.6288, "step": 9047 }, { "epoch": 0.71, "learning_rate": 0.00026020844906086857, "loss": 1.6027, "step": 9048 }, { "epoch": 0.71, "learning_rate": 0.0002602000642601194, "loss": 1.7163, "step": 9049 }, { "epoch": 0.71, "learning_rate": 0.00026019167871117266, "loss": 1.6344, "step": 9050 }, { "epoch": 0.71, "learning_rate": 0.00026018329241408517, "loss": 1.7175, "step": 9051 }, { "epoch": 0.71, "learning_rate": 0.00026017490536891396, "loss": 1.6731, "step": 9052 }, { "epoch": 0.71, "learning_rate": 0.00026016651757571594, "loss": 1.6528, "step": 9053 }, { "epoch": 0.71, "learning_rate": 0.00026015812903454805, "loss": 1.6435, "step": 9054 }, { "epoch": 0.71, "learning_rate": 0.0002601497397454673, "loss": 1.6665, "step": 9055 }, { "epoch": 0.71, "learning_rate": 0.0002601413497085305, "loss": 1.6225, "step": 9056 }, { "epoch": 0.71, "learning_rate": 0.0002601329589237948, "loss": 1.6733, "step": 9057 }, { "epoch": 0.71, "learning_rate": 0.0002601245673913171, "loss": 1.6247, "step": 9058 }, { "epoch": 0.71, "learning_rate": 0.0002601161751111543, "loss": 1.6537, "step": 9059 }, { "epoch": 0.71, "learning_rate": 0.0002601077820833635, "loss": 1.6612, "step": 9060 }, { "epoch": 0.71, "learning_rate": 0.0002600993883080016, "loss": 1.6521, "step": 9061 }, { "epoch": 0.71, "learning_rate": 0.0002600909937851256, "loss": 1.6815, "step": 9062 }, { "epoch": 0.71, "learning_rate": 0.00026008259851479244, "loss": 1.6345, "step": 9063 }, { "epoch": 0.71, "learning_rate": 0.00026007420249705927, "loss": 1.7539, "step": 9064 }, { "epoch": 0.71, "learning_rate": 0.000260065805731983, "loss": 1.6421, "step": 9065 }, { "epoch": 0.71, "learning_rate": 0.00026005740821962066, "loss": 1.6663, "step": 9066 }, { "epoch": 0.71, "learning_rate": 0.00026004900996002916, "loss": 1.623, "step": 9067 }, { "epoch": 0.71, "learning_rate": 0.00026004061095326575, "loss": 1.6163, "step": 9068 }, { "epoch": 0.71, "learning_rate": 0.00026003221119938724, "loss": 1.7078, "step": 9069 }, { "epoch": 0.71, "learning_rate": 0.00026002381069845077, "loss": 1.6343, "step": 9070 }, { "epoch": 0.71, "learning_rate": 0.00026001540945051326, "loss": 1.6888, "step": 9071 }, { "epoch": 0.71, "learning_rate": 0.0002600070074556319, "loss": 1.5844, "step": 9072 }, { "epoch": 0.71, "learning_rate": 0.0002599986047138637, "loss": 1.6556, "step": 9073 }, { "epoch": 0.71, "learning_rate": 0.0002599902012252656, "loss": 1.6567, "step": 9074 }, { "epoch": 0.71, "learning_rate": 0.00025998179698989476, "loss": 1.6649, "step": 9075 }, { "epoch": 0.71, "learning_rate": 0.0002599733920078082, "loss": 1.6216, "step": 9076 }, { "epoch": 0.71, "learning_rate": 0.00025996498627906304, "loss": 1.6772, "step": 9077 }, { "epoch": 0.71, "learning_rate": 0.00025995657980371626, "loss": 1.6312, "step": 9078 }, { "epoch": 0.71, "learning_rate": 0.000259948172581825, "loss": 1.6783, "step": 9079 }, { "epoch": 0.71, "learning_rate": 0.00025993976461344634, "loss": 1.6155, "step": 9080 }, { "epoch": 0.71, "learning_rate": 0.0002599313558986373, "loss": 1.6538, "step": 9081 }, { "epoch": 0.71, "learning_rate": 0.00025992294643745504, "loss": 1.6371, "step": 9082 }, { "epoch": 0.71, "learning_rate": 0.0002599145362299567, "loss": 1.6404, "step": 9083 }, { "epoch": 0.71, "learning_rate": 0.0002599061252761992, "loss": 1.6661, "step": 9084 }, { "epoch": 0.71, "learning_rate": 0.00025989771357623985, "loss": 1.6511, "step": 9085 }, { "epoch": 0.71, "learning_rate": 0.0002598893011301356, "loss": 1.6207, "step": 9086 }, { "epoch": 0.71, "learning_rate": 0.0002598808879379437, "loss": 1.6139, "step": 9087 }, { "epoch": 0.72, "learning_rate": 0.00025987247399972117, "loss": 1.6654, "step": 9088 }, { "epoch": 0.72, "learning_rate": 0.0002598640593155252, "loss": 1.7312, "step": 9089 }, { "epoch": 0.72, "learning_rate": 0.0002598556438854129, "loss": 1.658, "step": 9090 }, { "epoch": 0.72, "learning_rate": 0.00025984722770944137, "loss": 1.6194, "step": 9091 }, { "epoch": 0.72, "learning_rate": 0.0002598388107876678, "loss": 1.6055, "step": 9092 }, { "epoch": 0.72, "learning_rate": 0.0002598303931201493, "loss": 1.6807, "step": 9093 }, { "epoch": 0.72, "learning_rate": 0.00025982197470694307, "loss": 1.697, "step": 9094 }, { "epoch": 0.72, "learning_rate": 0.00025981355554810623, "loss": 1.6156, "step": 9095 }, { "epoch": 0.72, "learning_rate": 0.0002598051356436959, "loss": 1.6719, "step": 9096 }, { "epoch": 0.72, "learning_rate": 0.0002597967149937694, "loss": 1.6373, "step": 9097 }, { "epoch": 0.72, "learning_rate": 0.0002597882935983837, "loss": 1.564, "step": 9098 }, { "epoch": 0.72, "learning_rate": 0.0002597798714575961, "loss": 1.6688, "step": 9099 }, { "epoch": 0.72, "learning_rate": 0.0002597714485714638, "loss": 1.71, "step": 9100 }, { "epoch": 0.72, "learning_rate": 0.0002597630249400439, "loss": 1.6507, "step": 9101 }, { "epoch": 0.72, "learning_rate": 0.00025975460056339356, "loss": 1.6694, "step": 9102 }, { "epoch": 0.72, "learning_rate": 0.00025974617544157017, "loss": 1.5786, "step": 9103 }, { "epoch": 0.72, "learning_rate": 0.0002597377495746308, "loss": 1.6727, "step": 9104 }, { "epoch": 0.72, "learning_rate": 0.0002597293229626326, "loss": 1.6504, "step": 9105 }, { "epoch": 0.72, "learning_rate": 0.00025972089560563286, "loss": 1.6621, "step": 9106 }, { "epoch": 0.72, "learning_rate": 0.0002597124675036888, "loss": 1.6422, "step": 9107 }, { "epoch": 0.72, "learning_rate": 0.0002597040386568577, "loss": 1.6938, "step": 9108 }, { "epoch": 0.72, "learning_rate": 0.00025969560906519666, "loss": 1.6691, "step": 9109 }, { "epoch": 0.72, "learning_rate": 0.00025968717872876295, "loss": 1.6524, "step": 9110 }, { "epoch": 0.72, "learning_rate": 0.00025967874764761385, "loss": 1.6284, "step": 9111 }, { "epoch": 0.72, "learning_rate": 0.00025967031582180657, "loss": 1.6297, "step": 9112 }, { "epoch": 0.72, "learning_rate": 0.0002596618832513984, "loss": 1.6665, "step": 9113 }, { "epoch": 0.72, "learning_rate": 0.0002596534499364465, "loss": 1.677, "step": 9114 }, { "epoch": 0.72, "learning_rate": 0.00025964501587700823, "loss": 1.7019, "step": 9115 }, { "epoch": 0.72, "learning_rate": 0.0002596365810731408, "loss": 1.6344, "step": 9116 }, { "epoch": 0.72, "learning_rate": 0.00025962814552490146, "loss": 1.6889, "step": 9117 }, { "epoch": 0.72, "learning_rate": 0.00025961970923234754, "loss": 1.631, "step": 9118 }, { "epoch": 0.72, "learning_rate": 0.00025961127219553627, "loss": 1.7323, "step": 9119 }, { "epoch": 0.72, "learning_rate": 0.000259602834414525, "loss": 1.6511, "step": 9120 }, { "epoch": 0.72, "learning_rate": 0.0002595943958893709, "loss": 1.649, "step": 9121 }, { "epoch": 0.72, "learning_rate": 0.00025958595662013136, "loss": 1.6245, "step": 9122 }, { "epoch": 0.72, "learning_rate": 0.0002595775166068636, "loss": 1.6179, "step": 9123 }, { "epoch": 0.72, "learning_rate": 0.00025956907584962505, "loss": 1.6475, "step": 9124 }, { "epoch": 0.72, "learning_rate": 0.00025956063434847294, "loss": 1.6281, "step": 9125 }, { "epoch": 0.72, "learning_rate": 0.00025955219210346456, "loss": 1.6681, "step": 9126 }, { "epoch": 0.72, "learning_rate": 0.00025954374911465723, "loss": 1.6144, "step": 9127 }, { "epoch": 0.72, "learning_rate": 0.0002595353053821083, "loss": 1.6572, "step": 9128 }, { "epoch": 0.72, "learning_rate": 0.0002595268609058751, "loss": 1.6698, "step": 9129 }, { "epoch": 0.72, "learning_rate": 0.000259518415686015, "loss": 1.699, "step": 9130 }, { "epoch": 0.72, "learning_rate": 0.0002595099697225852, "loss": 1.6393, "step": 9131 }, { "epoch": 0.72, "learning_rate": 0.00025950152301564325, "loss": 1.6871, "step": 9132 }, { "epoch": 0.72, "learning_rate": 0.0002594930755652463, "loss": 1.5913, "step": 9133 }, { "epoch": 0.72, "learning_rate": 0.0002594846273714518, "loss": 1.6742, "step": 9134 }, { "epoch": 0.72, "learning_rate": 0.00025947617843431715, "loss": 1.6972, "step": 9135 }, { "epoch": 0.72, "learning_rate": 0.00025946772875389966, "loss": 1.632, "step": 9136 }, { "epoch": 0.72, "learning_rate": 0.0002594592783302566, "loss": 1.5851, "step": 9137 }, { "epoch": 0.72, "learning_rate": 0.00025945082716344553, "loss": 1.643, "step": 9138 }, { "epoch": 0.72, "learning_rate": 0.00025944237525352376, "loss": 1.6444, "step": 9139 }, { "epoch": 0.72, "learning_rate": 0.00025943392260054863, "loss": 1.6631, "step": 9140 }, { "epoch": 0.72, "learning_rate": 0.00025942546920457757, "loss": 1.6615, "step": 9141 }, { "epoch": 0.72, "learning_rate": 0.00025941701506566796, "loss": 1.6073, "step": 9142 }, { "epoch": 0.72, "learning_rate": 0.00025940856018387713, "loss": 1.6571, "step": 9143 }, { "epoch": 0.72, "learning_rate": 0.00025940010455926263, "loss": 1.6594, "step": 9144 }, { "epoch": 0.72, "learning_rate": 0.00025939164819188177, "loss": 1.6599, "step": 9145 }, { "epoch": 0.72, "learning_rate": 0.000259383191081792, "loss": 1.6361, "step": 9146 }, { "epoch": 0.72, "learning_rate": 0.0002593747332290507, "loss": 1.6895, "step": 9147 }, { "epoch": 0.72, "learning_rate": 0.0002593662746337153, "loss": 1.5995, "step": 9148 }, { "epoch": 0.72, "learning_rate": 0.00025935781529584325, "loss": 1.6775, "step": 9149 }, { "epoch": 0.72, "learning_rate": 0.0002593493552154921, "loss": 1.666, "step": 9150 }, { "epoch": 0.72, "learning_rate": 0.000259340894392719, "loss": 1.6416, "step": 9151 }, { "epoch": 0.72, "learning_rate": 0.0002593324328275817, "loss": 1.6383, "step": 9152 }, { "epoch": 0.72, "learning_rate": 0.00025932397052013745, "loss": 1.6417, "step": 9153 }, { "epoch": 0.72, "learning_rate": 0.00025931550747044374, "loss": 1.6781, "step": 9154 }, { "epoch": 0.72, "learning_rate": 0.00025930704367855813, "loss": 1.655, "step": 9155 }, { "epoch": 0.72, "learning_rate": 0.00025929857914453803, "loss": 1.6359, "step": 9156 }, { "epoch": 0.72, "learning_rate": 0.0002592901138684408, "loss": 1.6645, "step": 9157 }, { "epoch": 0.72, "learning_rate": 0.0002592816478503241, "loss": 1.684, "step": 9158 }, { "epoch": 0.72, "learning_rate": 0.0002592731810902453, "loss": 1.6773, "step": 9159 }, { "epoch": 0.72, "learning_rate": 0.0002592647135882618, "loss": 1.6639, "step": 9160 }, { "epoch": 0.72, "learning_rate": 0.0002592562453444313, "loss": 1.6035, "step": 9161 }, { "epoch": 0.72, "learning_rate": 0.00025924777635881116, "loss": 1.6634, "step": 9162 }, { "epoch": 0.72, "learning_rate": 0.0002592393066314589, "loss": 1.5993, "step": 9163 }, { "epoch": 0.72, "learning_rate": 0.00025923083616243204, "loss": 1.6668, "step": 9164 }, { "epoch": 0.72, "learning_rate": 0.00025922236495178806, "loss": 1.6529, "step": 9165 }, { "epoch": 0.72, "learning_rate": 0.0002592138929995846, "loss": 1.6765, "step": 9166 }, { "epoch": 0.72, "learning_rate": 0.00025920542030587895, "loss": 1.6577, "step": 9167 }, { "epoch": 0.72, "learning_rate": 0.0002591969468707288, "loss": 1.6266, "step": 9168 }, { "epoch": 0.72, "learning_rate": 0.0002591884726941916, "loss": 1.612, "step": 9169 }, { "epoch": 0.72, "learning_rate": 0.000259179997776325, "loss": 1.6009, "step": 9170 }, { "epoch": 0.72, "learning_rate": 0.00025917152211718644, "loss": 1.6722, "step": 9171 }, { "epoch": 0.72, "learning_rate": 0.0002591630457168335, "loss": 1.6299, "step": 9172 }, { "epoch": 0.72, "learning_rate": 0.00025915456857532364, "loss": 1.6612, "step": 9173 }, { "epoch": 0.72, "learning_rate": 0.0002591460906927146, "loss": 1.635, "step": 9174 }, { "epoch": 0.72, "learning_rate": 0.0002591376120690638, "loss": 1.5988, "step": 9175 }, { "epoch": 0.72, "learning_rate": 0.0002591291327044288, "loss": 1.5817, "step": 9176 }, { "epoch": 0.72, "learning_rate": 0.00025912065259886725, "loss": 1.6906, "step": 9177 }, { "epoch": 0.72, "learning_rate": 0.0002591121717524367, "loss": 1.6217, "step": 9178 }, { "epoch": 0.72, "learning_rate": 0.0002591036901651947, "loss": 1.6797, "step": 9179 }, { "epoch": 0.72, "learning_rate": 0.0002590952078371988, "loss": 1.6872, "step": 9180 }, { "epoch": 0.72, "learning_rate": 0.0002590867247685067, "loss": 1.6424, "step": 9181 }, { "epoch": 0.72, "learning_rate": 0.000259078240959176, "loss": 1.6439, "step": 9182 }, { "epoch": 0.72, "learning_rate": 0.00025906975640926417, "loss": 1.6675, "step": 9183 }, { "epoch": 0.72, "learning_rate": 0.0002590612711188289, "loss": 1.6409, "step": 9184 }, { "epoch": 0.72, "learning_rate": 0.00025905278508792773, "loss": 1.6512, "step": 9185 }, { "epoch": 0.72, "learning_rate": 0.0002590442983166184, "loss": 1.6547, "step": 9186 }, { "epoch": 0.72, "learning_rate": 0.0002590358108049584, "loss": 1.5999, "step": 9187 }, { "epoch": 0.72, "learning_rate": 0.00025902732255300546, "loss": 1.7109, "step": 9188 }, { "epoch": 0.72, "learning_rate": 0.0002590188335608171, "loss": 1.6413, "step": 9189 }, { "epoch": 0.72, "learning_rate": 0.0002590103438284511, "loss": 1.6561, "step": 9190 }, { "epoch": 0.72, "learning_rate": 0.000259001853355965, "loss": 1.6222, "step": 9191 }, { "epoch": 0.72, "learning_rate": 0.00025899336214341644, "loss": 1.6511, "step": 9192 }, { "epoch": 0.72, "learning_rate": 0.00025898487019086313, "loss": 1.6193, "step": 9193 }, { "epoch": 0.72, "learning_rate": 0.0002589763774983627, "loss": 1.6628, "step": 9194 }, { "epoch": 0.72, "learning_rate": 0.0002589678840659728, "loss": 1.5718, "step": 9195 }, { "epoch": 0.72, "learning_rate": 0.0002589593898937511, "loss": 1.5932, "step": 9196 }, { "epoch": 0.72, "learning_rate": 0.00025895089498175524, "loss": 1.6387, "step": 9197 }, { "epoch": 0.72, "learning_rate": 0.00025894239933004295, "loss": 1.6281, "step": 9198 }, { "epoch": 0.72, "learning_rate": 0.0002589339029386719, "loss": 1.6678, "step": 9199 }, { "epoch": 0.72, "learning_rate": 0.00025892540580769975, "loss": 1.6482, "step": 9200 }, { "epoch": 0.72, "learning_rate": 0.0002589169079371842, "loss": 1.6333, "step": 9201 }, { "epoch": 0.72, "learning_rate": 0.00025890840932718296, "loss": 1.6474, "step": 9202 }, { "epoch": 0.72, "learning_rate": 0.00025889990997775373, "loss": 1.6992, "step": 9203 }, { "epoch": 0.72, "learning_rate": 0.0002588914098889542, "loss": 1.6659, "step": 9204 }, { "epoch": 0.72, "learning_rate": 0.00025888290906084206, "loss": 1.6143, "step": 9205 }, { "epoch": 0.72, "learning_rate": 0.0002588744074934751, "loss": 1.6828, "step": 9206 }, { "epoch": 0.72, "learning_rate": 0.00025886590518691094, "loss": 1.6334, "step": 9207 }, { "epoch": 0.72, "learning_rate": 0.0002588574021412074, "loss": 1.6734, "step": 9208 }, { "epoch": 0.72, "learning_rate": 0.00025884889835642213, "loss": 1.7054, "step": 9209 }, { "epoch": 0.72, "learning_rate": 0.000258840393832613, "loss": 1.6287, "step": 9210 }, { "epoch": 0.72, "learning_rate": 0.00025883188856983756, "loss": 1.7165, "step": 9211 }, { "epoch": 0.72, "learning_rate": 0.0002588233825681537, "loss": 1.66, "step": 9212 }, { "epoch": 0.72, "learning_rate": 0.0002588148758276191, "loss": 1.682, "step": 9213 }, { "epoch": 0.72, "learning_rate": 0.0002588063683482916, "loss": 1.6147, "step": 9214 }, { "epoch": 0.73, "learning_rate": 0.0002587978601302289, "loss": 1.6795, "step": 9215 }, { "epoch": 0.73, "learning_rate": 0.0002587893511734887, "loss": 1.6526, "step": 9216 }, { "epoch": 0.73, "learning_rate": 0.0002587808414781289, "loss": 1.6429, "step": 9217 }, { "epoch": 0.73, "learning_rate": 0.0002587723310442072, "loss": 1.7356, "step": 9218 }, { "epoch": 0.73, "learning_rate": 0.0002587638198717814, "loss": 1.6353, "step": 9219 }, { "epoch": 0.73, "learning_rate": 0.0002587553079609092, "loss": 1.6218, "step": 9220 }, { "epoch": 0.73, "learning_rate": 0.0002587467953116486, "loss": 1.6696, "step": 9221 }, { "epoch": 0.73, "learning_rate": 0.00025873828192405723, "loss": 1.72, "step": 9222 }, { "epoch": 0.73, "learning_rate": 0.00025872976779819294, "loss": 1.667, "step": 9223 }, { "epoch": 0.73, "learning_rate": 0.0002587212529341135, "loss": 1.6619, "step": 9224 }, { "epoch": 0.73, "learning_rate": 0.0002587127373318768, "loss": 1.648, "step": 9225 }, { "epoch": 0.73, "learning_rate": 0.0002587042209915405, "loss": 1.6519, "step": 9226 }, { "epoch": 0.73, "learning_rate": 0.0002586957039131626, "loss": 1.5704, "step": 9227 }, { "epoch": 0.73, "learning_rate": 0.0002586871860968009, "loss": 1.6081, "step": 9228 }, { "epoch": 0.73, "learning_rate": 0.0002586786675425131, "loss": 1.6455, "step": 9229 }, { "epoch": 0.73, "learning_rate": 0.00025867014825035716, "loss": 1.6406, "step": 9230 }, { "epoch": 0.73, "learning_rate": 0.0002586616282203909, "loss": 1.716, "step": 9231 }, { "epoch": 0.73, "learning_rate": 0.0002586531074526721, "loss": 1.6415, "step": 9232 }, { "epoch": 0.73, "learning_rate": 0.0002586445859472587, "loss": 1.677, "step": 9233 }, { "epoch": 0.73, "learning_rate": 0.0002586360637042085, "loss": 1.6245, "step": 9234 }, { "epoch": 0.73, "learning_rate": 0.00025862754072357934, "loss": 1.5997, "step": 9235 }, { "epoch": 0.73, "learning_rate": 0.0002586190170054292, "loss": 1.637, "step": 9236 }, { "epoch": 0.73, "learning_rate": 0.0002586104925498158, "loss": 1.6535, "step": 9237 }, { "epoch": 0.73, "learning_rate": 0.00025860196735679716, "loss": 1.6935, "step": 9238 }, { "epoch": 0.73, "learning_rate": 0.0002585934414264311, "loss": 1.6729, "step": 9239 }, { "epoch": 0.73, "learning_rate": 0.00025858491475877547, "loss": 1.6334, "step": 9240 }, { "epoch": 0.73, "learning_rate": 0.00025857638735388817, "loss": 1.6563, "step": 9241 }, { "epoch": 0.73, "learning_rate": 0.00025856785921182714, "loss": 1.6769, "step": 9242 }, { "epoch": 0.73, "learning_rate": 0.00025855933033265023, "loss": 1.6312, "step": 9243 }, { "epoch": 0.73, "learning_rate": 0.0002585508007164154, "loss": 1.6332, "step": 9244 }, { "epoch": 0.73, "learning_rate": 0.0002585422703631805, "loss": 1.6723, "step": 9245 }, { "epoch": 0.73, "learning_rate": 0.00025853373927300357, "loss": 1.6511, "step": 9246 }, { "epoch": 0.73, "learning_rate": 0.00025852520744594243, "loss": 1.6398, "step": 9247 }, { "epoch": 0.73, "learning_rate": 0.00025851667488205495, "loss": 1.6532, "step": 9248 }, { "epoch": 0.73, "learning_rate": 0.0002585081415813991, "loss": 1.6469, "step": 9249 }, { "epoch": 0.73, "learning_rate": 0.00025849960754403297, "loss": 1.6706, "step": 9250 }, { "epoch": 0.73, "learning_rate": 0.0002584910727700143, "loss": 1.6256, "step": 9251 }, { "epoch": 0.73, "learning_rate": 0.0002584825372594012, "loss": 1.7208, "step": 9252 }, { "epoch": 0.73, "learning_rate": 0.00025847400101225145, "loss": 1.5874, "step": 9253 }, { "epoch": 0.73, "learning_rate": 0.00025846546402862313, "loss": 1.6697, "step": 9254 }, { "epoch": 0.73, "learning_rate": 0.0002584569263085741, "loss": 1.6665, "step": 9255 }, { "epoch": 0.73, "learning_rate": 0.0002584483878521625, "loss": 1.6479, "step": 9256 }, { "epoch": 0.73, "learning_rate": 0.0002584398486594461, "loss": 1.6772, "step": 9257 }, { "epoch": 0.73, "learning_rate": 0.000258431308730483, "loss": 1.6175, "step": 9258 }, { "epoch": 0.73, "learning_rate": 0.0002584227680653312, "loss": 1.6519, "step": 9259 }, { "epoch": 0.73, "learning_rate": 0.0002584142266640486, "loss": 1.6939, "step": 9260 }, { "epoch": 0.73, "learning_rate": 0.0002584056845266932, "loss": 1.6035, "step": 9261 }, { "epoch": 0.73, "learning_rate": 0.0002583971416533231, "loss": 1.6902, "step": 9262 }, { "epoch": 0.73, "learning_rate": 0.00025838859804399613, "loss": 1.6106, "step": 9263 }, { "epoch": 0.73, "learning_rate": 0.0002583800536987705, "loss": 1.6893, "step": 9264 }, { "epoch": 0.73, "learning_rate": 0.000258371508617704, "loss": 1.6014, "step": 9265 }, { "epoch": 0.73, "learning_rate": 0.0002583629628008549, "loss": 1.6627, "step": 9266 }, { "epoch": 0.73, "learning_rate": 0.000258354416248281, "loss": 1.6264, "step": 9267 }, { "epoch": 0.73, "learning_rate": 0.00025834586896004036, "loss": 1.5965, "step": 9268 }, { "epoch": 0.73, "learning_rate": 0.0002583373209361911, "loss": 1.6227, "step": 9269 }, { "epoch": 0.73, "learning_rate": 0.00025832877217679126, "loss": 1.6105, "step": 9270 }, { "epoch": 0.73, "learning_rate": 0.0002583202226818988, "loss": 1.631, "step": 9271 }, { "epoch": 0.73, "learning_rate": 0.0002583116724515718, "loss": 1.6306, "step": 9272 }, { "epoch": 0.73, "learning_rate": 0.0002583031214858683, "loss": 1.6907, "step": 9273 }, { "epoch": 0.73, "learning_rate": 0.00025829456978484637, "loss": 1.6549, "step": 9274 }, { "epoch": 0.73, "learning_rate": 0.00025828601734856414, "loss": 1.5458, "step": 9275 }, { "epoch": 0.73, "learning_rate": 0.00025827746417707954, "loss": 1.6112, "step": 9276 }, { "epoch": 0.73, "learning_rate": 0.00025826891027045073, "loss": 1.588, "step": 9277 }, { "epoch": 0.73, "learning_rate": 0.0002582603556287358, "loss": 1.667, "step": 9278 }, { "epoch": 0.73, "learning_rate": 0.0002582518002519928, "loss": 1.601, "step": 9279 }, { "epoch": 0.73, "learning_rate": 0.0002582432441402798, "loss": 1.651, "step": 9280 }, { "epoch": 0.73, "learning_rate": 0.00025823468729365486, "loss": 1.6055, "step": 9281 }, { "epoch": 0.73, "learning_rate": 0.00025822612971217613, "loss": 1.6333, "step": 9282 }, { "epoch": 0.73, "learning_rate": 0.00025821757139590177, "loss": 1.6726, "step": 9283 }, { "epoch": 0.73, "learning_rate": 0.0002582090123448898, "loss": 1.6319, "step": 9284 }, { "epoch": 0.73, "learning_rate": 0.0002582004525591983, "loss": 1.6412, "step": 9285 }, { "epoch": 0.73, "learning_rate": 0.0002581918920388855, "loss": 1.6766, "step": 9286 }, { "epoch": 0.73, "learning_rate": 0.00025818333078400933, "loss": 1.6411, "step": 9287 }, { "epoch": 0.73, "learning_rate": 0.0002581747687946282, "loss": 1.6096, "step": 9288 }, { "epoch": 0.73, "learning_rate": 0.0002581662060708, "loss": 1.6663, "step": 9289 }, { "epoch": 0.73, "learning_rate": 0.000258157642612583, "loss": 1.6404, "step": 9290 }, { "epoch": 0.73, "learning_rate": 0.0002581490784200353, "loss": 1.6826, "step": 9291 }, { "epoch": 0.73, "learning_rate": 0.0002581405134932149, "loss": 1.7079, "step": 9292 }, { "epoch": 0.73, "learning_rate": 0.0002581319478321803, "loss": 1.6571, "step": 9293 }, { "epoch": 0.73, "learning_rate": 0.00025812338143698933, "loss": 1.6506, "step": 9294 }, { "epoch": 0.73, "learning_rate": 0.00025811481430770025, "loss": 1.6592, "step": 9295 }, { "epoch": 0.73, "learning_rate": 0.0002581062464443713, "loss": 1.6538, "step": 9296 }, { "epoch": 0.73, "learning_rate": 0.00025809767784706054, "loss": 1.594, "step": 9297 }, { "epoch": 0.73, "learning_rate": 0.00025808910851582624, "loss": 1.6945, "step": 9298 }, { "epoch": 0.73, "learning_rate": 0.00025808053845072655, "loss": 1.6327, "step": 9299 }, { "epoch": 0.73, "learning_rate": 0.00025807196765181964, "loss": 1.6707, "step": 9300 }, { "epoch": 0.73, "learning_rate": 0.0002580633961191637, "loss": 1.6326, "step": 9301 }, { "epoch": 0.73, "learning_rate": 0.00025805482385281693, "loss": 1.6356, "step": 9302 }, { "epoch": 0.73, "learning_rate": 0.00025804625085283753, "loss": 1.6218, "step": 9303 }, { "epoch": 0.73, "learning_rate": 0.0002580376771192837, "loss": 1.6191, "step": 9304 }, { "epoch": 0.73, "learning_rate": 0.00025802910265221367, "loss": 1.643, "step": 9305 }, { "epoch": 0.73, "learning_rate": 0.00025802052745168565, "loss": 1.6114, "step": 9306 }, { "epoch": 0.73, "learning_rate": 0.0002580119515177579, "loss": 1.5628, "step": 9307 }, { "epoch": 0.73, "learning_rate": 0.0002580033748504886, "loss": 1.6635, "step": 9308 }, { "epoch": 0.73, "learning_rate": 0.00025799479744993594, "loss": 1.6761, "step": 9309 }, { "epoch": 0.73, "learning_rate": 0.0002579862193161582, "loss": 1.6429, "step": 9310 }, { "epoch": 0.73, "learning_rate": 0.00025797764044921363, "loss": 1.6333, "step": 9311 }, { "epoch": 0.73, "learning_rate": 0.0002579690608491605, "loss": 1.6239, "step": 9312 }, { "epoch": 0.73, "learning_rate": 0.00025796048051605707, "loss": 1.6541, "step": 9313 }, { "epoch": 0.73, "learning_rate": 0.0002579518994499615, "loss": 1.619, "step": 9314 }, { "epoch": 0.73, "learning_rate": 0.00025794331765093204, "loss": 1.6147, "step": 9315 }, { "epoch": 0.73, "learning_rate": 0.00025793473511902715, "loss": 1.6362, "step": 9316 }, { "epoch": 0.73, "learning_rate": 0.0002579261518543049, "loss": 1.678, "step": 9317 }, { "epoch": 0.73, "learning_rate": 0.0002579175678568236, "loss": 1.5954, "step": 9318 }, { "epoch": 0.73, "learning_rate": 0.0002579089831266416, "loss": 1.6534, "step": 9319 }, { "epoch": 0.73, "learning_rate": 0.00025790039766381717, "loss": 1.6095, "step": 9320 }, { "epoch": 0.73, "learning_rate": 0.00025789181146840864, "loss": 1.6002, "step": 9321 }, { "epoch": 0.73, "learning_rate": 0.00025788322454047414, "loss": 1.7147, "step": 9322 }, { "epoch": 0.73, "learning_rate": 0.0002578746368800722, "loss": 1.662, "step": 9323 }, { "epoch": 0.73, "learning_rate": 0.0002578660484872609, "loss": 1.6388, "step": 9324 }, { "epoch": 0.73, "learning_rate": 0.0002578574593620987, "loss": 1.6497, "step": 9325 }, { "epoch": 0.73, "learning_rate": 0.0002578488695046438, "loss": 1.6855, "step": 9326 }, { "epoch": 0.73, "learning_rate": 0.0002578402789149547, "loss": 1.613, "step": 9327 }, { "epoch": 0.73, "learning_rate": 0.00025783168759308954, "loss": 1.6493, "step": 9328 }, { "epoch": 0.73, "learning_rate": 0.0002578230955391068, "loss": 1.6298, "step": 9329 }, { "epoch": 0.73, "learning_rate": 0.0002578145027530647, "loss": 1.6142, "step": 9330 }, { "epoch": 0.73, "learning_rate": 0.00025780590923502164, "loss": 1.7036, "step": 9331 }, { "epoch": 0.73, "learning_rate": 0.0002577973149850359, "loss": 1.6235, "step": 9332 }, { "epoch": 0.73, "learning_rate": 0.000257788720003166, "loss": 1.6238, "step": 9333 }, { "epoch": 0.73, "learning_rate": 0.00025778012428947003, "loss": 1.6397, "step": 9334 }, { "epoch": 0.73, "learning_rate": 0.0002577715278440065, "loss": 1.6434, "step": 9335 }, { "epoch": 0.73, "learning_rate": 0.0002577629306668339, "loss": 1.6767, "step": 9336 }, { "epoch": 0.73, "learning_rate": 0.0002577543327580104, "loss": 1.6495, "step": 9337 }, { "epoch": 0.73, "learning_rate": 0.0002577457341175944, "loss": 1.6751, "step": 9338 }, { "epoch": 0.73, "learning_rate": 0.0002577371347456444, "loss": 1.6886, "step": 9339 }, { "epoch": 0.73, "learning_rate": 0.00025772853464221866, "loss": 1.6487, "step": 9340 }, { "epoch": 0.73, "learning_rate": 0.0002577199338073756, "loss": 1.6072, "step": 9341 }, { "epoch": 0.74, "learning_rate": 0.0002577113322411737, "loss": 1.6424, "step": 9342 }, { "epoch": 0.74, "learning_rate": 0.0002577027299436712, "loss": 1.7073, "step": 9343 }, { "epoch": 0.74, "learning_rate": 0.0002576941269149267, "loss": 1.6375, "step": 9344 }, { "epoch": 0.74, "learning_rate": 0.00025768552315499844, "loss": 1.6525, "step": 9345 }, { "epoch": 0.74, "learning_rate": 0.0002576769186639449, "loss": 1.6632, "step": 9346 }, { "epoch": 0.74, "learning_rate": 0.0002576683134418246, "loss": 1.6034, "step": 9347 }, { "epoch": 0.74, "learning_rate": 0.00025765970748869576, "loss": 1.6727, "step": 9348 }, { "epoch": 0.74, "learning_rate": 0.00025765110080461695, "loss": 1.6676, "step": 9349 }, { "epoch": 0.74, "learning_rate": 0.0002576424933896466, "loss": 1.6025, "step": 9350 }, { "epoch": 0.74, "learning_rate": 0.0002576338852438431, "loss": 1.6342, "step": 9351 }, { "epoch": 0.74, "learning_rate": 0.00025762527636726494, "loss": 1.6012, "step": 9352 }, { "epoch": 0.74, "learning_rate": 0.0002576166667599705, "loss": 1.6663, "step": 9353 }, { "epoch": 0.74, "learning_rate": 0.0002576080564220183, "loss": 1.6901, "step": 9354 }, { "epoch": 0.74, "learning_rate": 0.0002575994453534668, "loss": 1.6622, "step": 9355 }, { "epoch": 0.74, "learning_rate": 0.00025759083355437443, "loss": 1.6178, "step": 9356 }, { "epoch": 0.74, "learning_rate": 0.00025758222102479966, "loss": 1.624, "step": 9357 }, { "epoch": 0.74, "learning_rate": 0.000257573607764801, "loss": 1.6266, "step": 9358 }, { "epoch": 0.74, "learning_rate": 0.0002575649937744369, "loss": 1.6231, "step": 9359 }, { "epoch": 0.74, "learning_rate": 0.00025755637905376585, "loss": 1.6476, "step": 9360 }, { "epoch": 0.74, "learning_rate": 0.0002575477636028463, "loss": 1.6596, "step": 9361 }, { "epoch": 0.74, "learning_rate": 0.00025753914742173686, "loss": 1.644, "step": 9362 }, { "epoch": 0.74, "learning_rate": 0.00025753053051049595, "loss": 1.6581, "step": 9363 }, { "epoch": 0.74, "learning_rate": 0.000257521912869182, "loss": 1.7045, "step": 9364 }, { "epoch": 0.74, "learning_rate": 0.00025751329449785363, "loss": 1.6992, "step": 9365 }, { "epoch": 0.74, "learning_rate": 0.0002575046753965694, "loss": 1.7043, "step": 9366 }, { "epoch": 0.74, "learning_rate": 0.00025749605556538765, "loss": 1.6134, "step": 9367 }, { "epoch": 0.74, "learning_rate": 0.00025748743500436704, "loss": 1.6249, "step": 9368 }, { "epoch": 0.74, "learning_rate": 0.00025747881371356604, "loss": 1.6291, "step": 9369 }, { "epoch": 0.74, "learning_rate": 0.00025747019169304326, "loss": 1.6428, "step": 9370 }, { "epoch": 0.74, "learning_rate": 0.00025746156894285713, "loss": 1.6166, "step": 9371 }, { "epoch": 0.74, "learning_rate": 0.00025745294546306626, "loss": 1.6357, "step": 9372 }, { "epoch": 0.74, "learning_rate": 0.0002574443212537292, "loss": 1.6442, "step": 9373 }, { "epoch": 0.74, "learning_rate": 0.00025743569631490453, "loss": 1.6947, "step": 9374 }, { "epoch": 0.74, "learning_rate": 0.0002574270706466507, "loss": 1.6768, "step": 9375 }, { "epoch": 0.74, "learning_rate": 0.0002574184442490264, "loss": 1.6101, "step": 9376 }, { "epoch": 0.74, "learning_rate": 0.0002574098171220901, "loss": 1.662, "step": 9377 }, { "epoch": 0.74, "learning_rate": 0.0002574011892659004, "loss": 1.5979, "step": 9378 }, { "epoch": 0.74, "learning_rate": 0.00025739256068051596, "loss": 1.6701, "step": 9379 }, { "epoch": 0.74, "learning_rate": 0.0002573839313659953, "loss": 1.6393, "step": 9380 }, { "epoch": 0.74, "learning_rate": 0.00025737530132239695, "loss": 1.6494, "step": 9381 }, { "epoch": 0.74, "learning_rate": 0.0002573666705497796, "loss": 1.6254, "step": 9382 }, { "epoch": 0.74, "learning_rate": 0.00025735803904820175, "loss": 1.5853, "step": 9383 }, { "epoch": 0.74, "learning_rate": 0.0002573494068177221, "loss": 1.5814, "step": 9384 }, { "epoch": 0.74, "learning_rate": 0.0002573407738583992, "loss": 1.6095, "step": 9385 }, { "epoch": 0.74, "learning_rate": 0.00025733214017029175, "loss": 1.6405, "step": 9386 }, { "epoch": 0.74, "learning_rate": 0.0002573235057534582, "loss": 1.6024, "step": 9387 }, { "epoch": 0.74, "learning_rate": 0.0002573148706079573, "loss": 1.637, "step": 9388 }, { "epoch": 0.74, "learning_rate": 0.0002573062347338477, "loss": 1.6071, "step": 9389 }, { "epoch": 0.74, "learning_rate": 0.0002572975981311879, "loss": 1.6468, "step": 9390 }, { "epoch": 0.74, "learning_rate": 0.0002572889608000367, "loss": 1.6522, "step": 9391 }, { "epoch": 0.74, "learning_rate": 0.00025728032274045267, "loss": 1.6509, "step": 9392 }, { "epoch": 0.74, "learning_rate": 0.00025727168395249436, "loss": 1.6017, "step": 9393 }, { "epoch": 0.74, "learning_rate": 0.0002572630444362205, "loss": 1.6609, "step": 9394 }, { "epoch": 0.74, "learning_rate": 0.0002572544041916899, "loss": 1.6176, "step": 9395 }, { "epoch": 0.74, "learning_rate": 0.00025724576321896103, "loss": 1.6375, "step": 9396 }, { "epoch": 0.74, "learning_rate": 0.0002572371215180926, "loss": 1.6279, "step": 9397 }, { "epoch": 0.74, "learning_rate": 0.0002572284790891432, "loss": 1.6346, "step": 9398 }, { "epoch": 0.74, "learning_rate": 0.00025721983593217173, "loss": 1.6364, "step": 9399 }, { "epoch": 0.74, "learning_rate": 0.0002572111920472367, "loss": 1.6754, "step": 9400 }, { "epoch": 0.74, "learning_rate": 0.00025720254743439685, "loss": 1.6645, "step": 9401 }, { "epoch": 0.74, "learning_rate": 0.00025719390209371084, "loss": 1.6954, "step": 9402 }, { "epoch": 0.74, "learning_rate": 0.0002571852560252374, "loss": 1.6239, "step": 9403 }, { "epoch": 0.74, "learning_rate": 0.00025717660922903524, "loss": 1.6634, "step": 9404 }, { "epoch": 0.74, "learning_rate": 0.000257167961705163, "loss": 1.5995, "step": 9405 }, { "epoch": 0.74, "learning_rate": 0.0002571593134536795, "loss": 1.5917, "step": 9406 }, { "epoch": 0.74, "learning_rate": 0.0002571506644746433, "loss": 1.6333, "step": 9407 }, { "epoch": 0.74, "learning_rate": 0.0002571420147681133, "loss": 1.6679, "step": 9408 }, { "epoch": 0.74, "learning_rate": 0.0002571333643341482, "loss": 1.6279, "step": 9409 }, { "epoch": 0.74, "learning_rate": 0.0002571247131728065, "loss": 1.6714, "step": 9410 }, { "epoch": 0.74, "learning_rate": 0.00025711606128414724, "loss": 1.6613, "step": 9411 }, { "epoch": 0.74, "learning_rate": 0.00025710740866822905, "loss": 1.6571, "step": 9412 }, { "epoch": 0.74, "learning_rate": 0.0002570987553251106, "loss": 1.6772, "step": 9413 }, { "epoch": 0.74, "learning_rate": 0.00025709010125485077, "loss": 1.7034, "step": 9414 }, { "epoch": 0.74, "learning_rate": 0.0002570814464575082, "loss": 1.6535, "step": 9415 }, { "epoch": 0.74, "learning_rate": 0.0002570727909331417, "loss": 1.642, "step": 9416 }, { "epoch": 0.74, "learning_rate": 0.00025706413468181, "loss": 1.6637, "step": 9417 }, { "epoch": 0.74, "learning_rate": 0.000257055477703572, "loss": 1.627, "step": 9418 }, { "epoch": 0.74, "learning_rate": 0.00025704681999848635, "loss": 1.635, "step": 9419 }, { "epoch": 0.74, "learning_rate": 0.00025703816156661183, "loss": 1.583, "step": 9420 }, { "epoch": 0.74, "learning_rate": 0.0002570295024080073, "loss": 1.6586, "step": 9421 }, { "epoch": 0.74, "learning_rate": 0.00025702084252273154, "loss": 1.6425, "step": 9422 }, { "epoch": 0.74, "learning_rate": 0.00025701218191084325, "loss": 1.6309, "step": 9423 }, { "epoch": 0.74, "learning_rate": 0.0002570035205724013, "loss": 1.6165, "step": 9424 }, { "epoch": 0.74, "learning_rate": 0.0002569948585074646, "loss": 1.6181, "step": 9425 }, { "epoch": 0.74, "learning_rate": 0.0002569861957160918, "loss": 1.6797, "step": 9426 }, { "epoch": 0.74, "learning_rate": 0.0002569775321983417, "loss": 1.652, "step": 9427 }, { "epoch": 0.74, "learning_rate": 0.00025696886795427323, "loss": 1.6208, "step": 9428 }, { "epoch": 0.74, "learning_rate": 0.00025696020298394517, "loss": 1.6162, "step": 9429 }, { "epoch": 0.74, "learning_rate": 0.00025695153728741644, "loss": 1.6784, "step": 9430 }, { "epoch": 0.74, "learning_rate": 0.00025694287086474573, "loss": 1.6748, "step": 9431 }, { "epoch": 0.74, "learning_rate": 0.0002569342037159919, "loss": 1.6339, "step": 9432 }, { "epoch": 0.74, "learning_rate": 0.00025692553584121387, "loss": 1.6266, "step": 9433 }, { "epoch": 0.74, "learning_rate": 0.00025691686724047045, "loss": 1.66, "step": 9434 }, { "epoch": 0.74, "learning_rate": 0.00025690819791382056, "loss": 1.7077, "step": 9435 }, { "epoch": 0.74, "learning_rate": 0.00025689952786132295, "loss": 1.6514, "step": 9436 }, { "epoch": 0.74, "learning_rate": 0.00025689085708303656, "loss": 1.6615, "step": 9437 }, { "epoch": 0.74, "learning_rate": 0.00025688218557902025, "loss": 1.6472, "step": 9438 }, { "epoch": 0.74, "learning_rate": 0.00025687351334933284, "loss": 1.6222, "step": 9439 }, { "epoch": 0.74, "learning_rate": 0.00025686484039403327, "loss": 1.6696, "step": 9440 }, { "epoch": 0.74, "learning_rate": 0.0002568561667131804, "loss": 1.6974, "step": 9441 }, { "epoch": 0.74, "learning_rate": 0.00025684749230683315, "loss": 1.6765, "step": 9442 }, { "epoch": 0.74, "learning_rate": 0.00025683881717505035, "loss": 1.6058, "step": 9443 }, { "epoch": 0.74, "learning_rate": 0.000256830141317891, "loss": 1.665, "step": 9444 }, { "epoch": 0.74, "learning_rate": 0.0002568214647354139, "loss": 1.6209, "step": 9445 }, { "epoch": 0.74, "learning_rate": 0.000256812787427678, "loss": 1.7226, "step": 9446 }, { "epoch": 0.74, "learning_rate": 0.00025680410939474225, "loss": 1.714, "step": 9447 }, { "epoch": 0.74, "learning_rate": 0.0002567954306366655, "loss": 1.6508, "step": 9448 }, { "epoch": 0.74, "learning_rate": 0.0002567867511535067, "loss": 1.649, "step": 9449 }, { "epoch": 0.74, "learning_rate": 0.00025677807094532485, "loss": 1.6203, "step": 9450 }, { "epoch": 0.74, "learning_rate": 0.0002567693900121788, "loss": 1.6089, "step": 9451 }, { "epoch": 0.74, "learning_rate": 0.0002567607083541275, "loss": 1.6443, "step": 9452 }, { "epoch": 0.74, "learning_rate": 0.0002567520259712299, "loss": 1.7145, "step": 9453 }, { "epoch": 0.74, "learning_rate": 0.000256743342863545, "loss": 1.6294, "step": 9454 }, { "epoch": 0.74, "learning_rate": 0.00025673465903113164, "loss": 1.6134, "step": 9455 }, { "epoch": 0.74, "learning_rate": 0.00025672597447404884, "loss": 1.67, "step": 9456 }, { "epoch": 0.74, "learning_rate": 0.0002567172891923556, "loss": 1.6105, "step": 9457 }, { "epoch": 0.74, "learning_rate": 0.0002567086031861109, "loss": 1.6071, "step": 9458 }, { "epoch": 0.74, "learning_rate": 0.00025669991645537366, "loss": 1.6357, "step": 9459 }, { "epoch": 0.74, "learning_rate": 0.00025669122900020283, "loss": 1.6547, "step": 9460 }, { "epoch": 0.74, "learning_rate": 0.0002566825408206574, "loss": 1.624, "step": 9461 }, { "epoch": 0.74, "learning_rate": 0.0002566738519167965, "loss": 1.6285, "step": 9462 }, { "epoch": 0.74, "learning_rate": 0.0002566651622886789, "loss": 1.613, "step": 9463 }, { "epoch": 0.74, "learning_rate": 0.00025665647193636376, "loss": 1.6308, "step": 9464 }, { "epoch": 0.74, "learning_rate": 0.0002566477808599101, "loss": 1.6337, "step": 9465 }, { "epoch": 0.74, "learning_rate": 0.00025663908905937676, "loss": 1.6759, "step": 9466 }, { "epoch": 0.74, "learning_rate": 0.00025663039653482287, "loss": 1.6724, "step": 9467 }, { "epoch": 0.74, "learning_rate": 0.00025662170328630745, "loss": 1.653, "step": 9468 }, { "epoch": 0.75, "learning_rate": 0.0002566130093138895, "loss": 1.6451, "step": 9469 }, { "epoch": 0.75, "learning_rate": 0.0002566043146176281, "loss": 1.6252, "step": 9470 }, { "epoch": 0.75, "learning_rate": 0.00025659561919758213, "loss": 1.6451, "step": 9471 }, { "epoch": 0.75, "learning_rate": 0.0002565869230538108, "loss": 1.6036, "step": 9472 }, { "epoch": 0.75, "learning_rate": 0.00025657822618637305, "loss": 1.6617, "step": 9473 }, { "epoch": 0.75, "learning_rate": 0.000256569528595328, "loss": 1.6595, "step": 9474 }, { "epoch": 0.75, "learning_rate": 0.00025656083028073465, "loss": 1.6857, "step": 9475 }, { "epoch": 0.75, "learning_rate": 0.00025655213124265206, "loss": 1.5927, "step": 9476 }, { "epoch": 0.75, "learning_rate": 0.00025654343148113926, "loss": 1.6721, "step": 9477 }, { "epoch": 0.75, "learning_rate": 0.0002565347309962554, "loss": 1.627, "step": 9478 }, { "epoch": 0.75, "learning_rate": 0.0002565260297880595, "loss": 1.6703, "step": 9479 }, { "epoch": 0.75, "learning_rate": 0.0002565173278566106, "loss": 1.5977, "step": 9480 }, { "epoch": 0.75, "learning_rate": 0.0002565086252019679, "loss": 1.6515, "step": 9481 }, { "epoch": 0.75, "learning_rate": 0.0002564999218241904, "loss": 1.6059, "step": 9482 }, { "epoch": 0.75, "learning_rate": 0.00025649121772333716, "loss": 1.5629, "step": 9483 }, { "epoch": 0.75, "learning_rate": 0.00025648251289946735, "loss": 1.6215, "step": 9484 }, { "epoch": 0.75, "learning_rate": 0.00025647380735264005, "loss": 1.6362, "step": 9485 }, { "epoch": 0.75, "learning_rate": 0.00025646510108291433, "loss": 1.6645, "step": 9486 }, { "epoch": 0.75, "learning_rate": 0.0002564563940903493, "loss": 1.6572, "step": 9487 }, { "epoch": 0.75, "learning_rate": 0.0002564476863750041, "loss": 1.6768, "step": 9488 }, { "epoch": 0.75, "learning_rate": 0.0002564389779369379, "loss": 1.7057, "step": 9489 }, { "epoch": 0.75, "learning_rate": 0.0002564302687762098, "loss": 1.6803, "step": 9490 }, { "epoch": 0.75, "learning_rate": 0.0002564215588928788, "loss": 1.6749, "step": 9491 }, { "epoch": 0.75, "learning_rate": 0.00025641284828700425, "loss": 1.6229, "step": 9492 }, { "epoch": 0.75, "learning_rate": 0.00025640413695864517, "loss": 1.6393, "step": 9493 }, { "epoch": 0.75, "learning_rate": 0.00025639542490786066, "loss": 1.5823, "step": 9494 }, { "epoch": 0.75, "learning_rate": 0.00025638671213471, "loss": 1.6195, "step": 9495 }, { "epoch": 0.75, "learning_rate": 0.0002563779986392522, "loss": 1.6502, "step": 9496 }, { "epoch": 0.75, "learning_rate": 0.0002563692844215466, "loss": 1.6771, "step": 9497 }, { "epoch": 0.75, "learning_rate": 0.0002563605694816522, "loss": 1.6691, "step": 9498 }, { "epoch": 0.75, "learning_rate": 0.00025635185381962816, "loss": 1.6629, "step": 9499 }, { "epoch": 0.75, "learning_rate": 0.0002563431374355338, "loss": 1.6426, "step": 9500 }, { "epoch": 0.75, "learning_rate": 0.0002563344203294282, "loss": 1.6461, "step": 9501 }, { "epoch": 0.75, "learning_rate": 0.00025632570250137056, "loss": 1.6834, "step": 9502 }, { "epoch": 0.75, "learning_rate": 0.0002563169839514201, "loss": 1.6385, "step": 9503 }, { "epoch": 0.75, "learning_rate": 0.0002563082646796359, "loss": 1.6594, "step": 9504 }, { "epoch": 0.75, "learning_rate": 0.00025629954468607736, "loss": 1.584, "step": 9505 }, { "epoch": 0.75, "learning_rate": 0.00025629082397080353, "loss": 1.6648, "step": 9506 }, { "epoch": 0.75, "learning_rate": 0.0002562821025338737, "loss": 1.6392, "step": 9507 }, { "epoch": 0.75, "learning_rate": 0.00025627338037534695, "loss": 1.6983, "step": 9508 }, { "epoch": 0.75, "learning_rate": 0.0002562646574952827, "loss": 1.5595, "step": 9509 }, { "epoch": 0.75, "learning_rate": 0.00025625593389374, "loss": 1.689, "step": 9510 }, { "epoch": 0.75, "learning_rate": 0.0002562472095707782, "loss": 1.6213, "step": 9511 }, { "epoch": 0.75, "learning_rate": 0.0002562384845264564, "loss": 1.6277, "step": 9512 }, { "epoch": 0.75, "learning_rate": 0.00025622975876083396, "loss": 1.711, "step": 9513 }, { "epoch": 0.75, "learning_rate": 0.0002562210322739701, "loss": 1.6344, "step": 9514 }, { "epoch": 0.75, "learning_rate": 0.000256212305065924, "loss": 1.6043, "step": 9515 }, { "epoch": 0.75, "learning_rate": 0.000256203577136755, "loss": 1.6551, "step": 9516 }, { "epoch": 0.75, "learning_rate": 0.0002561948484865223, "loss": 1.6325, "step": 9517 }, { "epoch": 0.75, "learning_rate": 0.0002561861191152852, "loss": 1.6426, "step": 9518 }, { "epoch": 0.75, "learning_rate": 0.00025617738902310297, "loss": 1.6386, "step": 9519 }, { "epoch": 0.75, "learning_rate": 0.00025616865821003485, "loss": 1.628, "step": 9520 }, { "epoch": 0.75, "learning_rate": 0.0002561599266761401, "loss": 1.6573, "step": 9521 }, { "epoch": 0.75, "learning_rate": 0.0002561511944214781, "loss": 1.6564, "step": 9522 }, { "epoch": 0.75, "learning_rate": 0.00025614246144610794, "loss": 1.661, "step": 9523 }, { "epoch": 0.75, "learning_rate": 0.00025613372775008916, "loss": 1.6444, "step": 9524 }, { "epoch": 0.75, "learning_rate": 0.0002561249933334809, "loss": 1.62, "step": 9525 }, { "epoch": 0.75, "learning_rate": 0.0002561162581963425, "loss": 1.7062, "step": 9526 }, { "epoch": 0.75, "learning_rate": 0.00025610752233873324, "loss": 1.5972, "step": 9527 }, { "epoch": 0.75, "learning_rate": 0.0002560987857607125, "loss": 1.6606, "step": 9528 }, { "epoch": 0.75, "learning_rate": 0.0002560900484623395, "loss": 1.6608, "step": 9529 }, { "epoch": 0.75, "learning_rate": 0.00025608131044367366, "loss": 1.6243, "step": 9530 }, { "epoch": 0.75, "learning_rate": 0.0002560725717047742, "loss": 1.6919, "step": 9531 }, { "epoch": 0.75, "learning_rate": 0.0002560638322457006, "loss": 1.6706, "step": 9532 }, { "epoch": 0.75, "learning_rate": 0.00025605509206651206, "loss": 1.6167, "step": 9533 }, { "epoch": 0.75, "learning_rate": 0.000256046351167268, "loss": 1.6491, "step": 9534 }, { "epoch": 0.75, "learning_rate": 0.00025603760954802775, "loss": 1.6767, "step": 9535 }, { "epoch": 0.75, "learning_rate": 0.0002560288672088506, "loss": 1.7025, "step": 9536 }, { "epoch": 0.75, "learning_rate": 0.000256020124149796, "loss": 1.629, "step": 9537 }, { "epoch": 0.75, "learning_rate": 0.00025601138037092323, "loss": 1.6343, "step": 9538 }, { "epoch": 0.75, "learning_rate": 0.0002560026358722917, "loss": 1.5996, "step": 9539 }, { "epoch": 0.75, "learning_rate": 0.0002559938906539608, "loss": 1.6066, "step": 9540 }, { "epoch": 0.75, "learning_rate": 0.0002559851447159898, "loss": 1.598, "step": 9541 }, { "epoch": 0.75, "learning_rate": 0.0002559763980584382, "loss": 1.654, "step": 9542 }, { "epoch": 0.75, "learning_rate": 0.00025596765068136535, "loss": 1.644, "step": 9543 }, { "epoch": 0.75, "learning_rate": 0.0002559589025848306, "loss": 1.6181, "step": 9544 }, { "epoch": 0.75, "learning_rate": 0.00025595015376889336, "loss": 1.6445, "step": 9545 }, { "epoch": 0.75, "learning_rate": 0.0002559414042336131, "loss": 1.6641, "step": 9546 }, { "epoch": 0.75, "learning_rate": 0.00025593265397904914, "loss": 1.6509, "step": 9547 }, { "epoch": 0.75, "learning_rate": 0.000255923903005261, "loss": 1.5853, "step": 9548 }, { "epoch": 0.75, "learning_rate": 0.0002559151513123079, "loss": 1.6062, "step": 9549 }, { "epoch": 0.75, "learning_rate": 0.0002559063989002494, "loss": 1.6664, "step": 9550 }, { "epoch": 0.75, "learning_rate": 0.0002558976457691449, "loss": 1.6467, "step": 9551 }, { "epoch": 0.75, "learning_rate": 0.00025588889191905376, "loss": 1.588, "step": 9552 }, { "epoch": 0.75, "learning_rate": 0.0002558801373500356, "loss": 1.6682, "step": 9553 }, { "epoch": 0.75, "learning_rate": 0.0002558713820621497, "loss": 1.7259, "step": 9554 }, { "epoch": 0.75, "learning_rate": 0.0002558626260554555, "loss": 1.6362, "step": 9555 }, { "epoch": 0.75, "learning_rate": 0.0002558538693300125, "loss": 1.5731, "step": 9556 }, { "epoch": 0.75, "learning_rate": 0.00025584511188588016, "loss": 1.6404, "step": 9557 }, { "epoch": 0.75, "learning_rate": 0.0002558363537231179, "loss": 1.6105, "step": 9558 }, { "epoch": 0.75, "learning_rate": 0.00025582759484178523, "loss": 1.6522, "step": 9559 }, { "epoch": 0.75, "learning_rate": 0.0002558188352419416, "loss": 1.5901, "step": 9560 }, { "epoch": 0.75, "learning_rate": 0.0002558100749236464, "loss": 1.6351, "step": 9561 }, { "epoch": 0.75, "learning_rate": 0.00025580131388695923, "loss": 1.6793, "step": 9562 }, { "epoch": 0.75, "learning_rate": 0.0002557925521319396, "loss": 1.7318, "step": 9563 }, { "epoch": 0.75, "learning_rate": 0.00025578378965864684, "loss": 1.6722, "step": 9564 }, { "epoch": 0.75, "learning_rate": 0.0002557750264671405, "loss": 1.6551, "step": 9565 }, { "epoch": 0.75, "learning_rate": 0.00025576626255748014, "loss": 1.6481, "step": 9566 }, { "epoch": 0.75, "learning_rate": 0.00025575749792972524, "loss": 1.6268, "step": 9567 }, { "epoch": 0.75, "learning_rate": 0.0002557487325839352, "loss": 1.6126, "step": 9568 }, { "epoch": 0.75, "learning_rate": 0.0002557399665201697, "loss": 1.6057, "step": 9569 }, { "epoch": 0.75, "learning_rate": 0.0002557311997384882, "loss": 1.5909, "step": 9570 }, { "epoch": 0.75, "learning_rate": 0.00025572243223895015, "loss": 1.675, "step": 9571 }, { "epoch": 0.75, "learning_rate": 0.0002557136640216152, "loss": 1.5954, "step": 9572 }, { "epoch": 0.75, "learning_rate": 0.0002557048950865428, "loss": 1.6247, "step": 9573 }, { "epoch": 0.75, "learning_rate": 0.0002556961254337924, "loss": 1.6738, "step": 9574 }, { "epoch": 0.75, "learning_rate": 0.0002556873550634237, "loss": 1.6445, "step": 9575 }, { "epoch": 0.75, "learning_rate": 0.0002556785839754962, "loss": 1.6575, "step": 9576 }, { "epoch": 0.75, "learning_rate": 0.0002556698121700694, "loss": 1.6498, "step": 9577 }, { "epoch": 0.75, "learning_rate": 0.0002556610396472029, "loss": 1.6673, "step": 9578 }, { "epoch": 0.75, "learning_rate": 0.00025565226640695627, "loss": 1.6275, "step": 9579 }, { "epoch": 0.75, "learning_rate": 0.000255643492449389, "loss": 1.6272, "step": 9580 }, { "epoch": 0.75, "learning_rate": 0.00025563471777456073, "loss": 1.6504, "step": 9581 }, { "epoch": 0.75, "learning_rate": 0.00025562594238253105, "loss": 1.5866, "step": 9582 }, { "epoch": 0.75, "learning_rate": 0.0002556171662733595, "loss": 1.6618, "step": 9583 }, { "epoch": 0.75, "learning_rate": 0.00025560838944710564, "loss": 1.6393, "step": 9584 }, { "epoch": 0.75, "learning_rate": 0.00025559961190382916, "loss": 1.632, "step": 9585 }, { "epoch": 0.75, "learning_rate": 0.0002555908336435896, "loss": 1.6841, "step": 9586 }, { "epoch": 0.75, "learning_rate": 0.00025558205466644647, "loss": 1.6379, "step": 9587 }, { "epoch": 0.75, "learning_rate": 0.0002555732749724595, "loss": 1.628, "step": 9588 }, { "epoch": 0.75, "learning_rate": 0.0002555644945616882, "loss": 1.682, "step": 9589 }, { "epoch": 0.75, "learning_rate": 0.0002555557134341923, "loss": 1.5826, "step": 9590 }, { "epoch": 0.75, "learning_rate": 0.00025554693159003135, "loss": 1.6276, "step": 9591 }, { "epoch": 0.75, "learning_rate": 0.0002555381490292649, "loss": 1.6212, "step": 9592 }, { "epoch": 0.75, "learning_rate": 0.0002555293657519528, "loss": 1.6263, "step": 9593 }, { "epoch": 0.75, "learning_rate": 0.0002555205817581545, "loss": 1.6143, "step": 9594 }, { "epoch": 0.75, "learning_rate": 0.0002555117970479296, "loss": 1.7097, "step": 9595 }, { "epoch": 0.76, "learning_rate": 0.00025550301162133787, "loss": 1.637, "step": 9596 }, { "epoch": 0.76, "learning_rate": 0.0002554942254784389, "loss": 1.679, "step": 9597 }, { "epoch": 0.76, "learning_rate": 0.00025548543861929243, "loss": 1.6444, "step": 9598 }, { "epoch": 0.76, "learning_rate": 0.0002554766510439579, "loss": 1.6785, "step": 9599 }, { "epoch": 0.76, "learning_rate": 0.00025546786275249526, "loss": 1.6596, "step": 9600 }, { "epoch": 0.76, "learning_rate": 0.00025545907374496395, "loss": 1.6154, "step": 9601 }, { "epoch": 0.76, "learning_rate": 0.0002554502840214238, "loss": 1.6279, "step": 9602 }, { "epoch": 0.76, "learning_rate": 0.00025544149358193435, "loss": 1.5644, "step": 9603 }, { "epoch": 0.76, "learning_rate": 0.00025543270242655533, "loss": 1.6215, "step": 9604 }, { "epoch": 0.76, "learning_rate": 0.0002554239105553465, "loss": 1.6363, "step": 9605 }, { "epoch": 0.76, "learning_rate": 0.0002554151179683675, "loss": 1.641, "step": 9606 }, { "epoch": 0.76, "learning_rate": 0.00025540632466567793, "loss": 1.6561, "step": 9607 }, { "epoch": 0.76, "learning_rate": 0.0002553975306473377, "loss": 1.6628, "step": 9608 }, { "epoch": 0.76, "learning_rate": 0.0002553887359134063, "loss": 1.6631, "step": 9609 }, { "epoch": 0.76, "learning_rate": 0.0002553799404639436, "loss": 1.6133, "step": 9610 }, { "epoch": 0.76, "learning_rate": 0.00025537114429900927, "loss": 1.6597, "step": 9611 }, { "epoch": 0.76, "learning_rate": 0.00025536234741866293, "loss": 1.6245, "step": 9612 }, { "epoch": 0.76, "learning_rate": 0.0002553535498229645, "loss": 1.6156, "step": 9613 }, { "epoch": 0.76, "learning_rate": 0.0002553447515119736, "loss": 1.6079, "step": 9614 }, { "epoch": 0.76, "learning_rate": 0.00025533595248574987, "loss": 1.6254, "step": 9615 }, { "epoch": 0.76, "learning_rate": 0.00025532715274435326, "loss": 1.6248, "step": 9616 }, { "epoch": 0.76, "learning_rate": 0.00025531835228784336, "loss": 1.6734, "step": 9617 }, { "epoch": 0.76, "learning_rate": 0.00025530955111627995, "loss": 1.5941, "step": 9618 }, { "epoch": 0.76, "learning_rate": 0.00025530074922972283, "loss": 1.6318, "step": 9619 }, { "epoch": 0.76, "learning_rate": 0.00025529194662823174, "loss": 1.6748, "step": 9620 }, { "epoch": 0.76, "learning_rate": 0.0002552831433118664, "loss": 1.6341, "step": 9621 }, { "epoch": 0.76, "learning_rate": 0.00025527433928068666, "loss": 1.619, "step": 9622 }, { "epoch": 0.76, "learning_rate": 0.0002552655345347522, "loss": 1.6899, "step": 9623 }, { "epoch": 0.76, "learning_rate": 0.0002552567290741229, "loss": 1.6555, "step": 9624 }, { "epoch": 0.76, "learning_rate": 0.00025524792289885847, "loss": 1.6555, "step": 9625 }, { "epoch": 0.76, "learning_rate": 0.0002552391160090188, "loss": 1.6343, "step": 9626 }, { "epoch": 0.76, "learning_rate": 0.0002552303084046635, "loss": 1.6542, "step": 9627 }, { "epoch": 0.76, "learning_rate": 0.00025522150008585253, "loss": 1.6352, "step": 9628 }, { "epoch": 0.76, "learning_rate": 0.0002552126910526456, "loss": 1.6423, "step": 9629 }, { "epoch": 0.76, "learning_rate": 0.0002552038813051026, "loss": 1.7127, "step": 9630 }, { "epoch": 0.76, "learning_rate": 0.0002551950708432833, "loss": 1.6042, "step": 9631 }, { "epoch": 0.76, "learning_rate": 0.00025518625966724747, "loss": 1.5996, "step": 9632 }, { "epoch": 0.76, "learning_rate": 0.00025517744777705506, "loss": 1.6575, "step": 9633 }, { "epoch": 0.76, "learning_rate": 0.00025516863517276574, "loss": 1.6607, "step": 9634 }, { "epoch": 0.76, "learning_rate": 0.00025515982185443946, "loss": 1.7121, "step": 9635 }, { "epoch": 0.76, "learning_rate": 0.00025515100782213607, "loss": 1.6651, "step": 9636 }, { "epoch": 0.76, "learning_rate": 0.0002551421930759153, "loss": 1.6351, "step": 9637 }, { "epoch": 0.76, "learning_rate": 0.0002551333776158371, "loss": 1.666, "step": 9638 }, { "epoch": 0.76, "learning_rate": 0.00025512456144196125, "loss": 1.6706, "step": 9639 }, { "epoch": 0.76, "learning_rate": 0.0002551157445543477, "loss": 1.629, "step": 9640 }, { "epoch": 0.76, "learning_rate": 0.0002551069269530562, "loss": 1.6601, "step": 9641 }, { "epoch": 0.76, "learning_rate": 0.00025509810863814664, "loss": 1.6217, "step": 9642 }, { "epoch": 0.76, "learning_rate": 0.00025508928960967897, "loss": 1.6161, "step": 9643 }, { "epoch": 0.76, "learning_rate": 0.000255080469867713, "loss": 1.6374, "step": 9644 }, { "epoch": 0.76, "learning_rate": 0.00025507164941230865, "loss": 1.6543, "step": 9645 }, { "epoch": 0.76, "learning_rate": 0.00025506282824352576, "loss": 1.5965, "step": 9646 }, { "epoch": 0.76, "learning_rate": 0.0002550540063614243, "loss": 1.6635, "step": 9647 }, { "epoch": 0.76, "learning_rate": 0.000255045183766064, "loss": 1.5928, "step": 9648 }, { "epoch": 0.76, "learning_rate": 0.0002550363604575049, "loss": 1.5873, "step": 9649 }, { "epoch": 0.76, "learning_rate": 0.00025502753643580697, "loss": 1.6661, "step": 9650 }, { "epoch": 0.76, "learning_rate": 0.00025501871170102995, "loss": 1.6655, "step": 9651 }, { "epoch": 0.76, "learning_rate": 0.0002550098862532339, "loss": 1.6379, "step": 9652 }, { "epoch": 0.76, "learning_rate": 0.0002550010600924786, "loss": 1.6657, "step": 9653 }, { "epoch": 0.76, "learning_rate": 0.0002549922332188241, "loss": 1.6863, "step": 9654 }, { "epoch": 0.76, "learning_rate": 0.0002549834056323302, "loss": 1.6679, "step": 9655 }, { "epoch": 0.76, "learning_rate": 0.00025497457733305695, "loss": 1.6642, "step": 9656 }, { "epoch": 0.76, "learning_rate": 0.00025496574832106425, "loss": 1.5723, "step": 9657 }, { "epoch": 0.76, "learning_rate": 0.0002549569185964121, "loss": 1.6933, "step": 9658 }, { "epoch": 0.76, "learning_rate": 0.0002549480881591603, "loss": 1.6433, "step": 9659 }, { "epoch": 0.76, "learning_rate": 0.0002549392570093689, "loss": 1.6258, "step": 9660 }, { "epoch": 0.76, "learning_rate": 0.0002549304251470979, "loss": 1.6024, "step": 9661 }, { "epoch": 0.76, "learning_rate": 0.00025492159257240723, "loss": 1.6621, "step": 9662 }, { "epoch": 0.76, "learning_rate": 0.0002549127592853568, "loss": 1.6083, "step": 9663 }, { "epoch": 0.76, "learning_rate": 0.0002549039252860066, "loss": 1.6221, "step": 9664 }, { "epoch": 0.76, "learning_rate": 0.0002548950905744168, "loss": 1.6719, "step": 9665 }, { "epoch": 0.76, "learning_rate": 0.0002548862551506471, "loss": 1.6607, "step": 9666 }, { "epoch": 0.76, "learning_rate": 0.0002548774190147576, "loss": 1.6223, "step": 9667 }, { "epoch": 0.76, "learning_rate": 0.00025486858216680836, "loss": 1.6071, "step": 9668 }, { "epoch": 0.76, "learning_rate": 0.00025485974460685926, "loss": 1.6483, "step": 9669 }, { "epoch": 0.76, "learning_rate": 0.0002548509063349704, "loss": 1.6689, "step": 9670 }, { "epoch": 0.76, "learning_rate": 0.00025484206735120173, "loss": 1.6371, "step": 9671 }, { "epoch": 0.76, "learning_rate": 0.00025483322765561326, "loss": 1.6573, "step": 9672 }, { "epoch": 0.76, "learning_rate": 0.00025482438724826504, "loss": 1.637, "step": 9673 }, { "epoch": 0.76, "learning_rate": 0.00025481554612921713, "loss": 1.6956, "step": 9674 }, { "epoch": 0.76, "learning_rate": 0.00025480670429852944, "loss": 1.642, "step": 9675 }, { "epoch": 0.76, "learning_rate": 0.0002547978617562621, "loss": 1.5925, "step": 9676 }, { "epoch": 0.76, "learning_rate": 0.00025478901850247505, "loss": 1.6282, "step": 9677 }, { "epoch": 0.76, "learning_rate": 0.00025478017453722844, "loss": 1.6162, "step": 9678 }, { "epoch": 0.76, "learning_rate": 0.0002547713298605823, "loss": 1.6518, "step": 9679 }, { "epoch": 0.76, "learning_rate": 0.0002547624844725966, "loss": 1.6392, "step": 9680 }, { "epoch": 0.76, "learning_rate": 0.00025475363837333144, "loss": 1.6447, "step": 9681 }, { "epoch": 0.76, "learning_rate": 0.0002547447915628469, "loss": 1.6759, "step": 9682 }, { "epoch": 0.76, "learning_rate": 0.00025473594404120303, "loss": 1.6511, "step": 9683 }, { "epoch": 0.76, "learning_rate": 0.0002547270958084599, "loss": 1.6472, "step": 9684 }, { "epoch": 0.76, "learning_rate": 0.00025471824686467754, "loss": 1.669, "step": 9685 }, { "epoch": 0.76, "learning_rate": 0.0002547093972099161, "loss": 1.5841, "step": 9686 }, { "epoch": 0.76, "learning_rate": 0.00025470054684423565, "loss": 1.6598, "step": 9687 }, { "epoch": 0.76, "learning_rate": 0.0002546916957676963, "loss": 1.6581, "step": 9688 }, { "epoch": 0.76, "learning_rate": 0.00025468284398035804, "loss": 1.6306, "step": 9689 }, { "epoch": 0.76, "learning_rate": 0.00025467399148228106, "loss": 1.6237, "step": 9690 }, { "epoch": 0.76, "learning_rate": 0.00025466513827352544, "loss": 1.6269, "step": 9691 }, { "epoch": 0.76, "learning_rate": 0.00025465628435415136, "loss": 1.5991, "step": 9692 }, { "epoch": 0.76, "learning_rate": 0.00025464742972421876, "loss": 1.6411, "step": 9693 }, { "epoch": 0.76, "learning_rate": 0.0002546385743837879, "loss": 1.5873, "step": 9694 }, { "epoch": 0.76, "learning_rate": 0.0002546297183329189, "loss": 1.6348, "step": 9695 }, { "epoch": 0.76, "learning_rate": 0.0002546208615716718, "loss": 1.6981, "step": 9696 }, { "epoch": 0.76, "learning_rate": 0.0002546120041001068, "loss": 1.6029, "step": 9697 }, { "epoch": 0.76, "learning_rate": 0.0002546031459182841, "loss": 1.5729, "step": 9698 }, { "epoch": 0.76, "learning_rate": 0.0002545942870262636, "loss": 1.672, "step": 9699 }, { "epoch": 0.76, "learning_rate": 0.0002545854274241057, "loss": 1.6119, "step": 9700 }, { "epoch": 0.76, "learning_rate": 0.0002545765671118705, "loss": 1.6961, "step": 9701 }, { "epoch": 0.76, "learning_rate": 0.00025456770608961807, "loss": 1.6354, "step": 9702 }, { "epoch": 0.76, "learning_rate": 0.00025455884435740864, "loss": 1.6242, "step": 9703 }, { "epoch": 0.76, "learning_rate": 0.00025454998191530234, "loss": 1.6182, "step": 9704 }, { "epoch": 0.76, "learning_rate": 0.0002545411187633594, "loss": 1.6413, "step": 9705 }, { "epoch": 0.76, "learning_rate": 0.0002545322549016399, "loss": 1.633, "step": 9706 }, { "epoch": 0.76, "learning_rate": 0.00025452339033020413, "loss": 1.6686, "step": 9707 }, { "epoch": 0.76, "learning_rate": 0.00025451452504911216, "loss": 1.6491, "step": 9708 }, { "epoch": 0.76, "learning_rate": 0.00025450565905842424, "loss": 1.5971, "step": 9709 }, { "epoch": 0.76, "learning_rate": 0.00025449679235820064, "loss": 1.6227, "step": 9710 }, { "epoch": 0.76, "learning_rate": 0.00025448792494850144, "loss": 1.6747, "step": 9711 }, { "epoch": 0.76, "learning_rate": 0.0002544790568293869, "loss": 1.6427, "step": 9712 }, { "epoch": 0.76, "learning_rate": 0.0002544701880009172, "loss": 1.6548, "step": 9713 }, { "epoch": 0.76, "learning_rate": 0.0002544613184631526, "loss": 1.6909, "step": 9714 }, { "epoch": 0.76, "learning_rate": 0.0002544524482161533, "loss": 1.6594, "step": 9715 }, { "epoch": 0.76, "learning_rate": 0.0002544435772599795, "loss": 1.7044, "step": 9716 }, { "epoch": 0.76, "learning_rate": 0.00025443470559469145, "loss": 1.6197, "step": 9717 }, { "epoch": 0.76, "learning_rate": 0.00025442583322034934, "loss": 1.6892, "step": 9718 }, { "epoch": 0.76, "learning_rate": 0.0002544169601370135, "loss": 1.5759, "step": 9719 }, { "epoch": 0.76, "learning_rate": 0.0002544080863447441, "loss": 1.6388, "step": 9720 }, { "epoch": 0.76, "learning_rate": 0.00025439921184360146, "loss": 1.5918, "step": 9721 }, { "epoch": 0.76, "learning_rate": 0.0002543903366336457, "loss": 1.6443, "step": 9722 }, { "epoch": 0.77, "learning_rate": 0.00025438146071493726, "loss": 1.7043, "step": 9723 }, { "epoch": 0.77, "learning_rate": 0.0002543725840875362, "loss": 1.6361, "step": 9724 }, { "epoch": 0.77, "learning_rate": 0.00025436370675150293, "loss": 1.6582, "step": 9725 }, { "epoch": 0.77, "learning_rate": 0.00025435482870689774, "loss": 1.6169, "step": 9726 }, { "epoch": 0.77, "learning_rate": 0.0002543459499537808, "loss": 1.6677, "step": 9727 }, { "epoch": 0.77, "learning_rate": 0.0002543370704922125, "loss": 1.5837, "step": 9728 }, { "epoch": 0.77, "learning_rate": 0.000254328190322253, "loss": 1.6246, "step": 9729 }, { "epoch": 0.77, "learning_rate": 0.00025431930944396267, "loss": 1.6578, "step": 9730 }, { "epoch": 0.77, "learning_rate": 0.0002543104278574018, "loss": 1.6404, "step": 9731 }, { "epoch": 0.77, "learning_rate": 0.0002543015455626307, "loss": 1.6684, "step": 9732 }, { "epoch": 0.77, "learning_rate": 0.00025429266255970966, "loss": 1.5891, "step": 9733 }, { "epoch": 0.77, "learning_rate": 0.00025428377884869897, "loss": 1.6174, "step": 9734 }, { "epoch": 0.77, "learning_rate": 0.000254274894429659, "loss": 1.6629, "step": 9735 }, { "epoch": 0.77, "learning_rate": 0.00025426600930265, "loss": 1.6106, "step": 9736 }, { "epoch": 0.77, "learning_rate": 0.0002542571234677324, "loss": 1.7018, "step": 9737 }, { "epoch": 0.77, "learning_rate": 0.00025424823692496646, "loss": 1.66, "step": 9738 }, { "epoch": 0.77, "learning_rate": 0.0002542393496744125, "loss": 1.587, "step": 9739 }, { "epoch": 0.77, "learning_rate": 0.00025423046171613086, "loss": 1.6167, "step": 9740 }, { "epoch": 0.77, "learning_rate": 0.00025422157305018196, "loss": 1.6314, "step": 9741 }, { "epoch": 0.77, "learning_rate": 0.000254212683676626, "loss": 1.5735, "step": 9742 }, { "epoch": 0.77, "learning_rate": 0.0002542037935955235, "loss": 1.644, "step": 9743 }, { "epoch": 0.77, "learning_rate": 0.00025419490280693475, "loss": 1.6274, "step": 9744 }, { "epoch": 0.77, "learning_rate": 0.0002541860113109201, "loss": 1.6451, "step": 9745 }, { "epoch": 0.77, "learning_rate": 0.0002541771191075399, "loss": 1.6827, "step": 9746 }, { "epoch": 0.77, "learning_rate": 0.0002541682261968545, "loss": 1.6851, "step": 9747 }, { "epoch": 0.77, "learning_rate": 0.0002541593325789244, "loss": 1.6555, "step": 9748 }, { "epoch": 0.77, "learning_rate": 0.00025415043825380995, "loss": 1.6241, "step": 9749 }, { "epoch": 0.77, "learning_rate": 0.00025414154322157145, "loss": 1.6426, "step": 9750 }, { "epoch": 0.77, "learning_rate": 0.0002541326474822693, "loss": 1.6054, "step": 9751 }, { "epoch": 0.77, "learning_rate": 0.00025412375103596403, "loss": 1.5867, "step": 9752 }, { "epoch": 0.77, "learning_rate": 0.0002541148538827159, "loss": 1.6157, "step": 9753 }, { "epoch": 0.77, "learning_rate": 0.0002541059560225854, "loss": 1.6574, "step": 9754 }, { "epoch": 0.77, "learning_rate": 0.00025409705745563287, "loss": 1.6497, "step": 9755 }, { "epoch": 0.77, "learning_rate": 0.0002540881581819187, "loss": 1.6385, "step": 9756 }, { "epoch": 0.77, "learning_rate": 0.0002540792582015035, "loss": 1.6697, "step": 9757 }, { "epoch": 0.77, "learning_rate": 0.00025407035751444753, "loss": 1.6583, "step": 9758 }, { "epoch": 0.77, "learning_rate": 0.00025406145612081124, "loss": 1.6391, "step": 9759 }, { "epoch": 0.77, "learning_rate": 0.00025405255402065514, "loss": 1.6065, "step": 9760 }, { "epoch": 0.77, "learning_rate": 0.0002540436512140396, "loss": 1.7021, "step": 9761 }, { "epoch": 0.77, "learning_rate": 0.00025403474770102505, "loss": 1.6498, "step": 9762 }, { "epoch": 0.77, "learning_rate": 0.000254025843481672, "loss": 1.6466, "step": 9763 }, { "epoch": 0.77, "learning_rate": 0.00025401693855604086, "loss": 1.6077, "step": 9764 }, { "epoch": 0.77, "learning_rate": 0.00025400803292419214, "loss": 1.681, "step": 9765 }, { "epoch": 0.77, "learning_rate": 0.00025399912658618623, "loss": 1.6487, "step": 9766 }, { "epoch": 0.77, "learning_rate": 0.0002539902195420837, "loss": 1.7237, "step": 9767 }, { "epoch": 0.77, "learning_rate": 0.00025398131179194493, "loss": 1.6566, "step": 9768 }, { "epoch": 0.77, "learning_rate": 0.00025397240333583043, "loss": 1.6331, "step": 9769 }, { "epoch": 0.77, "learning_rate": 0.0002539634941738007, "loss": 1.6513, "step": 9770 }, { "epoch": 0.77, "learning_rate": 0.0002539545843059162, "loss": 1.6744, "step": 9771 }, { "epoch": 0.77, "learning_rate": 0.0002539456737322375, "loss": 1.6496, "step": 9772 }, { "epoch": 0.77, "learning_rate": 0.00025393676245282496, "loss": 1.6309, "step": 9773 }, { "epoch": 0.77, "learning_rate": 0.0002539278504677392, "loss": 1.6008, "step": 9774 }, { "epoch": 0.77, "learning_rate": 0.00025391893777704065, "loss": 1.6719, "step": 9775 }, { "epoch": 0.77, "learning_rate": 0.0002539100243807899, "loss": 1.6404, "step": 9776 }, { "epoch": 0.77, "learning_rate": 0.0002539011102790474, "loss": 1.6289, "step": 9777 }, { "epoch": 0.77, "learning_rate": 0.00025389219547187374, "loss": 1.6535, "step": 9778 }, { "epoch": 0.77, "learning_rate": 0.0002538832799593294, "loss": 1.6366, "step": 9779 }, { "epoch": 0.77, "learning_rate": 0.00025387436374147484, "loss": 1.6491, "step": 9780 }, { "epoch": 0.77, "learning_rate": 0.00025386544681837075, "loss": 1.6007, "step": 9781 }, { "epoch": 0.77, "learning_rate": 0.00025385652919007756, "loss": 1.6356, "step": 9782 }, { "epoch": 0.77, "learning_rate": 0.00025384761085665586, "loss": 1.6392, "step": 9783 }, { "epoch": 0.77, "learning_rate": 0.0002538386918181662, "loss": 1.6005, "step": 9784 }, { "epoch": 0.77, "learning_rate": 0.00025382977207466913, "loss": 1.6328, "step": 9785 }, { "epoch": 0.77, "learning_rate": 0.0002538208516262252, "loss": 1.678, "step": 9786 }, { "epoch": 0.77, "learning_rate": 0.00025381193047289497, "loss": 1.6879, "step": 9787 }, { "epoch": 0.77, "learning_rate": 0.000253803008614739, "loss": 1.5845, "step": 9788 }, { "epoch": 0.77, "learning_rate": 0.0002537940860518179, "loss": 1.6472, "step": 9789 }, { "epoch": 0.77, "learning_rate": 0.00025378516278419224, "loss": 1.6726, "step": 9790 }, { "epoch": 0.77, "learning_rate": 0.0002537762388119226, "loss": 1.6118, "step": 9791 }, { "epoch": 0.77, "learning_rate": 0.0002537673141350696, "loss": 1.6442, "step": 9792 }, { "epoch": 0.77, "learning_rate": 0.00025375838875369377, "loss": 1.6566, "step": 9793 }, { "epoch": 0.77, "learning_rate": 0.0002537494626678557, "loss": 1.6641, "step": 9794 }, { "epoch": 0.77, "learning_rate": 0.00025374053587761606, "loss": 1.6335, "step": 9795 }, { "epoch": 0.77, "learning_rate": 0.00025373160838303545, "loss": 1.6321, "step": 9796 }, { "epoch": 0.77, "learning_rate": 0.00025372268018417445, "loss": 1.698, "step": 9797 }, { "epoch": 0.77, "learning_rate": 0.0002537137512810937, "loss": 1.5871, "step": 9798 }, { "epoch": 0.77, "learning_rate": 0.0002537048216738538, "loss": 1.6422, "step": 9799 }, { "epoch": 0.77, "learning_rate": 0.0002536958913625154, "loss": 1.6444, "step": 9800 }, { "epoch": 0.77, "learning_rate": 0.00025368696034713914, "loss": 1.639, "step": 9801 }, { "epoch": 0.77, "learning_rate": 0.0002536780286277856, "loss": 1.613, "step": 9802 }, { "epoch": 0.77, "learning_rate": 0.0002536690962045154, "loss": 1.6757, "step": 9803 }, { "epoch": 0.77, "learning_rate": 0.0002536601630773894, "loss": 1.5951, "step": 9804 }, { "epoch": 0.77, "learning_rate": 0.000253651229246468, "loss": 1.6058, "step": 9805 }, { "epoch": 0.77, "learning_rate": 0.00025364229471181197, "loss": 1.5853, "step": 9806 }, { "epoch": 0.77, "learning_rate": 0.000253633359473482, "loss": 1.5803, "step": 9807 }, { "epoch": 0.77, "learning_rate": 0.0002536244235315386, "loss": 1.5994, "step": 9808 }, { "epoch": 0.77, "learning_rate": 0.0002536154868860426, "loss": 1.6554, "step": 9809 }, { "epoch": 0.77, "learning_rate": 0.00025360654953705467, "loss": 1.6389, "step": 9810 }, { "epoch": 0.77, "learning_rate": 0.0002535976114846354, "loss": 1.6269, "step": 9811 }, { "epoch": 0.77, "learning_rate": 0.0002535886727288455, "loss": 1.627, "step": 9812 }, { "epoch": 0.77, "learning_rate": 0.00025357973326974574, "loss": 1.6624, "step": 9813 }, { "epoch": 0.77, "learning_rate": 0.0002535707931073967, "loss": 1.6222, "step": 9814 }, { "epoch": 0.77, "learning_rate": 0.00025356185224185914, "loss": 1.6306, "step": 9815 }, { "epoch": 0.77, "learning_rate": 0.00025355291067319374, "loss": 1.6162, "step": 9816 }, { "epoch": 0.77, "learning_rate": 0.0002535439684014613, "loss": 1.6218, "step": 9817 }, { "epoch": 0.77, "learning_rate": 0.0002535350254267224, "loss": 1.6344, "step": 9818 }, { "epoch": 0.77, "learning_rate": 0.0002535260817490377, "loss": 1.6543, "step": 9819 }, { "epoch": 0.77, "learning_rate": 0.0002535171373684682, "loss": 1.656, "step": 9820 }, { "epoch": 0.77, "learning_rate": 0.0002535081922850744, "loss": 1.6397, "step": 9821 }, { "epoch": 0.77, "learning_rate": 0.0002534992464989171, "loss": 1.6015, "step": 9822 }, { "epoch": 0.77, "learning_rate": 0.00025349030001005704, "loss": 1.5913, "step": 9823 }, { "epoch": 0.77, "learning_rate": 0.0002534813528185549, "loss": 1.6197, "step": 9824 }, { "epoch": 0.77, "learning_rate": 0.0002534724049244716, "loss": 1.6501, "step": 9825 }, { "epoch": 0.77, "learning_rate": 0.0002534634563278677, "loss": 1.6027, "step": 9826 }, { "epoch": 0.77, "learning_rate": 0.000253454507028804, "loss": 1.6394, "step": 9827 }, { "epoch": 0.77, "learning_rate": 0.00025344555702734134, "loss": 1.625, "step": 9828 }, { "epoch": 0.77, "learning_rate": 0.00025343660632354037, "loss": 1.6405, "step": 9829 }, { "epoch": 0.77, "learning_rate": 0.000253427654917462, "loss": 1.6031, "step": 9830 }, { "epoch": 0.77, "learning_rate": 0.00025341870280916687, "loss": 1.6182, "step": 9831 }, { "epoch": 0.77, "learning_rate": 0.0002534097499987158, "loss": 1.6727, "step": 9832 }, { "epoch": 0.77, "learning_rate": 0.00025340079648616964, "loss": 1.6344, "step": 9833 }, { "epoch": 0.77, "learning_rate": 0.00025339184227158917, "loss": 1.6037, "step": 9834 }, { "epoch": 0.77, "learning_rate": 0.00025338288735503507, "loss": 1.6178, "step": 9835 }, { "epoch": 0.77, "learning_rate": 0.00025337393173656826, "loss": 1.6172, "step": 9836 }, { "epoch": 0.77, "learning_rate": 0.0002533649754162495, "loss": 1.6257, "step": 9837 }, { "epoch": 0.77, "learning_rate": 0.00025335601839413956, "loss": 1.6197, "step": 9838 }, { "epoch": 0.77, "learning_rate": 0.00025334706067029936, "loss": 1.6611, "step": 9839 }, { "epoch": 0.77, "learning_rate": 0.0002533381022447896, "loss": 1.6142, "step": 9840 }, { "epoch": 0.77, "learning_rate": 0.00025332914311767114, "loss": 1.644, "step": 9841 }, { "epoch": 0.77, "learning_rate": 0.00025332018328900487, "loss": 1.6601, "step": 9842 }, { "epoch": 0.77, "learning_rate": 0.00025331122275885155, "loss": 1.6393, "step": 9843 }, { "epoch": 0.77, "learning_rate": 0.00025330226152727196, "loss": 1.6447, "step": 9844 }, { "epoch": 0.77, "learning_rate": 0.00025329329959432713, "loss": 1.6414, "step": 9845 }, { "epoch": 0.77, "learning_rate": 0.0002532843369600778, "loss": 1.6585, "step": 9846 }, { "epoch": 0.77, "learning_rate": 0.00025327537362458474, "loss": 1.6589, "step": 9847 }, { "epoch": 0.77, "learning_rate": 0.000253266409587909, "loss": 1.645, "step": 9848 }, { "epoch": 0.77, "learning_rate": 0.0002532574448501112, "loss": 1.6615, "step": 9849 }, { "epoch": 0.78, "learning_rate": 0.00025324847941125237, "loss": 1.6608, "step": 9850 }, { "epoch": 0.78, "learning_rate": 0.00025323951327139337, "loss": 1.6374, "step": 9851 }, { "epoch": 0.78, "learning_rate": 0.000253230546430595, "loss": 1.5417, "step": 9852 }, { "epoch": 0.78, "learning_rate": 0.0002532215788889183, "loss": 1.6529, "step": 9853 }, { "epoch": 0.78, "learning_rate": 0.0002532126106464239, "loss": 1.6876, "step": 9854 }, { "epoch": 0.78, "learning_rate": 0.0002532036417031729, "loss": 1.6503, "step": 9855 }, { "epoch": 0.78, "learning_rate": 0.00025319467205922613, "loss": 1.6668, "step": 9856 }, { "epoch": 0.78, "learning_rate": 0.0002531857017146445, "loss": 1.6805, "step": 9857 }, { "epoch": 0.78, "learning_rate": 0.0002531767306694888, "loss": 1.6033, "step": 9858 }, { "epoch": 0.78, "learning_rate": 0.00025316775892382016, "loss": 1.6172, "step": 9859 }, { "epoch": 0.78, "learning_rate": 0.0002531587864776993, "loss": 1.6401, "step": 9860 }, { "epoch": 0.78, "learning_rate": 0.0002531498133311872, "loss": 1.5894, "step": 9861 }, { "epoch": 0.78, "learning_rate": 0.00025314083948434484, "loss": 1.5757, "step": 9862 }, { "epoch": 0.78, "learning_rate": 0.00025313186493723303, "loss": 1.5893, "step": 9863 }, { "epoch": 0.78, "learning_rate": 0.0002531228896899129, "loss": 1.6112, "step": 9864 }, { "epoch": 0.78, "learning_rate": 0.00025311391374244517, "loss": 1.6891, "step": 9865 }, { "epoch": 0.78, "learning_rate": 0.0002531049370948908, "loss": 1.6286, "step": 9866 }, { "epoch": 0.78, "learning_rate": 0.00025309595974731087, "loss": 1.5937, "step": 9867 }, { "epoch": 0.78, "learning_rate": 0.00025308698169976626, "loss": 1.654, "step": 9868 }, { "epoch": 0.78, "learning_rate": 0.000253078002952318, "loss": 1.6459, "step": 9869 }, { "epoch": 0.78, "learning_rate": 0.0002530690235050269, "loss": 1.6533, "step": 9870 }, { "epoch": 0.78, "learning_rate": 0.00025306004335795405, "loss": 1.6334, "step": 9871 }, { "epoch": 0.78, "learning_rate": 0.0002530510625111603, "loss": 1.6456, "step": 9872 }, { "epoch": 0.78, "learning_rate": 0.0002530420809647068, "loss": 1.6829, "step": 9873 }, { "epoch": 0.78, "learning_rate": 0.0002530330987186544, "loss": 1.6514, "step": 9874 }, { "epoch": 0.78, "learning_rate": 0.0002530241157730641, "loss": 1.6087, "step": 9875 }, { "epoch": 0.78, "learning_rate": 0.00025301513212799695, "loss": 1.6606, "step": 9876 }, { "epoch": 0.78, "learning_rate": 0.0002530061477835139, "loss": 1.6232, "step": 9877 }, { "epoch": 0.78, "learning_rate": 0.00025299716273967593, "loss": 1.6669, "step": 9878 }, { "epoch": 0.78, "learning_rate": 0.00025298817699654405, "loss": 1.6416, "step": 9879 }, { "epoch": 0.78, "learning_rate": 0.0002529791905541793, "loss": 1.6208, "step": 9880 }, { "epoch": 0.78, "learning_rate": 0.0002529702034126426, "loss": 1.6346, "step": 9881 }, { "epoch": 0.78, "learning_rate": 0.00025296121557199516, "loss": 1.6296, "step": 9882 }, { "epoch": 0.78, "learning_rate": 0.00025295222703229783, "loss": 1.6466, "step": 9883 }, { "epoch": 0.78, "learning_rate": 0.00025294323779361167, "loss": 1.6257, "step": 9884 }, { "epoch": 0.78, "learning_rate": 0.0002529342478559978, "loss": 1.6281, "step": 9885 }, { "epoch": 0.78, "learning_rate": 0.00025292525721951715, "loss": 1.6077, "step": 9886 }, { "epoch": 0.78, "learning_rate": 0.00025291626588423076, "loss": 1.6291, "step": 9887 }, { "epoch": 0.78, "learning_rate": 0.0002529072738501998, "loss": 1.6721, "step": 9888 }, { "epoch": 0.78, "learning_rate": 0.0002528982811174852, "loss": 1.6356, "step": 9889 }, { "epoch": 0.78, "learning_rate": 0.000252889287686148, "loss": 1.6524, "step": 9890 }, { "epoch": 0.78, "learning_rate": 0.00025288029355624944, "loss": 1.63, "step": 9891 }, { "epoch": 0.78, "learning_rate": 0.00025287129872785034, "loss": 1.5954, "step": 9892 }, { "epoch": 0.78, "learning_rate": 0.00025286230320101195, "loss": 1.646, "step": 9893 }, { "epoch": 0.78, "learning_rate": 0.0002528533069757953, "loss": 1.6826, "step": 9894 }, { "epoch": 0.78, "learning_rate": 0.00025284431005226143, "loss": 1.6308, "step": 9895 }, { "epoch": 0.78, "learning_rate": 0.00025283531243047144, "loss": 1.638, "step": 9896 }, { "epoch": 0.78, "learning_rate": 0.0002528263141104865, "loss": 1.5817, "step": 9897 }, { "epoch": 0.78, "learning_rate": 0.0002528173150923675, "loss": 1.6102, "step": 9898 }, { "epoch": 0.78, "learning_rate": 0.0002528083153761758, "loss": 1.6224, "step": 9899 }, { "epoch": 0.78, "learning_rate": 0.00025279931496197225, "loss": 1.6339, "step": 9900 }, { "epoch": 0.78, "learning_rate": 0.0002527903138498182, "loss": 1.642, "step": 9901 }, { "epoch": 0.78, "learning_rate": 0.0002527813120397746, "loss": 1.669, "step": 9902 }, { "epoch": 0.78, "learning_rate": 0.00025277230953190256, "loss": 1.6684, "step": 9903 }, { "epoch": 0.78, "learning_rate": 0.00025276330632626327, "loss": 1.6488, "step": 9904 }, { "epoch": 0.78, "learning_rate": 0.0002527543024229179, "loss": 1.6556, "step": 9905 }, { "epoch": 0.78, "learning_rate": 0.00025274529782192746, "loss": 1.6682, "step": 9906 }, { "epoch": 0.78, "learning_rate": 0.0002527362925233532, "loss": 1.6943, "step": 9907 }, { "epoch": 0.78, "learning_rate": 0.00025272728652725614, "loss": 1.6391, "step": 9908 }, { "epoch": 0.78, "learning_rate": 0.00025271827983369753, "loss": 1.6611, "step": 9909 }, { "epoch": 0.78, "learning_rate": 0.0002527092724427385, "loss": 1.6065, "step": 9910 }, { "epoch": 0.78, "learning_rate": 0.0002527002643544402, "loss": 1.5877, "step": 9911 }, { "epoch": 0.78, "learning_rate": 0.00025269125556886374, "loss": 1.6806, "step": 9912 }, { "epoch": 0.78, "learning_rate": 0.0002526822460860703, "loss": 1.6543, "step": 9913 }, { "epoch": 0.78, "learning_rate": 0.00025267323590612116, "loss": 1.6563, "step": 9914 }, { "epoch": 0.78, "learning_rate": 0.00025266422502907734, "loss": 1.6231, "step": 9915 }, { "epoch": 0.78, "learning_rate": 0.0002526552134550001, "loss": 1.5978, "step": 9916 }, { "epoch": 0.78, "learning_rate": 0.00025264620118395066, "loss": 1.6202, "step": 9917 }, { "epoch": 0.78, "learning_rate": 0.0002526371882159901, "loss": 1.6703, "step": 9918 }, { "epoch": 0.78, "learning_rate": 0.0002526281745511797, "loss": 1.6678, "step": 9919 }, { "epoch": 0.78, "learning_rate": 0.0002526191601895806, "loss": 1.6353, "step": 9920 }, { "epoch": 0.78, "learning_rate": 0.0002526101451312541, "loss": 1.6215, "step": 9921 }, { "epoch": 0.78, "learning_rate": 0.00025260112937626125, "loss": 1.5686, "step": 9922 }, { "epoch": 0.78, "learning_rate": 0.0002525921129246634, "loss": 1.6025, "step": 9923 }, { "epoch": 0.78, "learning_rate": 0.0002525830957765217, "loss": 1.5978, "step": 9924 }, { "epoch": 0.78, "learning_rate": 0.0002525740779318974, "loss": 1.576, "step": 9925 }, { "epoch": 0.78, "learning_rate": 0.0002525650593908517, "loss": 1.6686, "step": 9926 }, { "epoch": 0.78, "learning_rate": 0.00025255604015344586, "loss": 1.6339, "step": 9927 }, { "epoch": 0.78, "learning_rate": 0.00025254702021974113, "loss": 1.5895, "step": 9928 }, { "epoch": 0.78, "learning_rate": 0.00025253799958979874, "loss": 1.6514, "step": 9929 }, { "epoch": 0.78, "learning_rate": 0.0002525289782636799, "loss": 1.6111, "step": 9930 }, { "epoch": 0.78, "learning_rate": 0.0002525199562414458, "loss": 1.6311, "step": 9931 }, { "epoch": 0.78, "learning_rate": 0.00025251093352315787, "loss": 1.6423, "step": 9932 }, { "epoch": 0.78, "learning_rate": 0.00025250191010887723, "loss": 1.5924, "step": 9933 }, { "epoch": 0.78, "learning_rate": 0.00025249288599866516, "loss": 1.6353, "step": 9934 }, { "epoch": 0.78, "learning_rate": 0.000252483861192583, "loss": 1.6059, "step": 9935 }, { "epoch": 0.78, "learning_rate": 0.000252474835690692, "loss": 1.6467, "step": 9936 }, { "epoch": 0.78, "learning_rate": 0.0002524658094930533, "loss": 1.6218, "step": 9937 }, { "epoch": 0.78, "learning_rate": 0.00025245678259972837, "loss": 1.6273, "step": 9938 }, { "epoch": 0.78, "learning_rate": 0.00025244775501077844, "loss": 1.7123, "step": 9939 }, { "epoch": 0.78, "learning_rate": 0.0002524387267262648, "loss": 1.6276, "step": 9940 }, { "epoch": 0.78, "learning_rate": 0.00025242969774624867, "loss": 1.5701, "step": 9941 }, { "epoch": 0.78, "learning_rate": 0.0002524206680707915, "loss": 1.633, "step": 9942 }, { "epoch": 0.78, "learning_rate": 0.0002524116376999545, "loss": 1.6244, "step": 9943 }, { "epoch": 0.78, "learning_rate": 0.00025240260663379895, "loss": 1.6001, "step": 9944 }, { "epoch": 0.78, "learning_rate": 0.0002523935748723862, "loss": 1.6827, "step": 9945 }, { "epoch": 0.78, "learning_rate": 0.00025238454241577763, "loss": 1.6135, "step": 9946 }, { "epoch": 0.78, "learning_rate": 0.0002523755092640345, "loss": 1.6474, "step": 9947 }, { "epoch": 0.78, "learning_rate": 0.00025236647541721814, "loss": 1.6361, "step": 9948 }, { "epoch": 0.78, "learning_rate": 0.00025235744087538994, "loss": 1.5966, "step": 9949 }, { "epoch": 0.78, "learning_rate": 0.0002523484056386112, "loss": 1.6746, "step": 9950 }, { "epoch": 0.78, "learning_rate": 0.0002523393697069432, "loss": 1.6676, "step": 9951 }, { "epoch": 0.78, "learning_rate": 0.00025233033308044744, "loss": 1.663, "step": 9952 }, { "epoch": 0.78, "learning_rate": 0.0002523212957591851, "loss": 1.619, "step": 9953 }, { "epoch": 0.78, "learning_rate": 0.0002523122577432177, "loss": 1.5789, "step": 9954 }, { "epoch": 0.78, "learning_rate": 0.00025230321903260656, "loss": 1.6237, "step": 9955 }, { "epoch": 0.78, "learning_rate": 0.00025229417962741295, "loss": 1.6701, "step": 9956 }, { "epoch": 0.78, "learning_rate": 0.00025228513952769836, "loss": 1.631, "step": 9957 }, { "epoch": 0.78, "learning_rate": 0.000252276098733524, "loss": 1.6207, "step": 9958 }, { "epoch": 0.78, "learning_rate": 0.00025226705724495154, "loss": 1.7025, "step": 9959 }, { "epoch": 0.78, "learning_rate": 0.0002522580150620421, "loss": 1.6403, "step": 9960 }, { "epoch": 0.78, "learning_rate": 0.0002522489721848572, "loss": 1.5593, "step": 9961 }, { "epoch": 0.78, "learning_rate": 0.0002522399286134582, "loss": 1.631, "step": 9962 }, { "epoch": 0.78, "learning_rate": 0.00025223088434790647, "loss": 1.7165, "step": 9963 }, { "epoch": 0.78, "learning_rate": 0.0002522218393882635, "loss": 1.591, "step": 9964 }, { "epoch": 0.78, "learning_rate": 0.00025221279373459056, "loss": 1.6474, "step": 9965 }, { "epoch": 0.78, "learning_rate": 0.00025220374738694926, "loss": 1.6229, "step": 9966 }, { "epoch": 0.78, "learning_rate": 0.0002521947003454009, "loss": 1.6252, "step": 9967 }, { "epoch": 0.78, "learning_rate": 0.00025218565261000687, "loss": 1.6168, "step": 9968 }, { "epoch": 0.78, "learning_rate": 0.00025217660418082864, "loss": 1.604, "step": 9969 }, { "epoch": 0.78, "learning_rate": 0.0002521675550579277, "loss": 1.6043, "step": 9970 }, { "epoch": 0.78, "learning_rate": 0.00025215850524136545, "loss": 1.6321, "step": 9971 }, { "epoch": 0.78, "learning_rate": 0.0002521494547312033, "loss": 1.6393, "step": 9972 }, { "epoch": 0.78, "learning_rate": 0.00025214040352750273, "loss": 1.6368, "step": 9973 }, { "epoch": 0.78, "learning_rate": 0.00025213135163032523, "loss": 1.6984, "step": 9974 }, { "epoch": 0.78, "learning_rate": 0.0002521222990397322, "loss": 1.6534, "step": 9975 }, { "epoch": 0.78, "learning_rate": 0.000252113245755785, "loss": 1.6166, "step": 9976 }, { "epoch": 0.79, "learning_rate": 0.0002521041917785453, "loss": 1.6103, "step": 9977 }, { "epoch": 0.79, "learning_rate": 0.0002520951371080745, "loss": 1.6582, "step": 9978 }, { "epoch": 0.79, "learning_rate": 0.00025208608174443403, "loss": 1.6321, "step": 9979 }, { "epoch": 0.79, "learning_rate": 0.0002520770256876854, "loss": 1.6216, "step": 9980 }, { "epoch": 0.79, "learning_rate": 0.0002520679689378902, "loss": 1.6158, "step": 9981 }, { "epoch": 0.79, "learning_rate": 0.0002520589114951097, "loss": 1.6443, "step": 9982 }, { "epoch": 0.79, "learning_rate": 0.0002520498533594055, "loss": 1.6112, "step": 9983 }, { "epoch": 0.79, "learning_rate": 0.00025204079453083916, "loss": 1.6406, "step": 9984 }, { "epoch": 0.79, "learning_rate": 0.00025203173500947207, "loss": 1.6527, "step": 9985 }, { "epoch": 0.79, "learning_rate": 0.0002520226747953659, "loss": 1.6293, "step": 9986 }, { "epoch": 0.79, "learning_rate": 0.00025201361388858205, "loss": 1.6078, "step": 9987 }, { "epoch": 0.79, "learning_rate": 0.000252004552289182, "loss": 1.6494, "step": 9988 }, { "epoch": 0.79, "learning_rate": 0.0002519954899972274, "loss": 1.6354, "step": 9989 }, { "epoch": 0.79, "learning_rate": 0.0002519864270127796, "loss": 1.6767, "step": 9990 }, { "epoch": 0.79, "learning_rate": 0.0002519773633359004, "loss": 1.6468, "step": 9991 }, { "epoch": 0.79, "learning_rate": 0.00025196829896665106, "loss": 1.6471, "step": 9992 }, { "epoch": 0.79, "learning_rate": 0.00025195923390509327, "loss": 1.6442, "step": 9993 }, { "epoch": 0.79, "learning_rate": 0.00025195016815128855, "loss": 1.6649, "step": 9994 }, { "epoch": 0.79, "learning_rate": 0.00025194110170529847, "loss": 1.6648, "step": 9995 }, { "epoch": 0.79, "learning_rate": 0.0002519320345671845, "loss": 1.6528, "step": 9996 }, { "epoch": 0.79, "learning_rate": 0.0002519229667370084, "loss": 1.6444, "step": 9997 }, { "epoch": 0.79, "learning_rate": 0.0002519138982148315, "loss": 1.599, "step": 9998 }, { "epoch": 0.79, "learning_rate": 0.00025190482900071547, "loss": 1.5904, "step": 9999 }, { "epoch": 0.79, "learning_rate": 0.00025189575909472195, "loss": 1.654, "step": 10000 }, { "epoch": 0.79, "learning_rate": 0.00025188668849691236, "loss": 1.6002, "step": 10001 }, { "epoch": 0.79, "learning_rate": 0.00025187761720734845, "loss": 1.6263, "step": 10002 }, { "epoch": 0.79, "learning_rate": 0.0002518685452260917, "loss": 1.5878, "step": 10003 }, { "epoch": 0.79, "learning_rate": 0.00025185947255320376, "loss": 1.6261, "step": 10004 }, { "epoch": 0.79, "learning_rate": 0.00025185039918874626, "loss": 1.603, "step": 10005 }, { "epoch": 0.79, "learning_rate": 0.0002518413251327807, "loss": 1.5935, "step": 10006 }, { "epoch": 0.79, "learning_rate": 0.00025183225038536875, "loss": 1.6658, "step": 10007 }, { "epoch": 0.79, "learning_rate": 0.000251823174946572, "loss": 1.6301, "step": 10008 }, { "epoch": 0.79, "learning_rate": 0.0002518140988164521, "loss": 1.6646, "step": 10009 }, { "epoch": 0.79, "learning_rate": 0.0002518050219950707, "loss": 1.6806, "step": 10010 }, { "epoch": 0.79, "learning_rate": 0.0002517959444824893, "loss": 1.6207, "step": 10011 }, { "epoch": 0.79, "learning_rate": 0.00025178686627876963, "loss": 1.5972, "step": 10012 }, { "epoch": 0.79, "learning_rate": 0.00025177778738397336, "loss": 1.6324, "step": 10013 }, { "epoch": 0.79, "learning_rate": 0.0002517687077981621, "loss": 1.6589, "step": 10014 }, { "epoch": 0.79, "learning_rate": 0.0002517596275213974, "loss": 1.6607, "step": 10015 }, { "epoch": 0.79, "learning_rate": 0.000251750546553741, "loss": 1.6457, "step": 10016 }, { "epoch": 0.79, "learning_rate": 0.00025174146489525455, "loss": 1.5953, "step": 10017 }, { "epoch": 0.79, "learning_rate": 0.00025173238254599966, "loss": 1.695, "step": 10018 }, { "epoch": 0.79, "learning_rate": 0.0002517232995060381, "loss": 1.6151, "step": 10019 }, { "epoch": 0.79, "learning_rate": 0.0002517142157754314, "loss": 1.6627, "step": 10020 }, { "epoch": 0.79, "learning_rate": 0.0002517051313542414, "loss": 1.6726, "step": 10021 }, { "epoch": 0.79, "learning_rate": 0.0002516960462425296, "loss": 1.6536, "step": 10022 }, { "epoch": 0.79, "learning_rate": 0.00025168696044035777, "loss": 1.6269, "step": 10023 }, { "epoch": 0.79, "learning_rate": 0.00025167787394778763, "loss": 1.6275, "step": 10024 }, { "epoch": 0.79, "learning_rate": 0.00025166878676488087, "loss": 1.6424, "step": 10025 }, { "epoch": 0.79, "learning_rate": 0.0002516596988916991, "loss": 1.6627, "step": 10026 }, { "epoch": 0.79, "learning_rate": 0.0002516506103283041, "loss": 1.6303, "step": 10027 }, { "epoch": 0.79, "learning_rate": 0.00025164152107475755, "loss": 1.6747, "step": 10028 }, { "epoch": 0.79, "learning_rate": 0.00025163243113112115, "loss": 1.588, "step": 10029 }, { "epoch": 0.79, "learning_rate": 0.00025162334049745665, "loss": 1.6829, "step": 10030 }, { "epoch": 0.79, "learning_rate": 0.00025161424917382566, "loss": 1.6407, "step": 10031 }, { "epoch": 0.79, "learning_rate": 0.0002516051571602901, "loss": 1.648, "step": 10032 }, { "epoch": 0.79, "learning_rate": 0.0002515960644569116, "loss": 1.6028, "step": 10033 }, { "epoch": 0.79, "learning_rate": 0.0002515869710637518, "loss": 1.6749, "step": 10034 }, { "epoch": 0.79, "learning_rate": 0.00025157787698087253, "loss": 1.6478, "step": 10035 }, { "epoch": 0.79, "learning_rate": 0.0002515687822083356, "loss": 1.6423, "step": 10036 }, { "epoch": 0.79, "learning_rate": 0.0002515596867462027, "loss": 1.6349, "step": 10037 }, { "epoch": 0.79, "learning_rate": 0.0002515505905945355, "loss": 1.6696, "step": 10038 }, { "epoch": 0.79, "learning_rate": 0.00025154149375339584, "loss": 1.6285, "step": 10039 }, { "epoch": 0.79, "learning_rate": 0.0002515323962228455, "loss": 1.5725, "step": 10040 }, { "epoch": 0.79, "learning_rate": 0.0002515232980029462, "loss": 1.6946, "step": 10041 }, { "epoch": 0.79, "learning_rate": 0.00025151419909375975, "loss": 1.586, "step": 10042 }, { "epoch": 0.79, "learning_rate": 0.0002515050994953479, "loss": 1.6994, "step": 10043 }, { "epoch": 0.79, "learning_rate": 0.0002514959992077725, "loss": 1.6336, "step": 10044 }, { "epoch": 0.79, "learning_rate": 0.0002514868982310952, "loss": 1.605, "step": 10045 }, { "epoch": 0.79, "learning_rate": 0.00025147779656537785, "loss": 1.579, "step": 10046 }, { "epoch": 0.79, "learning_rate": 0.0002514686942106823, "loss": 1.6186, "step": 10047 }, { "epoch": 0.79, "learning_rate": 0.00025145959116707026, "loss": 1.6482, "step": 10048 }, { "epoch": 0.79, "learning_rate": 0.00025145048743460365, "loss": 1.6443, "step": 10049 }, { "epoch": 0.79, "learning_rate": 0.0002514413830133442, "loss": 1.6166, "step": 10050 }, { "epoch": 0.79, "learning_rate": 0.00025143227790335376, "loss": 1.6514, "step": 10051 }, { "epoch": 0.79, "learning_rate": 0.0002514231721046941, "loss": 1.589, "step": 10052 }, { "epoch": 0.79, "learning_rate": 0.0002514140656174271, "loss": 1.6676, "step": 10053 }, { "epoch": 0.79, "learning_rate": 0.0002514049584416146, "loss": 1.6502, "step": 10054 }, { "epoch": 0.79, "learning_rate": 0.00025139585057731823, "loss": 1.6539, "step": 10055 }, { "epoch": 0.79, "learning_rate": 0.00025138674202460017, "loss": 1.6495, "step": 10056 }, { "epoch": 0.79, "learning_rate": 0.0002513776327835219, "loss": 1.6763, "step": 10057 }, { "epoch": 0.79, "learning_rate": 0.0002513685228541456, "loss": 1.5691, "step": 10058 }, { "epoch": 0.79, "learning_rate": 0.00025135941223653293, "loss": 1.6192, "step": 10059 }, { "epoch": 0.79, "learning_rate": 0.0002513503009307458, "loss": 1.6168, "step": 10060 }, { "epoch": 0.79, "learning_rate": 0.00025134118893684596, "loss": 1.5989, "step": 10061 }, { "epoch": 0.79, "learning_rate": 0.00025133207625489546, "loss": 1.6539, "step": 10062 }, { "epoch": 0.79, "learning_rate": 0.00025132296288495607, "loss": 1.6331, "step": 10063 }, { "epoch": 0.79, "learning_rate": 0.00025131384882708964, "loss": 1.6229, "step": 10064 }, { "epoch": 0.79, "learning_rate": 0.00025130473408135814, "loss": 1.6618, "step": 10065 }, { "epoch": 0.79, "learning_rate": 0.00025129561864782336, "loss": 1.6681, "step": 10066 }, { "epoch": 0.79, "learning_rate": 0.0002512865025265473, "loss": 1.6782, "step": 10067 }, { "epoch": 0.79, "learning_rate": 0.0002512773857175917, "loss": 1.6112, "step": 10068 }, { "epoch": 0.79, "learning_rate": 0.00025126826822101855, "loss": 1.6413, "step": 10069 }, { "epoch": 0.79, "learning_rate": 0.0002512591500368898, "loss": 1.6467, "step": 10070 }, { "epoch": 0.79, "learning_rate": 0.0002512500311652672, "loss": 1.6493, "step": 10071 }, { "epoch": 0.79, "learning_rate": 0.0002512409116062129, "loss": 1.6486, "step": 10072 }, { "epoch": 0.79, "learning_rate": 0.00025123179135978855, "loss": 1.5876, "step": 10073 }, { "epoch": 0.79, "learning_rate": 0.00025122267042605625, "loss": 1.626, "step": 10074 }, { "epoch": 0.79, "learning_rate": 0.0002512135488050779, "loss": 1.6247, "step": 10075 }, { "epoch": 0.79, "learning_rate": 0.0002512044264969154, "loss": 1.6778, "step": 10076 }, { "epoch": 0.79, "learning_rate": 0.0002511953035016307, "loss": 1.6138, "step": 10077 }, { "epoch": 0.79, "learning_rate": 0.0002511861798192857, "loss": 1.6636, "step": 10078 }, { "epoch": 0.79, "learning_rate": 0.0002511770554499424, "loss": 1.6899, "step": 10079 }, { "epoch": 0.79, "learning_rate": 0.0002511679303936627, "loss": 1.6298, "step": 10080 }, { "epoch": 0.79, "learning_rate": 0.00025115880465050863, "loss": 1.6691, "step": 10081 }, { "epoch": 0.79, "learning_rate": 0.00025114967822054206, "loss": 1.6169, "step": 10082 }, { "epoch": 0.79, "learning_rate": 0.000251140551103825, "loss": 1.5936, "step": 10083 }, { "epoch": 0.79, "learning_rate": 0.00025113142330041943, "loss": 1.6064, "step": 10084 }, { "epoch": 0.79, "learning_rate": 0.00025112229481038726, "loss": 1.6599, "step": 10085 }, { "epoch": 0.79, "learning_rate": 0.00025111316563379056, "loss": 1.6275, "step": 10086 }, { "epoch": 0.79, "learning_rate": 0.00025110403577069125, "loss": 1.6195, "step": 10087 }, { "epoch": 0.79, "learning_rate": 0.0002510949052211514, "loss": 1.6368, "step": 10088 }, { "epoch": 0.79, "learning_rate": 0.0002510857739852328, "loss": 1.58, "step": 10089 }, { "epoch": 0.79, "learning_rate": 0.00025107664206299764, "loss": 1.6505, "step": 10090 }, { "epoch": 0.79, "learning_rate": 0.0002510675094545079, "loss": 1.6389, "step": 10091 }, { "epoch": 0.79, "learning_rate": 0.00025105837615982553, "loss": 1.5669, "step": 10092 }, { "epoch": 0.79, "learning_rate": 0.00025104924217901245, "loss": 1.6718, "step": 10093 }, { "epoch": 0.79, "learning_rate": 0.0002510401075121309, "loss": 1.6295, "step": 10094 }, { "epoch": 0.79, "learning_rate": 0.00025103097215924277, "loss": 1.6544, "step": 10095 }, { "epoch": 0.79, "learning_rate": 0.00025102183612041003, "loss": 1.6742, "step": 10096 }, { "epoch": 0.79, "learning_rate": 0.0002510126993956948, "loss": 1.603, "step": 10097 }, { "epoch": 0.79, "learning_rate": 0.00025100356198515906, "loss": 1.6313, "step": 10098 }, { "epoch": 0.79, "learning_rate": 0.00025099442388886497, "loss": 1.5884, "step": 10099 }, { "epoch": 0.79, "learning_rate": 0.00025098528510687437, "loss": 1.6543, "step": 10100 }, { "epoch": 0.79, "learning_rate": 0.00025097614563924944, "loss": 1.6313, "step": 10101 }, { "epoch": 0.79, "learning_rate": 0.0002509670054860522, "loss": 1.6464, "step": 10102 }, { "epoch": 0.79, "learning_rate": 0.0002509578646473447, "loss": 1.606, "step": 10103 }, { "epoch": 0.79, "learning_rate": 0.00025094872312318906, "loss": 1.6089, "step": 10104 }, { "epoch": 0.8, "learning_rate": 0.0002509395809136473, "loss": 1.6314, "step": 10105 }, { "epoch": 0.8, "learning_rate": 0.0002509304380187814, "loss": 1.6213, "step": 10106 }, { "epoch": 0.8, "learning_rate": 0.00025092129443865367, "loss": 1.6265, "step": 10107 }, { "epoch": 0.8, "learning_rate": 0.0002509121501733259, "loss": 1.6282, "step": 10108 }, { "epoch": 0.8, "learning_rate": 0.0002509030052228604, "loss": 1.6688, "step": 10109 }, { "epoch": 0.8, "learning_rate": 0.00025089385958731916, "loss": 1.6208, "step": 10110 }, { "epoch": 0.8, "learning_rate": 0.0002508847132667643, "loss": 1.6259, "step": 10111 }, { "epoch": 0.8, "learning_rate": 0.0002508755662612579, "loss": 1.67, "step": 10112 }, { "epoch": 0.8, "learning_rate": 0.00025086641857086203, "loss": 1.6712, "step": 10113 }, { "epoch": 0.8, "learning_rate": 0.0002508572701956389, "loss": 1.6967, "step": 10114 }, { "epoch": 0.8, "learning_rate": 0.0002508481211356506, "loss": 1.6542, "step": 10115 }, { "epoch": 0.8, "learning_rate": 0.00025083897139095907, "loss": 1.6085, "step": 10116 }, { "epoch": 0.8, "learning_rate": 0.0002508298209616267, "loss": 1.6193, "step": 10117 }, { "epoch": 0.8, "learning_rate": 0.00025082066984771545, "loss": 1.5484, "step": 10118 }, { "epoch": 0.8, "learning_rate": 0.0002508115180492874, "loss": 1.6168, "step": 10119 }, { "epoch": 0.8, "learning_rate": 0.0002508023655664049, "loss": 1.6547, "step": 10120 }, { "epoch": 0.8, "learning_rate": 0.0002507932123991299, "loss": 1.5679, "step": 10121 }, { "epoch": 0.8, "learning_rate": 0.0002507840585475247, "loss": 1.5841, "step": 10122 }, { "epoch": 0.8, "learning_rate": 0.00025077490401165123, "loss": 1.6318, "step": 10123 }, { "epoch": 0.8, "learning_rate": 0.00025076574879157184, "loss": 1.656, "step": 10124 }, { "epoch": 0.8, "learning_rate": 0.00025075659288734863, "loss": 1.6334, "step": 10125 }, { "epoch": 0.8, "learning_rate": 0.00025074743629904377, "loss": 1.5925, "step": 10126 }, { "epoch": 0.8, "learning_rate": 0.00025073827902671934, "loss": 1.689, "step": 10127 }, { "epoch": 0.8, "learning_rate": 0.0002507291210704377, "loss": 1.6409, "step": 10128 }, { "epoch": 0.8, "learning_rate": 0.0002507199624302608, "loss": 1.6264, "step": 10129 }, { "epoch": 0.8, "learning_rate": 0.00025071080310625095, "loss": 1.6052, "step": 10130 }, { "epoch": 0.8, "learning_rate": 0.0002507016430984704, "loss": 1.6008, "step": 10131 }, { "epoch": 0.8, "learning_rate": 0.00025069248240698123, "loss": 1.5993, "step": 10132 }, { "epoch": 0.8, "learning_rate": 0.00025068332103184566, "loss": 1.6479, "step": 10133 }, { "epoch": 0.8, "learning_rate": 0.0002506741589731259, "loss": 1.6592, "step": 10134 }, { "epoch": 0.8, "learning_rate": 0.0002506649962308842, "loss": 1.6674, "step": 10135 }, { "epoch": 0.8, "learning_rate": 0.0002506558328051827, "loss": 1.6219, "step": 10136 }, { "epoch": 0.8, "learning_rate": 0.0002506466686960836, "loss": 1.5928, "step": 10137 }, { "epoch": 0.8, "learning_rate": 0.00025063750390364923, "loss": 1.6456, "step": 10138 }, { "epoch": 0.8, "learning_rate": 0.00025062833842794173, "loss": 1.6035, "step": 10139 }, { "epoch": 0.8, "learning_rate": 0.0002506191722690233, "loss": 1.6215, "step": 10140 }, { "epoch": 0.8, "learning_rate": 0.00025061000542695626, "loss": 1.6035, "step": 10141 }, { "epoch": 0.8, "learning_rate": 0.00025060083790180276, "loss": 1.6415, "step": 10142 }, { "epoch": 0.8, "learning_rate": 0.00025059166969362514, "loss": 1.6273, "step": 10143 }, { "epoch": 0.8, "learning_rate": 0.00025058250080248553, "loss": 1.6016, "step": 10144 }, { "epoch": 0.8, "learning_rate": 0.00025057333122844634, "loss": 1.6676, "step": 10145 }, { "epoch": 0.8, "learning_rate": 0.0002505641609715696, "loss": 1.6379, "step": 10146 }, { "epoch": 0.8, "learning_rate": 0.0002505549900319178, "loss": 1.6112, "step": 10147 }, { "epoch": 0.8, "learning_rate": 0.00025054581840955315, "loss": 1.6722, "step": 10148 }, { "epoch": 0.8, "learning_rate": 0.00025053664610453775, "loss": 1.6416, "step": 10149 }, { "epoch": 0.8, "learning_rate": 0.0002505274731169341, "loss": 1.6447, "step": 10150 }, { "epoch": 0.8, "learning_rate": 0.0002505182994468043, "loss": 1.5935, "step": 10151 }, { "epoch": 0.8, "learning_rate": 0.0002505091250942108, "loss": 1.6231, "step": 10152 }, { "epoch": 0.8, "learning_rate": 0.00025049995005921576, "loss": 1.6422, "step": 10153 }, { "epoch": 0.8, "learning_rate": 0.00025049077434188155, "loss": 1.6101, "step": 10154 }, { "epoch": 0.8, "learning_rate": 0.0002504815979422704, "loss": 1.6412, "step": 10155 }, { "epoch": 0.8, "learning_rate": 0.0002504724208604447, "loss": 1.6513, "step": 10156 }, { "epoch": 0.8, "learning_rate": 0.0002504632430964667, "loss": 1.653, "step": 10157 }, { "epoch": 0.8, "learning_rate": 0.0002504540646503987, "loss": 1.6498, "step": 10158 }, { "epoch": 0.8, "learning_rate": 0.000250444885522303, "loss": 1.5949, "step": 10159 }, { "epoch": 0.8, "learning_rate": 0.000250435705712242, "loss": 1.6507, "step": 10160 }, { "epoch": 0.8, "learning_rate": 0.00025042652522027796, "loss": 1.6116, "step": 10161 }, { "epoch": 0.8, "learning_rate": 0.0002504173440464733, "loss": 1.6095, "step": 10162 }, { "epoch": 0.8, "learning_rate": 0.0002504081621908902, "loss": 1.609, "step": 10163 }, { "epoch": 0.8, "learning_rate": 0.00025039897965359114, "loss": 1.601, "step": 10164 }, { "epoch": 0.8, "learning_rate": 0.0002503897964346384, "loss": 1.5861, "step": 10165 }, { "epoch": 0.8, "learning_rate": 0.0002503806125340943, "loss": 1.5656, "step": 10166 }, { "epoch": 0.8, "learning_rate": 0.0002503714279520213, "loss": 1.6471, "step": 10167 }, { "epoch": 0.8, "learning_rate": 0.0002503622426884817, "loss": 1.6659, "step": 10168 }, { "epoch": 0.8, "learning_rate": 0.0002503530567435378, "loss": 1.6197, "step": 10169 }, { "epoch": 0.8, "learning_rate": 0.00025034387011725205, "loss": 1.6274, "step": 10170 }, { "epoch": 0.8, "learning_rate": 0.0002503346828096868, "loss": 1.6228, "step": 10171 }, { "epoch": 0.8, "learning_rate": 0.00025032549482090444, "loss": 1.6337, "step": 10172 }, { "epoch": 0.8, "learning_rate": 0.00025031630615096726, "loss": 1.6254, "step": 10173 }, { "epoch": 0.8, "learning_rate": 0.00025030711679993785, "loss": 1.6521, "step": 10174 }, { "epoch": 0.8, "learning_rate": 0.00025029792676787833, "loss": 1.6457, "step": 10175 }, { "epoch": 0.8, "learning_rate": 0.00025028873605485133, "loss": 1.6417, "step": 10176 }, { "epoch": 0.8, "learning_rate": 0.00025027954466091913, "loss": 1.5928, "step": 10177 }, { "epoch": 0.8, "learning_rate": 0.0002502703525861442, "loss": 1.613, "step": 10178 }, { "epoch": 0.8, "learning_rate": 0.0002502611598305888, "loss": 1.6554, "step": 10179 }, { "epoch": 0.8, "learning_rate": 0.0002502519663943156, "loss": 1.6299, "step": 10180 }, { "epoch": 0.8, "learning_rate": 0.00025024277227738676, "loss": 1.6315, "step": 10181 }, { "epoch": 0.8, "learning_rate": 0.0002502335774798648, "loss": 1.6219, "step": 10182 }, { "epoch": 0.8, "learning_rate": 0.0002502243820018123, "loss": 1.6696, "step": 10183 }, { "epoch": 0.8, "learning_rate": 0.0002502151858432914, "loss": 1.6736, "step": 10184 }, { "epoch": 0.8, "learning_rate": 0.00025020598900436477, "loss": 1.602, "step": 10185 }, { "epoch": 0.8, "learning_rate": 0.00025019679148509475, "loss": 1.6459, "step": 10186 }, { "epoch": 0.8, "learning_rate": 0.0002501875932855438, "loss": 1.6394, "step": 10187 }, { "epoch": 0.8, "learning_rate": 0.0002501783944057744, "loss": 1.6569, "step": 10188 }, { "epoch": 0.8, "learning_rate": 0.000250169194845849, "loss": 1.6204, "step": 10189 }, { "epoch": 0.8, "learning_rate": 0.00025015999460583, "loss": 1.6379, "step": 10190 }, { "epoch": 0.8, "learning_rate": 0.00025015079368577995, "loss": 1.7212, "step": 10191 }, { "epoch": 0.8, "learning_rate": 0.0002501415920857613, "loss": 1.6307, "step": 10192 }, { "epoch": 0.8, "learning_rate": 0.0002501323898058365, "loss": 1.6606, "step": 10193 }, { "epoch": 0.8, "learning_rate": 0.00025012318684606796, "loss": 1.6279, "step": 10194 }, { "epoch": 0.8, "learning_rate": 0.0002501139832065183, "loss": 1.6407, "step": 10195 }, { "epoch": 0.8, "learning_rate": 0.0002501047788872499, "loss": 1.6133, "step": 10196 }, { "epoch": 0.8, "learning_rate": 0.0002500955738883253, "loss": 1.5868, "step": 10197 }, { "epoch": 0.8, "learning_rate": 0.00025008636820980705, "loss": 1.6254, "step": 10198 }, { "epoch": 0.8, "learning_rate": 0.0002500771618517575, "loss": 1.6394, "step": 10199 }, { "epoch": 0.8, "learning_rate": 0.0002500679548142393, "loss": 1.6037, "step": 10200 }, { "epoch": 0.8, "learning_rate": 0.0002500587470973149, "loss": 1.6315, "step": 10201 }, { "epoch": 0.8, "learning_rate": 0.00025004953870104684, "loss": 1.6575, "step": 10202 }, { "epoch": 0.8, "learning_rate": 0.00025004032962549756, "loss": 1.6316, "step": 10203 }, { "epoch": 0.8, "learning_rate": 0.0002500311198707297, "loss": 1.6834, "step": 10204 }, { "epoch": 0.8, "learning_rate": 0.00025002190943680577, "loss": 1.6102, "step": 10205 }, { "epoch": 0.8, "learning_rate": 0.0002500126983237882, "loss": 1.6391, "step": 10206 }, { "epoch": 0.8, "learning_rate": 0.00025000348653173964, "loss": 1.6632, "step": 10207 }, { "epoch": 0.8, "learning_rate": 0.00024999427406072265, "loss": 1.644, "step": 10208 }, { "epoch": 0.8, "learning_rate": 0.0002499850609107996, "loss": 1.5916, "step": 10209 }, { "epoch": 0.8, "learning_rate": 0.00024997584708203325, "loss": 1.613, "step": 10210 }, { "epoch": 0.8, "learning_rate": 0.0002499666325744861, "loss": 1.6362, "step": 10211 }, { "epoch": 0.8, "learning_rate": 0.00024995741738822054, "loss": 1.602, "step": 10212 }, { "epoch": 0.8, "learning_rate": 0.0002499482015232994, "loss": 1.6242, "step": 10213 }, { "epoch": 0.8, "learning_rate": 0.0002499389849797851, "loss": 1.6291, "step": 10214 }, { "epoch": 0.8, "learning_rate": 0.0002499297677577402, "loss": 1.6223, "step": 10215 }, { "epoch": 0.8, "learning_rate": 0.00024992054985722734, "loss": 1.6419, "step": 10216 }, { "epoch": 0.8, "learning_rate": 0.0002499113312783091, "loss": 1.5666, "step": 10217 }, { "epoch": 0.8, "learning_rate": 0.00024990211202104807, "loss": 1.6546, "step": 10218 }, { "epoch": 0.8, "learning_rate": 0.0002498928920855068, "loss": 1.5836, "step": 10219 }, { "epoch": 0.8, "learning_rate": 0.00024988367147174795, "loss": 1.6507, "step": 10220 }, { "epoch": 0.8, "learning_rate": 0.0002498744501798341, "loss": 1.6941, "step": 10221 }, { "epoch": 0.8, "learning_rate": 0.00024986522820982776, "loss": 1.645, "step": 10222 }, { "epoch": 0.8, "learning_rate": 0.00024985600556179176, "loss": 1.6526, "step": 10223 }, { "epoch": 0.8, "learning_rate": 0.0002498467822357885, "loss": 1.6633, "step": 10224 }, { "epoch": 0.8, "learning_rate": 0.0002498375582318807, "loss": 1.6638, "step": 10225 }, { "epoch": 0.8, "learning_rate": 0.000249828333550131, "loss": 1.6014, "step": 10226 }, { "epoch": 0.8, "learning_rate": 0.00024981910819060196, "loss": 1.6581, "step": 10227 }, { "epoch": 0.8, "learning_rate": 0.0002498098821533563, "loss": 1.6274, "step": 10228 }, { "epoch": 0.8, "learning_rate": 0.0002498006554384566, "loss": 1.6462, "step": 10229 }, { "epoch": 0.8, "learning_rate": 0.00024979142804596556, "loss": 1.6353, "step": 10230 }, { "epoch": 0.8, "learning_rate": 0.0002497821999759458, "loss": 1.6946, "step": 10231 }, { "epoch": 0.81, "learning_rate": 0.0002497729712284599, "loss": 1.5386, "step": 10232 }, { "epoch": 0.81, "learning_rate": 0.0002497637418035706, "loss": 1.621, "step": 10233 }, { "epoch": 0.81, "learning_rate": 0.00024975451170134057, "loss": 1.6191, "step": 10234 }, { "epoch": 0.81, "learning_rate": 0.00024974528092183246, "loss": 1.6295, "step": 10235 }, { "epoch": 0.81, "learning_rate": 0.0002497360494651089, "loss": 1.6314, "step": 10236 }, { "epoch": 0.81, "learning_rate": 0.00024972681733123267, "loss": 1.6444, "step": 10237 }, { "epoch": 0.81, "learning_rate": 0.00024971758452026633, "loss": 1.634, "step": 10238 }, { "epoch": 0.81, "learning_rate": 0.0002497083510322726, "loss": 1.6913, "step": 10239 }, { "epoch": 0.81, "learning_rate": 0.00024969911686731426, "loss": 1.6672, "step": 10240 }, { "epoch": 0.81, "learning_rate": 0.0002496898820254539, "loss": 1.6124, "step": 10241 }, { "epoch": 0.81, "learning_rate": 0.0002496806465067543, "loss": 1.6211, "step": 10242 }, { "epoch": 0.81, "learning_rate": 0.00024967141031127804, "loss": 1.6096, "step": 10243 }, { "epoch": 0.81, "learning_rate": 0.0002496621734390879, "loss": 1.6653, "step": 10244 }, { "epoch": 0.81, "learning_rate": 0.00024965293589024665, "loss": 1.6133, "step": 10245 }, { "epoch": 0.81, "learning_rate": 0.00024964369766481694, "loss": 1.5657, "step": 10246 }, { "epoch": 0.81, "learning_rate": 0.0002496344587628615, "loss": 1.6451, "step": 10247 }, { "epoch": 0.81, "learning_rate": 0.0002496252191844431, "loss": 1.6769, "step": 10248 }, { "epoch": 0.81, "learning_rate": 0.00024961597892962444, "loss": 1.5898, "step": 10249 }, { "epoch": 0.81, "learning_rate": 0.00024960673799846825, "loss": 1.6459, "step": 10250 }, { "epoch": 0.81, "learning_rate": 0.00024959749639103727, "loss": 1.6452, "step": 10251 }, { "epoch": 0.81, "learning_rate": 0.0002495882541073942, "loss": 1.6829, "step": 10252 }, { "epoch": 0.81, "learning_rate": 0.000249579011147602, "loss": 1.623, "step": 10253 }, { "epoch": 0.81, "learning_rate": 0.0002495697675117231, "loss": 1.65, "step": 10254 }, { "epoch": 0.81, "learning_rate": 0.00024956052319982045, "loss": 1.6303, "step": 10255 }, { "epoch": 0.81, "learning_rate": 0.0002495512782119569, "loss": 1.6017, "step": 10256 }, { "epoch": 0.81, "learning_rate": 0.00024954203254819505, "loss": 1.5902, "step": 10257 }, { "epoch": 0.81, "learning_rate": 0.00024953278620859764, "loss": 1.6055, "step": 10258 }, { "epoch": 0.81, "learning_rate": 0.00024952353919322764, "loss": 1.6643, "step": 10259 }, { "epoch": 0.81, "learning_rate": 0.00024951429150214767, "loss": 1.6386, "step": 10260 }, { "epoch": 0.81, "learning_rate": 0.0002495050431354206, "loss": 1.6394, "step": 10261 }, { "epoch": 0.81, "learning_rate": 0.00024949579409310927, "loss": 1.6698, "step": 10262 }, { "epoch": 0.81, "learning_rate": 0.0002494865443752763, "loss": 1.6076, "step": 10263 }, { "epoch": 0.81, "learning_rate": 0.00024947729398198465, "loss": 1.6299, "step": 10264 }, { "epoch": 0.81, "learning_rate": 0.000249468042913297, "loss": 1.6926, "step": 10265 }, { "epoch": 0.81, "learning_rate": 0.00024945879116927634, "loss": 1.5842, "step": 10266 }, { "epoch": 0.81, "learning_rate": 0.0002494495387499853, "loss": 1.5986, "step": 10267 }, { "epoch": 0.81, "learning_rate": 0.0002494402856554868, "loss": 1.6211, "step": 10268 }, { "epoch": 0.81, "learning_rate": 0.0002494310318858437, "loss": 1.6445, "step": 10269 }, { "epoch": 0.81, "learning_rate": 0.00024942177744111864, "loss": 1.6264, "step": 10270 }, { "epoch": 0.81, "learning_rate": 0.00024941252232137465, "loss": 1.5929, "step": 10271 }, { "epoch": 0.81, "learning_rate": 0.0002494032665266744, "loss": 1.5775, "step": 10272 }, { "epoch": 0.81, "learning_rate": 0.00024939401005708093, "loss": 1.5879, "step": 10273 }, { "epoch": 0.81, "learning_rate": 0.000249384752912657, "loss": 1.6206, "step": 10274 }, { "epoch": 0.81, "learning_rate": 0.00024937549509346533, "loss": 1.5847, "step": 10275 }, { "epoch": 0.81, "learning_rate": 0.000249366236599569, "loss": 1.6303, "step": 10276 }, { "epoch": 0.81, "learning_rate": 0.0002493569774310307, "loss": 1.591, "step": 10277 }, { "epoch": 0.81, "learning_rate": 0.0002493477175879134, "loss": 1.6504, "step": 10278 }, { "epoch": 0.81, "learning_rate": 0.00024933845707027984, "loss": 1.653, "step": 10279 }, { "epoch": 0.81, "learning_rate": 0.000249329195878193, "loss": 1.5981, "step": 10280 }, { "epoch": 0.81, "learning_rate": 0.0002493199340117158, "loss": 1.6321, "step": 10281 }, { "epoch": 0.81, "learning_rate": 0.00024931067147091103, "loss": 1.5791, "step": 10282 }, { "epoch": 0.81, "learning_rate": 0.0002493014082558415, "loss": 1.6164, "step": 10283 }, { "epoch": 0.81, "learning_rate": 0.00024929214436657037, "loss": 1.6462, "step": 10284 }, { "epoch": 0.81, "learning_rate": 0.00024928287980316026, "loss": 1.6594, "step": 10285 }, { "epoch": 0.81, "learning_rate": 0.0002492736145656742, "loss": 1.5804, "step": 10286 }, { "epoch": 0.81, "learning_rate": 0.0002492643486541751, "loss": 1.7146, "step": 10287 }, { "epoch": 0.81, "learning_rate": 0.0002492550820687259, "loss": 1.6673, "step": 10288 }, { "epoch": 0.81, "learning_rate": 0.00024924581480938944, "loss": 1.5741, "step": 10289 }, { "epoch": 0.81, "learning_rate": 0.00024923654687622867, "loss": 1.5524, "step": 10290 }, { "epoch": 0.81, "learning_rate": 0.0002492272782693064, "loss": 1.6475, "step": 10291 }, { "epoch": 0.81, "learning_rate": 0.0002492180089886858, "loss": 1.5954, "step": 10292 }, { "epoch": 0.81, "learning_rate": 0.00024920873903442963, "loss": 1.6295, "step": 10293 }, { "epoch": 0.81, "learning_rate": 0.00024919946840660086, "loss": 1.5909, "step": 10294 }, { "epoch": 0.81, "learning_rate": 0.00024919019710526244, "loss": 1.6308, "step": 10295 }, { "epoch": 0.81, "learning_rate": 0.0002491809251304773, "loss": 1.59, "step": 10296 }, { "epoch": 0.81, "learning_rate": 0.0002491716524823085, "loss": 1.6316, "step": 10297 }, { "epoch": 0.81, "learning_rate": 0.00024916237916081883, "loss": 1.6635, "step": 10298 }, { "epoch": 0.81, "learning_rate": 0.00024915310516607133, "loss": 1.5833, "step": 10299 }, { "epoch": 0.81, "learning_rate": 0.000249143830498129, "loss": 1.6275, "step": 10300 }, { "epoch": 0.81, "learning_rate": 0.00024913455515705474, "loss": 1.6459, "step": 10301 }, { "epoch": 0.81, "learning_rate": 0.0002491252791429116, "loss": 1.6657, "step": 10302 }, { "epoch": 0.81, "learning_rate": 0.0002491160024557625, "loss": 1.651, "step": 10303 }, { "epoch": 0.81, "learning_rate": 0.0002491067250956704, "loss": 1.6584, "step": 10304 }, { "epoch": 0.81, "learning_rate": 0.0002490974470626984, "loss": 1.5902, "step": 10305 }, { "epoch": 0.81, "learning_rate": 0.0002490881683569093, "loss": 1.5894, "step": 10306 }, { "epoch": 0.81, "learning_rate": 0.0002490788889783663, "loss": 1.6923, "step": 10307 }, { "epoch": 0.81, "learning_rate": 0.00024906960892713233, "loss": 1.6321, "step": 10308 }, { "epoch": 0.81, "learning_rate": 0.00024906032820327034, "loss": 1.6504, "step": 10309 }, { "epoch": 0.81, "learning_rate": 0.0002490510468068435, "loss": 1.6041, "step": 10310 }, { "epoch": 0.81, "learning_rate": 0.00024904176473791457, "loss": 1.5962, "step": 10311 }, { "epoch": 0.81, "learning_rate": 0.0002490324819965468, "loss": 1.633, "step": 10312 }, { "epoch": 0.81, "learning_rate": 0.0002490231985828031, "loss": 1.684, "step": 10313 }, { "epoch": 0.81, "learning_rate": 0.0002490139144967465, "loss": 1.6404, "step": 10314 }, { "epoch": 0.81, "learning_rate": 0.0002490046297384401, "loss": 1.5674, "step": 10315 }, { "epoch": 0.81, "learning_rate": 0.0002489953443079469, "loss": 1.6638, "step": 10316 }, { "epoch": 0.81, "learning_rate": 0.0002489860582053299, "loss": 1.6151, "step": 10317 }, { "epoch": 0.81, "learning_rate": 0.00024897677143065225, "loss": 1.5942, "step": 10318 }, { "epoch": 0.81, "learning_rate": 0.0002489674839839769, "loss": 1.6343, "step": 10319 }, { "epoch": 0.81, "learning_rate": 0.00024895819586536697, "loss": 1.6573, "step": 10320 }, { "epoch": 0.81, "learning_rate": 0.0002489489070748855, "loss": 1.6239, "step": 10321 }, { "epoch": 0.81, "learning_rate": 0.00024893961761259556, "loss": 1.6005, "step": 10322 }, { "epoch": 0.81, "learning_rate": 0.0002489303274785602, "loss": 1.5907, "step": 10323 }, { "epoch": 0.81, "learning_rate": 0.00024892103667284254, "loss": 1.6033, "step": 10324 }, { "epoch": 0.81, "learning_rate": 0.00024891174519550555, "loss": 1.5833, "step": 10325 }, { "epoch": 0.81, "learning_rate": 0.00024890245304661244, "loss": 1.5881, "step": 10326 }, { "epoch": 0.81, "learning_rate": 0.00024889316022622625, "loss": 1.6523, "step": 10327 }, { "epoch": 0.81, "learning_rate": 0.0002488838667344101, "loss": 1.6488, "step": 10328 }, { "epoch": 0.81, "learning_rate": 0.0002488745725712271, "loss": 1.6693, "step": 10329 }, { "epoch": 0.81, "learning_rate": 0.0002488652777367402, "loss": 1.6297, "step": 10330 }, { "epoch": 0.81, "learning_rate": 0.0002488559822310127, "loss": 1.61, "step": 10331 }, { "epoch": 0.81, "learning_rate": 0.00024884668605410767, "loss": 1.609, "step": 10332 }, { "epoch": 0.81, "learning_rate": 0.0002488373892060881, "loss": 1.5955, "step": 10333 }, { "epoch": 0.81, "learning_rate": 0.00024882809168701723, "loss": 1.5537, "step": 10334 }, { "epoch": 0.81, "learning_rate": 0.00024881879349695823, "loss": 1.6213, "step": 10335 }, { "epoch": 0.81, "learning_rate": 0.00024880949463597406, "loss": 1.5846, "step": 10336 }, { "epoch": 0.81, "learning_rate": 0.000248800195104128, "loss": 1.6184, "step": 10337 }, { "epoch": 0.81, "learning_rate": 0.0002487908949014831, "loss": 1.6538, "step": 10338 }, { "epoch": 0.81, "learning_rate": 0.00024878159402810253, "loss": 1.5953, "step": 10339 }, { "epoch": 0.81, "learning_rate": 0.0002487722924840495, "loss": 1.6489, "step": 10340 }, { "epoch": 0.81, "learning_rate": 0.0002487629902693871, "loss": 1.6203, "step": 10341 }, { "epoch": 0.81, "learning_rate": 0.0002487536873841785, "loss": 1.6155, "step": 10342 }, { "epoch": 0.81, "learning_rate": 0.0002487443838284868, "loss": 1.6888, "step": 10343 }, { "epoch": 0.81, "learning_rate": 0.0002487350796023753, "loss": 1.6329, "step": 10344 }, { "epoch": 0.81, "learning_rate": 0.0002487257747059071, "loss": 1.6105, "step": 10345 }, { "epoch": 0.81, "learning_rate": 0.0002487164691391453, "loss": 1.6389, "step": 10346 }, { "epoch": 0.81, "learning_rate": 0.00024870716290215317, "loss": 1.6382, "step": 10347 }, { "epoch": 0.81, "learning_rate": 0.0002486978559949939, "loss": 1.6708, "step": 10348 }, { "epoch": 0.81, "learning_rate": 0.00024868854841773066, "loss": 1.6504, "step": 10349 }, { "epoch": 0.81, "learning_rate": 0.00024867924017042665, "loss": 1.6178, "step": 10350 }, { "epoch": 0.81, "learning_rate": 0.00024866993125314505, "loss": 1.6635, "step": 10351 }, { "epoch": 0.81, "learning_rate": 0.000248660621665949, "loss": 1.6435, "step": 10352 }, { "epoch": 0.81, "learning_rate": 0.00024865131140890183, "loss": 1.6513, "step": 10353 }, { "epoch": 0.81, "learning_rate": 0.0002486420004820667, "loss": 1.6711, "step": 10354 }, { "epoch": 0.81, "learning_rate": 0.00024863268888550684, "loss": 1.6316, "step": 10355 }, { "epoch": 0.81, "learning_rate": 0.00024862337661928535, "loss": 1.5965, "step": 10356 }, { "epoch": 0.81, "learning_rate": 0.00024861406368346565, "loss": 1.5897, "step": 10357 }, { "epoch": 0.81, "learning_rate": 0.0002486047500781109, "loss": 1.6115, "step": 10358 }, { "epoch": 0.82, "learning_rate": 0.00024859543580328425, "loss": 1.6249, "step": 10359 }, { "epoch": 0.82, "learning_rate": 0.00024858612085904903, "loss": 1.6275, "step": 10360 }, { "epoch": 0.82, "learning_rate": 0.0002485768052454684, "loss": 1.6167, "step": 10361 }, { "epoch": 0.82, "learning_rate": 0.0002485674889626057, "loss": 1.6526, "step": 10362 }, { "epoch": 0.82, "learning_rate": 0.00024855817201052417, "loss": 1.6357, "step": 10363 }, { "epoch": 0.82, "learning_rate": 0.00024854885438928704, "loss": 1.6354, "step": 10364 }, { "epoch": 0.82, "learning_rate": 0.00024853953609895753, "loss": 1.6685, "step": 10365 }, { "epoch": 0.82, "learning_rate": 0.000248530217139599, "loss": 1.5874, "step": 10366 }, { "epoch": 0.82, "learning_rate": 0.0002485208975112746, "loss": 1.6174, "step": 10367 }, { "epoch": 0.82, "learning_rate": 0.00024851157721404775, "loss": 1.6466, "step": 10368 }, { "epoch": 0.82, "learning_rate": 0.0002485022562479816, "loss": 1.6589, "step": 10369 }, { "epoch": 0.82, "learning_rate": 0.0002484929346131395, "loss": 1.6488, "step": 10370 }, { "epoch": 0.82, "learning_rate": 0.00024848361230958473, "loss": 1.6246, "step": 10371 }, { "epoch": 0.82, "learning_rate": 0.0002484742893373806, "loss": 1.6233, "step": 10372 }, { "epoch": 0.82, "learning_rate": 0.0002484649656965904, "loss": 1.6057, "step": 10373 }, { "epoch": 0.82, "learning_rate": 0.0002484556413872774, "loss": 1.6329, "step": 10374 }, { "epoch": 0.82, "learning_rate": 0.0002484463164095049, "loss": 1.6548, "step": 10375 }, { "epoch": 0.82, "learning_rate": 0.0002484369907633362, "loss": 1.561, "step": 10376 }, { "epoch": 0.82, "learning_rate": 0.0002484276644488347, "loss": 1.6881, "step": 10377 }, { "epoch": 0.82, "learning_rate": 0.00024841833746606375, "loss": 1.6296, "step": 10378 }, { "epoch": 0.82, "learning_rate": 0.0002484090098150865, "loss": 1.6959, "step": 10379 }, { "epoch": 0.82, "learning_rate": 0.00024839968149596643, "loss": 1.5989, "step": 10380 }, { "epoch": 0.82, "learning_rate": 0.00024839035250876683, "loss": 1.6362, "step": 10381 }, { "epoch": 0.82, "learning_rate": 0.000248381022853551, "loss": 1.5572, "step": 10382 }, { "epoch": 0.82, "learning_rate": 0.0002483716925303824, "loss": 1.6238, "step": 10383 }, { "epoch": 0.82, "learning_rate": 0.00024836236153932416, "loss": 1.6682, "step": 10384 }, { "epoch": 0.82, "learning_rate": 0.0002483530298804398, "loss": 1.6107, "step": 10385 }, { "epoch": 0.82, "learning_rate": 0.0002483436975537927, "loss": 1.6678, "step": 10386 }, { "epoch": 0.82, "learning_rate": 0.0002483343645594461, "loss": 1.6359, "step": 10387 }, { "epoch": 0.82, "learning_rate": 0.0002483250308974635, "loss": 1.6547, "step": 10388 }, { "epoch": 0.82, "learning_rate": 0.0002483156965679082, "loss": 1.6564, "step": 10389 }, { "epoch": 0.82, "learning_rate": 0.00024830636157084353, "loss": 1.6306, "step": 10390 }, { "epoch": 0.82, "learning_rate": 0.00024829702590633293, "loss": 1.5826, "step": 10391 }, { "epoch": 0.82, "learning_rate": 0.0002482876895744398, "loss": 1.6388, "step": 10392 }, { "epoch": 0.82, "learning_rate": 0.0002482783525752274, "loss": 1.6416, "step": 10393 }, { "epoch": 0.82, "learning_rate": 0.0002482690149087593, "loss": 1.5643, "step": 10394 }, { "epoch": 0.82, "learning_rate": 0.0002482596765750988, "loss": 1.621, "step": 10395 }, { "epoch": 0.82, "learning_rate": 0.0002482503375743093, "loss": 1.6226, "step": 10396 }, { "epoch": 0.82, "learning_rate": 0.0002482409979064543, "loss": 1.6402, "step": 10397 }, { "epoch": 0.82, "learning_rate": 0.00024823165757159707, "loss": 1.6264, "step": 10398 }, { "epoch": 0.82, "learning_rate": 0.0002482223165698011, "loss": 1.6129, "step": 10399 }, { "epoch": 0.82, "learning_rate": 0.00024821297490112986, "loss": 1.6707, "step": 10400 }, { "epoch": 0.82, "learning_rate": 0.00024820363256564663, "loss": 1.5628, "step": 10401 }, { "epoch": 0.82, "learning_rate": 0.00024819428956341494, "loss": 1.6365, "step": 10402 }, { "epoch": 0.82, "learning_rate": 0.0002481849458944983, "loss": 1.6021, "step": 10403 }, { "epoch": 0.82, "learning_rate": 0.00024817560155896, "loss": 1.6001, "step": 10404 }, { "epoch": 0.82, "learning_rate": 0.00024816625655686356, "loss": 1.5812, "step": 10405 }, { "epoch": 0.82, "learning_rate": 0.0002481569108882724, "loss": 1.6191, "step": 10406 }, { "epoch": 0.82, "learning_rate": 0.00024814756455324995, "loss": 1.62, "step": 10407 }, { "epoch": 0.82, "learning_rate": 0.00024813821755185973, "loss": 1.6198, "step": 10408 }, { "epoch": 0.82, "learning_rate": 0.0002481288698841652, "loss": 1.6742, "step": 10409 }, { "epoch": 0.82, "learning_rate": 0.00024811952155022975, "loss": 1.5715, "step": 10410 }, { "epoch": 0.82, "learning_rate": 0.00024811017255011694, "loss": 1.6134, "step": 10411 }, { "epoch": 0.82, "learning_rate": 0.0002481008228838901, "loss": 1.6122, "step": 10412 }, { "epoch": 0.82, "learning_rate": 0.00024809147255161295, "loss": 1.6376, "step": 10413 }, { "epoch": 0.82, "learning_rate": 0.00024808212155334877, "loss": 1.6379, "step": 10414 }, { "epoch": 0.82, "learning_rate": 0.00024807276988916106, "loss": 1.6737, "step": 10415 }, { "epoch": 0.82, "learning_rate": 0.0002480634175591134, "loss": 1.604, "step": 10416 }, { "epoch": 0.82, "learning_rate": 0.0002480540645632693, "loss": 1.666, "step": 10417 }, { "epoch": 0.82, "learning_rate": 0.00024804471090169217, "loss": 1.6892, "step": 10418 }, { "epoch": 0.82, "learning_rate": 0.00024803535657444555, "loss": 1.6135, "step": 10419 }, { "epoch": 0.82, "learning_rate": 0.00024802600158159297, "loss": 1.6464, "step": 10420 }, { "epoch": 0.82, "learning_rate": 0.00024801664592319795, "loss": 1.5874, "step": 10421 }, { "epoch": 0.82, "learning_rate": 0.0002480072895993239, "loss": 1.632, "step": 10422 }, { "epoch": 0.82, "learning_rate": 0.00024799793261003457, "loss": 1.5667, "step": 10423 }, { "epoch": 0.82, "learning_rate": 0.0002479885749553933, "loss": 1.6417, "step": 10424 }, { "epoch": 0.82, "learning_rate": 0.0002479792166354637, "loss": 1.704, "step": 10425 }, { "epoch": 0.82, "learning_rate": 0.0002479698576503093, "loss": 1.6589, "step": 10426 }, { "epoch": 0.82, "learning_rate": 0.00024796049799999354, "loss": 1.6197, "step": 10427 }, { "epoch": 0.82, "learning_rate": 0.00024795113768458015, "loss": 1.6582, "step": 10428 }, { "epoch": 0.82, "learning_rate": 0.00024794177670413255, "loss": 1.5955, "step": 10429 }, { "epoch": 0.82, "learning_rate": 0.00024793241505871436, "loss": 1.656, "step": 10430 }, { "epoch": 0.82, "learning_rate": 0.0002479230527483891, "loss": 1.602, "step": 10431 }, { "epoch": 0.82, "learning_rate": 0.00024791368977322036, "loss": 1.6424, "step": 10432 }, { "epoch": 0.82, "learning_rate": 0.00024790432613327166, "loss": 1.6084, "step": 10433 }, { "epoch": 0.82, "learning_rate": 0.00024789496182860664, "loss": 1.6183, "step": 10434 }, { "epoch": 0.82, "learning_rate": 0.00024788559685928887, "loss": 1.6459, "step": 10435 }, { "epoch": 0.82, "learning_rate": 0.0002478762312253819, "loss": 1.5827, "step": 10436 }, { "epoch": 0.82, "learning_rate": 0.00024786686492694936, "loss": 1.6309, "step": 10437 }, { "epoch": 0.82, "learning_rate": 0.00024785749796405474, "loss": 1.6323, "step": 10438 }, { "epoch": 0.82, "learning_rate": 0.0002478481303367618, "loss": 1.6207, "step": 10439 }, { "epoch": 0.82, "learning_rate": 0.000247838762045134, "loss": 1.6147, "step": 10440 }, { "epoch": 0.82, "learning_rate": 0.00024782939308923497, "loss": 1.5662, "step": 10441 }, { "epoch": 0.82, "learning_rate": 0.00024782002346912844, "loss": 1.6108, "step": 10442 }, { "epoch": 0.82, "learning_rate": 0.0002478106531848778, "loss": 1.5805, "step": 10443 }, { "epoch": 0.82, "learning_rate": 0.0002478012822365469, "loss": 1.6186, "step": 10444 }, { "epoch": 0.82, "learning_rate": 0.0002477919106241993, "loss": 1.626, "step": 10445 }, { "epoch": 0.82, "learning_rate": 0.00024778253834789853, "loss": 1.6657, "step": 10446 }, { "epoch": 0.82, "learning_rate": 0.00024777316540770827, "loss": 1.6604, "step": 10447 }, { "epoch": 0.82, "learning_rate": 0.0002477637918036922, "loss": 1.6212, "step": 10448 }, { "epoch": 0.82, "learning_rate": 0.0002477544175359139, "loss": 1.6588, "step": 10449 }, { "epoch": 0.82, "learning_rate": 0.00024774504260443713, "loss": 1.599, "step": 10450 }, { "epoch": 0.82, "learning_rate": 0.0002477356670093254, "loss": 1.6432, "step": 10451 }, { "epoch": 0.82, "learning_rate": 0.0002477262907506424, "loss": 1.5343, "step": 10452 }, { "epoch": 0.82, "learning_rate": 0.0002477169138284519, "loss": 1.6062, "step": 10453 }, { "epoch": 0.82, "learning_rate": 0.0002477075362428174, "loss": 1.6556, "step": 10454 }, { "epoch": 0.82, "learning_rate": 0.0002476981579938027, "loss": 1.5922, "step": 10455 }, { "epoch": 0.82, "learning_rate": 0.0002476887790814714, "loss": 1.6326, "step": 10456 }, { "epoch": 0.82, "learning_rate": 0.0002476793995058872, "loss": 1.623, "step": 10457 }, { "epoch": 0.82, "learning_rate": 0.0002476700192671138, "loss": 1.6714, "step": 10458 }, { "epoch": 0.82, "learning_rate": 0.0002476606383652148, "loss": 1.6145, "step": 10459 }, { "epoch": 0.82, "learning_rate": 0.00024765125680025407, "loss": 1.6241, "step": 10460 }, { "epoch": 0.82, "learning_rate": 0.0002476418745722951, "loss": 1.6531, "step": 10461 }, { "epoch": 0.82, "learning_rate": 0.0002476324916814017, "loss": 1.5746, "step": 10462 }, { "epoch": 0.82, "learning_rate": 0.0002476231081276376, "loss": 1.7025, "step": 10463 }, { "epoch": 0.82, "learning_rate": 0.00024761372391106644, "loss": 1.5585, "step": 10464 }, { "epoch": 0.82, "learning_rate": 0.000247604339031752, "loss": 1.6161, "step": 10465 }, { "epoch": 0.82, "learning_rate": 0.0002475949534897579, "loss": 1.6408, "step": 10466 }, { "epoch": 0.82, "learning_rate": 0.000247585567285148, "loss": 1.6947, "step": 10467 }, { "epoch": 0.82, "learning_rate": 0.0002475761804179859, "loss": 1.6043, "step": 10468 }, { "epoch": 0.82, "learning_rate": 0.00024756679288833535, "loss": 1.6242, "step": 10469 }, { "epoch": 0.82, "learning_rate": 0.0002475574046962602, "loss": 1.6444, "step": 10470 }, { "epoch": 0.82, "learning_rate": 0.000247548015841824, "loss": 1.6158, "step": 10471 }, { "epoch": 0.82, "learning_rate": 0.0002475386263250907, "loss": 1.6472, "step": 10472 }, { "epoch": 0.82, "learning_rate": 0.0002475292361461239, "loss": 1.6665, "step": 10473 }, { "epoch": 0.82, "learning_rate": 0.00024751984530498744, "loss": 1.6441, "step": 10474 }, { "epoch": 0.82, "learning_rate": 0.00024751045380174504, "loss": 1.5899, "step": 10475 }, { "epoch": 0.82, "learning_rate": 0.00024750106163646044, "loss": 1.5887, "step": 10476 }, { "epoch": 0.82, "learning_rate": 0.00024749166880919744, "loss": 1.6362, "step": 10477 }, { "epoch": 0.82, "learning_rate": 0.00024748227532001986, "loss": 1.5889, "step": 10478 }, { "epoch": 0.82, "learning_rate": 0.0002474728811689914, "loss": 1.586, "step": 10479 }, { "epoch": 0.82, "learning_rate": 0.00024746348635617583, "loss": 1.615, "step": 10480 }, { "epoch": 0.82, "learning_rate": 0.000247454090881637, "loss": 1.6085, "step": 10481 }, { "epoch": 0.82, "learning_rate": 0.00024744469474543873, "loss": 1.6911, "step": 10482 }, { "epoch": 0.82, "learning_rate": 0.0002474352979476447, "loss": 1.6556, "step": 10483 }, { "epoch": 0.82, "learning_rate": 0.00024742590048831874, "loss": 1.6309, "step": 10484 }, { "epoch": 0.82, "learning_rate": 0.0002474165023675247, "loss": 1.696, "step": 10485 }, { "epoch": 0.83, "learning_rate": 0.0002474071035853264, "loss": 1.6186, "step": 10486 }, { "epoch": 0.83, "learning_rate": 0.0002473977041417876, "loss": 1.6554, "step": 10487 }, { "epoch": 0.83, "learning_rate": 0.0002473883040369721, "loss": 1.571, "step": 10488 }, { "epoch": 0.83, "learning_rate": 0.0002473789032709438, "loss": 1.6298, "step": 10489 }, { "epoch": 0.83, "learning_rate": 0.0002473695018437665, "loss": 1.5881, "step": 10490 }, { "epoch": 0.83, "learning_rate": 0.000247360099755504, "loss": 1.6179, "step": 10491 }, { "epoch": 0.83, "learning_rate": 0.0002473506970062202, "loss": 1.6041, "step": 10492 }, { "epoch": 0.83, "learning_rate": 0.0002473412935959788, "loss": 1.641, "step": 10493 }, { "epoch": 0.83, "learning_rate": 0.00024733188952484375, "loss": 1.6003, "step": 10494 }, { "epoch": 0.83, "learning_rate": 0.0002473224847928789, "loss": 1.6533, "step": 10495 }, { "epoch": 0.83, "learning_rate": 0.00024731307940014806, "loss": 1.6206, "step": 10496 }, { "epoch": 0.83, "learning_rate": 0.0002473036733467152, "loss": 1.6211, "step": 10497 }, { "epoch": 0.83, "learning_rate": 0.000247294266632644, "loss": 1.6474, "step": 10498 }, { "epoch": 0.83, "learning_rate": 0.0002472848592579985, "loss": 1.6377, "step": 10499 }, { "epoch": 0.83, "learning_rate": 0.00024727545122284244, "loss": 1.6255, "step": 10500 }, { "epoch": 0.83, "learning_rate": 0.0002472660425272397, "loss": 1.5508, "step": 10501 }, { "epoch": 0.83, "learning_rate": 0.0002472566331712543, "loss": 1.6346, "step": 10502 }, { "epoch": 0.83, "learning_rate": 0.00024724722315494995, "loss": 1.5986, "step": 10503 }, { "epoch": 0.83, "learning_rate": 0.0002472378124783907, "loss": 1.5762, "step": 10504 }, { "epoch": 0.83, "learning_rate": 0.0002472284011416403, "loss": 1.5907, "step": 10505 }, { "epoch": 0.83, "learning_rate": 0.00024721898914476274, "loss": 1.5958, "step": 10506 }, { "epoch": 0.83, "learning_rate": 0.0002472095764878219, "loss": 1.6476, "step": 10507 }, { "epoch": 0.83, "learning_rate": 0.0002472001631708817, "loss": 1.6862, "step": 10508 }, { "epoch": 0.83, "learning_rate": 0.000247190749194006, "loss": 1.6772, "step": 10509 }, { "epoch": 0.83, "learning_rate": 0.00024718133455725876, "loss": 1.605, "step": 10510 }, { "epoch": 0.83, "learning_rate": 0.0002471719192607038, "loss": 1.6246, "step": 10511 }, { "epoch": 0.83, "learning_rate": 0.00024716250330440525, "loss": 1.6305, "step": 10512 }, { "epoch": 0.83, "learning_rate": 0.00024715308668842685, "loss": 1.6475, "step": 10513 }, { "epoch": 0.83, "learning_rate": 0.00024714366941283264, "loss": 1.5987, "step": 10514 }, { "epoch": 0.83, "learning_rate": 0.00024713425147768653, "loss": 1.6348, "step": 10515 }, { "epoch": 0.83, "learning_rate": 0.0002471248328830525, "loss": 1.6646, "step": 10516 }, { "epoch": 0.83, "learning_rate": 0.00024711541362899435, "loss": 1.6414, "step": 10517 }, { "epoch": 0.83, "learning_rate": 0.0002471059937155762, "loss": 1.6121, "step": 10518 }, { "epoch": 0.83, "learning_rate": 0.00024709657314286187, "loss": 1.6139, "step": 10519 }, { "epoch": 0.83, "learning_rate": 0.0002470871519109155, "loss": 1.6175, "step": 10520 }, { "epoch": 0.83, "learning_rate": 0.00024707773001980086, "loss": 1.6037, "step": 10521 }, { "epoch": 0.83, "learning_rate": 0.00024706830746958205, "loss": 1.631, "step": 10522 }, { "epoch": 0.83, "learning_rate": 0.000247058884260323, "loss": 1.5745, "step": 10523 }, { "epoch": 0.83, "learning_rate": 0.0002470494603920877, "loss": 1.6489, "step": 10524 }, { "epoch": 0.83, "learning_rate": 0.00024704003586494005, "loss": 1.6287, "step": 10525 }, { "epoch": 0.83, "learning_rate": 0.00024703061067894407, "loss": 1.6327, "step": 10526 }, { "epoch": 0.83, "learning_rate": 0.0002470211848341639, "loss": 1.5643, "step": 10527 }, { "epoch": 0.83, "learning_rate": 0.0002470117583306634, "loss": 1.6344, "step": 10528 }, { "epoch": 0.83, "learning_rate": 0.00024700233116850664, "loss": 1.6104, "step": 10529 }, { "epoch": 0.83, "learning_rate": 0.0002469929033477575, "loss": 1.5754, "step": 10530 }, { "epoch": 0.83, "learning_rate": 0.00024698347486848014, "loss": 1.6104, "step": 10531 }, { "epoch": 0.83, "learning_rate": 0.00024697404573073843, "loss": 1.6257, "step": 10532 }, { "epoch": 0.83, "learning_rate": 0.00024696461593459653, "loss": 1.6036, "step": 10533 }, { "epoch": 0.83, "learning_rate": 0.00024695518548011833, "loss": 1.5932, "step": 10534 }, { "epoch": 0.83, "learning_rate": 0.000246945754367368, "loss": 1.6235, "step": 10535 }, { "epoch": 0.83, "learning_rate": 0.0002469363225964094, "loss": 1.6138, "step": 10536 }, { "epoch": 0.83, "learning_rate": 0.00024692689016730674, "loss": 1.6864, "step": 10537 }, { "epoch": 0.83, "learning_rate": 0.00024691745708012395, "loss": 1.615, "step": 10538 }, { "epoch": 0.83, "learning_rate": 0.0002469080233349252, "loss": 1.5858, "step": 10539 }, { "epoch": 0.83, "learning_rate": 0.00024689858893177434, "loss": 1.6444, "step": 10540 }, { "epoch": 0.83, "learning_rate": 0.00024688915387073557, "loss": 1.6261, "step": 10541 }, { "epoch": 0.83, "learning_rate": 0.0002468797181518729, "loss": 1.612, "step": 10542 }, { "epoch": 0.83, "learning_rate": 0.00024687028177525043, "loss": 1.5781, "step": 10543 }, { "epoch": 0.83, "learning_rate": 0.0002468608447409322, "loss": 1.6224, "step": 10544 }, { "epoch": 0.83, "learning_rate": 0.0002468514070489823, "loss": 1.6185, "step": 10545 }, { "epoch": 0.83, "learning_rate": 0.00024684196869946475, "loss": 1.5924, "step": 10546 }, { "epoch": 0.83, "learning_rate": 0.0002468325296924437, "loss": 1.6439, "step": 10547 }, { "epoch": 0.83, "learning_rate": 0.00024682309002798324, "loss": 1.6115, "step": 10548 }, { "epoch": 0.83, "learning_rate": 0.0002468136497061474, "loss": 1.6478, "step": 10549 }, { "epoch": 0.83, "learning_rate": 0.0002468042087270003, "loss": 1.6429, "step": 10550 }, { "epoch": 0.83, "learning_rate": 0.00024679476709060604, "loss": 1.6017, "step": 10551 }, { "epoch": 0.83, "learning_rate": 0.0002467853247970287, "loss": 1.5684, "step": 10552 }, { "epoch": 0.83, "learning_rate": 0.0002467758818463325, "loss": 1.6515, "step": 10553 }, { "epoch": 0.83, "learning_rate": 0.00024676643823858137, "loss": 1.6213, "step": 10554 }, { "epoch": 0.83, "learning_rate": 0.0002467569939738396, "loss": 1.6192, "step": 10555 }, { "epoch": 0.83, "learning_rate": 0.0002467475490521712, "loss": 1.5982, "step": 10556 }, { "epoch": 0.83, "learning_rate": 0.00024673810347364034, "loss": 1.6295, "step": 10557 }, { "epoch": 0.83, "learning_rate": 0.0002467286572383111, "loss": 1.6645, "step": 10558 }, { "epoch": 0.83, "learning_rate": 0.00024671921034624775, "loss": 1.6792, "step": 10559 }, { "epoch": 0.83, "learning_rate": 0.00024670976279751424, "loss": 1.6391, "step": 10560 }, { "epoch": 0.83, "learning_rate": 0.0002467003145921749, "loss": 1.6445, "step": 10561 }, { "epoch": 0.83, "learning_rate": 0.00024669086573029375, "loss": 1.5876, "step": 10562 }, { "epoch": 0.83, "learning_rate": 0.000246681416211935, "loss": 1.6571, "step": 10563 }, { "epoch": 0.83, "learning_rate": 0.0002466719660371627, "loss": 1.6069, "step": 10564 }, { "epoch": 0.83, "learning_rate": 0.0002466625152060412, "loss": 1.6412, "step": 10565 }, { "epoch": 0.83, "learning_rate": 0.00024665306371863453, "loss": 1.5863, "step": 10566 }, { "epoch": 0.83, "learning_rate": 0.00024664361157500684, "loss": 1.6378, "step": 10567 }, { "epoch": 0.83, "learning_rate": 0.00024663415877522243, "loss": 1.6003, "step": 10568 }, { "epoch": 0.83, "learning_rate": 0.0002466247053193454, "loss": 1.6358, "step": 10569 }, { "epoch": 0.83, "learning_rate": 0.00024661525120743994, "loss": 1.5882, "step": 10570 }, { "epoch": 0.83, "learning_rate": 0.00024660579643957017, "loss": 1.6512, "step": 10571 }, { "epoch": 0.83, "learning_rate": 0.0002465963410158004, "loss": 1.5953, "step": 10572 }, { "epoch": 0.83, "learning_rate": 0.0002465868849361948, "loss": 1.5958, "step": 10573 }, { "epoch": 0.83, "learning_rate": 0.00024657742820081757, "loss": 1.643, "step": 10574 }, { "epoch": 0.83, "learning_rate": 0.0002465679708097329, "loss": 1.622, "step": 10575 }, { "epoch": 0.83, "learning_rate": 0.000246558512763005, "loss": 1.5472, "step": 10576 }, { "epoch": 0.83, "learning_rate": 0.00024654905406069807, "loss": 1.615, "step": 10577 }, { "epoch": 0.83, "learning_rate": 0.0002465395947028763, "loss": 1.562, "step": 10578 }, { "epoch": 0.83, "learning_rate": 0.000246530134689604, "loss": 1.6205, "step": 10579 }, { "epoch": 0.83, "learning_rate": 0.0002465206740209453, "loss": 1.6268, "step": 10580 }, { "epoch": 0.83, "learning_rate": 0.0002465112126969645, "loss": 1.62, "step": 10581 }, { "epoch": 0.83, "learning_rate": 0.0002465017507177259, "loss": 1.6576, "step": 10582 }, { "epoch": 0.83, "learning_rate": 0.00024649228808329367, "loss": 1.62, "step": 10583 }, { "epoch": 0.83, "learning_rate": 0.0002464828247937319, "loss": 1.6337, "step": 10584 }, { "epoch": 0.83, "learning_rate": 0.00024647336084910514, "loss": 1.6303, "step": 10585 }, { "epoch": 0.83, "learning_rate": 0.00024646389624947745, "loss": 1.5828, "step": 10586 }, { "epoch": 0.83, "learning_rate": 0.0002464544309949132, "loss": 1.6597, "step": 10587 }, { "epoch": 0.83, "learning_rate": 0.0002464449650854765, "loss": 1.6094, "step": 10588 }, { "epoch": 0.83, "learning_rate": 0.00024643549852123176, "loss": 1.5932, "step": 10589 }, { "epoch": 0.83, "learning_rate": 0.0002464260313022432, "loss": 1.5889, "step": 10590 }, { "epoch": 0.83, "learning_rate": 0.00024641656342857507, "loss": 1.6032, "step": 10591 }, { "epoch": 0.83, "learning_rate": 0.0002464070949002917, "loss": 1.6832, "step": 10592 }, { "epoch": 0.83, "learning_rate": 0.0002463976257174574, "loss": 1.6094, "step": 10593 }, { "epoch": 0.83, "learning_rate": 0.0002463881558801363, "loss": 1.642, "step": 10594 }, { "epoch": 0.83, "learning_rate": 0.0002463786853883929, "loss": 1.6202, "step": 10595 }, { "epoch": 0.83, "learning_rate": 0.0002463692142422914, "loss": 1.6453, "step": 10596 }, { "epoch": 0.83, "learning_rate": 0.00024635974244189613, "loss": 1.6056, "step": 10597 }, { "epoch": 0.83, "learning_rate": 0.00024635026998727136, "loss": 1.6014, "step": 10598 }, { "epoch": 0.83, "learning_rate": 0.00024634079687848144, "loss": 1.5702, "step": 10599 }, { "epoch": 0.83, "learning_rate": 0.0002463313231155907, "loss": 1.5687, "step": 10600 }, { "epoch": 0.83, "learning_rate": 0.0002463218486986634, "loss": 1.6229, "step": 10601 }, { "epoch": 0.83, "learning_rate": 0.0002463123736277639, "loss": 1.611, "step": 10602 }, { "epoch": 0.83, "learning_rate": 0.0002463028979029566, "loss": 1.6946, "step": 10603 }, { "epoch": 0.83, "learning_rate": 0.00024629342152430566, "loss": 1.6511, "step": 10604 }, { "epoch": 0.83, "learning_rate": 0.0002462839444918756, "loss": 1.6539, "step": 10605 }, { "epoch": 0.83, "learning_rate": 0.0002462744668057306, "loss": 1.6213, "step": 10606 }, { "epoch": 0.83, "learning_rate": 0.00024626498846593524, "loss": 1.6162, "step": 10607 }, { "epoch": 0.83, "learning_rate": 0.00024625550947255363, "loss": 1.6472, "step": 10608 }, { "epoch": 0.83, "learning_rate": 0.00024624602982565024, "loss": 1.6182, "step": 10609 }, { "epoch": 0.83, "learning_rate": 0.00024623654952528947, "loss": 1.6376, "step": 10610 }, { "epoch": 0.83, "learning_rate": 0.0002462270685715356, "loss": 1.6051, "step": 10611 }, { "epoch": 0.83, "learning_rate": 0.0002462175869644531, "loss": 1.6109, "step": 10612 }, { "epoch": 0.84, "learning_rate": 0.00024620810470410616, "loss": 1.6034, "step": 10613 }, { "epoch": 0.84, "learning_rate": 0.00024619862179055935, "loss": 1.5749, "step": 10614 }, { "epoch": 0.84, "learning_rate": 0.00024618913822387696, "loss": 1.6334, "step": 10615 }, { "epoch": 0.84, "learning_rate": 0.00024617965400412344, "loss": 1.6357, "step": 10616 }, { "epoch": 0.84, "learning_rate": 0.00024617016913136314, "loss": 1.5843, "step": 10617 }, { "epoch": 0.84, "learning_rate": 0.00024616068360566046, "loss": 1.5852, "step": 10618 }, { "epoch": 0.84, "learning_rate": 0.0002461511974270798, "loss": 1.6438, "step": 10619 }, { "epoch": 0.84, "learning_rate": 0.00024614171059568555, "loss": 1.6329, "step": 10620 }, { "epoch": 0.84, "learning_rate": 0.00024613222311154213, "loss": 1.6375, "step": 10621 }, { "epoch": 0.84, "learning_rate": 0.000246122734974714, "loss": 1.6241, "step": 10622 }, { "epoch": 0.84, "learning_rate": 0.00024611324618526554, "loss": 1.6383, "step": 10623 }, { "epoch": 0.84, "learning_rate": 0.0002461037567432612, "loss": 1.619, "step": 10624 }, { "epoch": 0.84, "learning_rate": 0.00024609426664876533, "loss": 1.6096, "step": 10625 }, { "epoch": 0.84, "learning_rate": 0.00024608477590184243, "loss": 1.603, "step": 10626 }, { "epoch": 0.84, "learning_rate": 0.000246075284502557, "loss": 1.6982, "step": 10627 }, { "epoch": 0.84, "learning_rate": 0.0002460657924509733, "loss": 1.6756, "step": 10628 }, { "epoch": 0.84, "learning_rate": 0.00024605629974715595, "loss": 1.6809, "step": 10629 }, { "epoch": 0.84, "learning_rate": 0.0002460468063911693, "loss": 1.6082, "step": 10630 }, { "epoch": 0.84, "learning_rate": 0.00024603731238307785, "loss": 1.6366, "step": 10631 }, { "epoch": 0.84, "learning_rate": 0.00024602781772294606, "loss": 1.6115, "step": 10632 }, { "epoch": 0.84, "learning_rate": 0.0002460183224108384, "loss": 1.6051, "step": 10633 }, { "epoch": 0.84, "learning_rate": 0.00024600882644681927, "loss": 1.6337, "step": 10634 }, { "epoch": 0.84, "learning_rate": 0.0002459993298309532, "loss": 1.6, "step": 10635 }, { "epoch": 0.84, "learning_rate": 0.0002459898325633047, "loss": 1.6575, "step": 10636 }, { "epoch": 0.84, "learning_rate": 0.0002459803346439382, "loss": 1.5803, "step": 10637 }, { "epoch": 0.84, "learning_rate": 0.0002459708360729181, "loss": 1.5759, "step": 10638 }, { "epoch": 0.84, "learning_rate": 0.00024596133685030904, "loss": 1.5602, "step": 10639 }, { "epoch": 0.84, "learning_rate": 0.0002459518369761755, "loss": 1.6136, "step": 10640 }, { "epoch": 0.84, "learning_rate": 0.00024594233645058194, "loss": 1.6296, "step": 10641 }, { "epoch": 0.84, "learning_rate": 0.00024593283527359283, "loss": 1.6157, "step": 10642 }, { "epoch": 0.84, "learning_rate": 0.0002459233334452727, "loss": 1.6435, "step": 10643 }, { "epoch": 0.84, "learning_rate": 0.0002459138309656861, "loss": 1.696, "step": 10644 }, { "epoch": 0.84, "learning_rate": 0.0002459043278348975, "loss": 1.621, "step": 10645 }, { "epoch": 0.84, "learning_rate": 0.0002458948240529714, "loss": 1.6032, "step": 10646 }, { "epoch": 0.84, "learning_rate": 0.0002458853196199724, "loss": 1.652, "step": 10647 }, { "epoch": 0.84, "learning_rate": 0.000245875814535965, "loss": 1.6174, "step": 10648 }, { "epoch": 0.84, "learning_rate": 0.0002458663088010137, "loss": 1.6717, "step": 10649 }, { "epoch": 0.84, "learning_rate": 0.0002458568024151831, "loss": 1.608, "step": 10650 }, { "epoch": 0.84, "learning_rate": 0.0002458472953785377, "loss": 1.6119, "step": 10651 }, { "epoch": 0.84, "learning_rate": 0.000245837787691142, "loss": 1.6885, "step": 10652 }, { "epoch": 0.84, "learning_rate": 0.0002458282793530607, "loss": 1.5951, "step": 10653 }, { "epoch": 0.84, "learning_rate": 0.00024581877036435827, "loss": 1.626, "step": 10654 }, { "epoch": 0.84, "learning_rate": 0.00024580926072509916, "loss": 1.6319, "step": 10655 }, { "epoch": 0.84, "learning_rate": 0.00024579975043534814, "loss": 1.6293, "step": 10656 }, { "epoch": 0.84, "learning_rate": 0.00024579023949516964, "loss": 1.6328, "step": 10657 }, { "epoch": 0.84, "learning_rate": 0.0002457807279046283, "loss": 1.6206, "step": 10658 }, { "epoch": 0.84, "learning_rate": 0.0002457712156637887, "loss": 1.6346, "step": 10659 }, { "epoch": 0.84, "learning_rate": 0.00024576170277271534, "loss": 1.6369, "step": 10660 }, { "epoch": 0.84, "learning_rate": 0.00024575218923147285, "loss": 1.6512, "step": 10661 }, { "epoch": 0.84, "learning_rate": 0.00024574267504012587, "loss": 1.5709, "step": 10662 }, { "epoch": 0.84, "learning_rate": 0.00024573316019873897, "loss": 1.6029, "step": 10663 }, { "epoch": 0.84, "learning_rate": 0.0002457236447073767, "loss": 1.6144, "step": 10664 }, { "epoch": 0.84, "learning_rate": 0.00024571412856610374, "loss": 1.5998, "step": 10665 }, { "epoch": 0.84, "learning_rate": 0.00024570461177498464, "loss": 1.6662, "step": 10666 }, { "epoch": 0.84, "learning_rate": 0.0002456950943340841, "loss": 1.6148, "step": 10667 }, { "epoch": 0.84, "learning_rate": 0.0002456855762434666, "loss": 1.6033, "step": 10668 }, { "epoch": 0.84, "learning_rate": 0.00024567605750319693, "loss": 1.6293, "step": 10669 }, { "epoch": 0.84, "learning_rate": 0.00024566653811333955, "loss": 1.6092, "step": 10670 }, { "epoch": 0.84, "learning_rate": 0.0002456570180739592, "loss": 1.5749, "step": 10671 }, { "epoch": 0.84, "learning_rate": 0.0002456474973851205, "loss": 1.632, "step": 10672 }, { "epoch": 0.84, "learning_rate": 0.00024563797604688805, "loss": 1.6777, "step": 10673 }, { "epoch": 0.84, "learning_rate": 0.00024562845405932656, "loss": 1.6087, "step": 10674 }, { "epoch": 0.84, "learning_rate": 0.00024561893142250056, "loss": 1.5964, "step": 10675 }, { "epoch": 0.84, "learning_rate": 0.00024560940813647485, "loss": 1.6184, "step": 10676 }, { "epoch": 0.84, "learning_rate": 0.000245599884201314, "loss": 1.5609, "step": 10677 }, { "epoch": 0.84, "learning_rate": 0.0002455903596170827, "loss": 1.6143, "step": 10678 }, { "epoch": 0.84, "learning_rate": 0.0002455808343838456, "loss": 1.6414, "step": 10679 }, { "epoch": 0.84, "learning_rate": 0.0002455713085016674, "loss": 1.5834, "step": 10680 }, { "epoch": 0.84, "learning_rate": 0.0002455617819706127, "loss": 1.5915, "step": 10681 }, { "epoch": 0.84, "learning_rate": 0.0002455522547907463, "loss": 1.5851, "step": 10682 }, { "epoch": 0.84, "learning_rate": 0.00024554272696213276, "loss": 1.6117, "step": 10683 }, { "epoch": 0.84, "learning_rate": 0.0002455331984848369, "loss": 1.666, "step": 10684 }, { "epoch": 0.84, "learning_rate": 0.0002455236693589233, "loss": 1.6239, "step": 10685 }, { "epoch": 0.84, "learning_rate": 0.0002455141395844567, "loss": 1.6108, "step": 10686 }, { "epoch": 0.84, "learning_rate": 0.0002455046091615018, "loss": 1.6311, "step": 10687 }, { "epoch": 0.84, "learning_rate": 0.0002454950780901233, "loss": 1.6663, "step": 10688 }, { "epoch": 0.84, "learning_rate": 0.00024548554637038593, "loss": 1.5973, "step": 10689 }, { "epoch": 0.84, "learning_rate": 0.00024547601400235446, "loss": 1.6517, "step": 10690 }, { "epoch": 0.84, "learning_rate": 0.00024546648098609347, "loss": 1.5831, "step": 10691 }, { "epoch": 0.84, "learning_rate": 0.00024545694732166774, "loss": 1.6043, "step": 10692 }, { "epoch": 0.84, "learning_rate": 0.000245447413009142, "loss": 1.6285, "step": 10693 }, { "epoch": 0.84, "learning_rate": 0.0002454378780485811, "loss": 1.5969, "step": 10694 }, { "epoch": 0.84, "learning_rate": 0.0002454283424400496, "loss": 1.6412, "step": 10695 }, { "epoch": 0.84, "learning_rate": 0.00024541880618361234, "loss": 1.5868, "step": 10696 }, { "epoch": 0.84, "learning_rate": 0.000245409269279334, "loss": 1.5944, "step": 10697 }, { "epoch": 0.84, "learning_rate": 0.00024539973172727945, "loss": 1.5695, "step": 10698 }, { "epoch": 0.84, "learning_rate": 0.0002453901935275133, "loss": 1.6491, "step": 10699 }, { "epoch": 0.84, "learning_rate": 0.0002453806546801004, "loss": 1.5824, "step": 10700 }, { "epoch": 0.84, "learning_rate": 0.00024537111518510546, "loss": 1.6178, "step": 10701 }, { "epoch": 0.84, "learning_rate": 0.00024536157504259333, "loss": 1.6246, "step": 10702 }, { "epoch": 0.84, "learning_rate": 0.00024535203425262873, "loss": 1.6019, "step": 10703 }, { "epoch": 0.84, "learning_rate": 0.0002453424928152764, "loss": 1.6469, "step": 10704 }, { "epoch": 0.84, "learning_rate": 0.00024533295073060114, "loss": 1.6462, "step": 10705 }, { "epoch": 0.84, "learning_rate": 0.0002453234079986678, "loss": 1.5728, "step": 10706 }, { "epoch": 0.84, "learning_rate": 0.0002453138646195411, "loss": 1.6356, "step": 10707 }, { "epoch": 0.84, "learning_rate": 0.00024530432059328587, "loss": 1.6306, "step": 10708 }, { "epoch": 0.84, "learning_rate": 0.0002452947759199669, "loss": 1.6125, "step": 10709 }, { "epoch": 0.84, "learning_rate": 0.000245285230599649, "loss": 1.6168, "step": 10710 }, { "epoch": 0.84, "learning_rate": 0.00024527568463239693, "loss": 1.6708, "step": 10711 }, { "epoch": 0.84, "learning_rate": 0.0002452661380182756, "loss": 1.6014, "step": 10712 }, { "epoch": 0.84, "learning_rate": 0.0002452565907573497, "loss": 1.6564, "step": 10713 }, { "epoch": 0.84, "learning_rate": 0.0002452470428496841, "loss": 1.6433, "step": 10714 }, { "epoch": 0.84, "learning_rate": 0.00024523749429534373, "loss": 1.5943, "step": 10715 }, { "epoch": 0.84, "learning_rate": 0.00024522794509439325, "loss": 1.6305, "step": 10716 }, { "epoch": 0.84, "learning_rate": 0.0002452183952468976, "loss": 1.6691, "step": 10717 }, { "epoch": 0.84, "learning_rate": 0.0002452088447529216, "loss": 1.6348, "step": 10718 }, { "epoch": 0.84, "learning_rate": 0.0002451992936125301, "loss": 1.6678, "step": 10719 }, { "epoch": 0.84, "learning_rate": 0.0002451897418257879, "loss": 1.5795, "step": 10720 }, { "epoch": 0.84, "learning_rate": 0.0002451801893927599, "loss": 1.6431, "step": 10721 }, { "epoch": 0.84, "learning_rate": 0.00024517063631351095, "loss": 1.6643, "step": 10722 }, { "epoch": 0.84, "learning_rate": 0.0002451610825881059, "loss": 1.6607, "step": 10723 }, { "epoch": 0.84, "learning_rate": 0.0002451515282166096, "loss": 1.5883, "step": 10724 }, { "epoch": 0.84, "learning_rate": 0.0002451419731990869, "loss": 1.6269, "step": 10725 }, { "epoch": 0.84, "learning_rate": 0.00024513241753560273, "loss": 1.59, "step": 10726 }, { "epoch": 0.84, "learning_rate": 0.00024512286122622197, "loss": 1.5918, "step": 10727 }, { "epoch": 0.84, "learning_rate": 0.0002451133042710094, "loss": 1.6047, "step": 10728 }, { "epoch": 0.84, "learning_rate": 0.0002451037466700301, "loss": 1.6223, "step": 10729 }, { "epoch": 0.84, "learning_rate": 0.00024509418842334876, "loss": 1.6913, "step": 10730 }, { "epoch": 0.84, "learning_rate": 0.00024508462953103035, "loss": 1.6253, "step": 10731 }, { "epoch": 0.84, "learning_rate": 0.0002450750699931398, "loss": 1.6128, "step": 10732 }, { "epoch": 0.84, "learning_rate": 0.00024506550980974204, "loss": 1.6036, "step": 10733 }, { "epoch": 0.84, "learning_rate": 0.0002450559489809019, "loss": 1.5934, "step": 10734 }, { "epoch": 0.84, "learning_rate": 0.0002450463875066843, "loss": 1.5938, "step": 10735 }, { "epoch": 0.84, "learning_rate": 0.00024503682538715415, "loss": 1.5813, "step": 10736 }, { "epoch": 0.84, "learning_rate": 0.00024502726262237647, "loss": 1.63, "step": 10737 }, { "epoch": 0.84, "learning_rate": 0.0002450176992124161, "loss": 1.5974, "step": 10738 }, { "epoch": 0.84, "learning_rate": 0.00024500813515733797, "loss": 1.6253, "step": 10739 }, { "epoch": 0.85, "learning_rate": 0.00024499857045720704, "loss": 1.6165, "step": 10740 }, { "epoch": 0.85, "learning_rate": 0.0002449890051120882, "loss": 1.6921, "step": 10741 }, { "epoch": 0.85, "learning_rate": 0.0002449794391220465, "loss": 1.6072, "step": 10742 }, { "epoch": 0.85, "learning_rate": 0.00024496987248714676, "loss": 1.6374, "step": 10743 }, { "epoch": 0.85, "learning_rate": 0.00024496030520745405, "loss": 1.6548, "step": 10744 }, { "epoch": 0.85, "learning_rate": 0.00024495073728303325, "loss": 1.6236, "step": 10745 }, { "epoch": 0.85, "learning_rate": 0.0002449411687139493, "loss": 1.6049, "step": 10746 }, { "epoch": 0.85, "learning_rate": 0.0002449315995002673, "loss": 1.6494, "step": 10747 }, { "epoch": 0.85, "learning_rate": 0.00024492202964205206, "loss": 1.6144, "step": 10748 }, { "epoch": 0.85, "learning_rate": 0.00024491245913936863, "loss": 1.5757, "step": 10749 }, { "epoch": 0.85, "learning_rate": 0.000244902887992282, "loss": 1.6518, "step": 10750 }, { "epoch": 0.85, "learning_rate": 0.00024489331620085715, "loss": 1.6279, "step": 10751 }, { "epoch": 0.85, "learning_rate": 0.000244883743765159, "loss": 1.6818, "step": 10752 }, { "epoch": 0.85, "learning_rate": 0.0002448741706852526, "loss": 1.6197, "step": 10753 }, { "epoch": 0.85, "learning_rate": 0.00024486459696120293, "loss": 1.5947, "step": 10754 }, { "epoch": 0.85, "learning_rate": 0.000244855022593075, "loss": 1.6167, "step": 10755 }, { "epoch": 0.85, "learning_rate": 0.0002448454475809339, "loss": 1.6389, "step": 10756 }, { "epoch": 0.85, "learning_rate": 0.00024483587192484444, "loss": 1.573, "step": 10757 }, { "epoch": 0.85, "learning_rate": 0.00024482629562487177, "loss": 1.5916, "step": 10758 }, { "epoch": 0.85, "learning_rate": 0.0002448167186810809, "loss": 1.5879, "step": 10759 }, { "epoch": 0.85, "learning_rate": 0.00024480714109353685, "loss": 1.5431, "step": 10760 }, { "epoch": 0.85, "learning_rate": 0.0002447975628623046, "loss": 1.6437, "step": 10761 }, { "epoch": 0.85, "learning_rate": 0.0002447879839874492, "loss": 1.6539, "step": 10762 }, { "epoch": 0.85, "learning_rate": 0.0002447784044690357, "loss": 1.6104, "step": 10763 }, { "epoch": 0.85, "learning_rate": 0.0002447688243071292, "loss": 1.6271, "step": 10764 }, { "epoch": 0.85, "learning_rate": 0.0002447592435017946, "loss": 1.6113, "step": 10765 }, { "epoch": 0.85, "learning_rate": 0.0002447496620530971, "loss": 1.5952, "step": 10766 }, { "epoch": 0.85, "learning_rate": 0.0002447400799611016, "loss": 1.6723, "step": 10767 }, { "epoch": 0.85, "learning_rate": 0.00024473049722587335, "loss": 1.6803, "step": 10768 }, { "epoch": 0.85, "learning_rate": 0.0002447209138474772, "loss": 1.5897, "step": 10769 }, { "epoch": 0.85, "learning_rate": 0.0002447113298259783, "loss": 1.7135, "step": 10770 }, { "epoch": 0.85, "learning_rate": 0.00024470174516144183, "loss": 1.6495, "step": 10771 }, { "epoch": 0.85, "learning_rate": 0.00024469215985393274, "loss": 1.6001, "step": 10772 }, { "epoch": 0.85, "learning_rate": 0.00024468257390351615, "loss": 1.6298, "step": 10773 }, { "epoch": 0.85, "learning_rate": 0.00024467298731025713, "loss": 1.6449, "step": 10774 }, { "epoch": 0.85, "learning_rate": 0.0002446634000742207, "loss": 1.6511, "step": 10775 }, { "epoch": 0.85, "learning_rate": 0.0002446538121954721, "loss": 1.6044, "step": 10776 }, { "epoch": 0.85, "learning_rate": 0.0002446442236740763, "loss": 1.6014, "step": 10777 }, { "epoch": 0.85, "learning_rate": 0.00024463463451009846, "loss": 1.636, "step": 10778 }, { "epoch": 0.85, "learning_rate": 0.0002446250447036037, "loss": 1.6081, "step": 10779 }, { "epoch": 0.85, "learning_rate": 0.00024461545425465717, "loss": 1.5777, "step": 10780 }, { "epoch": 0.85, "learning_rate": 0.0002446058631633238, "loss": 1.6303, "step": 10781 }, { "epoch": 0.85, "learning_rate": 0.00024459627142966886, "loss": 1.5998, "step": 10782 }, { "epoch": 0.85, "learning_rate": 0.0002445866790537575, "loss": 1.6021, "step": 10783 }, { "epoch": 0.85, "learning_rate": 0.0002445770860356547, "loss": 1.5616, "step": 10784 }, { "epoch": 0.85, "learning_rate": 0.00024456749237542576, "loss": 1.6641, "step": 10785 }, { "epoch": 0.85, "learning_rate": 0.00024455789807313567, "loss": 1.5882, "step": 10786 }, { "epoch": 0.85, "learning_rate": 0.00024454830312884963, "loss": 1.656, "step": 10787 }, { "epoch": 0.85, "learning_rate": 0.0002445387075426328, "loss": 1.6259, "step": 10788 }, { "epoch": 0.85, "learning_rate": 0.00024452911131455035, "loss": 1.6744, "step": 10789 }, { "epoch": 0.85, "learning_rate": 0.0002445195144446674, "loss": 1.6455, "step": 10790 }, { "epoch": 0.85, "learning_rate": 0.00024450991693304903, "loss": 1.5925, "step": 10791 }, { "epoch": 0.85, "learning_rate": 0.00024450031877976054, "loss": 1.5766, "step": 10792 }, { "epoch": 0.85, "learning_rate": 0.000244490719984867, "loss": 1.6776, "step": 10793 }, { "epoch": 0.85, "learning_rate": 0.00024448112054843365, "loss": 1.6405, "step": 10794 }, { "epoch": 0.85, "learning_rate": 0.00024447152047052563, "loss": 1.6261, "step": 10795 }, { "epoch": 0.85, "learning_rate": 0.00024446191975120815, "loss": 1.6678, "step": 10796 }, { "epoch": 0.85, "learning_rate": 0.00024445231839054633, "loss": 1.6168, "step": 10797 }, { "epoch": 0.85, "learning_rate": 0.0002444427163886054, "loss": 1.6218, "step": 10798 }, { "epoch": 0.85, "learning_rate": 0.0002444331137454505, "loss": 1.6053, "step": 10799 }, { "epoch": 0.85, "learning_rate": 0.0002444235104611469, "loss": 1.5836, "step": 10800 }, { "epoch": 0.85, "learning_rate": 0.0002444139065357598, "loss": 1.6298, "step": 10801 }, { "epoch": 0.85, "learning_rate": 0.00024440430196935435, "loss": 1.5817, "step": 10802 }, { "epoch": 0.85, "learning_rate": 0.00024439469676199575, "loss": 1.6021, "step": 10803 }, { "epoch": 0.85, "learning_rate": 0.0002443850909137493, "loss": 1.6549, "step": 10804 }, { "epoch": 0.85, "learning_rate": 0.00024437548442468013, "loss": 1.6498, "step": 10805 }, { "epoch": 0.85, "learning_rate": 0.0002443658772948536, "loss": 1.628, "step": 10806 }, { "epoch": 0.85, "learning_rate": 0.00024435626952433475, "loss": 1.584, "step": 10807 }, { "epoch": 0.85, "learning_rate": 0.0002443466611131889, "loss": 1.6582, "step": 10808 }, { "epoch": 0.85, "learning_rate": 0.0002443370520614813, "loss": 1.5935, "step": 10809 }, { "epoch": 0.85, "learning_rate": 0.0002443274423692772, "loss": 1.5968, "step": 10810 }, { "epoch": 0.85, "learning_rate": 0.00024431783203664176, "loss": 1.5911, "step": 10811 }, { "epoch": 0.85, "learning_rate": 0.0002443082210636403, "loss": 1.5845, "step": 10812 }, { "epoch": 0.85, "learning_rate": 0.0002442986094503381, "loss": 1.6288, "step": 10813 }, { "epoch": 0.85, "learning_rate": 0.0002442889971968004, "loss": 1.6597, "step": 10814 }, { "epoch": 0.85, "learning_rate": 0.0002442793843030924, "loss": 1.5725, "step": 10815 }, { "epoch": 0.85, "learning_rate": 0.00024426977076927943, "loss": 1.6095, "step": 10816 }, { "epoch": 0.85, "learning_rate": 0.00024426015659542667, "loss": 1.6436, "step": 10817 }, { "epoch": 0.85, "learning_rate": 0.00024425054178159956, "loss": 1.6499, "step": 10818 }, { "epoch": 0.85, "learning_rate": 0.0002442409263278632, "loss": 1.6414, "step": 10819 }, { "epoch": 0.85, "learning_rate": 0.00024423131023428306, "loss": 1.5894, "step": 10820 }, { "epoch": 0.85, "learning_rate": 0.0002442216935009243, "loss": 1.6073, "step": 10821 }, { "epoch": 0.85, "learning_rate": 0.0002442120761278522, "loss": 1.5992, "step": 10822 }, { "epoch": 0.85, "learning_rate": 0.0002442024581151321, "loss": 1.591, "step": 10823 }, { "epoch": 0.85, "learning_rate": 0.0002441928394628293, "loss": 1.6298, "step": 10824 }, { "epoch": 0.85, "learning_rate": 0.00024418322017100906, "loss": 1.6241, "step": 10825 }, { "epoch": 0.85, "learning_rate": 0.00024417360023973675, "loss": 1.5991, "step": 10826 }, { "epoch": 0.85, "learning_rate": 0.00024416397966907767, "loss": 1.6237, "step": 10827 }, { "epoch": 0.85, "learning_rate": 0.00024415435845909716, "loss": 1.6533, "step": 10828 }, { "epoch": 0.85, "learning_rate": 0.00024414473660986047, "loss": 1.6058, "step": 10829 }, { "epoch": 0.85, "learning_rate": 0.000244135114121433, "loss": 1.6555, "step": 10830 }, { "epoch": 0.85, "learning_rate": 0.00024412549099388006, "loss": 1.641, "step": 10831 }, { "epoch": 0.85, "learning_rate": 0.00024411586722726696, "loss": 1.6234, "step": 10832 }, { "epoch": 0.85, "learning_rate": 0.00024410624282165903, "loss": 1.6187, "step": 10833 }, { "epoch": 0.85, "learning_rate": 0.0002440966177771217, "loss": 1.6239, "step": 10834 }, { "epoch": 0.85, "learning_rate": 0.0002440869920937202, "loss": 1.6142, "step": 10835 }, { "epoch": 0.85, "learning_rate": 0.00024407736577152002, "loss": 1.6712, "step": 10836 }, { "epoch": 0.85, "learning_rate": 0.00024406773881058643, "loss": 1.6387, "step": 10837 }, { "epoch": 0.85, "learning_rate": 0.00024405811121098474, "loss": 1.5795, "step": 10838 }, { "epoch": 0.85, "learning_rate": 0.00024404848297278044, "loss": 1.6307, "step": 10839 }, { "epoch": 0.85, "learning_rate": 0.00024403885409603882, "loss": 1.6143, "step": 10840 }, { "epoch": 0.85, "learning_rate": 0.00024402922458082528, "loss": 1.5821, "step": 10841 }, { "epoch": 0.85, "learning_rate": 0.0002440195944272052, "loss": 1.6382, "step": 10842 }, { "epoch": 0.85, "learning_rate": 0.00024400996363524395, "loss": 1.587, "step": 10843 }, { "epoch": 0.85, "learning_rate": 0.00024400033220500693, "loss": 1.62, "step": 10844 }, { "epoch": 0.85, "learning_rate": 0.00024399070013655954, "loss": 1.5773, "step": 10845 }, { "epoch": 0.85, "learning_rate": 0.00024398106742996715, "loss": 1.5738, "step": 10846 }, { "epoch": 0.85, "learning_rate": 0.00024397143408529516, "loss": 1.5982, "step": 10847 }, { "epoch": 0.85, "learning_rate": 0.000243961800102609, "loss": 1.6033, "step": 10848 }, { "epoch": 0.85, "learning_rate": 0.0002439521654819741, "loss": 1.6069, "step": 10849 }, { "epoch": 0.85, "learning_rate": 0.00024394253022345578, "loss": 1.6098, "step": 10850 }, { "epoch": 0.85, "learning_rate": 0.0002439328943271196, "loss": 1.6557, "step": 10851 }, { "epoch": 0.85, "learning_rate": 0.00024392325779303085, "loss": 1.5736, "step": 10852 }, { "epoch": 0.85, "learning_rate": 0.00024391362062125502, "loss": 1.5942, "step": 10853 }, { "epoch": 0.85, "learning_rate": 0.00024390398281185754, "loss": 1.6391, "step": 10854 }, { "epoch": 0.85, "learning_rate": 0.00024389434436490384, "loss": 1.5838, "step": 10855 }, { "epoch": 0.85, "learning_rate": 0.00024388470528045937, "loss": 1.6247, "step": 10856 }, { "epoch": 0.85, "learning_rate": 0.0002438750655585895, "loss": 1.6158, "step": 10857 }, { "epoch": 0.85, "learning_rate": 0.00024386542519935978, "loss": 1.6416, "step": 10858 }, { "epoch": 0.85, "learning_rate": 0.00024385578420283563, "loss": 1.6354, "step": 10859 }, { "epoch": 0.85, "learning_rate": 0.00024384614256908253, "loss": 1.6486, "step": 10860 }, { "epoch": 0.85, "learning_rate": 0.00024383650029816584, "loss": 1.5926, "step": 10861 }, { "epoch": 0.85, "learning_rate": 0.00024382685739015117, "loss": 1.6439, "step": 10862 }, { "epoch": 0.85, "learning_rate": 0.00024381721384510383, "loss": 1.6247, "step": 10863 }, { "epoch": 0.85, "learning_rate": 0.00024380756966308945, "loss": 1.6154, "step": 10864 }, { "epoch": 0.85, "learning_rate": 0.0002437979248441734, "loss": 1.5977, "step": 10865 }, { "epoch": 0.85, "learning_rate": 0.00024378827938842122, "loss": 1.6247, "step": 10866 }, { "epoch": 0.86, "learning_rate": 0.00024377863329589836, "loss": 1.558, "step": 10867 }, { "epoch": 0.86, "learning_rate": 0.0002437689865666704, "loss": 1.5943, "step": 10868 }, { "epoch": 0.86, "learning_rate": 0.0002437593392008027, "loss": 1.6325, "step": 10869 }, { "epoch": 0.86, "learning_rate": 0.00024374969119836086, "loss": 1.6148, "step": 10870 }, { "epoch": 0.86, "learning_rate": 0.0002437400425594103, "loss": 1.6162, "step": 10871 }, { "epoch": 0.86, "learning_rate": 0.0002437303932840166, "loss": 1.5701, "step": 10872 }, { "epoch": 0.86, "learning_rate": 0.00024372074337224527, "loss": 1.6461, "step": 10873 }, { "epoch": 0.86, "learning_rate": 0.00024371109282416182, "loss": 1.6232, "step": 10874 }, { "epoch": 0.86, "learning_rate": 0.00024370144163983175, "loss": 1.5422, "step": 10875 }, { "epoch": 0.86, "learning_rate": 0.00024369178981932063, "loss": 1.6549, "step": 10876 }, { "epoch": 0.86, "learning_rate": 0.00024368213736269395, "loss": 1.6033, "step": 10877 }, { "epoch": 0.86, "learning_rate": 0.00024367248427001722, "loss": 1.6638, "step": 10878 }, { "epoch": 0.86, "learning_rate": 0.00024366283054135605, "loss": 1.636, "step": 10879 }, { "epoch": 0.86, "learning_rate": 0.00024365317617677592, "loss": 1.6129, "step": 10880 }, { "epoch": 0.86, "learning_rate": 0.00024364352117634244, "loss": 1.6716, "step": 10881 }, { "epoch": 0.86, "learning_rate": 0.00024363386554012112, "loss": 1.661, "step": 10882 }, { "epoch": 0.86, "learning_rate": 0.0002436242092681775, "loss": 1.6482, "step": 10883 }, { "epoch": 0.86, "learning_rate": 0.00024361455236057716, "loss": 1.6345, "step": 10884 }, { "epoch": 0.86, "learning_rate": 0.0002436048948173857, "loss": 1.6189, "step": 10885 }, { "epoch": 0.86, "learning_rate": 0.00024359523663866866, "loss": 1.6153, "step": 10886 }, { "epoch": 0.86, "learning_rate": 0.00024358557782449162, "loss": 1.5983, "step": 10887 }, { "epoch": 0.86, "learning_rate": 0.0002435759183749201, "loss": 1.6228, "step": 10888 }, { "epoch": 0.86, "learning_rate": 0.0002435662582900198, "loss": 1.6621, "step": 10889 }, { "epoch": 0.86, "learning_rate": 0.00024355659756985617, "loss": 1.6146, "step": 10890 }, { "epoch": 0.86, "learning_rate": 0.0002435469362144949, "loss": 1.6192, "step": 10891 }, { "epoch": 0.86, "learning_rate": 0.00024353727422400158, "loss": 1.5741, "step": 10892 }, { "epoch": 0.86, "learning_rate": 0.00024352761159844181, "loss": 1.567, "step": 10893 }, { "epoch": 0.86, "learning_rate": 0.0002435179483378811, "loss": 1.6012, "step": 10894 }, { "epoch": 0.86, "learning_rate": 0.00024350828444238517, "loss": 1.5872, "step": 10895 }, { "epoch": 0.86, "learning_rate": 0.0002434986199120196, "loss": 1.6136, "step": 10896 }, { "epoch": 0.86, "learning_rate": 0.00024348895474684995, "loss": 1.6398, "step": 10897 }, { "epoch": 0.86, "learning_rate": 0.0002434792889469419, "loss": 1.58, "step": 10898 }, { "epoch": 0.86, "learning_rate": 0.00024346962251236109, "loss": 1.69, "step": 10899 }, { "epoch": 0.86, "learning_rate": 0.0002434599554431731, "loss": 1.6065, "step": 10900 }, { "epoch": 0.86, "learning_rate": 0.0002434502877394436, "loss": 1.5887, "step": 10901 }, { "epoch": 0.86, "learning_rate": 0.00024344061940123824, "loss": 1.6324, "step": 10902 }, { "epoch": 0.86, "learning_rate": 0.00024343095042862262, "loss": 1.6537, "step": 10903 }, { "epoch": 0.86, "learning_rate": 0.0002434212808216624, "loss": 1.6594, "step": 10904 }, { "epoch": 0.86, "learning_rate": 0.00024341161058042323, "loss": 1.6473, "step": 10905 }, { "epoch": 0.86, "learning_rate": 0.0002434019397049708, "loss": 1.5956, "step": 10906 }, { "epoch": 0.86, "learning_rate": 0.00024339226819537074, "loss": 1.5811, "step": 10907 }, { "epoch": 0.86, "learning_rate": 0.00024338259605168871, "loss": 1.5784, "step": 10908 }, { "epoch": 0.86, "learning_rate": 0.00024337292327399036, "loss": 1.6222, "step": 10909 }, { "epoch": 0.86, "learning_rate": 0.00024336324986234142, "loss": 1.6289, "step": 10910 }, { "epoch": 0.86, "learning_rate": 0.0002433535758168075, "loss": 1.5911, "step": 10911 }, { "epoch": 0.86, "learning_rate": 0.00024334390113745437, "loss": 1.6125, "step": 10912 }, { "epoch": 0.86, "learning_rate": 0.0002433342258243476, "loss": 1.633, "step": 10913 }, { "epoch": 0.86, "learning_rate": 0.000243324549877553, "loss": 1.6574, "step": 10914 }, { "epoch": 0.86, "learning_rate": 0.0002433148732971362, "loss": 1.6109, "step": 10915 }, { "epoch": 0.86, "learning_rate": 0.0002433051960831629, "loss": 1.596, "step": 10916 }, { "epoch": 0.86, "learning_rate": 0.00024329551823569875, "loss": 1.6062, "step": 10917 }, { "epoch": 0.86, "learning_rate": 0.0002432858397548096, "loss": 1.648, "step": 10918 }, { "epoch": 0.86, "learning_rate": 0.000243276160640561, "loss": 1.6647, "step": 10919 }, { "epoch": 0.86, "learning_rate": 0.0002432664808930188, "loss": 1.6204, "step": 10920 }, { "epoch": 0.86, "learning_rate": 0.00024325680051224866, "loss": 1.6211, "step": 10921 }, { "epoch": 0.86, "learning_rate": 0.00024324711949831628, "loss": 1.6118, "step": 10922 }, { "epoch": 0.86, "learning_rate": 0.00024323743785128744, "loss": 1.6318, "step": 10923 }, { "epoch": 0.86, "learning_rate": 0.00024322775557122787, "loss": 1.624, "step": 10924 }, { "epoch": 0.86, "learning_rate": 0.00024321807265820325, "loss": 1.6374, "step": 10925 }, { "epoch": 0.86, "learning_rate": 0.00024320838911227936, "loss": 1.6134, "step": 10926 }, { "epoch": 0.86, "learning_rate": 0.00024319870493352195, "loss": 1.5472, "step": 10927 }, { "epoch": 0.86, "learning_rate": 0.00024318902012199678, "loss": 1.622, "step": 10928 }, { "epoch": 0.86, "learning_rate": 0.00024317933467776954, "loss": 1.585, "step": 10929 }, { "epoch": 0.86, "learning_rate": 0.00024316964860090609, "loss": 1.5608, "step": 10930 }, { "epoch": 0.86, "learning_rate": 0.0002431599618914721, "loss": 1.5804, "step": 10931 }, { "epoch": 0.86, "learning_rate": 0.00024315027454953345, "loss": 1.6444, "step": 10932 }, { "epoch": 0.86, "learning_rate": 0.0002431405865751558, "loss": 1.6544, "step": 10933 }, { "epoch": 0.86, "learning_rate": 0.00024313089796840494, "loss": 1.598, "step": 10934 }, { "epoch": 0.86, "learning_rate": 0.0002431212087293467, "loss": 1.6491, "step": 10935 }, { "epoch": 0.86, "learning_rate": 0.00024311151885804684, "loss": 1.6483, "step": 10936 }, { "epoch": 0.86, "learning_rate": 0.00024310182835457112, "loss": 1.5891, "step": 10937 }, { "epoch": 0.86, "learning_rate": 0.00024309213721898545, "loss": 1.6446, "step": 10938 }, { "epoch": 0.86, "learning_rate": 0.00024308244545135548, "loss": 1.6153, "step": 10939 }, { "epoch": 0.86, "learning_rate": 0.00024307275305174707, "loss": 1.5836, "step": 10940 }, { "epoch": 0.86, "learning_rate": 0.00024306306002022603, "loss": 1.5294, "step": 10941 }, { "epoch": 0.86, "learning_rate": 0.0002430533663568582, "loss": 1.5866, "step": 10942 }, { "epoch": 0.86, "learning_rate": 0.00024304367206170929, "loss": 1.6164, "step": 10943 }, { "epoch": 0.86, "learning_rate": 0.00024303397713484526, "loss": 1.6086, "step": 10944 }, { "epoch": 0.86, "learning_rate": 0.00024302428157633183, "loss": 1.6246, "step": 10945 }, { "epoch": 0.86, "learning_rate": 0.00024301458538623488, "loss": 1.6202, "step": 10946 }, { "epoch": 0.86, "learning_rate": 0.00024300488856462025, "loss": 1.5638, "step": 10947 }, { "epoch": 0.86, "learning_rate": 0.00024299519111155372, "loss": 1.6145, "step": 10948 }, { "epoch": 0.86, "learning_rate": 0.00024298549302710117, "loss": 1.6074, "step": 10949 }, { "epoch": 0.86, "learning_rate": 0.00024297579431132842, "loss": 1.5933, "step": 10950 }, { "epoch": 0.86, "learning_rate": 0.00024296609496430132, "loss": 1.5895, "step": 10951 }, { "epoch": 0.86, "learning_rate": 0.00024295639498608573, "loss": 1.6108, "step": 10952 }, { "epoch": 0.86, "learning_rate": 0.0002429466943767476, "loss": 1.5989, "step": 10953 }, { "epoch": 0.86, "learning_rate": 0.00024293699313635266, "loss": 1.6189, "step": 10954 }, { "epoch": 0.86, "learning_rate": 0.00024292729126496683, "loss": 1.6355, "step": 10955 }, { "epoch": 0.86, "learning_rate": 0.00024291758876265594, "loss": 1.6195, "step": 10956 }, { "epoch": 0.86, "learning_rate": 0.00024290788562948592, "loss": 1.5841, "step": 10957 }, { "epoch": 0.86, "learning_rate": 0.00024289818186552263, "loss": 1.6679, "step": 10958 }, { "epoch": 0.86, "learning_rate": 0.00024288847747083197, "loss": 1.6538, "step": 10959 }, { "epoch": 0.86, "learning_rate": 0.0002428787724454798, "loss": 1.5647, "step": 10960 }, { "epoch": 0.86, "learning_rate": 0.00024286906678953202, "loss": 1.6234, "step": 10961 }, { "epoch": 0.86, "learning_rate": 0.0002428593605030545, "loss": 1.5553, "step": 10962 }, { "epoch": 0.86, "learning_rate": 0.00024284965358611316, "loss": 1.5744, "step": 10963 }, { "epoch": 0.86, "learning_rate": 0.00024283994603877397, "loss": 1.6459, "step": 10964 }, { "epoch": 0.86, "learning_rate": 0.00024283023786110273, "loss": 1.5688, "step": 10965 }, { "epoch": 0.86, "learning_rate": 0.00024282052905316538, "loss": 1.6502, "step": 10966 }, { "epoch": 0.86, "learning_rate": 0.00024281081961502793, "loss": 1.5617, "step": 10967 }, { "epoch": 0.86, "learning_rate": 0.0002428011095467562, "loss": 1.6131, "step": 10968 }, { "epoch": 0.86, "learning_rate": 0.00024279139884841611, "loss": 1.6286, "step": 10969 }, { "epoch": 0.86, "learning_rate": 0.0002427816875200737, "loss": 1.5963, "step": 10970 }, { "epoch": 0.86, "learning_rate": 0.00024277197556179478, "loss": 1.5818, "step": 10971 }, { "epoch": 0.86, "learning_rate": 0.00024276226297364537, "loss": 1.5591, "step": 10972 }, { "epoch": 0.86, "learning_rate": 0.00024275254975569138, "loss": 1.6313, "step": 10973 }, { "epoch": 0.86, "learning_rate": 0.00024274283590799872, "loss": 1.6386, "step": 10974 }, { "epoch": 0.86, "learning_rate": 0.00024273312143063342, "loss": 1.6174, "step": 10975 }, { "epoch": 0.86, "learning_rate": 0.00024272340632366143, "loss": 1.6124, "step": 10976 }, { "epoch": 0.86, "learning_rate": 0.00024271369058714864, "loss": 1.5646, "step": 10977 }, { "epoch": 0.86, "learning_rate": 0.00024270397422116106, "loss": 1.5862, "step": 10978 }, { "epoch": 0.86, "learning_rate": 0.00024269425722576467, "loss": 1.6312, "step": 10979 }, { "epoch": 0.86, "learning_rate": 0.00024268453960102538, "loss": 1.588, "step": 10980 }, { "epoch": 0.86, "learning_rate": 0.00024267482134700927, "loss": 1.5916, "step": 10981 }, { "epoch": 0.86, "learning_rate": 0.00024266510246378223, "loss": 1.5888, "step": 10982 }, { "epoch": 0.86, "learning_rate": 0.00024265538295141032, "loss": 1.5994, "step": 10983 }, { "epoch": 0.86, "learning_rate": 0.00024264566280995944, "loss": 1.6544, "step": 10984 }, { "epoch": 0.86, "learning_rate": 0.00024263594203949567, "loss": 1.5419, "step": 10985 }, { "epoch": 0.86, "learning_rate": 0.00024262622064008494, "loss": 1.6299, "step": 10986 }, { "epoch": 0.86, "learning_rate": 0.00024261649861179334, "loss": 1.6187, "step": 10987 }, { "epoch": 0.86, "learning_rate": 0.0002426067759546868, "loss": 1.5761, "step": 10988 }, { "epoch": 0.86, "learning_rate": 0.0002425970526688314, "loss": 1.5964, "step": 10989 }, { "epoch": 0.86, "learning_rate": 0.00024258732875429302, "loss": 1.5997, "step": 10990 }, { "epoch": 0.86, "learning_rate": 0.0002425776042111378, "loss": 1.649, "step": 10991 }, { "epoch": 0.86, "learning_rate": 0.00024256787903943172, "loss": 1.6075, "step": 10992 }, { "epoch": 0.86, "learning_rate": 0.00024255815323924088, "loss": 1.5818, "step": 10993 }, { "epoch": 0.87, "learning_rate": 0.00024254842681063128, "loss": 1.5734, "step": 10994 }, { "epoch": 0.87, "learning_rate": 0.00024253869975366884, "loss": 1.6722, "step": 10995 }, { "epoch": 0.87, "learning_rate": 0.00024252897206841976, "loss": 1.5994, "step": 10996 }, { "epoch": 0.87, "learning_rate": 0.00024251924375495, "loss": 1.6722, "step": 10997 }, { "epoch": 0.87, "learning_rate": 0.00024250951481332561, "loss": 1.612, "step": 10998 }, { "epoch": 0.87, "learning_rate": 0.0002424997852436127, "loss": 1.6224, "step": 10999 }, { "epoch": 0.87, "learning_rate": 0.0002424900550458773, "loss": 1.6593, "step": 11000 }, { "epoch": 0.87, "learning_rate": 0.00024248032422018547, "loss": 1.5982, "step": 11001 }, { "epoch": 0.87, "learning_rate": 0.00024247059276660325, "loss": 1.6075, "step": 11002 }, { "epoch": 0.87, "learning_rate": 0.00024246086068519673, "loss": 1.6609, "step": 11003 }, { "epoch": 0.87, "learning_rate": 0.00024245112797603203, "loss": 1.6728, "step": 11004 }, { "epoch": 0.87, "learning_rate": 0.00024244139463917513, "loss": 1.5893, "step": 11005 }, { "epoch": 0.87, "learning_rate": 0.0002424316606746922, "loss": 1.62, "step": 11006 }, { "epoch": 0.87, "learning_rate": 0.0002424219260826493, "loss": 1.6114, "step": 11007 }, { "epoch": 0.87, "learning_rate": 0.00024241219086311251, "loss": 1.6555, "step": 11008 }, { "epoch": 0.87, "learning_rate": 0.00024240245501614796, "loss": 1.6058, "step": 11009 }, { "epoch": 0.87, "learning_rate": 0.0002423927185418218, "loss": 1.6214, "step": 11010 }, { "epoch": 0.87, "learning_rate": 0.0002423829814402, "loss": 1.6611, "step": 11011 }, { "epoch": 0.87, "learning_rate": 0.00024237324371134873, "loss": 1.6162, "step": 11012 }, { "epoch": 0.87, "learning_rate": 0.00024236350535533407, "loss": 1.6297, "step": 11013 }, { "epoch": 0.87, "learning_rate": 0.00024235376637222222, "loss": 1.6052, "step": 11014 }, { "epoch": 0.87, "learning_rate": 0.0002423440267620793, "loss": 1.6225, "step": 11015 }, { "epoch": 0.87, "learning_rate": 0.00024233428652497137, "loss": 1.6672, "step": 11016 }, { "epoch": 0.87, "learning_rate": 0.00024232454566096458, "loss": 1.6585, "step": 11017 }, { "epoch": 0.87, "learning_rate": 0.00024231480417012511, "loss": 1.5782, "step": 11018 }, { "epoch": 0.87, "learning_rate": 0.00024230506205251903, "loss": 1.6485, "step": 11019 }, { "epoch": 0.87, "learning_rate": 0.0002422953193082125, "loss": 1.5799, "step": 11020 }, { "epoch": 0.87, "learning_rate": 0.0002422855759372717, "loss": 1.6171, "step": 11021 }, { "epoch": 0.87, "learning_rate": 0.0002422758319397628, "loss": 1.608, "step": 11022 }, { "epoch": 0.87, "learning_rate": 0.00024226608731575187, "loss": 1.6681, "step": 11023 }, { "epoch": 0.87, "learning_rate": 0.00024225634206530514, "loss": 1.569, "step": 11024 }, { "epoch": 0.87, "learning_rate": 0.00024224659618848877, "loss": 1.6273, "step": 11025 }, { "epoch": 0.87, "learning_rate": 0.00024223684968536892, "loss": 1.6502, "step": 11026 }, { "epoch": 0.87, "learning_rate": 0.00024222710255601178, "loss": 1.6239, "step": 11027 }, { "epoch": 0.87, "learning_rate": 0.00024221735480048348, "loss": 1.5972, "step": 11028 }, { "epoch": 0.87, "learning_rate": 0.0002422076064188502, "loss": 1.6249, "step": 11029 }, { "epoch": 0.87, "learning_rate": 0.00024219785741117823, "loss": 1.6236, "step": 11030 }, { "epoch": 0.87, "learning_rate": 0.00024218810777753365, "loss": 1.6115, "step": 11031 }, { "epoch": 0.87, "learning_rate": 0.00024217835751798268, "loss": 1.6321, "step": 11032 }, { "epoch": 0.87, "learning_rate": 0.00024216860663259153, "loss": 1.6355, "step": 11033 }, { "epoch": 0.87, "learning_rate": 0.0002421588551214264, "loss": 1.6416, "step": 11034 }, { "epoch": 0.87, "learning_rate": 0.00024214910298455354, "loss": 1.6129, "step": 11035 }, { "epoch": 0.87, "learning_rate": 0.0002421393502220391, "loss": 1.6787, "step": 11036 }, { "epoch": 0.87, "learning_rate": 0.00024212959683394929, "loss": 1.5931, "step": 11037 }, { "epoch": 0.87, "learning_rate": 0.0002421198428203504, "loss": 1.6508, "step": 11038 }, { "epoch": 0.87, "learning_rate": 0.0002421100881813086, "loss": 1.637, "step": 11039 }, { "epoch": 0.87, "learning_rate": 0.00024210033291689016, "loss": 1.5627, "step": 11040 }, { "epoch": 0.87, "learning_rate": 0.00024209057702716125, "loss": 1.6017, "step": 11041 }, { "epoch": 0.87, "learning_rate": 0.00024208082051218815, "loss": 1.6246, "step": 11042 }, { "epoch": 0.87, "learning_rate": 0.0002420710633720371, "loss": 1.5897, "step": 11043 }, { "epoch": 0.87, "learning_rate": 0.00024206130560677433, "loss": 1.6566, "step": 11044 }, { "epoch": 0.87, "learning_rate": 0.0002420515472164661, "loss": 1.5771, "step": 11045 }, { "epoch": 0.87, "learning_rate": 0.00024204178820117864, "loss": 1.6203, "step": 11046 }, { "epoch": 0.87, "learning_rate": 0.00024203202856097822, "loss": 1.6005, "step": 11047 }, { "epoch": 0.87, "learning_rate": 0.00024202226829593117, "loss": 1.636, "step": 11048 }, { "epoch": 0.87, "learning_rate": 0.0002420125074061037, "loss": 1.5595, "step": 11049 }, { "epoch": 0.87, "learning_rate": 0.00024200274589156206, "loss": 1.611, "step": 11050 }, { "epoch": 0.87, "learning_rate": 0.00024199298375237254, "loss": 1.6096, "step": 11051 }, { "epoch": 0.87, "learning_rate": 0.00024198322098860142, "loss": 1.6202, "step": 11052 }, { "epoch": 0.87, "learning_rate": 0.000241973457600315, "loss": 1.6055, "step": 11053 }, { "epoch": 0.87, "learning_rate": 0.00024196369358757956, "loss": 1.5777, "step": 11054 }, { "epoch": 0.87, "learning_rate": 0.00024195392895046141, "loss": 1.6325, "step": 11055 }, { "epoch": 0.87, "learning_rate": 0.0002419441636890268, "loss": 1.5823, "step": 11056 }, { "epoch": 0.87, "learning_rate": 0.00024193439780334207, "loss": 1.6212, "step": 11057 }, { "epoch": 0.87, "learning_rate": 0.0002419246312934735, "loss": 1.6108, "step": 11058 }, { "epoch": 0.87, "learning_rate": 0.00024191486415948743, "loss": 1.5527, "step": 11059 }, { "epoch": 0.87, "learning_rate": 0.00024190509640145013, "loss": 1.633, "step": 11060 }, { "epoch": 0.87, "learning_rate": 0.00024189532801942795, "loss": 1.6111, "step": 11061 }, { "epoch": 0.87, "learning_rate": 0.00024188555901348717, "loss": 1.6389, "step": 11062 }, { "epoch": 0.87, "learning_rate": 0.00024187578938369422, "loss": 1.5961, "step": 11063 }, { "epoch": 0.87, "learning_rate": 0.00024186601913011533, "loss": 1.6371, "step": 11064 }, { "epoch": 0.87, "learning_rate": 0.00024185624825281686, "loss": 1.6363, "step": 11065 }, { "epoch": 0.87, "learning_rate": 0.00024184647675186521, "loss": 1.6277, "step": 11066 }, { "epoch": 0.87, "learning_rate": 0.0002418367046273266, "loss": 1.6119, "step": 11067 }, { "epoch": 0.87, "learning_rate": 0.00024182693187926746, "loss": 1.5937, "step": 11068 }, { "epoch": 0.87, "learning_rate": 0.00024181715850775417, "loss": 1.616, "step": 11069 }, { "epoch": 0.87, "learning_rate": 0.00024180738451285295, "loss": 1.6139, "step": 11070 }, { "epoch": 0.87, "learning_rate": 0.00024179760989463035, "loss": 1.6296, "step": 11071 }, { "epoch": 0.87, "learning_rate": 0.00024178783465315256, "loss": 1.6283, "step": 11072 }, { "epoch": 0.87, "learning_rate": 0.0002417780587884861, "loss": 1.5892, "step": 11073 }, { "epoch": 0.87, "learning_rate": 0.00024176828230069723, "loss": 1.5874, "step": 11074 }, { "epoch": 0.87, "learning_rate": 0.00024175850518985234, "loss": 1.612, "step": 11075 }, { "epoch": 0.87, "learning_rate": 0.00024174872745601789, "loss": 1.5765, "step": 11076 }, { "epoch": 0.87, "learning_rate": 0.00024173894909926017, "loss": 1.6183, "step": 11077 }, { "epoch": 0.87, "learning_rate": 0.00024172917011964563, "loss": 1.6212, "step": 11078 }, { "epoch": 0.87, "learning_rate": 0.0002417193905172406, "loss": 1.669, "step": 11079 }, { "epoch": 0.87, "learning_rate": 0.00024170961029211158, "loss": 1.6459, "step": 11080 }, { "epoch": 0.87, "learning_rate": 0.0002416998294443249, "loss": 1.634, "step": 11081 }, { "epoch": 0.87, "learning_rate": 0.00024169004797394702, "loss": 1.658, "step": 11082 }, { "epoch": 0.87, "learning_rate": 0.00024168026588104426, "loss": 1.6377, "step": 11083 }, { "epoch": 0.87, "learning_rate": 0.00024167048316568306, "loss": 1.6101, "step": 11084 }, { "epoch": 0.87, "learning_rate": 0.00024166069982792994, "loss": 1.5828, "step": 11085 }, { "epoch": 0.87, "learning_rate": 0.00024165091586785122, "loss": 1.6031, "step": 11086 }, { "epoch": 0.87, "learning_rate": 0.00024164113128551334, "loss": 1.5942, "step": 11087 }, { "epoch": 0.87, "learning_rate": 0.00024163134608098276, "loss": 1.6409, "step": 11088 }, { "epoch": 0.87, "learning_rate": 0.00024162156025432595, "loss": 1.629, "step": 11089 }, { "epoch": 0.87, "learning_rate": 0.00024161177380560927, "loss": 1.6838, "step": 11090 }, { "epoch": 0.87, "learning_rate": 0.0002416019867348992, "loss": 1.6122, "step": 11091 }, { "epoch": 0.87, "learning_rate": 0.00024159219904226216, "loss": 1.6247, "step": 11092 }, { "epoch": 0.87, "learning_rate": 0.00024158241072776468, "loss": 1.6191, "step": 11093 }, { "epoch": 0.87, "learning_rate": 0.00024157262179147314, "loss": 1.6421, "step": 11094 }, { "epoch": 0.87, "learning_rate": 0.0002415628322334541, "loss": 1.6294, "step": 11095 }, { "epoch": 0.87, "learning_rate": 0.0002415530420537739, "loss": 1.6342, "step": 11096 }, { "epoch": 0.87, "learning_rate": 0.00024154325125249905, "loss": 1.5836, "step": 11097 }, { "epoch": 0.87, "learning_rate": 0.0002415334598296961, "loss": 1.5217, "step": 11098 }, { "epoch": 0.87, "learning_rate": 0.0002415236677854314, "loss": 1.5885, "step": 11099 }, { "epoch": 0.87, "learning_rate": 0.00024151387511977157, "loss": 1.6705, "step": 11100 }, { "epoch": 0.87, "learning_rate": 0.00024150408183278298, "loss": 1.6544, "step": 11101 }, { "epoch": 0.87, "learning_rate": 0.0002414942879245322, "loss": 1.5796, "step": 11102 }, { "epoch": 0.87, "learning_rate": 0.00024148449339508565, "loss": 1.6512, "step": 11103 }, { "epoch": 0.87, "learning_rate": 0.00024147469824450994, "loss": 1.5832, "step": 11104 }, { "epoch": 0.87, "learning_rate": 0.0002414649024728715, "loss": 1.5627, "step": 11105 }, { "epoch": 0.87, "learning_rate": 0.00024145510608023678, "loss": 1.6442, "step": 11106 }, { "epoch": 0.87, "learning_rate": 0.00024144530906667245, "loss": 1.5958, "step": 11107 }, { "epoch": 0.87, "learning_rate": 0.00024143551143224486, "loss": 1.6585, "step": 11108 }, { "epoch": 0.87, "learning_rate": 0.00024142571317702064, "loss": 1.6667, "step": 11109 }, { "epoch": 0.87, "learning_rate": 0.00024141591430106626, "loss": 1.5954, "step": 11110 }, { "epoch": 0.87, "learning_rate": 0.00024140611480444828, "loss": 1.5957, "step": 11111 }, { "epoch": 0.87, "learning_rate": 0.00024139631468723325, "loss": 1.5929, "step": 11112 }, { "epoch": 0.87, "learning_rate": 0.00024138651394948766, "loss": 1.5659, "step": 11113 }, { "epoch": 0.87, "learning_rate": 0.00024137671259127807, "loss": 1.6026, "step": 11114 }, { "epoch": 0.87, "learning_rate": 0.000241366910612671, "loss": 1.637, "step": 11115 }, { "epoch": 0.87, "learning_rate": 0.00024135710801373304, "loss": 1.6419, "step": 11116 }, { "epoch": 0.87, "learning_rate": 0.00024134730479453078, "loss": 1.6255, "step": 11117 }, { "epoch": 0.87, "learning_rate": 0.00024133750095513067, "loss": 1.6021, "step": 11118 }, { "epoch": 0.87, "learning_rate": 0.0002413276964955994, "loss": 1.6005, "step": 11119 }, { "epoch": 0.87, "learning_rate": 0.0002413178914160034, "loss": 1.609, "step": 11120 }, { "epoch": 0.88, "learning_rate": 0.00024130808571640934, "loss": 1.6062, "step": 11121 }, { "epoch": 0.88, "learning_rate": 0.00024129827939688375, "loss": 1.6143, "step": 11122 }, { "epoch": 0.88, "learning_rate": 0.00024128847245749322, "loss": 1.5732, "step": 11123 }, { "epoch": 0.88, "learning_rate": 0.00024127866489830437, "loss": 1.5496, "step": 11124 }, { "epoch": 0.88, "learning_rate": 0.00024126885671938377, "loss": 1.6169, "step": 11125 }, { "epoch": 0.88, "learning_rate": 0.000241259047920798, "loss": 1.6087, "step": 11126 }, { "epoch": 0.88, "learning_rate": 0.0002412492385026136, "loss": 1.6081, "step": 11127 }, { "epoch": 0.88, "learning_rate": 0.00024123942846489727, "loss": 1.5741, "step": 11128 }, { "epoch": 0.88, "learning_rate": 0.00024122961780771558, "loss": 1.5678, "step": 11129 }, { "epoch": 0.88, "learning_rate": 0.00024121980653113507, "loss": 1.6017, "step": 11130 }, { "epoch": 0.88, "learning_rate": 0.00024120999463522242, "loss": 1.6645, "step": 11131 }, { "epoch": 0.88, "learning_rate": 0.00024120018212004431, "loss": 1.6178, "step": 11132 }, { "epoch": 0.88, "learning_rate": 0.0002411903689856672, "loss": 1.6119, "step": 11133 }, { "epoch": 0.88, "learning_rate": 0.0002411805552321579, "loss": 1.5741, "step": 11134 }, { "epoch": 0.88, "learning_rate": 0.0002411707408595829, "loss": 1.574, "step": 11135 }, { "epoch": 0.88, "learning_rate": 0.00024116092586800892, "loss": 1.6379, "step": 11136 }, { "epoch": 0.88, "learning_rate": 0.00024115111025750253, "loss": 1.5832, "step": 11137 }, { "epoch": 0.88, "learning_rate": 0.00024114129402813038, "loss": 1.6383, "step": 11138 }, { "epoch": 0.88, "learning_rate": 0.00024113147717995915, "loss": 1.6275, "step": 11139 }, { "epoch": 0.88, "learning_rate": 0.0002411216597130555, "loss": 1.6401, "step": 11140 }, { "epoch": 0.88, "learning_rate": 0.00024111184162748604, "loss": 1.6499, "step": 11141 }, { "epoch": 0.88, "learning_rate": 0.0002411020229233175, "loss": 1.5724, "step": 11142 }, { "epoch": 0.88, "learning_rate": 0.00024109220360061644, "loss": 1.5918, "step": 11143 }, { "epoch": 0.88, "learning_rate": 0.00024108238365944964, "loss": 1.5522, "step": 11144 }, { "epoch": 0.88, "learning_rate": 0.0002410725630998837, "loss": 1.5375, "step": 11145 }, { "epoch": 0.88, "learning_rate": 0.00024106274192198533, "loss": 1.6458, "step": 11146 }, { "epoch": 0.88, "learning_rate": 0.00024105292012582117, "loss": 1.5791, "step": 11147 }, { "epoch": 0.88, "learning_rate": 0.00024104309771145793, "loss": 1.5612, "step": 11148 }, { "epoch": 0.88, "learning_rate": 0.00024103327467896228, "loss": 1.6115, "step": 11149 }, { "epoch": 0.88, "learning_rate": 0.00024102345102840095, "loss": 1.6747, "step": 11150 }, { "epoch": 0.88, "learning_rate": 0.00024101362675984066, "loss": 1.6345, "step": 11151 }, { "epoch": 0.88, "learning_rate": 0.00024100380187334802, "loss": 1.5654, "step": 11152 }, { "epoch": 0.88, "learning_rate": 0.00024099397636898978, "loss": 1.6005, "step": 11153 }, { "epoch": 0.88, "learning_rate": 0.00024098415024683268, "loss": 1.5749, "step": 11154 }, { "epoch": 0.88, "learning_rate": 0.0002409743235069434, "loss": 1.5834, "step": 11155 }, { "epoch": 0.88, "learning_rate": 0.0002409644961493887, "loss": 1.6048, "step": 11156 }, { "epoch": 0.88, "learning_rate": 0.0002409546681742352, "loss": 1.6022, "step": 11157 }, { "epoch": 0.88, "learning_rate": 0.00024094483958154973, "loss": 1.6187, "step": 11158 }, { "epoch": 0.88, "learning_rate": 0.000240935010371399, "loss": 1.5612, "step": 11159 }, { "epoch": 0.88, "learning_rate": 0.00024092518054384972, "loss": 1.577, "step": 11160 }, { "epoch": 0.88, "learning_rate": 0.00024091535009896866, "loss": 1.6369, "step": 11161 }, { "epoch": 0.88, "learning_rate": 0.00024090551903682253, "loss": 1.5824, "step": 11162 }, { "epoch": 0.88, "learning_rate": 0.00024089568735747807, "loss": 1.6228, "step": 11163 }, { "epoch": 0.88, "learning_rate": 0.00024088585506100207, "loss": 1.6131, "step": 11164 }, { "epoch": 0.88, "learning_rate": 0.00024087602214746128, "loss": 1.634, "step": 11165 }, { "epoch": 0.88, "learning_rate": 0.0002408661886169224, "loss": 1.6416, "step": 11166 }, { "epoch": 0.88, "learning_rate": 0.00024085635446945234, "loss": 1.6045, "step": 11167 }, { "epoch": 0.88, "learning_rate": 0.00024084651970511772, "loss": 1.6165, "step": 11168 }, { "epoch": 0.88, "learning_rate": 0.00024083668432398536, "loss": 1.5882, "step": 11169 }, { "epoch": 0.88, "learning_rate": 0.00024082684832612202, "loss": 1.6203, "step": 11170 }, { "epoch": 0.88, "learning_rate": 0.0002408170117115945, "loss": 1.6181, "step": 11171 }, { "epoch": 0.88, "learning_rate": 0.00024080717448046962, "loss": 1.6201, "step": 11172 }, { "epoch": 0.88, "learning_rate": 0.00024079733663281413, "loss": 1.6258, "step": 11173 }, { "epoch": 0.88, "learning_rate": 0.00024078749816869484, "loss": 1.6196, "step": 11174 }, { "epoch": 0.88, "learning_rate": 0.00024077765908817853, "loss": 1.6341, "step": 11175 }, { "epoch": 0.88, "learning_rate": 0.00024076781939133201, "loss": 1.6723, "step": 11176 }, { "epoch": 0.88, "learning_rate": 0.0002407579790782221, "loss": 1.6355, "step": 11177 }, { "epoch": 0.88, "learning_rate": 0.00024074813814891556, "loss": 1.6496, "step": 11178 }, { "epoch": 0.88, "learning_rate": 0.00024073829660347927, "loss": 1.6015, "step": 11179 }, { "epoch": 0.88, "learning_rate": 0.00024072845444198, "loss": 1.6202, "step": 11180 }, { "epoch": 0.88, "learning_rate": 0.00024071861166448464, "loss": 1.6076, "step": 11181 }, { "epoch": 0.88, "learning_rate": 0.00024070876827105987, "loss": 1.6017, "step": 11182 }, { "epoch": 0.88, "learning_rate": 0.0002406989242617727, "loss": 1.5539, "step": 11183 }, { "epoch": 0.88, "learning_rate": 0.0002406890796366899, "loss": 1.5802, "step": 11184 }, { "epoch": 0.88, "learning_rate": 0.00024067923439587824, "loss": 1.6066, "step": 11185 }, { "epoch": 0.88, "learning_rate": 0.00024066938853940464, "loss": 1.6228, "step": 11186 }, { "epoch": 0.88, "learning_rate": 0.00024065954206733592, "loss": 1.5727, "step": 11187 }, { "epoch": 0.88, "learning_rate": 0.00024064969497973894, "loss": 1.6016, "step": 11188 }, { "epoch": 0.88, "learning_rate": 0.0002406398472766806, "loss": 1.6232, "step": 11189 }, { "epoch": 0.88, "learning_rate": 0.00024062999895822765, "loss": 1.5939, "step": 11190 }, { "epoch": 0.88, "learning_rate": 0.00024062015002444709, "loss": 1.6172, "step": 11191 }, { "epoch": 0.88, "learning_rate": 0.0002406103004754057, "loss": 1.5981, "step": 11192 }, { "epoch": 0.88, "learning_rate": 0.00024060045031117034, "loss": 1.6426, "step": 11193 }, { "epoch": 0.88, "learning_rate": 0.00024059059953180793, "loss": 1.5578, "step": 11194 }, { "epoch": 0.88, "learning_rate": 0.00024058074813738533, "loss": 1.6006, "step": 11195 }, { "epoch": 0.88, "learning_rate": 0.00024057089612796945, "loss": 1.6082, "step": 11196 }, { "epoch": 0.88, "learning_rate": 0.00024056104350362716, "loss": 1.6283, "step": 11197 }, { "epoch": 0.88, "learning_rate": 0.00024055119026442543, "loss": 1.605, "step": 11198 }, { "epoch": 0.88, "learning_rate": 0.000240541336410431, "loss": 1.6037, "step": 11199 }, { "epoch": 0.88, "learning_rate": 0.00024053148194171087, "loss": 1.5952, "step": 11200 }, { "epoch": 0.88, "learning_rate": 0.00024052162685833198, "loss": 1.6169, "step": 11201 }, { "epoch": 0.88, "learning_rate": 0.00024051177116036116, "loss": 1.5987, "step": 11202 }, { "epoch": 0.88, "learning_rate": 0.00024050191484786538, "loss": 1.6703, "step": 11203 }, { "epoch": 0.88, "learning_rate": 0.00024049205792091156, "loss": 1.565, "step": 11204 }, { "epoch": 0.88, "learning_rate": 0.00024048220037956657, "loss": 1.6087, "step": 11205 }, { "epoch": 0.88, "learning_rate": 0.00024047234222389737, "loss": 1.5867, "step": 11206 }, { "epoch": 0.88, "learning_rate": 0.0002404624834539709, "loss": 1.618, "step": 11207 }, { "epoch": 0.88, "learning_rate": 0.0002404526240698541, "loss": 1.559, "step": 11208 }, { "epoch": 0.88, "learning_rate": 0.0002404427640716139, "loss": 1.5937, "step": 11209 }, { "epoch": 0.88, "learning_rate": 0.00024043290345931724, "loss": 1.6289, "step": 11210 }, { "epoch": 0.88, "learning_rate": 0.00024042304223303104, "loss": 1.5809, "step": 11211 }, { "epoch": 0.88, "learning_rate": 0.00024041318039282232, "loss": 1.5888, "step": 11212 }, { "epoch": 0.88, "learning_rate": 0.00024040331793875799, "loss": 1.5769, "step": 11213 }, { "epoch": 0.88, "learning_rate": 0.00024039345487090504, "loss": 1.6093, "step": 11214 }, { "epoch": 0.88, "learning_rate": 0.0002403835911893304, "loss": 1.6149, "step": 11215 }, { "epoch": 0.88, "learning_rate": 0.000240373726894101, "loss": 1.5835, "step": 11216 }, { "epoch": 0.88, "learning_rate": 0.00024036386198528393, "loss": 1.612, "step": 11217 }, { "epoch": 0.88, "learning_rate": 0.00024035399646294607, "loss": 1.5382, "step": 11218 }, { "epoch": 0.88, "learning_rate": 0.00024034413032715445, "loss": 1.601, "step": 11219 }, { "epoch": 0.88, "learning_rate": 0.0002403342635779761, "loss": 1.6222, "step": 11220 }, { "epoch": 0.88, "learning_rate": 0.00024032439621547786, "loss": 1.5884, "step": 11221 }, { "epoch": 0.88, "learning_rate": 0.00024031452823972685, "loss": 1.5299, "step": 11222 }, { "epoch": 0.88, "learning_rate": 0.00024030465965079004, "loss": 1.6656, "step": 11223 }, { "epoch": 0.88, "learning_rate": 0.0002402947904487344, "loss": 1.5758, "step": 11224 }, { "epoch": 0.88, "learning_rate": 0.00024028492063362698, "loss": 1.6135, "step": 11225 }, { "epoch": 0.88, "learning_rate": 0.0002402750502055348, "loss": 1.5665, "step": 11226 }, { "epoch": 0.88, "learning_rate": 0.0002402651791645248, "loss": 1.6702, "step": 11227 }, { "epoch": 0.88, "learning_rate": 0.00024025530751066405, "loss": 1.6292, "step": 11228 }, { "epoch": 0.88, "learning_rate": 0.00024024543524401963, "loss": 1.5687, "step": 11229 }, { "epoch": 0.88, "learning_rate": 0.00024023556236465844, "loss": 1.6109, "step": 11230 }, { "epoch": 0.88, "learning_rate": 0.0002402256888726476, "loss": 1.6124, "step": 11231 }, { "epoch": 0.88, "learning_rate": 0.00024021581476805408, "loss": 1.5829, "step": 11232 }, { "epoch": 0.88, "learning_rate": 0.00024020594005094503, "loss": 1.6157, "step": 11233 }, { "epoch": 0.88, "learning_rate": 0.0002401960647213874, "loss": 1.6545, "step": 11234 }, { "epoch": 0.88, "learning_rate": 0.0002401861887794483, "loss": 1.6087, "step": 11235 }, { "epoch": 0.88, "learning_rate": 0.00024017631222519469, "loss": 1.6269, "step": 11236 }, { "epoch": 0.88, "learning_rate": 0.00024016643505869368, "loss": 1.6178, "step": 11237 }, { "epoch": 0.88, "learning_rate": 0.00024015655728001236, "loss": 1.6249, "step": 11238 }, { "epoch": 0.88, "learning_rate": 0.0002401466788892178, "loss": 1.647, "step": 11239 }, { "epoch": 0.88, "learning_rate": 0.00024013679988637703, "loss": 1.622, "step": 11240 }, { "epoch": 0.88, "learning_rate": 0.00024012692027155705, "loss": 1.5836, "step": 11241 }, { "epoch": 0.88, "learning_rate": 0.00024011704004482507, "loss": 1.5313, "step": 11242 }, { "epoch": 0.88, "learning_rate": 0.00024010715920624816, "loss": 1.607, "step": 11243 }, { "epoch": 0.88, "learning_rate": 0.0002400972777558933, "loss": 1.6103, "step": 11244 }, { "epoch": 0.88, "learning_rate": 0.00024008739569382766, "loss": 1.6137, "step": 11245 }, { "epoch": 0.88, "learning_rate": 0.00024007751302011836, "loss": 1.6107, "step": 11246 }, { "epoch": 0.88, "learning_rate": 0.0002400676297348324, "loss": 1.636, "step": 11247 }, { "epoch": 0.89, "learning_rate": 0.00024005774583803696, "loss": 1.6596, "step": 11248 }, { "epoch": 0.89, "learning_rate": 0.0002400478613297991, "loss": 1.631, "step": 11249 }, { "epoch": 0.89, "learning_rate": 0.00024003797621018598, "loss": 1.6387, "step": 11250 }, { "epoch": 0.89, "learning_rate": 0.00024002809047926472, "loss": 1.6506, "step": 11251 }, { "epoch": 0.89, "learning_rate": 0.00024001820413710237, "loss": 1.6187, "step": 11252 }, { "epoch": 0.89, "learning_rate": 0.0002400083171837661, "loss": 1.6068, "step": 11253 }, { "epoch": 0.89, "learning_rate": 0.00023999842961932303, "loss": 1.61, "step": 11254 }, { "epoch": 0.89, "learning_rate": 0.00023998854144384026, "loss": 1.5818, "step": 11255 }, { "epoch": 0.89, "learning_rate": 0.000239978652657385, "loss": 1.5759, "step": 11256 }, { "epoch": 0.89, "learning_rate": 0.0002399687632600243, "loss": 1.5945, "step": 11257 }, { "epoch": 0.89, "learning_rate": 0.00023995887325182537, "loss": 1.6797, "step": 11258 }, { "epoch": 0.89, "learning_rate": 0.00023994898263285535, "loss": 1.5869, "step": 11259 }, { "epoch": 0.89, "learning_rate": 0.00023993909140318132, "loss": 1.5934, "step": 11260 }, { "epoch": 0.89, "learning_rate": 0.00023992919956287051, "loss": 1.6329, "step": 11261 }, { "epoch": 0.89, "learning_rate": 0.0002399193071119901, "loss": 1.5595, "step": 11262 }, { "epoch": 0.89, "learning_rate": 0.0002399094140506072, "loss": 1.6069, "step": 11263 }, { "epoch": 0.89, "learning_rate": 0.00023989952037878898, "loss": 1.6138, "step": 11264 }, { "epoch": 0.89, "learning_rate": 0.00023988962609660262, "loss": 1.6082, "step": 11265 }, { "epoch": 0.89, "learning_rate": 0.00023987973120411532, "loss": 1.6145, "step": 11266 }, { "epoch": 0.89, "learning_rate": 0.0002398698357013942, "loss": 1.6266, "step": 11267 }, { "epoch": 0.89, "learning_rate": 0.00023985993958850656, "loss": 1.6292, "step": 11268 }, { "epoch": 0.89, "learning_rate": 0.0002398500428655195, "loss": 1.5959, "step": 11269 }, { "epoch": 0.89, "learning_rate": 0.00023984014553250026, "loss": 1.5823, "step": 11270 }, { "epoch": 0.89, "learning_rate": 0.00023983024758951596, "loss": 1.6635, "step": 11271 }, { "epoch": 0.89, "learning_rate": 0.00023982034903663387, "loss": 1.5589, "step": 11272 }, { "epoch": 0.89, "learning_rate": 0.00023981044987392112, "loss": 1.5891, "step": 11273 }, { "epoch": 0.89, "learning_rate": 0.00023980055010144508, "loss": 1.5997, "step": 11274 }, { "epoch": 0.89, "learning_rate": 0.0002397906497192728, "loss": 1.6442, "step": 11275 }, { "epoch": 0.89, "learning_rate": 0.00023978074872747158, "loss": 1.625, "step": 11276 }, { "epoch": 0.89, "learning_rate": 0.00023977084712610862, "loss": 1.6188, "step": 11277 }, { "epoch": 0.89, "learning_rate": 0.00023976094491525113, "loss": 1.5332, "step": 11278 }, { "epoch": 0.89, "learning_rate": 0.00023975104209496634, "loss": 1.6206, "step": 11279 }, { "epoch": 0.89, "learning_rate": 0.00023974113866532154, "loss": 1.5756, "step": 11280 }, { "epoch": 0.89, "learning_rate": 0.00023973123462638389, "loss": 1.6257, "step": 11281 }, { "epoch": 0.89, "learning_rate": 0.00023972132997822072, "loss": 1.567, "step": 11282 }, { "epoch": 0.89, "learning_rate": 0.00023971142472089922, "loss": 1.6107, "step": 11283 }, { "epoch": 0.89, "learning_rate": 0.00023970151885448668, "loss": 1.6339, "step": 11284 }, { "epoch": 0.89, "learning_rate": 0.0002396916123790503, "loss": 1.6176, "step": 11285 }, { "epoch": 0.89, "learning_rate": 0.00023968170529465734, "loss": 1.6626, "step": 11286 }, { "epoch": 0.89, "learning_rate": 0.0002396717976013751, "loss": 1.59, "step": 11287 }, { "epoch": 0.89, "learning_rate": 0.00023966188929927087, "loss": 1.6095, "step": 11288 }, { "epoch": 0.89, "learning_rate": 0.00023965198038841188, "loss": 1.624, "step": 11289 }, { "epoch": 0.89, "learning_rate": 0.00023964207086886542, "loss": 1.5775, "step": 11290 }, { "epoch": 0.89, "learning_rate": 0.00023963216074069876, "loss": 1.6203, "step": 11291 }, { "epoch": 0.89, "learning_rate": 0.0002396222500039792, "loss": 1.6078, "step": 11292 }, { "epoch": 0.89, "learning_rate": 0.000239612338658774, "loss": 1.576, "step": 11293 }, { "epoch": 0.89, "learning_rate": 0.0002396024267051505, "loss": 1.5565, "step": 11294 }, { "epoch": 0.89, "learning_rate": 0.00023959251414317596, "loss": 1.5867, "step": 11295 }, { "epoch": 0.89, "learning_rate": 0.00023958260097291768, "loss": 1.607, "step": 11296 }, { "epoch": 0.89, "learning_rate": 0.000239572687194443, "loss": 1.5743, "step": 11297 }, { "epoch": 0.89, "learning_rate": 0.0002395627728078192, "loss": 1.6087, "step": 11298 }, { "epoch": 0.89, "learning_rate": 0.00023955285781311356, "loss": 1.5946, "step": 11299 }, { "epoch": 0.89, "learning_rate": 0.00023954294221039342, "loss": 1.5776, "step": 11300 }, { "epoch": 0.89, "learning_rate": 0.00023953302599972616, "loss": 1.6585, "step": 11301 }, { "epoch": 0.89, "learning_rate": 0.0002395231091811791, "loss": 1.5594, "step": 11302 }, { "epoch": 0.89, "learning_rate": 0.0002395131917548195, "loss": 1.5933, "step": 11303 }, { "epoch": 0.89, "learning_rate": 0.0002395032737207147, "loss": 1.6031, "step": 11304 }, { "epoch": 0.89, "learning_rate": 0.00023949335507893207, "loss": 1.6679, "step": 11305 }, { "epoch": 0.89, "learning_rate": 0.00023948343582953893, "loss": 1.5418, "step": 11306 }, { "epoch": 0.89, "learning_rate": 0.00023947351597260267, "loss": 1.5369, "step": 11307 }, { "epoch": 0.89, "learning_rate": 0.00023946359550819062, "loss": 1.6042, "step": 11308 }, { "epoch": 0.89, "learning_rate": 0.00023945367443637013, "loss": 1.6443, "step": 11309 }, { "epoch": 0.89, "learning_rate": 0.00023944375275720853, "loss": 1.5994, "step": 11310 }, { "epoch": 0.89, "learning_rate": 0.00023943383047077323, "loss": 1.6244, "step": 11311 }, { "epoch": 0.89, "learning_rate": 0.00023942390757713153, "loss": 1.6, "step": 11312 }, { "epoch": 0.89, "learning_rate": 0.00023941398407635088, "loss": 1.6228, "step": 11313 }, { "epoch": 0.89, "learning_rate": 0.00023940405996849862, "loss": 1.6429, "step": 11314 }, { "epoch": 0.89, "learning_rate": 0.00023939413525364214, "loss": 1.6167, "step": 11315 }, { "epoch": 0.89, "learning_rate": 0.0002393842099318488, "loss": 1.5846, "step": 11316 }, { "epoch": 0.89, "learning_rate": 0.000239374284003186, "loss": 1.5714, "step": 11317 }, { "epoch": 0.89, "learning_rate": 0.00023936435746772113, "loss": 1.6067, "step": 11318 }, { "epoch": 0.89, "learning_rate": 0.0002393544303255216, "loss": 1.6121, "step": 11319 }, { "epoch": 0.89, "learning_rate": 0.00023934450257665478, "loss": 1.5986, "step": 11320 }, { "epoch": 0.89, "learning_rate": 0.00023933457422118808, "loss": 1.6232, "step": 11321 }, { "epoch": 0.89, "learning_rate": 0.00023932464525918898, "loss": 1.6356, "step": 11322 }, { "epoch": 0.89, "learning_rate": 0.00023931471569072478, "loss": 1.5961, "step": 11323 }, { "epoch": 0.89, "learning_rate": 0.000239304785515863, "loss": 1.6255, "step": 11324 }, { "epoch": 0.89, "learning_rate": 0.00023929485473467093, "loss": 1.6289, "step": 11325 }, { "epoch": 0.89, "learning_rate": 0.0002392849233472161, "loss": 1.6528, "step": 11326 }, { "epoch": 0.89, "learning_rate": 0.00023927499135356593, "loss": 1.6195, "step": 11327 }, { "epoch": 0.89, "learning_rate": 0.00023926505875378787, "loss": 1.6592, "step": 11328 }, { "epoch": 0.89, "learning_rate": 0.00023925512554794927, "loss": 1.6012, "step": 11329 }, { "epoch": 0.89, "learning_rate": 0.00023924519173611761, "loss": 1.568, "step": 11330 }, { "epoch": 0.89, "learning_rate": 0.0002392352573183604, "loss": 1.6183, "step": 11331 }, { "epoch": 0.89, "learning_rate": 0.000239225322294745, "loss": 1.6011, "step": 11332 }, { "epoch": 0.89, "learning_rate": 0.0002392153866653389, "loss": 1.5986, "step": 11333 }, { "epoch": 0.89, "learning_rate": 0.00023920545043020958, "loss": 1.5718, "step": 11334 }, { "epoch": 0.89, "learning_rate": 0.0002391955135894245, "loss": 1.6246, "step": 11335 }, { "epoch": 0.89, "learning_rate": 0.00023918557614305104, "loss": 1.6241, "step": 11336 }, { "epoch": 0.89, "learning_rate": 0.00023917563809115676, "loss": 1.5754, "step": 11337 }, { "epoch": 0.89, "learning_rate": 0.00023916569943380913, "loss": 1.5849, "step": 11338 }, { "epoch": 0.89, "learning_rate": 0.0002391557601710756, "loss": 1.5969, "step": 11339 }, { "epoch": 0.89, "learning_rate": 0.00023914582030302363, "loss": 1.5802, "step": 11340 }, { "epoch": 0.89, "learning_rate": 0.00023913587982972076, "loss": 1.6619, "step": 11341 }, { "epoch": 0.89, "learning_rate": 0.00023912593875123446, "loss": 1.6128, "step": 11342 }, { "epoch": 0.89, "learning_rate": 0.00023911599706763224, "loss": 1.6128, "step": 11343 }, { "epoch": 0.89, "learning_rate": 0.0002391060547789815, "loss": 1.5779, "step": 11344 }, { "epoch": 0.89, "learning_rate": 0.0002390961118853499, "loss": 1.6012, "step": 11345 }, { "epoch": 0.89, "learning_rate": 0.00023908616838680483, "loss": 1.58, "step": 11346 }, { "epoch": 0.89, "learning_rate": 0.00023907622428341385, "loss": 1.6072, "step": 11347 }, { "epoch": 0.89, "learning_rate": 0.00023906627957524446, "loss": 1.5984, "step": 11348 }, { "epoch": 0.89, "learning_rate": 0.0002390563342623642, "loss": 1.6394, "step": 11349 }, { "epoch": 0.89, "learning_rate": 0.00023904638834484055, "loss": 1.5807, "step": 11350 }, { "epoch": 0.89, "learning_rate": 0.00023903644182274105, "loss": 1.59, "step": 11351 }, { "epoch": 0.89, "learning_rate": 0.00023902649469613327, "loss": 1.6012, "step": 11352 }, { "epoch": 0.89, "learning_rate": 0.0002390165469650847, "loss": 1.6341, "step": 11353 }, { "epoch": 0.89, "learning_rate": 0.00023900659862966292, "loss": 1.5974, "step": 11354 }, { "epoch": 0.89, "learning_rate": 0.00023899664968993545, "loss": 1.6587, "step": 11355 }, { "epoch": 0.89, "learning_rate": 0.00023898670014596985, "loss": 1.6249, "step": 11356 }, { "epoch": 0.89, "learning_rate": 0.00023897674999783365, "loss": 1.574, "step": 11357 }, { "epoch": 0.89, "learning_rate": 0.00023896679924559442, "loss": 1.6153, "step": 11358 }, { "epoch": 0.89, "learning_rate": 0.0002389568478893197, "loss": 1.595, "step": 11359 }, { "epoch": 0.89, "learning_rate": 0.00023894689592907707, "loss": 1.6091, "step": 11360 }, { "epoch": 0.89, "learning_rate": 0.00023893694336493416, "loss": 1.646, "step": 11361 }, { "epoch": 0.89, "learning_rate": 0.00023892699019695845, "loss": 1.5539, "step": 11362 }, { "epoch": 0.89, "learning_rate": 0.00023891703642521753, "loss": 1.5854, "step": 11363 }, { "epoch": 0.89, "learning_rate": 0.00023890708204977903, "loss": 1.6038, "step": 11364 }, { "epoch": 0.89, "learning_rate": 0.00023889712707071052, "loss": 1.538, "step": 11365 }, { "epoch": 0.89, "learning_rate": 0.00023888717148807956, "loss": 1.5985, "step": 11366 }, { "epoch": 0.89, "learning_rate": 0.0002388772153019537, "loss": 1.6071, "step": 11367 }, { "epoch": 0.89, "learning_rate": 0.00023886725851240064, "loss": 1.6156, "step": 11368 }, { "epoch": 0.89, "learning_rate": 0.00023885730111948797, "loss": 1.6079, "step": 11369 }, { "epoch": 0.89, "learning_rate": 0.00023884734312328322, "loss": 1.5805, "step": 11370 }, { "epoch": 0.89, "learning_rate": 0.00023883738452385405, "loss": 1.5816, "step": 11371 }, { "epoch": 0.89, "learning_rate": 0.00023882742532126808, "loss": 1.5992, "step": 11372 }, { "epoch": 0.89, "learning_rate": 0.00023881746551559287, "loss": 1.5749, "step": 11373 }, { "epoch": 0.89, "learning_rate": 0.00023880750510689612, "loss": 1.621, "step": 11374 }, { "epoch": 0.89, "learning_rate": 0.00023879754409524535, "loss": 1.6244, "step": 11375 }, { "epoch": 0.9, "learning_rate": 0.00023878758248070838, "loss": 1.5995, "step": 11376 }, { "epoch": 0.9, "learning_rate": 0.00023877762026335266, "loss": 1.6238, "step": 11377 }, { "epoch": 0.9, "learning_rate": 0.0002387676574432459, "loss": 1.6344, "step": 11378 }, { "epoch": 0.9, "learning_rate": 0.0002387576940204557, "loss": 1.578, "step": 11379 }, { "epoch": 0.9, "learning_rate": 0.00023874772999504972, "loss": 1.6303, "step": 11380 }, { "epoch": 0.9, "learning_rate": 0.00023873776536709567, "loss": 1.5849, "step": 11381 }, { "epoch": 0.9, "learning_rate": 0.00023872780013666118, "loss": 1.6229, "step": 11382 }, { "epoch": 0.9, "learning_rate": 0.00023871783430381386, "loss": 1.5879, "step": 11383 }, { "epoch": 0.9, "learning_rate": 0.00023870786786862143, "loss": 1.5597, "step": 11384 }, { "epoch": 0.9, "learning_rate": 0.00023869790083115146, "loss": 1.5984, "step": 11385 }, { "epoch": 0.9, "learning_rate": 0.00023868793319147176, "loss": 1.5796, "step": 11386 }, { "epoch": 0.9, "learning_rate": 0.00023867796494964993, "loss": 1.5724, "step": 11387 }, { "epoch": 0.9, "learning_rate": 0.00023866799610575368, "loss": 1.6178, "step": 11388 }, { "epoch": 0.9, "learning_rate": 0.0002386580266598506, "loss": 1.5786, "step": 11389 }, { "epoch": 0.9, "learning_rate": 0.00023864805661200848, "loss": 1.6317, "step": 11390 }, { "epoch": 0.9, "learning_rate": 0.00023863808596229495, "loss": 1.6439, "step": 11391 }, { "epoch": 0.9, "learning_rate": 0.00023862811471077775, "loss": 1.5945, "step": 11392 }, { "epoch": 0.9, "learning_rate": 0.00023861814285752454, "loss": 1.6104, "step": 11393 }, { "epoch": 0.9, "learning_rate": 0.0002386081704026031, "loss": 1.5834, "step": 11394 }, { "epoch": 0.9, "learning_rate": 0.00023859819734608104, "loss": 1.5618, "step": 11395 }, { "epoch": 0.9, "learning_rate": 0.0002385882236880261, "loss": 1.6528, "step": 11396 }, { "epoch": 0.9, "learning_rate": 0.00023857824942850604, "loss": 1.6021, "step": 11397 }, { "epoch": 0.9, "learning_rate": 0.00023856827456758854, "loss": 1.5696, "step": 11398 }, { "epoch": 0.9, "learning_rate": 0.00023855829910534129, "loss": 1.5791, "step": 11399 }, { "epoch": 0.9, "learning_rate": 0.00023854832304183213, "loss": 1.605, "step": 11400 }, { "epoch": 0.9, "learning_rate": 0.0002385383463771287, "loss": 1.6216, "step": 11401 }, { "epoch": 0.9, "learning_rate": 0.00023852836911129874, "loss": 1.6024, "step": 11402 }, { "epoch": 0.9, "learning_rate": 0.00023851839124441, "loss": 1.572, "step": 11403 }, { "epoch": 0.9, "learning_rate": 0.00023850841277653023, "loss": 1.5959, "step": 11404 }, { "epoch": 0.9, "learning_rate": 0.00023849843370772722, "loss": 1.6027, "step": 11405 }, { "epoch": 0.9, "learning_rate": 0.00023848845403806861, "loss": 1.5828, "step": 11406 }, { "epoch": 0.9, "learning_rate": 0.0002384784737676223, "loss": 1.6424, "step": 11407 }, { "epoch": 0.9, "learning_rate": 0.00023846849289645597, "loss": 1.6418, "step": 11408 }, { "epoch": 0.9, "learning_rate": 0.00023845851142463738, "loss": 1.6646, "step": 11409 }, { "epoch": 0.9, "learning_rate": 0.00023844852935223432, "loss": 1.6414, "step": 11410 }, { "epoch": 0.9, "learning_rate": 0.00023843854667931458, "loss": 1.5635, "step": 11411 }, { "epoch": 0.9, "learning_rate": 0.00023842856340594584, "loss": 1.5628, "step": 11412 }, { "epoch": 0.9, "learning_rate": 0.00023841857953219597, "loss": 1.5487, "step": 11413 }, { "epoch": 0.9, "learning_rate": 0.0002384085950581328, "loss": 1.583, "step": 11414 }, { "epoch": 0.9, "learning_rate": 0.000238398609983824, "loss": 1.6302, "step": 11415 }, { "epoch": 0.9, "learning_rate": 0.00023838862430933746, "loss": 1.6011, "step": 11416 }, { "epoch": 0.9, "learning_rate": 0.00023837863803474093, "loss": 1.6312, "step": 11417 }, { "epoch": 0.9, "learning_rate": 0.0002383686511601022, "loss": 1.5743, "step": 11418 }, { "epoch": 0.9, "learning_rate": 0.0002383586636854891, "loss": 1.5912, "step": 11419 }, { "epoch": 0.9, "learning_rate": 0.00023834867561096942, "loss": 1.6466, "step": 11420 }, { "epoch": 0.9, "learning_rate": 0.00023833868693661102, "loss": 1.5784, "step": 11421 }, { "epoch": 0.9, "learning_rate": 0.00023832869766248166, "loss": 1.5011, "step": 11422 }, { "epoch": 0.9, "learning_rate": 0.0002383187077886492, "loss": 1.6176, "step": 11423 }, { "epoch": 0.9, "learning_rate": 0.0002383087173151814, "loss": 1.5669, "step": 11424 }, { "epoch": 0.9, "learning_rate": 0.00023829872624214621, "loss": 1.6743, "step": 11425 }, { "epoch": 0.9, "learning_rate": 0.0002382887345696114, "loss": 1.638, "step": 11426 }, { "epoch": 0.9, "learning_rate": 0.0002382787422976448, "loss": 1.6161, "step": 11427 }, { "epoch": 0.9, "learning_rate": 0.00023826874942631425, "loss": 1.5575, "step": 11428 }, { "epoch": 0.9, "learning_rate": 0.00023825875595568754, "loss": 1.6281, "step": 11429 }, { "epoch": 0.9, "learning_rate": 0.00023824876188583268, "loss": 1.6094, "step": 11430 }, { "epoch": 0.9, "learning_rate": 0.0002382387672168173, "loss": 1.5718, "step": 11431 }, { "epoch": 0.9, "learning_rate": 0.0002382287719487095, "loss": 1.5855, "step": 11432 }, { "epoch": 0.9, "learning_rate": 0.000238218776081577, "loss": 1.5739, "step": 11433 }, { "epoch": 0.9, "learning_rate": 0.00023820877961548768, "loss": 1.5873, "step": 11434 }, { "epoch": 0.9, "learning_rate": 0.00023819878255050943, "loss": 1.5763, "step": 11435 }, { "epoch": 0.9, "learning_rate": 0.0002381887848867101, "loss": 1.6288, "step": 11436 }, { "epoch": 0.9, "learning_rate": 0.00023817878662415763, "loss": 1.5942, "step": 11437 }, { "epoch": 0.9, "learning_rate": 0.0002381687877629198, "loss": 1.6023, "step": 11438 }, { "epoch": 0.9, "learning_rate": 0.0002381587883030646, "loss": 1.668, "step": 11439 }, { "epoch": 0.9, "learning_rate": 0.00023814878824465985, "loss": 1.538, "step": 11440 }, { "epoch": 0.9, "learning_rate": 0.00023813878758777352, "loss": 1.6285, "step": 11441 }, { "epoch": 0.9, "learning_rate": 0.0002381287863324734, "loss": 1.6789, "step": 11442 }, { "epoch": 0.9, "learning_rate": 0.0002381187844788275, "loss": 1.5073, "step": 11443 }, { "epoch": 0.9, "learning_rate": 0.0002381087820269037, "loss": 1.6241, "step": 11444 }, { "epoch": 0.9, "learning_rate": 0.00023809877897676982, "loss": 1.5689, "step": 11445 }, { "epoch": 0.9, "learning_rate": 0.00023808877532849386, "loss": 1.639, "step": 11446 }, { "epoch": 0.9, "learning_rate": 0.0002380787710821438, "loss": 1.6095, "step": 11447 }, { "epoch": 0.9, "learning_rate": 0.0002380687662377874, "loss": 1.6306, "step": 11448 }, { "epoch": 0.9, "learning_rate": 0.00023805876079549274, "loss": 1.6142, "step": 11449 }, { "epoch": 0.9, "learning_rate": 0.0002380487547553277, "loss": 1.6166, "step": 11450 }, { "epoch": 0.9, "learning_rate": 0.00023803874811736015, "loss": 1.587, "step": 11451 }, { "epoch": 0.9, "learning_rate": 0.0002380287408816581, "loss": 1.6306, "step": 11452 }, { "epoch": 0.9, "learning_rate": 0.0002380187330482895, "loss": 1.6395, "step": 11453 }, { "epoch": 0.9, "learning_rate": 0.00023800872461732226, "loss": 1.6021, "step": 11454 }, { "epoch": 0.9, "learning_rate": 0.00023799871558882434, "loss": 1.6366, "step": 11455 }, { "epoch": 0.9, "learning_rate": 0.0002379887059628637, "loss": 1.6077, "step": 11456 }, { "epoch": 0.9, "learning_rate": 0.00023797869573950834, "loss": 1.6287, "step": 11457 }, { "epoch": 0.9, "learning_rate": 0.00023796868491882613, "loss": 1.6274, "step": 11458 }, { "epoch": 0.9, "learning_rate": 0.00023795867350088514, "loss": 1.6095, "step": 11459 }, { "epoch": 0.9, "learning_rate": 0.0002379486614857533, "loss": 1.5744, "step": 11460 }, { "epoch": 0.9, "learning_rate": 0.00023793864887349854, "loss": 1.6564, "step": 11461 }, { "epoch": 0.9, "learning_rate": 0.0002379286356641889, "loss": 1.5879, "step": 11462 }, { "epoch": 0.9, "learning_rate": 0.00023791862185789238, "loss": 1.6144, "step": 11463 }, { "epoch": 0.9, "learning_rate": 0.0002379086074546769, "loss": 1.6189, "step": 11464 }, { "epoch": 0.9, "learning_rate": 0.00023789859245461052, "loss": 1.6119, "step": 11465 }, { "epoch": 0.9, "learning_rate": 0.00023788857685776117, "loss": 1.6139, "step": 11466 }, { "epoch": 0.9, "learning_rate": 0.0002378785606641969, "loss": 1.5566, "step": 11467 }, { "epoch": 0.9, "learning_rate": 0.00023786854387398566, "loss": 1.6245, "step": 11468 }, { "epoch": 0.9, "learning_rate": 0.00023785852648719553, "loss": 1.6436, "step": 11469 }, { "epoch": 0.9, "learning_rate": 0.00023784850850389449, "loss": 1.5784, "step": 11470 }, { "epoch": 0.9, "learning_rate": 0.00023783848992415052, "loss": 1.5852, "step": 11471 }, { "epoch": 0.9, "learning_rate": 0.00023782847074803177, "loss": 1.5777, "step": 11472 }, { "epoch": 0.9, "learning_rate": 0.0002378184509756061, "loss": 1.5757, "step": 11473 }, { "epoch": 0.9, "learning_rate": 0.00023780843060694162, "loss": 1.6092, "step": 11474 }, { "epoch": 0.9, "learning_rate": 0.00023779840964210637, "loss": 1.5575, "step": 11475 }, { "epoch": 0.9, "learning_rate": 0.00023778838808116836, "loss": 1.5998, "step": 11476 }, { "epoch": 0.9, "learning_rate": 0.0002377783659241956, "loss": 1.612, "step": 11477 }, { "epoch": 0.9, "learning_rate": 0.00023776834317125624, "loss": 1.6555, "step": 11478 }, { "epoch": 0.9, "learning_rate": 0.00023775831982241825, "loss": 1.5781, "step": 11479 }, { "epoch": 0.9, "learning_rate": 0.00023774829587774966, "loss": 1.6357, "step": 11480 }, { "epoch": 0.9, "learning_rate": 0.0002377382713373186, "loss": 1.6817, "step": 11481 }, { "epoch": 0.9, "learning_rate": 0.00023772824620119307, "loss": 1.6128, "step": 11482 }, { "epoch": 0.9, "learning_rate": 0.0002377182204694412, "loss": 1.5811, "step": 11483 }, { "epoch": 0.9, "learning_rate": 0.000237708194142131, "loss": 1.6499, "step": 11484 }, { "epoch": 0.9, "learning_rate": 0.00023769816721933056, "loss": 1.6027, "step": 11485 }, { "epoch": 0.9, "learning_rate": 0.00023768813970110792, "loss": 1.5468, "step": 11486 }, { "epoch": 0.9, "learning_rate": 0.00023767811158753124, "loss": 1.5542, "step": 11487 }, { "epoch": 0.9, "learning_rate": 0.00023766808287866857, "loss": 1.5499, "step": 11488 }, { "epoch": 0.9, "learning_rate": 0.000237658053574588, "loss": 1.5858, "step": 11489 }, { "epoch": 0.9, "learning_rate": 0.00023764802367535765, "loss": 1.593, "step": 11490 }, { "epoch": 0.9, "learning_rate": 0.0002376379931810455, "loss": 1.6311, "step": 11491 }, { "epoch": 0.9, "learning_rate": 0.0002376279620917198, "loss": 1.6422, "step": 11492 }, { "epoch": 0.9, "learning_rate": 0.0002376179304074486, "loss": 1.6225, "step": 11493 }, { "epoch": 0.9, "learning_rate": 0.00023760789812829998, "loss": 1.6113, "step": 11494 }, { "epoch": 0.9, "learning_rate": 0.0002375978652543421, "loss": 1.6251, "step": 11495 }, { "epoch": 0.9, "learning_rate": 0.00023758783178564304, "loss": 1.65, "step": 11496 }, { "epoch": 0.9, "learning_rate": 0.0002375777977222709, "loss": 1.6421, "step": 11497 }, { "epoch": 0.9, "learning_rate": 0.00023756776306429393, "loss": 1.6146, "step": 11498 }, { "epoch": 0.9, "learning_rate": 0.00023755772781178008, "loss": 1.6307, "step": 11499 }, { "epoch": 0.9, "learning_rate": 0.00023754769196479764, "loss": 1.6146, "step": 11500 }, { "epoch": 0.9, "learning_rate": 0.00023753765552341467, "loss": 1.5878, "step": 11501 }, { "epoch": 0.9, "learning_rate": 0.0002375276184876993, "loss": 1.6898, "step": 11502 }, { "epoch": 0.91, "learning_rate": 0.00023751758085771975, "loss": 1.6026, "step": 11503 }, { "epoch": 0.91, "learning_rate": 0.00023750754263354408, "loss": 1.5907, "step": 11504 }, { "epoch": 0.91, "learning_rate": 0.0002374975038152405, "loss": 1.58, "step": 11505 }, { "epoch": 0.91, "learning_rate": 0.00023748746440287717, "loss": 1.6177, "step": 11506 }, { "epoch": 0.91, "learning_rate": 0.0002374774243965222, "loss": 1.59, "step": 11507 }, { "epoch": 0.91, "learning_rate": 0.00023746738379624383, "loss": 1.5938, "step": 11508 }, { "epoch": 0.91, "learning_rate": 0.00023745734260211017, "loss": 1.6202, "step": 11509 }, { "epoch": 0.91, "learning_rate": 0.0002374473008141894, "loss": 1.6404, "step": 11510 }, { "epoch": 0.91, "learning_rate": 0.00023743725843254976, "loss": 1.5898, "step": 11511 }, { "epoch": 0.91, "learning_rate": 0.00023742721545725936, "loss": 1.614, "step": 11512 }, { "epoch": 0.91, "learning_rate": 0.00023741717188838644, "loss": 1.5938, "step": 11513 }, { "epoch": 0.91, "learning_rate": 0.00023740712772599913, "loss": 1.5829, "step": 11514 }, { "epoch": 0.91, "learning_rate": 0.00023739708297016565, "loss": 1.5808, "step": 11515 }, { "epoch": 0.91, "learning_rate": 0.00023738703762095424, "loss": 1.5961, "step": 11516 }, { "epoch": 0.91, "learning_rate": 0.00023737699167843305, "loss": 1.5825, "step": 11517 }, { "epoch": 0.91, "learning_rate": 0.00023736694514267032, "loss": 1.5999, "step": 11518 }, { "epoch": 0.91, "learning_rate": 0.00023735689801373424, "loss": 1.6014, "step": 11519 }, { "epoch": 0.91, "learning_rate": 0.00023734685029169305, "loss": 1.6506, "step": 11520 }, { "epoch": 0.91, "learning_rate": 0.0002373368019766149, "loss": 1.5498, "step": 11521 }, { "epoch": 0.91, "learning_rate": 0.0002373267530685681, "loss": 1.581, "step": 11522 }, { "epoch": 0.91, "learning_rate": 0.00023731670356762083, "loss": 1.5555, "step": 11523 }, { "epoch": 0.91, "learning_rate": 0.0002373066534738413, "loss": 1.6258, "step": 11524 }, { "epoch": 0.91, "learning_rate": 0.00023729660278729782, "loss": 1.5373, "step": 11525 }, { "epoch": 0.91, "learning_rate": 0.00023728655150805856, "loss": 1.6758, "step": 11526 }, { "epoch": 0.91, "learning_rate": 0.00023727649963619176, "loss": 1.6311, "step": 11527 }, { "epoch": 0.91, "learning_rate": 0.0002372664471717657, "loss": 1.6034, "step": 11528 }, { "epoch": 0.91, "learning_rate": 0.00023725639411484865, "loss": 1.561, "step": 11529 }, { "epoch": 0.91, "learning_rate": 0.0002372463404655088, "loss": 1.6037, "step": 11530 }, { "epoch": 0.91, "learning_rate": 0.0002372362862238145, "loss": 1.5488, "step": 11531 }, { "epoch": 0.91, "learning_rate": 0.0002372262313898339, "loss": 1.6326, "step": 11532 }, { "epoch": 0.91, "learning_rate": 0.00023721617596363535, "loss": 1.5522, "step": 11533 }, { "epoch": 0.91, "learning_rate": 0.00023720611994528708, "loss": 1.5797, "step": 11534 }, { "epoch": 0.91, "learning_rate": 0.00023719606333485736, "loss": 1.5801, "step": 11535 }, { "epoch": 0.91, "learning_rate": 0.00023718600613241452, "loss": 1.5963, "step": 11536 }, { "epoch": 0.91, "learning_rate": 0.00023717594833802685, "loss": 1.6089, "step": 11537 }, { "epoch": 0.91, "learning_rate": 0.00023716588995176255, "loss": 1.6494, "step": 11538 }, { "epoch": 0.91, "learning_rate": 0.00023715583097369, "loss": 1.6217, "step": 11539 }, { "epoch": 0.91, "learning_rate": 0.00023714577140387737, "loss": 1.6328, "step": 11540 }, { "epoch": 0.91, "learning_rate": 0.00023713571124239313, "loss": 1.628, "step": 11541 }, { "epoch": 0.91, "learning_rate": 0.00023712565048930544, "loss": 1.5788, "step": 11542 }, { "epoch": 0.91, "learning_rate": 0.00023711558914468267, "loss": 1.5909, "step": 11543 }, { "epoch": 0.91, "learning_rate": 0.00023710552720859312, "loss": 1.6136, "step": 11544 }, { "epoch": 0.91, "learning_rate": 0.00023709546468110514, "loss": 1.5654, "step": 11545 }, { "epoch": 0.91, "learning_rate": 0.00023708540156228703, "loss": 1.6195, "step": 11546 }, { "epoch": 0.91, "learning_rate": 0.0002370753378522071, "loss": 1.5893, "step": 11547 }, { "epoch": 0.91, "learning_rate": 0.00023706527355093362, "loss": 1.6455, "step": 11548 }, { "epoch": 0.91, "learning_rate": 0.000237055208658535, "loss": 1.5679, "step": 11549 }, { "epoch": 0.91, "learning_rate": 0.00023704514317507958, "loss": 1.5588, "step": 11550 }, { "epoch": 0.91, "learning_rate": 0.00023703507710063566, "loss": 1.5775, "step": 11551 }, { "epoch": 0.91, "learning_rate": 0.0002370250104352716, "loss": 1.5967, "step": 11552 }, { "epoch": 0.91, "learning_rate": 0.00023701494317905574, "loss": 1.5907, "step": 11553 }, { "epoch": 0.91, "learning_rate": 0.00023700487533205645, "loss": 1.6458, "step": 11554 }, { "epoch": 0.91, "learning_rate": 0.00023699480689434206, "loss": 1.5948, "step": 11555 }, { "epoch": 0.91, "learning_rate": 0.00023698473786598094, "loss": 1.6164, "step": 11556 }, { "epoch": 0.91, "learning_rate": 0.00023697466824704143, "loss": 1.6076, "step": 11557 }, { "epoch": 0.91, "learning_rate": 0.00023696459803759193, "loss": 1.6092, "step": 11558 }, { "epoch": 0.91, "learning_rate": 0.00023695452723770079, "loss": 1.6054, "step": 11559 }, { "epoch": 0.91, "learning_rate": 0.00023694445584743643, "loss": 1.5407, "step": 11560 }, { "epoch": 0.91, "learning_rate": 0.00023693438386686717, "loss": 1.6246, "step": 11561 }, { "epoch": 0.91, "learning_rate": 0.00023692431129606142, "loss": 1.6089, "step": 11562 }, { "epoch": 0.91, "learning_rate": 0.00023691423813508762, "loss": 1.7036, "step": 11563 }, { "epoch": 0.91, "learning_rate": 0.00023690416438401402, "loss": 1.6066, "step": 11564 }, { "epoch": 0.91, "learning_rate": 0.00023689409004290914, "loss": 1.616, "step": 11565 }, { "epoch": 0.91, "learning_rate": 0.00023688401511184133, "loss": 1.5739, "step": 11566 }, { "epoch": 0.91, "learning_rate": 0.000236873939590879, "loss": 1.6029, "step": 11567 }, { "epoch": 0.91, "learning_rate": 0.0002368638634800906, "loss": 1.5968, "step": 11568 }, { "epoch": 0.91, "learning_rate": 0.00023685378677954449, "loss": 1.5495, "step": 11569 }, { "epoch": 0.91, "learning_rate": 0.00023684370948930905, "loss": 1.5316, "step": 11570 }, { "epoch": 0.91, "learning_rate": 0.00023683363160945277, "loss": 1.6172, "step": 11571 }, { "epoch": 0.91, "learning_rate": 0.00023682355314004407, "loss": 1.6294, "step": 11572 }, { "epoch": 0.91, "learning_rate": 0.00023681347408115137, "loss": 1.6345, "step": 11573 }, { "epoch": 0.91, "learning_rate": 0.00023680339443284305, "loss": 1.559, "step": 11574 }, { "epoch": 0.91, "learning_rate": 0.0002367933141951876, "loss": 1.5339, "step": 11575 }, { "epoch": 0.91, "learning_rate": 0.00023678323336825342, "loss": 1.5619, "step": 11576 }, { "epoch": 0.91, "learning_rate": 0.00023677315195210904, "loss": 1.5978, "step": 11577 }, { "epoch": 0.91, "learning_rate": 0.00023676306994682277, "loss": 1.5164, "step": 11578 }, { "epoch": 0.91, "learning_rate": 0.00023675298735246315, "loss": 1.6016, "step": 11579 }, { "epoch": 0.91, "learning_rate": 0.00023674290416909866, "loss": 1.6059, "step": 11580 }, { "epoch": 0.91, "learning_rate": 0.00023673282039679772, "loss": 1.5943, "step": 11581 }, { "epoch": 0.91, "learning_rate": 0.00023672273603562874, "loss": 1.5852, "step": 11582 }, { "epoch": 0.91, "learning_rate": 0.0002367126510856603, "loss": 1.6039, "step": 11583 }, { "epoch": 0.91, "learning_rate": 0.00023670256554696076, "loss": 1.5636, "step": 11584 }, { "epoch": 0.91, "learning_rate": 0.00023669247941959868, "loss": 1.593, "step": 11585 }, { "epoch": 0.91, "learning_rate": 0.00023668239270364252, "loss": 1.5866, "step": 11586 }, { "epoch": 0.91, "learning_rate": 0.00023667230539916066, "loss": 1.5395, "step": 11587 }, { "epoch": 0.91, "learning_rate": 0.00023666221750622175, "loss": 1.571, "step": 11588 }, { "epoch": 0.91, "learning_rate": 0.0002366521290248942, "loss": 1.6096, "step": 11589 }, { "epoch": 0.91, "learning_rate": 0.0002366420399552465, "loss": 1.6102, "step": 11590 }, { "epoch": 0.91, "learning_rate": 0.0002366319502973472, "loss": 1.6356, "step": 11591 }, { "epoch": 0.91, "learning_rate": 0.0002366218600512647, "loss": 1.6123, "step": 11592 }, { "epoch": 0.91, "learning_rate": 0.0002366117692170676, "loss": 1.6392, "step": 11593 }, { "epoch": 0.91, "learning_rate": 0.00023660167779482444, "loss": 1.6046, "step": 11594 }, { "epoch": 0.91, "learning_rate": 0.0002365915857846036, "loss": 1.5837, "step": 11595 }, { "epoch": 0.91, "learning_rate": 0.0002365814931864737, "loss": 1.5807, "step": 11596 }, { "epoch": 0.91, "learning_rate": 0.00023657140000050327, "loss": 1.5478, "step": 11597 }, { "epoch": 0.91, "learning_rate": 0.0002365613062267608, "loss": 1.6194, "step": 11598 }, { "epoch": 0.91, "learning_rate": 0.0002365512118653148, "loss": 1.6623, "step": 11599 }, { "epoch": 0.91, "learning_rate": 0.00023654111691623385, "loss": 1.6768, "step": 11600 }, { "epoch": 0.91, "learning_rate": 0.00023653102137958647, "loss": 1.6164, "step": 11601 }, { "epoch": 0.91, "learning_rate": 0.00023652092525544124, "loss": 1.6425, "step": 11602 }, { "epoch": 0.91, "learning_rate": 0.0002365108285438666, "loss": 1.548, "step": 11603 }, { "epoch": 0.91, "learning_rate": 0.00023650073124493123, "loss": 1.5832, "step": 11604 }, { "epoch": 0.91, "learning_rate": 0.0002364906333587036, "loss": 1.6284, "step": 11605 }, { "epoch": 0.91, "learning_rate": 0.00023648053488525234, "loss": 1.5669, "step": 11606 }, { "epoch": 0.91, "learning_rate": 0.00023647043582464595, "loss": 1.6663, "step": 11607 }, { "epoch": 0.91, "learning_rate": 0.000236460336176953, "loss": 1.5609, "step": 11608 }, { "epoch": 0.91, "learning_rate": 0.0002364502359422421, "loss": 1.6292, "step": 11609 }, { "epoch": 0.91, "learning_rate": 0.0002364401351205818, "loss": 1.6125, "step": 11610 }, { "epoch": 0.91, "learning_rate": 0.00023643003371204068, "loss": 1.5857, "step": 11611 }, { "epoch": 0.91, "learning_rate": 0.0002364199317166873, "loss": 1.5755, "step": 11612 }, { "epoch": 0.91, "learning_rate": 0.00023640982913459036, "loss": 1.6658, "step": 11613 }, { "epoch": 0.91, "learning_rate": 0.00023639972596581831, "loss": 1.6047, "step": 11614 }, { "epoch": 0.91, "learning_rate": 0.0002363896222104398, "loss": 1.6337, "step": 11615 }, { "epoch": 0.91, "learning_rate": 0.00023637951786852345, "loss": 1.5597, "step": 11616 }, { "epoch": 0.91, "learning_rate": 0.0002363694129401378, "loss": 1.5994, "step": 11617 }, { "epoch": 0.91, "learning_rate": 0.00023635930742535154, "loss": 1.6088, "step": 11618 }, { "epoch": 0.91, "learning_rate": 0.0002363492013242332, "loss": 1.6576, "step": 11619 }, { "epoch": 0.91, "learning_rate": 0.00023633909463685148, "loss": 1.594, "step": 11620 }, { "epoch": 0.91, "learning_rate": 0.0002363289873632749, "loss": 1.6213, "step": 11621 }, { "epoch": 0.91, "learning_rate": 0.00023631887950357217, "loss": 1.6, "step": 11622 }, { "epoch": 0.91, "learning_rate": 0.00023630877105781188, "loss": 1.616, "step": 11623 }, { "epoch": 0.91, "learning_rate": 0.00023629866202606268, "loss": 1.5863, "step": 11624 }, { "epoch": 0.91, "learning_rate": 0.00023628855240839314, "loss": 1.6373, "step": 11625 }, { "epoch": 0.91, "learning_rate": 0.00023627844220487198, "loss": 1.5659, "step": 11626 }, { "epoch": 0.91, "learning_rate": 0.00023626833141556782, "loss": 1.5961, "step": 11627 }, { "epoch": 0.91, "learning_rate": 0.00023625822004054927, "loss": 1.6479, "step": 11628 }, { "epoch": 0.91, "learning_rate": 0.00023624810807988504, "loss": 1.6202, "step": 11629 }, { "epoch": 0.92, "learning_rate": 0.00023623799553364373, "loss": 1.651, "step": 11630 }, { "epoch": 0.92, "learning_rate": 0.000236227882401894, "loss": 1.5609, "step": 11631 }, { "epoch": 0.92, "learning_rate": 0.00023621776868470458, "loss": 1.6076, "step": 11632 }, { "epoch": 0.92, "learning_rate": 0.00023620765438214406, "loss": 1.6447, "step": 11633 }, { "epoch": 0.92, "learning_rate": 0.00023619753949428115, "loss": 1.6212, "step": 11634 }, { "epoch": 0.92, "learning_rate": 0.0002361874240211845, "loss": 1.6699, "step": 11635 }, { "epoch": 0.92, "learning_rate": 0.00023617730796292283, "loss": 1.6344, "step": 11636 }, { "epoch": 0.92, "learning_rate": 0.00023616719131956478, "loss": 1.6268, "step": 11637 }, { "epoch": 0.92, "learning_rate": 0.00023615707409117904, "loss": 1.6005, "step": 11638 }, { "epoch": 0.92, "learning_rate": 0.0002361469562778343, "loss": 1.6236, "step": 11639 }, { "epoch": 0.92, "learning_rate": 0.00023613683787959932, "loss": 1.5976, "step": 11640 }, { "epoch": 0.92, "learning_rate": 0.00023612671889654271, "loss": 1.5778, "step": 11641 }, { "epoch": 0.92, "learning_rate": 0.0002361165993287332, "loss": 1.5658, "step": 11642 }, { "epoch": 0.92, "learning_rate": 0.00023610647917623955, "loss": 1.5113, "step": 11643 }, { "epoch": 0.92, "learning_rate": 0.00023609635843913038, "loss": 1.6214, "step": 11644 }, { "epoch": 0.92, "learning_rate": 0.00023608623711747446, "loss": 1.6737, "step": 11645 }, { "epoch": 0.92, "learning_rate": 0.00023607611521134046, "loss": 1.6033, "step": 11646 }, { "epoch": 0.92, "learning_rate": 0.00023606599272079723, "loss": 1.5772, "step": 11647 }, { "epoch": 0.92, "learning_rate": 0.00023605586964591332, "loss": 1.6151, "step": 11648 }, { "epoch": 0.92, "learning_rate": 0.00023604574598675755, "loss": 1.6165, "step": 11649 }, { "epoch": 0.92, "learning_rate": 0.0002360356217433987, "loss": 1.6165, "step": 11650 }, { "epoch": 0.92, "learning_rate": 0.00023602549691590543, "loss": 1.6176, "step": 11651 }, { "epoch": 0.92, "learning_rate": 0.00023601537150434647, "loss": 1.5869, "step": 11652 }, { "epoch": 0.92, "learning_rate": 0.00023600524550879067, "loss": 1.6145, "step": 11653 }, { "epoch": 0.92, "learning_rate": 0.00023599511892930666, "loss": 1.6153, "step": 11654 }, { "epoch": 0.92, "learning_rate": 0.00023598499176596328, "loss": 1.6333, "step": 11655 }, { "epoch": 0.92, "learning_rate": 0.0002359748640188293, "loss": 1.4794, "step": 11656 }, { "epoch": 0.92, "learning_rate": 0.00023596473568797337, "loss": 1.6229, "step": 11657 }, { "epoch": 0.92, "learning_rate": 0.00023595460677346434, "loss": 1.5977, "step": 11658 }, { "epoch": 0.92, "learning_rate": 0.00023594447727537095, "loss": 1.6453, "step": 11659 }, { "epoch": 0.92, "learning_rate": 0.000235934347193762, "loss": 1.6182, "step": 11660 }, { "epoch": 0.92, "learning_rate": 0.00023592421652870625, "loss": 1.6196, "step": 11661 }, { "epoch": 0.92, "learning_rate": 0.00023591408528027253, "loss": 1.5761, "step": 11662 }, { "epoch": 0.92, "learning_rate": 0.00023590395344852953, "loss": 1.6637, "step": 11663 }, { "epoch": 0.92, "learning_rate": 0.00023589382103354612, "loss": 1.6194, "step": 11664 }, { "epoch": 0.92, "learning_rate": 0.00023588368803539105, "loss": 1.5611, "step": 11665 }, { "epoch": 0.92, "learning_rate": 0.00023587355445413313, "loss": 1.6235, "step": 11666 }, { "epoch": 0.92, "learning_rate": 0.00023586342028984115, "loss": 1.6085, "step": 11667 }, { "epoch": 0.92, "learning_rate": 0.00023585328554258397, "loss": 1.6316, "step": 11668 }, { "epoch": 0.92, "learning_rate": 0.00023584315021243034, "loss": 1.5609, "step": 11669 }, { "epoch": 0.92, "learning_rate": 0.0002358330142994491, "loss": 1.5266, "step": 11670 }, { "epoch": 0.92, "learning_rate": 0.00023582287780370907, "loss": 1.6266, "step": 11671 }, { "epoch": 0.92, "learning_rate": 0.000235812740725279, "loss": 1.6306, "step": 11672 }, { "epoch": 0.92, "learning_rate": 0.00023580260306422783, "loss": 1.6312, "step": 11673 }, { "epoch": 0.92, "learning_rate": 0.00023579246482062431, "loss": 1.6195, "step": 11674 }, { "epoch": 0.92, "learning_rate": 0.0002357823259945373, "loss": 1.5751, "step": 11675 }, { "epoch": 0.92, "learning_rate": 0.0002357721865860357, "loss": 1.5981, "step": 11676 }, { "epoch": 0.92, "learning_rate": 0.00023576204659518817, "loss": 1.6082, "step": 11677 }, { "epoch": 0.92, "learning_rate": 0.00023575190602206377, "loss": 1.6097, "step": 11678 }, { "epoch": 0.92, "learning_rate": 0.0002357417648667312, "loss": 1.6055, "step": 11679 }, { "epoch": 0.92, "learning_rate": 0.00023573162312925938, "loss": 1.599, "step": 11680 }, { "epoch": 0.92, "learning_rate": 0.00023572148080971714, "loss": 1.6285, "step": 11681 }, { "epoch": 0.92, "learning_rate": 0.0002357113379081734, "loss": 1.5977, "step": 11682 }, { "epoch": 0.92, "learning_rate": 0.00023570119442469688, "loss": 1.6359, "step": 11683 }, { "epoch": 0.92, "learning_rate": 0.00023569105035935664, "loss": 1.5805, "step": 11684 }, { "epoch": 0.92, "learning_rate": 0.0002356809057122214, "loss": 1.5849, "step": 11685 }, { "epoch": 0.92, "learning_rate": 0.0002356707604833601, "loss": 1.5446, "step": 11686 }, { "epoch": 0.92, "learning_rate": 0.00023566061467284163, "loss": 1.6111, "step": 11687 }, { "epoch": 0.92, "learning_rate": 0.00023565046828073484, "loss": 1.6375, "step": 11688 }, { "epoch": 0.92, "learning_rate": 0.00023564032130710862, "loss": 1.5672, "step": 11689 }, { "epoch": 0.92, "learning_rate": 0.0002356301737520319, "loss": 1.6115, "step": 11690 }, { "epoch": 0.92, "learning_rate": 0.00023562002561557354, "loss": 1.5747, "step": 11691 }, { "epoch": 0.92, "learning_rate": 0.0002356098768978025, "loss": 1.6111, "step": 11692 }, { "epoch": 0.92, "learning_rate": 0.00023559972759878764, "loss": 1.6245, "step": 11693 }, { "epoch": 0.92, "learning_rate": 0.0002355895777185978, "loss": 1.5746, "step": 11694 }, { "epoch": 0.92, "learning_rate": 0.00023557942725730202, "loss": 1.608, "step": 11695 }, { "epoch": 0.92, "learning_rate": 0.00023556927621496912, "loss": 1.6194, "step": 11696 }, { "epoch": 0.92, "learning_rate": 0.00023555912459166805, "loss": 1.5804, "step": 11697 }, { "epoch": 0.92, "learning_rate": 0.00023554897238746775, "loss": 1.61, "step": 11698 }, { "epoch": 0.92, "learning_rate": 0.00023553881960243717, "loss": 1.5545, "step": 11699 }, { "epoch": 0.92, "learning_rate": 0.00023552866623664516, "loss": 1.5947, "step": 11700 }, { "epoch": 0.92, "learning_rate": 0.00023551851229016072, "loss": 1.6171, "step": 11701 }, { "epoch": 0.92, "learning_rate": 0.0002355083577630528, "loss": 1.5477, "step": 11702 }, { "epoch": 0.92, "learning_rate": 0.0002354982026553903, "loss": 1.5781, "step": 11703 }, { "epoch": 0.92, "learning_rate": 0.00023548804696724217, "loss": 1.5994, "step": 11704 }, { "epoch": 0.92, "learning_rate": 0.0002354778906986774, "loss": 1.6066, "step": 11705 }, { "epoch": 0.92, "learning_rate": 0.0002354677338497649, "loss": 1.5794, "step": 11706 }, { "epoch": 0.92, "learning_rate": 0.00023545757642057369, "loss": 1.6542, "step": 11707 }, { "epoch": 0.92, "learning_rate": 0.0002354474184111727, "loss": 1.5594, "step": 11708 }, { "epoch": 0.92, "learning_rate": 0.00023543725982163086, "loss": 1.5952, "step": 11709 }, { "epoch": 0.92, "learning_rate": 0.00023542710065201715, "loss": 1.6267, "step": 11710 }, { "epoch": 0.92, "learning_rate": 0.00023541694090240063, "loss": 1.5831, "step": 11711 }, { "epoch": 0.92, "learning_rate": 0.0002354067805728502, "loss": 1.6368, "step": 11712 }, { "epoch": 0.92, "learning_rate": 0.00023539661966343484, "loss": 1.6043, "step": 11713 }, { "epoch": 0.92, "learning_rate": 0.00023538645817422358, "loss": 1.6464, "step": 11714 }, { "epoch": 0.92, "learning_rate": 0.00023537629610528537, "loss": 1.6353, "step": 11715 }, { "epoch": 0.92, "learning_rate": 0.00023536613345668923, "loss": 1.6063, "step": 11716 }, { "epoch": 0.92, "learning_rate": 0.00023535597022850414, "loss": 1.6345, "step": 11717 }, { "epoch": 0.92, "learning_rate": 0.00023534580642079915, "loss": 1.6128, "step": 11718 }, { "epoch": 0.92, "learning_rate": 0.0002353356420336432, "loss": 1.5719, "step": 11719 }, { "epoch": 0.92, "learning_rate": 0.00023532547706710537, "loss": 1.5849, "step": 11720 }, { "epoch": 0.92, "learning_rate": 0.00023531531152125456, "loss": 1.5889, "step": 11721 }, { "epoch": 0.92, "learning_rate": 0.00023530514539615993, "loss": 1.6154, "step": 11722 }, { "epoch": 0.92, "learning_rate": 0.0002352949786918904, "loss": 1.5177, "step": 11723 }, { "epoch": 0.92, "learning_rate": 0.00023528481140851508, "loss": 1.6136, "step": 11724 }, { "epoch": 0.92, "learning_rate": 0.00023527464354610296, "loss": 1.5577, "step": 11725 }, { "epoch": 0.92, "learning_rate": 0.00023526447510472304, "loss": 1.5549, "step": 11726 }, { "epoch": 0.92, "learning_rate": 0.00023525430608444436, "loss": 1.6567, "step": 11727 }, { "epoch": 0.92, "learning_rate": 0.00023524413648533604, "loss": 1.5567, "step": 11728 }, { "epoch": 0.92, "learning_rate": 0.00023523396630746704, "loss": 1.5812, "step": 11729 }, { "epoch": 0.92, "learning_rate": 0.00023522379555090646, "loss": 1.5311, "step": 11730 }, { "epoch": 0.92, "learning_rate": 0.0002352136242157233, "loss": 1.6268, "step": 11731 }, { "epoch": 0.92, "learning_rate": 0.00023520345230198674, "loss": 1.5619, "step": 11732 }, { "epoch": 0.92, "learning_rate": 0.0002351932798097657, "loss": 1.6235, "step": 11733 }, { "epoch": 0.92, "learning_rate": 0.0002351831067391293, "loss": 1.5728, "step": 11734 }, { "epoch": 0.92, "learning_rate": 0.00023517293309014664, "loss": 1.5843, "step": 11735 }, { "epoch": 0.92, "learning_rate": 0.00023516275886288672, "loss": 1.5437, "step": 11736 }, { "epoch": 0.92, "learning_rate": 0.00023515258405741875, "loss": 1.5365, "step": 11737 }, { "epoch": 0.92, "learning_rate": 0.00023514240867381168, "loss": 1.6155, "step": 11738 }, { "epoch": 0.92, "learning_rate": 0.0002351322327121346, "loss": 1.6356, "step": 11739 }, { "epoch": 0.92, "learning_rate": 0.0002351220561724567, "loss": 1.5482, "step": 11740 }, { "epoch": 0.92, "learning_rate": 0.00023511187905484699, "loss": 1.6199, "step": 11741 }, { "epoch": 0.92, "learning_rate": 0.0002351017013593746, "loss": 1.5994, "step": 11742 }, { "epoch": 0.92, "learning_rate": 0.0002350915230861086, "loss": 1.673, "step": 11743 }, { "epoch": 0.92, "learning_rate": 0.00023508134423511808, "loss": 1.6264, "step": 11744 }, { "epoch": 0.92, "learning_rate": 0.00023507116480647223, "loss": 1.6198, "step": 11745 }, { "epoch": 0.92, "learning_rate": 0.00023506098480024012, "loss": 1.5559, "step": 11746 }, { "epoch": 0.92, "learning_rate": 0.00023505080421649087, "loss": 1.5963, "step": 11747 }, { "epoch": 0.92, "learning_rate": 0.0002350406230552936, "loss": 1.5472, "step": 11748 }, { "epoch": 0.92, "learning_rate": 0.00023503044131671741, "loss": 1.6148, "step": 11749 }, { "epoch": 0.92, "learning_rate": 0.00023502025900083145, "loss": 1.6263, "step": 11750 }, { "epoch": 0.92, "learning_rate": 0.00023501007610770484, "loss": 1.5985, "step": 11751 }, { "epoch": 0.92, "learning_rate": 0.00023499989263740673, "loss": 1.5899, "step": 11752 }, { "epoch": 0.92, "learning_rate": 0.0002349897085900063, "loss": 1.5628, "step": 11753 }, { "epoch": 0.92, "learning_rate": 0.00023497952396557258, "loss": 1.6147, "step": 11754 }, { "epoch": 0.92, "learning_rate": 0.00023496933876417483, "loss": 1.5549, "step": 11755 }, { "epoch": 0.92, "learning_rate": 0.0002349591529858821, "loss": 1.6594, "step": 11756 }, { "epoch": 0.93, "learning_rate": 0.0002349489666307637, "loss": 1.5941, "step": 11757 }, { "epoch": 0.93, "learning_rate": 0.00023493877969888867, "loss": 1.5904, "step": 11758 }, { "epoch": 0.93, "learning_rate": 0.00023492859219032615, "loss": 1.6314, "step": 11759 }, { "epoch": 0.93, "learning_rate": 0.00023491840410514535, "loss": 1.6003, "step": 11760 }, { "epoch": 0.93, "learning_rate": 0.0002349082154434155, "loss": 1.519, "step": 11761 }, { "epoch": 0.93, "learning_rate": 0.0002348980262052057, "loss": 1.6089, "step": 11762 }, { "epoch": 0.93, "learning_rate": 0.00023488783639058516, "loss": 1.573, "step": 11763 }, { "epoch": 0.93, "learning_rate": 0.00023487764599962308, "loss": 1.6487, "step": 11764 }, { "epoch": 0.93, "learning_rate": 0.00023486745503238857, "loss": 1.5818, "step": 11765 }, { "epoch": 0.93, "learning_rate": 0.0002348572634889509, "loss": 1.5879, "step": 11766 }, { "epoch": 0.93, "learning_rate": 0.00023484707136937923, "loss": 1.6077, "step": 11767 }, { "epoch": 0.93, "learning_rate": 0.00023483687867374277, "loss": 1.6012, "step": 11768 }, { "epoch": 0.93, "learning_rate": 0.00023482668540211074, "loss": 1.5668, "step": 11769 }, { "epoch": 0.93, "learning_rate": 0.00023481649155455232, "loss": 1.5786, "step": 11770 }, { "epoch": 0.93, "learning_rate": 0.0002348062971311367, "loss": 1.6017, "step": 11771 }, { "epoch": 0.93, "learning_rate": 0.00023479610213193318, "loss": 1.5873, "step": 11772 }, { "epoch": 0.93, "learning_rate": 0.00023478590655701085, "loss": 1.5605, "step": 11773 }, { "epoch": 0.93, "learning_rate": 0.00023477571040643908, "loss": 1.601, "step": 11774 }, { "epoch": 0.93, "learning_rate": 0.00023476551368028698, "loss": 1.606, "step": 11775 }, { "epoch": 0.93, "learning_rate": 0.00023475531637862378, "loss": 1.6631, "step": 11776 }, { "epoch": 0.93, "learning_rate": 0.0002347451185015188, "loss": 1.6055, "step": 11777 }, { "epoch": 0.93, "learning_rate": 0.00023473492004904122, "loss": 1.5506, "step": 11778 }, { "epoch": 0.93, "learning_rate": 0.00023472472102126029, "loss": 1.5802, "step": 11779 }, { "epoch": 0.93, "learning_rate": 0.00023471452141824532, "loss": 1.6272, "step": 11780 }, { "epoch": 0.93, "learning_rate": 0.0002347043212400654, "loss": 1.6161, "step": 11781 }, { "epoch": 0.93, "learning_rate": 0.00023469412048678995, "loss": 1.5724, "step": 11782 }, { "epoch": 0.93, "learning_rate": 0.0002346839191584881, "loss": 1.593, "step": 11783 }, { "epoch": 0.93, "learning_rate": 0.00023467371725522924, "loss": 1.6126, "step": 11784 }, { "epoch": 0.93, "learning_rate": 0.00023466351477708253, "loss": 1.6372, "step": 11785 }, { "epoch": 0.93, "learning_rate": 0.00023465331172411728, "loss": 1.5723, "step": 11786 }, { "epoch": 0.93, "learning_rate": 0.00023464310809640277, "loss": 1.5968, "step": 11787 }, { "epoch": 0.93, "learning_rate": 0.00023463290389400828, "loss": 1.6556, "step": 11788 }, { "epoch": 0.93, "learning_rate": 0.000234622699117003, "loss": 1.5736, "step": 11789 }, { "epoch": 0.93, "learning_rate": 0.0002346124937654564, "loss": 1.6134, "step": 11790 }, { "epoch": 0.93, "learning_rate": 0.00023460228783943755, "loss": 1.6356, "step": 11791 }, { "epoch": 0.93, "learning_rate": 0.00023459208133901592, "loss": 1.6317, "step": 11792 }, { "epoch": 0.93, "learning_rate": 0.00023458187426426074, "loss": 1.6355, "step": 11793 }, { "epoch": 0.93, "learning_rate": 0.0002345716666152413, "loss": 1.6237, "step": 11794 }, { "epoch": 0.93, "learning_rate": 0.00023456145839202694, "loss": 1.625, "step": 11795 }, { "epoch": 0.93, "learning_rate": 0.00023455124959468693, "loss": 1.5573, "step": 11796 }, { "epoch": 0.93, "learning_rate": 0.00023454104022329058, "loss": 1.5876, "step": 11797 }, { "epoch": 0.93, "learning_rate": 0.0002345308302779072, "loss": 1.623, "step": 11798 }, { "epoch": 0.93, "learning_rate": 0.00023452061975860614, "loss": 1.6419, "step": 11799 }, { "epoch": 0.93, "learning_rate": 0.00023451040866545673, "loss": 1.5952, "step": 11800 }, { "epoch": 0.93, "learning_rate": 0.00023450019699852826, "loss": 1.6572, "step": 11801 }, { "epoch": 0.93, "learning_rate": 0.00023448998475789008, "loss": 1.6161, "step": 11802 }, { "epoch": 0.93, "learning_rate": 0.00023447977194361155, "loss": 1.558, "step": 11803 }, { "epoch": 0.93, "learning_rate": 0.00023446955855576203, "loss": 1.5848, "step": 11804 }, { "epoch": 0.93, "learning_rate": 0.00023445934459441077, "loss": 1.6554, "step": 11805 }, { "epoch": 0.93, "learning_rate": 0.00023444913005962718, "loss": 1.5816, "step": 11806 }, { "epoch": 0.93, "learning_rate": 0.00023443891495148058, "loss": 1.6105, "step": 11807 }, { "epoch": 0.93, "learning_rate": 0.00023442869927004032, "loss": 1.6236, "step": 11808 }, { "epoch": 0.93, "learning_rate": 0.00023441848301537587, "loss": 1.5724, "step": 11809 }, { "epoch": 0.93, "learning_rate": 0.00023440826618755645, "loss": 1.5733, "step": 11810 }, { "epoch": 0.93, "learning_rate": 0.0002343980487866515, "loss": 1.6671, "step": 11811 }, { "epoch": 0.93, "learning_rate": 0.00023438783081273037, "loss": 1.5864, "step": 11812 }, { "epoch": 0.93, "learning_rate": 0.00023437761226586244, "loss": 1.568, "step": 11813 }, { "epoch": 0.93, "learning_rate": 0.0002343673931461171, "loss": 1.6219, "step": 11814 }, { "epoch": 0.93, "learning_rate": 0.00023435717345356367, "loss": 1.6193, "step": 11815 }, { "epoch": 0.93, "learning_rate": 0.00023434695318827164, "loss": 1.6087, "step": 11816 }, { "epoch": 0.93, "learning_rate": 0.0002343367323503103, "loss": 1.5785, "step": 11817 }, { "epoch": 0.93, "learning_rate": 0.0002343265109397491, "loss": 1.6371, "step": 11818 }, { "epoch": 0.93, "learning_rate": 0.00023431628895665747, "loss": 1.6078, "step": 11819 }, { "epoch": 0.93, "learning_rate": 0.0002343060664011047, "loss": 1.6491, "step": 11820 }, { "epoch": 0.93, "learning_rate": 0.0002342958432731603, "loss": 1.5982, "step": 11821 }, { "epoch": 0.93, "learning_rate": 0.00023428561957289365, "loss": 1.5763, "step": 11822 }, { "epoch": 0.93, "learning_rate": 0.00023427539530037413, "loss": 1.6113, "step": 11823 }, { "epoch": 0.93, "learning_rate": 0.00023426517045567116, "loss": 1.5718, "step": 11824 }, { "epoch": 0.93, "learning_rate": 0.00023425494503885423, "loss": 1.6198, "step": 11825 }, { "epoch": 0.93, "learning_rate": 0.00023424471904999274, "loss": 1.6334, "step": 11826 }, { "epoch": 0.93, "learning_rate": 0.00023423449248915603, "loss": 1.5946, "step": 11827 }, { "epoch": 0.93, "learning_rate": 0.00023422426535641365, "loss": 1.5889, "step": 11828 }, { "epoch": 0.93, "learning_rate": 0.00023421403765183497, "loss": 1.628, "step": 11829 }, { "epoch": 0.93, "learning_rate": 0.00023420380937548948, "loss": 1.5813, "step": 11830 }, { "epoch": 0.93, "learning_rate": 0.00023419358052744653, "loss": 1.5912, "step": 11831 }, { "epoch": 0.93, "learning_rate": 0.00023418335110777567, "loss": 1.5792, "step": 11832 }, { "epoch": 0.93, "learning_rate": 0.00023417312111654633, "loss": 1.6303, "step": 11833 }, { "epoch": 0.93, "learning_rate": 0.00023416289055382792, "loss": 1.6035, "step": 11834 }, { "epoch": 0.93, "learning_rate": 0.0002341526594196899, "loss": 1.5835, "step": 11835 }, { "epoch": 0.93, "learning_rate": 0.00023414242771420182, "loss": 1.6372, "step": 11836 }, { "epoch": 0.93, "learning_rate": 0.00023413219543743307, "loss": 1.6387, "step": 11837 }, { "epoch": 0.93, "learning_rate": 0.00023412196258945314, "loss": 1.5888, "step": 11838 }, { "epoch": 0.93, "learning_rate": 0.00023411172917033146, "loss": 1.6075, "step": 11839 }, { "epoch": 0.93, "learning_rate": 0.0002341014951801376, "loss": 1.6289, "step": 11840 }, { "epoch": 0.93, "learning_rate": 0.00023409126061894103, "loss": 1.5279, "step": 11841 }, { "epoch": 0.93, "learning_rate": 0.00023408102548681112, "loss": 1.6228, "step": 11842 }, { "epoch": 0.93, "learning_rate": 0.00023407078978381751, "loss": 1.5872, "step": 11843 }, { "epoch": 0.93, "learning_rate": 0.00023406055351002963, "loss": 1.5919, "step": 11844 }, { "epoch": 0.93, "learning_rate": 0.00023405031666551697, "loss": 1.6256, "step": 11845 }, { "epoch": 0.93, "learning_rate": 0.000234040079250349, "loss": 1.5778, "step": 11846 }, { "epoch": 0.93, "learning_rate": 0.00023402984126459533, "loss": 1.6115, "step": 11847 }, { "epoch": 0.93, "learning_rate": 0.00023401960270832538, "loss": 1.5896, "step": 11848 }, { "epoch": 0.93, "learning_rate": 0.00023400936358160872, "loss": 1.5463, "step": 11849 }, { "epoch": 0.93, "learning_rate": 0.00023399912388451482, "loss": 1.644, "step": 11850 }, { "epoch": 0.93, "learning_rate": 0.00023398888361711323, "loss": 1.6021, "step": 11851 }, { "epoch": 0.93, "learning_rate": 0.0002339786427794735, "loss": 1.6217, "step": 11852 }, { "epoch": 0.93, "learning_rate": 0.00023396840137166508, "loss": 1.6156, "step": 11853 }, { "epoch": 0.93, "learning_rate": 0.00023395815939375754, "loss": 1.6228, "step": 11854 }, { "epoch": 0.93, "learning_rate": 0.00023394791684582043, "loss": 1.5812, "step": 11855 }, { "epoch": 0.93, "learning_rate": 0.00023393767372792336, "loss": 1.681, "step": 11856 }, { "epoch": 0.93, "learning_rate": 0.00023392743004013576, "loss": 1.5439, "step": 11857 }, { "epoch": 0.93, "learning_rate": 0.0002339171857825272, "loss": 1.6097, "step": 11858 }, { "epoch": 0.93, "learning_rate": 0.00023390694095516733, "loss": 1.5747, "step": 11859 }, { "epoch": 0.93, "learning_rate": 0.0002338966955581256, "loss": 1.6451, "step": 11860 }, { "epoch": 0.93, "learning_rate": 0.0002338864495914716, "loss": 1.646, "step": 11861 }, { "epoch": 0.93, "learning_rate": 0.00023387620305527485, "loss": 1.5969, "step": 11862 }, { "epoch": 0.93, "learning_rate": 0.00023386595594960505, "loss": 1.5837, "step": 11863 }, { "epoch": 0.93, "learning_rate": 0.00023385570827453162, "loss": 1.5959, "step": 11864 }, { "epoch": 0.93, "learning_rate": 0.00023384546003012423, "loss": 1.5389, "step": 11865 }, { "epoch": 0.93, "learning_rate": 0.00023383521121645248, "loss": 1.5974, "step": 11866 }, { "epoch": 0.93, "learning_rate": 0.00023382496183358588, "loss": 1.5836, "step": 11867 }, { "epoch": 0.93, "learning_rate": 0.00023381471188159403, "loss": 1.5477, "step": 11868 }, { "epoch": 0.93, "learning_rate": 0.00023380446136054658, "loss": 1.5741, "step": 11869 }, { "epoch": 0.93, "learning_rate": 0.00023379421027051303, "loss": 1.6234, "step": 11870 }, { "epoch": 0.93, "learning_rate": 0.00023378395861156306, "loss": 1.605, "step": 11871 }, { "epoch": 0.93, "learning_rate": 0.00023377370638376626, "loss": 1.5719, "step": 11872 }, { "epoch": 0.93, "learning_rate": 0.0002337634535871922, "loss": 1.5769, "step": 11873 }, { "epoch": 0.93, "learning_rate": 0.0002337532002219105, "loss": 1.5633, "step": 11874 }, { "epoch": 0.93, "learning_rate": 0.00023374294628799086, "loss": 1.5658, "step": 11875 }, { "epoch": 0.93, "learning_rate": 0.00023373269178550277, "loss": 1.5937, "step": 11876 }, { "epoch": 0.93, "learning_rate": 0.0002337224367145159, "loss": 1.5378, "step": 11877 }, { "epoch": 0.93, "learning_rate": 0.00023371218107509994, "loss": 1.6127, "step": 11878 }, { "epoch": 0.93, "learning_rate": 0.0002337019248673244, "loss": 1.5804, "step": 11879 }, { "epoch": 0.93, "learning_rate": 0.00023369166809125906, "loss": 1.5737, "step": 11880 }, { "epoch": 0.93, "learning_rate": 0.00023368141074697342, "loss": 1.5825, "step": 11881 }, { "epoch": 0.93, "learning_rate": 0.0002336711528345372, "loss": 1.5394, "step": 11882 }, { "epoch": 0.93, "learning_rate": 0.00023366089435402002, "loss": 1.6509, "step": 11883 }, { "epoch": 0.94, "learning_rate": 0.00023365063530549155, "loss": 1.6047, "step": 11884 }, { "epoch": 0.94, "learning_rate": 0.00023364037568902142, "loss": 1.536, "step": 11885 }, { "epoch": 0.94, "learning_rate": 0.00023363011550467925, "loss": 1.5978, "step": 11886 }, { "epoch": 0.94, "learning_rate": 0.0002336198547525348, "loss": 1.6574, "step": 11887 }, { "epoch": 0.94, "learning_rate": 0.00023360959343265772, "loss": 1.621, "step": 11888 }, { "epoch": 0.94, "learning_rate": 0.00023359933154511758, "loss": 1.5853, "step": 11889 }, { "epoch": 0.94, "learning_rate": 0.0002335890690899841, "loss": 1.6128, "step": 11890 }, { "epoch": 0.94, "learning_rate": 0.000233578806067327, "loss": 1.609, "step": 11891 }, { "epoch": 0.94, "learning_rate": 0.00023356854247721592, "loss": 1.569, "step": 11892 }, { "epoch": 0.94, "learning_rate": 0.00023355827831972057, "loss": 1.6178, "step": 11893 }, { "epoch": 0.94, "learning_rate": 0.00023354801359491058, "loss": 1.6383, "step": 11894 }, { "epoch": 0.94, "learning_rate": 0.00023353774830285568, "loss": 1.5824, "step": 11895 }, { "epoch": 0.94, "learning_rate": 0.00023352748244362566, "loss": 1.6016, "step": 11896 }, { "epoch": 0.94, "learning_rate": 0.00023351721601729005, "loss": 1.6047, "step": 11897 }, { "epoch": 0.94, "learning_rate": 0.00023350694902391866, "loss": 1.5829, "step": 11898 }, { "epoch": 0.94, "learning_rate": 0.00023349668146358115, "loss": 1.6077, "step": 11899 }, { "epoch": 0.94, "learning_rate": 0.00023348641333634728, "loss": 1.5625, "step": 11900 }, { "epoch": 0.94, "learning_rate": 0.0002334761446422867, "loss": 1.5767, "step": 11901 }, { "epoch": 0.94, "learning_rate": 0.00023346587538146916, "loss": 1.6118, "step": 11902 }, { "epoch": 0.94, "learning_rate": 0.00023345560555396437, "loss": 1.5809, "step": 11903 }, { "epoch": 0.94, "learning_rate": 0.00023344533515984217, "loss": 1.5834, "step": 11904 }, { "epoch": 0.94, "learning_rate": 0.00023343506419917212, "loss": 1.656, "step": 11905 }, { "epoch": 0.94, "learning_rate": 0.00023342479267202403, "loss": 1.6175, "step": 11906 }, { "epoch": 0.94, "learning_rate": 0.00023341452057846763, "loss": 1.5987, "step": 11907 }, { "epoch": 0.94, "learning_rate": 0.00023340424791857268, "loss": 1.5948, "step": 11908 }, { "epoch": 0.94, "learning_rate": 0.00023339397469240893, "loss": 1.596, "step": 11909 }, { "epoch": 0.94, "learning_rate": 0.00023338370090004608, "loss": 1.5781, "step": 11910 }, { "epoch": 0.94, "learning_rate": 0.00023337342654155397, "loss": 1.6096, "step": 11911 }, { "epoch": 0.94, "learning_rate": 0.00023336315161700223, "loss": 1.5663, "step": 11912 }, { "epoch": 0.94, "learning_rate": 0.00023335287612646073, "loss": 1.6633, "step": 11913 }, { "epoch": 0.94, "learning_rate": 0.0002333426000699992, "loss": 1.6674, "step": 11914 }, { "epoch": 0.94, "learning_rate": 0.0002333323234476874, "loss": 1.5718, "step": 11915 }, { "epoch": 0.94, "learning_rate": 0.00023332204625959514, "loss": 1.5708, "step": 11916 }, { "epoch": 0.94, "learning_rate": 0.00023331176850579211, "loss": 1.5891, "step": 11917 }, { "epoch": 0.94, "learning_rate": 0.00023330149018634819, "loss": 1.569, "step": 11918 }, { "epoch": 0.94, "learning_rate": 0.0002332912113013331, "loss": 1.5957, "step": 11919 }, { "epoch": 0.94, "learning_rate": 0.00023328093185081663, "loss": 1.6236, "step": 11920 }, { "epoch": 0.94, "learning_rate": 0.00023327065183486868, "loss": 1.5761, "step": 11921 }, { "epoch": 0.94, "learning_rate": 0.0002332603712535589, "loss": 1.607, "step": 11922 }, { "epoch": 0.94, "learning_rate": 0.00023325009010695714, "loss": 1.5809, "step": 11923 }, { "epoch": 0.94, "learning_rate": 0.0002332398083951332, "loss": 1.5768, "step": 11924 }, { "epoch": 0.94, "learning_rate": 0.0002332295261181569, "loss": 1.6197, "step": 11925 }, { "epoch": 0.94, "learning_rate": 0.00023321924327609806, "loss": 1.6097, "step": 11926 }, { "epoch": 0.94, "learning_rate": 0.00023320895986902646, "loss": 1.5361, "step": 11927 }, { "epoch": 0.94, "learning_rate": 0.00023319867589701194, "loss": 1.5523, "step": 11928 }, { "epoch": 0.94, "learning_rate": 0.00023318839136012438, "loss": 1.574, "step": 11929 }, { "epoch": 0.94, "learning_rate": 0.0002331781062584335, "loss": 1.5838, "step": 11930 }, { "epoch": 0.94, "learning_rate": 0.0002331678205920092, "loss": 1.5897, "step": 11931 }, { "epoch": 0.94, "learning_rate": 0.0002331575343609213, "loss": 1.5942, "step": 11932 }, { "epoch": 0.94, "learning_rate": 0.0002331472475652396, "loss": 1.6013, "step": 11933 }, { "epoch": 0.94, "learning_rate": 0.000233136960205034, "loss": 1.6216, "step": 11934 }, { "epoch": 0.94, "learning_rate": 0.00023312667228037433, "loss": 1.5956, "step": 11935 }, { "epoch": 0.94, "learning_rate": 0.00023311638379133038, "loss": 1.6379, "step": 11936 }, { "epoch": 0.94, "learning_rate": 0.0002331060947379721, "loss": 1.6597, "step": 11937 }, { "epoch": 0.94, "learning_rate": 0.0002330958051203693, "loss": 1.5619, "step": 11938 }, { "epoch": 0.94, "learning_rate": 0.00023308551493859183, "loss": 1.5832, "step": 11939 }, { "epoch": 0.94, "learning_rate": 0.00023307522419270952, "loss": 1.6468, "step": 11940 }, { "epoch": 0.94, "learning_rate": 0.00023306493288279234, "loss": 1.5585, "step": 11941 }, { "epoch": 0.94, "learning_rate": 0.00023305464100891005, "loss": 1.5834, "step": 11942 }, { "epoch": 0.94, "learning_rate": 0.0002330443485711326, "loss": 1.5315, "step": 11943 }, { "epoch": 0.94, "learning_rate": 0.0002330340555695299, "loss": 1.552, "step": 11944 }, { "epoch": 0.94, "learning_rate": 0.00023302376200417174, "loss": 1.6029, "step": 11945 }, { "epoch": 0.94, "learning_rate": 0.00023301346787512806, "loss": 1.5584, "step": 11946 }, { "epoch": 0.94, "learning_rate": 0.00023300317318246874, "loss": 1.5691, "step": 11947 }, { "epoch": 0.94, "learning_rate": 0.00023299287792626368, "loss": 1.6016, "step": 11948 }, { "epoch": 0.94, "learning_rate": 0.00023298258210658276, "loss": 1.596, "step": 11949 }, { "epoch": 0.94, "learning_rate": 0.0002329722857234959, "loss": 1.5492, "step": 11950 }, { "epoch": 0.94, "learning_rate": 0.00023296198877707306, "loss": 1.5938, "step": 11951 }, { "epoch": 0.94, "learning_rate": 0.00023295169126738409, "loss": 1.6049, "step": 11952 }, { "epoch": 0.94, "learning_rate": 0.00023294139319449887, "loss": 1.6011, "step": 11953 }, { "epoch": 0.94, "learning_rate": 0.0002329310945584874, "loss": 1.6509, "step": 11954 }, { "epoch": 0.94, "learning_rate": 0.00023292079535941953, "loss": 1.6095, "step": 11955 }, { "epoch": 0.94, "learning_rate": 0.0002329104955973652, "loss": 1.6162, "step": 11956 }, { "epoch": 0.94, "learning_rate": 0.00023290019527239444, "loss": 1.6465, "step": 11957 }, { "epoch": 0.94, "learning_rate": 0.00023288989438457705, "loss": 1.5498, "step": 11958 }, { "epoch": 0.94, "learning_rate": 0.00023287959293398302, "loss": 1.5884, "step": 11959 }, { "epoch": 0.94, "learning_rate": 0.0002328692909206823, "loss": 1.5542, "step": 11960 }, { "epoch": 0.94, "learning_rate": 0.00023285898834474482, "loss": 1.6394, "step": 11961 }, { "epoch": 0.94, "learning_rate": 0.0002328486852062405, "loss": 1.6069, "step": 11962 }, { "epoch": 0.94, "learning_rate": 0.00023283838150523937, "loss": 1.5836, "step": 11963 }, { "epoch": 0.94, "learning_rate": 0.0002328280772418113, "loss": 1.6012, "step": 11964 }, { "epoch": 0.94, "learning_rate": 0.00023281777241602637, "loss": 1.6207, "step": 11965 }, { "epoch": 0.94, "learning_rate": 0.00023280746702795442, "loss": 1.5681, "step": 11966 }, { "epoch": 0.94, "learning_rate": 0.00023279716107766548, "loss": 1.5826, "step": 11967 }, { "epoch": 0.94, "learning_rate": 0.0002327868545652295, "loss": 1.5936, "step": 11968 }, { "epoch": 0.94, "learning_rate": 0.00023277654749071647, "loss": 1.5819, "step": 11969 }, { "epoch": 0.94, "learning_rate": 0.00023276623985419635, "loss": 1.5534, "step": 11970 }, { "epoch": 0.94, "learning_rate": 0.00023275593165573915, "loss": 1.5524, "step": 11971 }, { "epoch": 0.94, "learning_rate": 0.0002327456228954148, "loss": 1.6547, "step": 11972 }, { "epoch": 0.94, "learning_rate": 0.00023273531357329336, "loss": 1.6, "step": 11973 }, { "epoch": 0.94, "learning_rate": 0.00023272500368944483, "loss": 1.582, "step": 11974 }, { "epoch": 0.94, "learning_rate": 0.00023271469324393914, "loss": 1.5801, "step": 11975 }, { "epoch": 0.94, "learning_rate": 0.00023270438223684634, "loss": 1.624, "step": 11976 }, { "epoch": 0.94, "learning_rate": 0.00023269407066823643, "loss": 1.5835, "step": 11977 }, { "epoch": 0.94, "learning_rate": 0.00023268375853817942, "loss": 1.5658, "step": 11978 }, { "epoch": 0.94, "learning_rate": 0.00023267344584674535, "loss": 1.5644, "step": 11979 }, { "epoch": 0.94, "learning_rate": 0.00023266313259400414, "loss": 1.5869, "step": 11980 }, { "epoch": 0.94, "learning_rate": 0.00023265281878002587, "loss": 1.5442, "step": 11981 }, { "epoch": 0.94, "learning_rate": 0.0002326425044048806, "loss": 1.5913, "step": 11982 }, { "epoch": 0.94, "learning_rate": 0.00023263218946863832, "loss": 1.6146, "step": 11983 }, { "epoch": 0.94, "learning_rate": 0.00023262187397136912, "loss": 1.5938, "step": 11984 }, { "epoch": 0.94, "learning_rate": 0.00023261155791314296, "loss": 1.6108, "step": 11985 }, { "epoch": 0.94, "learning_rate": 0.0002326012412940299, "loss": 1.6597, "step": 11986 }, { "epoch": 0.94, "learning_rate": 0.0002325909241141, "loss": 1.667, "step": 11987 }, { "epoch": 0.94, "learning_rate": 0.0002325806063734233, "loss": 1.5553, "step": 11988 }, { "epoch": 0.94, "learning_rate": 0.00023257028807206986, "loss": 1.5634, "step": 11989 }, { "epoch": 0.94, "learning_rate": 0.00023255996921010973, "loss": 1.6145, "step": 11990 }, { "epoch": 0.94, "learning_rate": 0.00023254964978761298, "loss": 1.5876, "step": 11991 }, { "epoch": 0.94, "learning_rate": 0.00023253932980464966, "loss": 1.583, "step": 11992 }, { "epoch": 0.94, "learning_rate": 0.00023252900926128982, "loss": 1.5935, "step": 11993 }, { "epoch": 0.94, "learning_rate": 0.00023251868815760357, "loss": 1.6404, "step": 11994 }, { "epoch": 0.94, "learning_rate": 0.00023250836649366097, "loss": 1.5727, "step": 11995 }, { "epoch": 0.94, "learning_rate": 0.00023249804426953206, "loss": 1.6222, "step": 11996 }, { "epoch": 0.94, "learning_rate": 0.00023248772148528699, "loss": 1.6212, "step": 11997 }, { "epoch": 0.94, "learning_rate": 0.00023247739814099576, "loss": 1.5705, "step": 11998 }, { "epoch": 0.94, "learning_rate": 0.00023246707423672856, "loss": 1.5762, "step": 11999 }, { "epoch": 0.94, "learning_rate": 0.00023245674977255543, "loss": 1.6297, "step": 12000 }, { "epoch": 0.94, "learning_rate": 0.00023244642474854648, "loss": 1.5446, "step": 12001 }, { "epoch": 0.94, "learning_rate": 0.0002324360991647718, "loss": 1.6001, "step": 12002 }, { "epoch": 0.94, "learning_rate": 0.0002324257730213015, "loss": 1.597, "step": 12003 }, { "epoch": 0.94, "learning_rate": 0.00023241544631820562, "loss": 1.6072, "step": 12004 }, { "epoch": 0.94, "learning_rate": 0.0002324051190555544, "loss": 1.5339, "step": 12005 }, { "epoch": 0.94, "learning_rate": 0.00023239479123341792, "loss": 1.634, "step": 12006 }, { "epoch": 0.94, "learning_rate": 0.00023238446285186624, "loss": 1.6459, "step": 12007 }, { "epoch": 0.94, "learning_rate": 0.00023237413391096953, "loss": 1.5499, "step": 12008 }, { "epoch": 0.94, "learning_rate": 0.0002323638044107979, "loss": 1.5893, "step": 12009 }, { "epoch": 0.94, "learning_rate": 0.00023235347435142153, "loss": 1.6417, "step": 12010 }, { "epoch": 0.95, "learning_rate": 0.00023234314373291043, "loss": 1.6003, "step": 12011 }, { "epoch": 0.95, "learning_rate": 0.0002323328125553349, "loss": 1.5961, "step": 12012 }, { "epoch": 0.95, "learning_rate": 0.000232322480818765, "loss": 1.5622, "step": 12013 }, { "epoch": 0.95, "learning_rate": 0.00023231214852327087, "loss": 1.5473, "step": 12014 }, { "epoch": 0.95, "learning_rate": 0.00023230181566892265, "loss": 1.6196, "step": 12015 }, { "epoch": 0.95, "learning_rate": 0.0002322914822557906, "loss": 1.59, "step": 12016 }, { "epoch": 0.95, "learning_rate": 0.0002322811482839447, "loss": 1.5966, "step": 12017 }, { "epoch": 0.95, "learning_rate": 0.00023227081375345527, "loss": 1.5676, "step": 12018 }, { "epoch": 0.95, "learning_rate": 0.0002322604786643924, "loss": 1.5831, "step": 12019 }, { "epoch": 0.95, "learning_rate": 0.0002322501430168263, "loss": 1.5835, "step": 12020 }, { "epoch": 0.95, "learning_rate": 0.00023223980681082705, "loss": 1.5548, "step": 12021 }, { "epoch": 0.95, "learning_rate": 0.00023222947004646497, "loss": 1.6072, "step": 12022 }, { "epoch": 0.95, "learning_rate": 0.0002322191327238101, "loss": 1.6321, "step": 12023 }, { "epoch": 0.95, "learning_rate": 0.0002322087948429328, "loss": 1.6059, "step": 12024 }, { "epoch": 0.95, "learning_rate": 0.00023219845640390304, "loss": 1.6409, "step": 12025 }, { "epoch": 0.95, "learning_rate": 0.00023218811740679114, "loss": 1.6039, "step": 12026 }, { "epoch": 0.95, "learning_rate": 0.00023217777785166727, "loss": 1.5901, "step": 12027 }, { "epoch": 0.95, "learning_rate": 0.00023216743773860166, "loss": 1.6537, "step": 12028 }, { "epoch": 0.95, "learning_rate": 0.00023215709706766451, "loss": 1.5828, "step": 12029 }, { "epoch": 0.95, "learning_rate": 0.000232146755838926, "loss": 1.5581, "step": 12030 }, { "epoch": 0.95, "learning_rate": 0.00023213641405245636, "loss": 1.6129, "step": 12031 }, { "epoch": 0.95, "learning_rate": 0.00023212607170832578, "loss": 1.6401, "step": 12032 }, { "epoch": 0.95, "learning_rate": 0.0002321157288066045, "loss": 1.5846, "step": 12033 }, { "epoch": 0.95, "learning_rate": 0.00023210538534736272, "loss": 1.6186, "step": 12034 }, { "epoch": 0.95, "learning_rate": 0.00023209504133067066, "loss": 1.6279, "step": 12035 }, { "epoch": 0.95, "learning_rate": 0.00023208469675659862, "loss": 1.6113, "step": 12036 }, { "epoch": 0.95, "learning_rate": 0.00023207435162521676, "loss": 1.6306, "step": 12037 }, { "epoch": 0.95, "learning_rate": 0.00023206400593659538, "loss": 1.6242, "step": 12038 }, { "epoch": 0.95, "learning_rate": 0.00023205365969080466, "loss": 1.6149, "step": 12039 }, { "epoch": 0.95, "learning_rate": 0.00023204331288791488, "loss": 1.6101, "step": 12040 }, { "epoch": 0.95, "learning_rate": 0.00023203296552799628, "loss": 1.5289, "step": 12041 }, { "epoch": 0.95, "learning_rate": 0.0002320226176111191, "loss": 1.5669, "step": 12042 }, { "epoch": 0.95, "learning_rate": 0.00023201226913735363, "loss": 1.5557, "step": 12043 }, { "epoch": 0.95, "learning_rate": 0.00023200192010677006, "loss": 1.5804, "step": 12044 }, { "epoch": 0.95, "learning_rate": 0.00023199157051943876, "loss": 1.5223, "step": 12045 }, { "epoch": 0.95, "learning_rate": 0.00023198122037542993, "loss": 1.613, "step": 12046 }, { "epoch": 0.95, "learning_rate": 0.00023197086967481384, "loss": 1.639, "step": 12047 }, { "epoch": 0.95, "learning_rate": 0.00023196051841766082, "loss": 1.5396, "step": 12048 }, { "epoch": 0.95, "learning_rate": 0.00023195016660404108, "loss": 1.5394, "step": 12049 }, { "epoch": 0.95, "learning_rate": 0.00023193981423402495, "loss": 1.656, "step": 12050 }, { "epoch": 0.95, "learning_rate": 0.00023192946130768267, "loss": 1.6499, "step": 12051 }, { "epoch": 0.95, "learning_rate": 0.00023191910782508453, "loss": 1.5852, "step": 12052 }, { "epoch": 0.95, "learning_rate": 0.00023190875378630092, "loss": 1.6913, "step": 12053 }, { "epoch": 0.95, "learning_rate": 0.00023189839919140207, "loss": 1.5358, "step": 12054 }, { "epoch": 0.95, "learning_rate": 0.00023188804404045826, "loss": 1.5415, "step": 12055 }, { "epoch": 0.95, "learning_rate": 0.00023187768833353984, "loss": 1.6041, "step": 12056 }, { "epoch": 0.95, "learning_rate": 0.00023186733207071708, "loss": 1.6272, "step": 12057 }, { "epoch": 0.95, "learning_rate": 0.00023185697525206033, "loss": 1.646, "step": 12058 }, { "epoch": 0.95, "learning_rate": 0.00023184661787763986, "loss": 1.5499, "step": 12059 }, { "epoch": 0.95, "learning_rate": 0.00023183625994752604, "loss": 1.5582, "step": 12060 }, { "epoch": 0.95, "learning_rate": 0.00023182590146178918, "loss": 1.6022, "step": 12061 }, { "epoch": 0.95, "learning_rate": 0.00023181554242049962, "loss": 1.5718, "step": 12062 }, { "epoch": 0.95, "learning_rate": 0.00023180518282372764, "loss": 1.5859, "step": 12063 }, { "epoch": 0.95, "learning_rate": 0.00023179482267154364, "loss": 1.5955, "step": 12064 }, { "epoch": 0.95, "learning_rate": 0.00023178446196401794, "loss": 1.6684, "step": 12065 }, { "epoch": 0.95, "learning_rate": 0.00023177410070122082, "loss": 1.6504, "step": 12066 }, { "epoch": 0.95, "learning_rate": 0.00023176373888322274, "loss": 1.5966, "step": 12067 }, { "epoch": 0.95, "learning_rate": 0.00023175337651009395, "loss": 1.6034, "step": 12068 }, { "epoch": 0.95, "learning_rate": 0.00023174301358190494, "loss": 1.5718, "step": 12069 }, { "epoch": 0.95, "learning_rate": 0.0002317326500987259, "loss": 1.5695, "step": 12070 }, { "epoch": 0.95, "learning_rate": 0.00023172228606062724, "loss": 1.579, "step": 12071 }, { "epoch": 0.95, "learning_rate": 0.0002317119214676794, "loss": 1.6085, "step": 12072 }, { "epoch": 0.95, "learning_rate": 0.00023170155631995276, "loss": 1.6487, "step": 12073 }, { "epoch": 0.95, "learning_rate": 0.00023169119061751755, "loss": 1.6387, "step": 12074 }, { "epoch": 0.95, "learning_rate": 0.00023168082436044425, "loss": 1.6107, "step": 12075 }, { "epoch": 0.95, "learning_rate": 0.00023167045754880324, "loss": 1.5734, "step": 12076 }, { "epoch": 0.95, "learning_rate": 0.00023166009018266493, "loss": 1.6318, "step": 12077 }, { "epoch": 0.95, "learning_rate": 0.00023164972226209963, "loss": 1.5961, "step": 12078 }, { "epoch": 0.95, "learning_rate": 0.00023163935378717779, "loss": 1.546, "step": 12079 }, { "epoch": 0.95, "learning_rate": 0.0002316289847579698, "loss": 1.5752, "step": 12080 }, { "epoch": 0.95, "learning_rate": 0.00023161861517454602, "loss": 1.5578, "step": 12081 }, { "epoch": 0.95, "learning_rate": 0.00023160824503697688, "loss": 1.6314, "step": 12082 }, { "epoch": 0.95, "learning_rate": 0.00023159787434533281, "loss": 1.6238, "step": 12083 }, { "epoch": 0.95, "learning_rate": 0.0002315875030996842, "loss": 1.6207, "step": 12084 }, { "epoch": 0.95, "learning_rate": 0.0002315771313001015, "loss": 1.5959, "step": 12085 }, { "epoch": 0.95, "learning_rate": 0.00023156675894665506, "loss": 1.6171, "step": 12086 }, { "epoch": 0.95, "learning_rate": 0.00023155638603941534, "loss": 1.58, "step": 12087 }, { "epoch": 0.95, "learning_rate": 0.00023154601257845277, "loss": 1.5805, "step": 12088 }, { "epoch": 0.95, "learning_rate": 0.00023153563856383776, "loss": 1.6134, "step": 12089 }, { "epoch": 0.95, "learning_rate": 0.00023152526399564078, "loss": 1.5749, "step": 12090 }, { "epoch": 0.95, "learning_rate": 0.00023151488887393224, "loss": 1.5557, "step": 12091 }, { "epoch": 0.95, "learning_rate": 0.00023150451319878262, "loss": 1.6285, "step": 12092 }, { "epoch": 0.95, "learning_rate": 0.00023149413697026228, "loss": 1.4656, "step": 12093 }, { "epoch": 0.95, "learning_rate": 0.00023148376018844176, "loss": 1.5341, "step": 12094 }, { "epoch": 0.95, "learning_rate": 0.00023147338285339148, "loss": 1.6022, "step": 12095 }, { "epoch": 0.95, "learning_rate": 0.00023146300496518186, "loss": 1.5813, "step": 12096 }, { "epoch": 0.95, "learning_rate": 0.00023145262652388338, "loss": 1.6149, "step": 12097 }, { "epoch": 0.95, "learning_rate": 0.00023144224752956653, "loss": 1.6205, "step": 12098 }, { "epoch": 0.95, "learning_rate": 0.00023143186798230177, "loss": 1.6214, "step": 12099 }, { "epoch": 0.95, "learning_rate": 0.00023142148788215958, "loss": 1.6025, "step": 12100 }, { "epoch": 0.95, "learning_rate": 0.0002314111072292104, "loss": 1.5774, "step": 12101 }, { "epoch": 0.95, "learning_rate": 0.00023140072602352476, "loss": 1.5734, "step": 12102 }, { "epoch": 0.95, "learning_rate": 0.00023139034426517308, "loss": 1.6139, "step": 12103 }, { "epoch": 0.95, "learning_rate": 0.0002313799619542259, "loss": 1.5944, "step": 12104 }, { "epoch": 0.95, "learning_rate": 0.00023136957909075366, "loss": 1.5838, "step": 12105 }, { "epoch": 0.95, "learning_rate": 0.0002313591956748269, "loss": 1.5964, "step": 12106 }, { "epoch": 0.95, "learning_rate": 0.00023134881170651606, "loss": 1.5841, "step": 12107 }, { "epoch": 0.95, "learning_rate": 0.00023133842718589174, "loss": 1.6049, "step": 12108 }, { "epoch": 0.95, "learning_rate": 0.00023132804211302435, "loss": 1.5895, "step": 12109 }, { "epoch": 0.95, "learning_rate": 0.00023131765648798442, "loss": 1.6146, "step": 12110 }, { "epoch": 0.95, "learning_rate": 0.00023130727031084252, "loss": 1.5607, "step": 12111 }, { "epoch": 0.95, "learning_rate": 0.0002312968835816691, "loss": 1.6033, "step": 12112 }, { "epoch": 0.95, "learning_rate": 0.0002312864963005347, "loss": 1.6044, "step": 12113 }, { "epoch": 0.95, "learning_rate": 0.00023127610846750984, "loss": 1.5643, "step": 12114 }, { "epoch": 0.95, "learning_rate": 0.00023126572008266507, "loss": 1.5714, "step": 12115 }, { "epoch": 0.95, "learning_rate": 0.00023125533114607089, "loss": 1.5884, "step": 12116 }, { "epoch": 0.95, "learning_rate": 0.00023124494165779785, "loss": 1.5174, "step": 12117 }, { "epoch": 0.95, "learning_rate": 0.00023123455161791652, "loss": 1.6119, "step": 12118 }, { "epoch": 0.95, "learning_rate": 0.00023122416102649743, "loss": 1.6462, "step": 12119 }, { "epoch": 0.95, "learning_rate": 0.00023121376988361107, "loss": 1.5557, "step": 12120 }, { "epoch": 0.95, "learning_rate": 0.00023120337818932803, "loss": 1.5445, "step": 12121 }, { "epoch": 0.95, "learning_rate": 0.00023119298594371888, "loss": 1.5355, "step": 12122 }, { "epoch": 0.95, "learning_rate": 0.00023118259314685414, "loss": 1.6143, "step": 12123 }, { "epoch": 0.95, "learning_rate": 0.0002311721997988044, "loss": 1.6105, "step": 12124 }, { "epoch": 0.95, "learning_rate": 0.00023116180589964025, "loss": 1.5687, "step": 12125 }, { "epoch": 0.95, "learning_rate": 0.00023115141144943222, "loss": 1.5966, "step": 12126 }, { "epoch": 0.95, "learning_rate": 0.00023114101644825086, "loss": 1.5868, "step": 12127 }, { "epoch": 0.95, "learning_rate": 0.00023113062089616677, "loss": 1.614, "step": 12128 }, { "epoch": 0.95, "learning_rate": 0.00023112022479325058, "loss": 1.6039, "step": 12129 }, { "epoch": 0.95, "learning_rate": 0.00023110982813957283, "loss": 1.6429, "step": 12130 }, { "epoch": 0.95, "learning_rate": 0.00023109943093520404, "loss": 1.5768, "step": 12131 }, { "epoch": 0.95, "learning_rate": 0.00023108903318021495, "loss": 1.6336, "step": 12132 }, { "epoch": 0.95, "learning_rate": 0.00023107863487467598, "loss": 1.6002, "step": 12133 }, { "epoch": 0.95, "learning_rate": 0.00023106823601865792, "loss": 1.5778, "step": 12134 }, { "epoch": 0.95, "learning_rate": 0.00023105783661223121, "loss": 1.5862, "step": 12135 }, { "epoch": 0.95, "learning_rate": 0.00023104743665546654, "loss": 1.648, "step": 12136 }, { "epoch": 0.95, "learning_rate": 0.00023103703614843447, "loss": 1.628, "step": 12137 }, { "epoch": 0.96, "learning_rate": 0.00023102663509120568, "loss": 1.6201, "step": 12138 }, { "epoch": 0.96, "learning_rate": 0.00023101623348385078, "loss": 1.6382, "step": 12139 }, { "epoch": 0.96, "learning_rate": 0.0002310058313264403, "loss": 1.5956, "step": 12140 }, { "epoch": 0.96, "learning_rate": 0.00023099542861904497, "loss": 1.5882, "step": 12141 }, { "epoch": 0.96, "learning_rate": 0.0002309850253617354, "loss": 1.5881, "step": 12142 }, { "epoch": 0.96, "learning_rate": 0.00023097462155458216, "loss": 1.6091, "step": 12143 }, { "epoch": 0.96, "learning_rate": 0.00023096421719765594, "loss": 1.6096, "step": 12144 }, { "epoch": 0.96, "learning_rate": 0.00023095381229102732, "loss": 1.5869, "step": 12145 }, { "epoch": 0.96, "learning_rate": 0.00023094340683476702, "loss": 1.5454, "step": 12146 }, { "epoch": 0.96, "learning_rate": 0.00023093300082894567, "loss": 1.6077, "step": 12147 }, { "epoch": 0.96, "learning_rate": 0.00023092259427363388, "loss": 1.6052, "step": 12148 }, { "epoch": 0.96, "learning_rate": 0.0002309121871689024, "loss": 1.5389, "step": 12149 }, { "epoch": 0.96, "learning_rate": 0.00023090177951482171, "loss": 1.5861, "step": 12150 }, { "epoch": 0.96, "learning_rate": 0.0002308913713114627, "loss": 1.5633, "step": 12151 }, { "epoch": 0.96, "learning_rate": 0.00023088096255889583, "loss": 1.5407, "step": 12152 }, { "epoch": 0.96, "learning_rate": 0.00023087055325719187, "loss": 1.5893, "step": 12153 }, { "epoch": 0.96, "learning_rate": 0.00023086014340642147, "loss": 1.5975, "step": 12154 }, { "epoch": 0.96, "learning_rate": 0.00023084973300665536, "loss": 1.6251, "step": 12155 }, { "epoch": 0.96, "learning_rate": 0.0002308393220579642, "loss": 1.6288, "step": 12156 }, { "epoch": 0.96, "learning_rate": 0.0002308289105604186, "loss": 1.5156, "step": 12157 }, { "epoch": 0.96, "learning_rate": 0.00023081849851408934, "loss": 1.5859, "step": 12158 }, { "epoch": 0.96, "learning_rate": 0.00023080808591904707, "loss": 1.5252, "step": 12159 }, { "epoch": 0.96, "learning_rate": 0.00023079767277536244, "loss": 1.5974, "step": 12160 }, { "epoch": 0.96, "learning_rate": 0.00023078725908310622, "loss": 1.5866, "step": 12161 }, { "epoch": 0.96, "learning_rate": 0.00023077684484234913, "loss": 1.6197, "step": 12162 }, { "epoch": 0.96, "learning_rate": 0.00023076643005316184, "loss": 1.6371, "step": 12163 }, { "epoch": 0.96, "learning_rate": 0.00023075601471561502, "loss": 1.6013, "step": 12164 }, { "epoch": 0.96, "learning_rate": 0.0002307455988297794, "loss": 1.5409, "step": 12165 }, { "epoch": 0.96, "learning_rate": 0.00023073518239572583, "loss": 1.5646, "step": 12166 }, { "epoch": 0.96, "learning_rate": 0.00023072476541352485, "loss": 1.6417, "step": 12167 }, { "epoch": 0.96, "learning_rate": 0.00023071434788324725, "loss": 1.5874, "step": 12168 }, { "epoch": 0.96, "learning_rate": 0.0002307039298049638, "loss": 1.5952, "step": 12169 }, { "epoch": 0.96, "learning_rate": 0.00023069351117874516, "loss": 1.6136, "step": 12170 }, { "epoch": 0.96, "learning_rate": 0.0002306830920046622, "loss": 1.6201, "step": 12171 }, { "epoch": 0.96, "learning_rate": 0.00023067267228278547, "loss": 1.5919, "step": 12172 }, { "epoch": 0.96, "learning_rate": 0.0002306622520131859, "loss": 1.652, "step": 12173 }, { "epoch": 0.96, "learning_rate": 0.00023065183119593411, "loss": 1.584, "step": 12174 }, { "epoch": 0.96, "learning_rate": 0.00023064140983110088, "loss": 1.5859, "step": 12175 }, { "epoch": 0.96, "learning_rate": 0.000230630987918757, "loss": 1.5582, "step": 12176 }, { "epoch": 0.96, "learning_rate": 0.00023062056545897317, "loss": 1.5923, "step": 12177 }, { "epoch": 0.96, "learning_rate": 0.00023061014245182024, "loss": 1.5859, "step": 12178 }, { "epoch": 0.96, "learning_rate": 0.0002305997188973689, "loss": 1.6573, "step": 12179 }, { "epoch": 0.96, "learning_rate": 0.00023058929479568999, "loss": 1.6167, "step": 12180 }, { "epoch": 0.96, "learning_rate": 0.0002305788701468542, "loss": 1.5987, "step": 12181 }, { "epoch": 0.96, "learning_rate": 0.00023056844495093236, "loss": 1.5961, "step": 12182 }, { "epoch": 0.96, "learning_rate": 0.00023055801920799526, "loss": 1.6451, "step": 12183 }, { "epoch": 0.96, "learning_rate": 0.0002305475929181136, "loss": 1.6015, "step": 12184 }, { "epoch": 0.96, "learning_rate": 0.00023053716608135828, "loss": 1.5855, "step": 12185 }, { "epoch": 0.96, "learning_rate": 0.00023052673869780003, "loss": 1.5673, "step": 12186 }, { "epoch": 0.96, "learning_rate": 0.00023051631076750968, "loss": 1.5618, "step": 12187 }, { "epoch": 0.96, "learning_rate": 0.000230505882290558, "loss": 1.522, "step": 12188 }, { "epoch": 0.96, "learning_rate": 0.00023049545326701582, "loss": 1.5648, "step": 12189 }, { "epoch": 0.96, "learning_rate": 0.00023048502369695393, "loss": 1.6331, "step": 12190 }, { "epoch": 0.96, "learning_rate": 0.00023047459358044314, "loss": 1.5742, "step": 12191 }, { "epoch": 0.96, "learning_rate": 0.00023046416291755425, "loss": 1.6055, "step": 12192 }, { "epoch": 0.96, "learning_rate": 0.00023045373170835814, "loss": 1.6248, "step": 12193 }, { "epoch": 0.96, "learning_rate": 0.00023044329995292555, "loss": 1.5577, "step": 12194 }, { "epoch": 0.96, "learning_rate": 0.0002304328676513274, "loss": 1.6179, "step": 12195 }, { "epoch": 0.96, "learning_rate": 0.00023042243480363443, "loss": 1.628, "step": 12196 }, { "epoch": 0.96, "learning_rate": 0.00023041200140991747, "loss": 1.6048, "step": 12197 }, { "epoch": 0.96, "learning_rate": 0.00023040156747024745, "loss": 1.5902, "step": 12198 }, { "epoch": 0.96, "learning_rate": 0.00023039113298469513, "loss": 1.5838, "step": 12199 }, { "epoch": 0.96, "learning_rate": 0.0002303806979533314, "loss": 1.6123, "step": 12200 }, { "epoch": 0.96, "learning_rate": 0.00023037026237622706, "loss": 1.5689, "step": 12201 }, { "epoch": 0.96, "learning_rate": 0.00023035982625345305, "loss": 1.6482, "step": 12202 }, { "epoch": 0.96, "learning_rate": 0.00023034938958508012, "loss": 1.6459, "step": 12203 }, { "epoch": 0.96, "learning_rate": 0.00023033895237117914, "loss": 1.6465, "step": 12204 }, { "epoch": 0.96, "learning_rate": 0.00023032851461182106, "loss": 1.5552, "step": 12205 }, { "epoch": 0.96, "learning_rate": 0.00023031807630707668, "loss": 1.6254, "step": 12206 }, { "epoch": 0.96, "learning_rate": 0.0002303076374570169, "loss": 1.5904, "step": 12207 }, { "epoch": 0.96, "learning_rate": 0.00023029719806171253, "loss": 1.6086, "step": 12208 }, { "epoch": 0.96, "learning_rate": 0.00023028675812123456, "loss": 1.5872, "step": 12209 }, { "epoch": 0.96, "learning_rate": 0.00023027631763565374, "loss": 1.6249, "step": 12210 }, { "epoch": 0.96, "learning_rate": 0.00023026587660504108, "loss": 1.5873, "step": 12211 }, { "epoch": 0.96, "learning_rate": 0.00023025543502946743, "loss": 1.5635, "step": 12212 }, { "epoch": 0.96, "learning_rate": 0.0002302449929090036, "loss": 1.5799, "step": 12213 }, { "epoch": 0.96, "learning_rate": 0.00023023455024372057, "loss": 1.5841, "step": 12214 }, { "epoch": 0.96, "learning_rate": 0.00023022410703368927, "loss": 1.5993, "step": 12215 }, { "epoch": 0.96, "learning_rate": 0.00023021366327898049, "loss": 1.5913, "step": 12216 }, { "epoch": 0.96, "learning_rate": 0.00023020321897966522, "loss": 1.5697, "step": 12217 }, { "epoch": 0.96, "learning_rate": 0.00023019277413581437, "loss": 1.5986, "step": 12218 }, { "epoch": 0.96, "learning_rate": 0.00023018232874749884, "loss": 1.6199, "step": 12219 }, { "epoch": 0.96, "learning_rate": 0.00023017188281478955, "loss": 1.6052, "step": 12220 }, { "epoch": 0.96, "learning_rate": 0.0002301614363377574, "loss": 1.5676, "step": 12221 }, { "epoch": 0.96, "learning_rate": 0.00023015098931647334, "loss": 1.5651, "step": 12222 }, { "epoch": 0.96, "learning_rate": 0.0002301405417510083, "loss": 1.5805, "step": 12223 }, { "epoch": 0.96, "learning_rate": 0.0002301300936414332, "loss": 1.6393, "step": 12224 }, { "epoch": 0.96, "learning_rate": 0.00023011964498781897, "loss": 1.6018, "step": 12225 }, { "epoch": 0.96, "learning_rate": 0.00023010919579023658, "loss": 1.6329, "step": 12226 }, { "epoch": 0.96, "learning_rate": 0.00023009874604875696, "loss": 1.5669, "step": 12227 }, { "epoch": 0.96, "learning_rate": 0.00023008829576345104, "loss": 1.5599, "step": 12228 }, { "epoch": 0.96, "learning_rate": 0.00023007784493438981, "loss": 1.641, "step": 12229 }, { "epoch": 0.96, "learning_rate": 0.00023006739356164422, "loss": 1.5706, "step": 12230 }, { "epoch": 0.96, "learning_rate": 0.00023005694164528515, "loss": 1.5978, "step": 12231 }, { "epoch": 0.96, "learning_rate": 0.00023004648918538366, "loss": 1.5916, "step": 12232 }, { "epoch": 0.96, "learning_rate": 0.00023003603618201065, "loss": 1.6839, "step": 12233 }, { "epoch": 0.96, "learning_rate": 0.00023002558263523717, "loss": 1.5917, "step": 12234 }, { "epoch": 0.96, "learning_rate": 0.00023001512854513412, "loss": 1.6006, "step": 12235 }, { "epoch": 0.96, "learning_rate": 0.00023000467391177257, "loss": 1.5934, "step": 12236 }, { "epoch": 0.96, "learning_rate": 0.00022999421873522337, "loss": 1.6619, "step": 12237 }, { "epoch": 0.96, "learning_rate": 0.00022998376301555757, "loss": 1.6727, "step": 12238 }, { "epoch": 0.96, "learning_rate": 0.00022997330675284615, "loss": 1.5839, "step": 12239 }, { "epoch": 0.96, "learning_rate": 0.0002299628499471601, "loss": 1.5293, "step": 12240 }, { "epoch": 0.96, "learning_rate": 0.0002299523925985705, "loss": 1.627, "step": 12241 }, { "epoch": 0.96, "learning_rate": 0.0002299419347071482, "loss": 1.664, "step": 12242 }, { "epoch": 0.96, "learning_rate": 0.00022993147627296432, "loss": 1.5309, "step": 12243 }, { "epoch": 0.96, "learning_rate": 0.0002299210172960898, "loss": 1.6219, "step": 12244 }, { "epoch": 0.96, "learning_rate": 0.0002299105577765957, "loss": 1.6225, "step": 12245 }, { "epoch": 0.96, "learning_rate": 0.00022990009771455303, "loss": 1.6082, "step": 12246 }, { "epoch": 0.96, "learning_rate": 0.0002298896371100327, "loss": 1.5736, "step": 12247 }, { "epoch": 0.96, "learning_rate": 0.0002298791759631059, "loss": 1.565, "step": 12248 }, { "epoch": 0.96, "learning_rate": 0.00022986871427384354, "loss": 1.6264, "step": 12249 }, { "epoch": 0.96, "learning_rate": 0.00022985825204231673, "loss": 1.5974, "step": 12250 }, { "epoch": 0.96, "learning_rate": 0.0002298477892685964, "loss": 1.628, "step": 12251 }, { "epoch": 0.96, "learning_rate": 0.00022983732595275368, "loss": 1.6045, "step": 12252 }, { "epoch": 0.96, "learning_rate": 0.00022982686209485956, "loss": 1.6021, "step": 12253 }, { "epoch": 0.96, "learning_rate": 0.0002298163976949851, "loss": 1.6189, "step": 12254 }, { "epoch": 0.96, "learning_rate": 0.00022980593275320134, "loss": 1.6163, "step": 12255 }, { "epoch": 0.96, "learning_rate": 0.00022979546726957937, "loss": 1.5956, "step": 12256 }, { "epoch": 0.96, "learning_rate": 0.00022978500124419017, "loss": 1.6163, "step": 12257 }, { "epoch": 0.96, "learning_rate": 0.00022977453467710486, "loss": 1.5697, "step": 12258 }, { "epoch": 0.96, "learning_rate": 0.0002297640675683945, "loss": 1.5704, "step": 12259 }, { "epoch": 0.96, "learning_rate": 0.00022975359991813011, "loss": 1.574, "step": 12260 }, { "epoch": 0.96, "learning_rate": 0.0002297431317263828, "loss": 1.5508, "step": 12261 }, { "epoch": 0.96, "learning_rate": 0.00022973266299322365, "loss": 1.5525, "step": 12262 }, { "epoch": 0.96, "learning_rate": 0.0002297221937187237, "loss": 1.5637, "step": 12263 }, { "epoch": 0.96, "learning_rate": 0.00022971172390295406, "loss": 1.5917, "step": 12264 }, { "epoch": 0.97, "learning_rate": 0.00022970125354598576, "loss": 1.5813, "step": 12265 }, { "epoch": 0.97, "learning_rate": 0.00022969078264789, "loss": 1.6486, "step": 12266 }, { "epoch": 0.97, "learning_rate": 0.00022968031120873775, "loss": 1.6006, "step": 12267 }, { "epoch": 0.97, "learning_rate": 0.00022966983922860021, "loss": 1.6177, "step": 12268 }, { "epoch": 0.97, "learning_rate": 0.0002296593667075484, "loss": 1.5336, "step": 12269 }, { "epoch": 0.97, "learning_rate": 0.0002296488936456534, "loss": 1.6373, "step": 12270 }, { "epoch": 0.97, "learning_rate": 0.0002296384200429864, "loss": 1.5723, "step": 12271 }, { "epoch": 0.97, "learning_rate": 0.0002296279458996185, "loss": 1.5537, "step": 12272 }, { "epoch": 0.97, "learning_rate": 0.00022961747121562077, "loss": 1.589, "step": 12273 }, { "epoch": 0.97, "learning_rate": 0.00022960699599106435, "loss": 1.6058, "step": 12274 }, { "epoch": 0.97, "learning_rate": 0.00022959652022602037, "loss": 1.5777, "step": 12275 }, { "epoch": 0.97, "learning_rate": 0.00022958604392055995, "loss": 1.57, "step": 12276 }, { "epoch": 0.97, "learning_rate": 0.00022957556707475416, "loss": 1.6111, "step": 12277 }, { "epoch": 0.97, "learning_rate": 0.00022956508968867425, "loss": 1.6056, "step": 12278 }, { "epoch": 0.97, "learning_rate": 0.0002295546117623912, "loss": 1.5518, "step": 12279 }, { "epoch": 0.97, "learning_rate": 0.00022954413329597632, "loss": 1.5646, "step": 12280 }, { "epoch": 0.97, "learning_rate": 0.00022953365428950064, "loss": 1.5744, "step": 12281 }, { "epoch": 0.97, "learning_rate": 0.00022952317474303534, "loss": 1.5838, "step": 12282 }, { "epoch": 0.97, "learning_rate": 0.00022951269465665156, "loss": 1.583, "step": 12283 }, { "epoch": 0.97, "learning_rate": 0.00022950221403042047, "loss": 1.586, "step": 12284 }, { "epoch": 0.97, "learning_rate": 0.00022949173286441324, "loss": 1.6242, "step": 12285 }, { "epoch": 0.97, "learning_rate": 0.000229481251158701, "loss": 1.596, "step": 12286 }, { "epoch": 0.97, "learning_rate": 0.0002294707689133549, "loss": 1.6291, "step": 12287 }, { "epoch": 0.97, "learning_rate": 0.00022946028612844615, "loss": 1.5801, "step": 12288 }, { "epoch": 0.97, "learning_rate": 0.00022944980280404593, "loss": 1.6093, "step": 12289 }, { "epoch": 0.97, "learning_rate": 0.00022943931894022537, "loss": 1.6817, "step": 12290 }, { "epoch": 0.97, "learning_rate": 0.00022942883453705567, "loss": 1.6039, "step": 12291 }, { "epoch": 0.97, "learning_rate": 0.00022941834959460804, "loss": 1.58, "step": 12292 }, { "epoch": 0.97, "learning_rate": 0.0002294078641129536, "loss": 1.5915, "step": 12293 }, { "epoch": 0.97, "learning_rate": 0.0002293973780921636, "loss": 1.5297, "step": 12294 }, { "epoch": 0.97, "learning_rate": 0.00022938689153230926, "loss": 1.5302, "step": 12295 }, { "epoch": 0.97, "learning_rate": 0.00022937640443346165, "loss": 1.6028, "step": 12296 }, { "epoch": 0.97, "learning_rate": 0.00022936591679569216, "loss": 1.5989, "step": 12297 }, { "epoch": 0.97, "learning_rate": 0.00022935542861907184, "loss": 1.637, "step": 12298 }, { "epoch": 0.97, "learning_rate": 0.00022934493990367193, "loss": 1.5556, "step": 12299 }, { "epoch": 0.97, "learning_rate": 0.00022933445064956368, "loss": 1.5738, "step": 12300 }, { "epoch": 0.97, "learning_rate": 0.0002293239608568183, "loss": 1.6255, "step": 12301 }, { "epoch": 0.97, "learning_rate": 0.00022931347052550702, "loss": 1.5935, "step": 12302 }, { "epoch": 0.97, "learning_rate": 0.000229302979655701, "loss": 1.6499, "step": 12303 }, { "epoch": 0.97, "learning_rate": 0.00022929248824747153, "loss": 1.604, "step": 12304 }, { "epoch": 0.97, "learning_rate": 0.00022928199630088984, "loss": 1.6174, "step": 12305 }, { "epoch": 0.97, "learning_rate": 0.0002292715038160271, "loss": 1.6406, "step": 12306 }, { "epoch": 0.97, "learning_rate": 0.00022926101079295464, "loss": 1.636, "step": 12307 }, { "epoch": 0.97, "learning_rate": 0.00022925051723174364, "loss": 1.6114, "step": 12308 }, { "epoch": 0.97, "learning_rate": 0.0002292400231324654, "loss": 1.6177, "step": 12309 }, { "epoch": 0.97, "learning_rate": 0.00022922952849519106, "loss": 1.6022, "step": 12310 }, { "epoch": 0.97, "learning_rate": 0.00022921903331999196, "loss": 1.6178, "step": 12311 }, { "epoch": 0.97, "learning_rate": 0.0002292085376069394, "loss": 1.5214, "step": 12312 }, { "epoch": 0.97, "learning_rate": 0.0002291980413561045, "loss": 1.5548, "step": 12313 }, { "epoch": 0.97, "learning_rate": 0.0002291875445675587, "loss": 1.6072, "step": 12314 }, { "epoch": 0.97, "learning_rate": 0.00022917704724137312, "loss": 1.6181, "step": 12315 }, { "epoch": 0.97, "learning_rate": 0.00022916654937761905, "loss": 1.6327, "step": 12316 }, { "epoch": 0.97, "learning_rate": 0.00022915605097636785, "loss": 1.5766, "step": 12317 }, { "epoch": 0.97, "learning_rate": 0.0002291455520376907, "loss": 1.6649, "step": 12318 }, { "epoch": 0.97, "learning_rate": 0.00022913505256165896, "loss": 1.5681, "step": 12319 }, { "epoch": 0.97, "learning_rate": 0.00022912455254834387, "loss": 1.5744, "step": 12320 }, { "epoch": 0.97, "learning_rate": 0.00022911405199781674, "loss": 1.5638, "step": 12321 }, { "epoch": 0.97, "learning_rate": 0.00022910355091014886, "loss": 1.5952, "step": 12322 }, { "epoch": 0.97, "learning_rate": 0.0002290930492854115, "loss": 1.5577, "step": 12323 }, { "epoch": 0.97, "learning_rate": 0.00022908254712367604, "loss": 1.6067, "step": 12324 }, { "epoch": 0.97, "learning_rate": 0.00022907204442501367, "loss": 1.5507, "step": 12325 }, { "epoch": 0.97, "learning_rate": 0.00022906154118949575, "loss": 1.5255, "step": 12326 }, { "epoch": 0.97, "learning_rate": 0.0002290510374171936, "loss": 1.6081, "step": 12327 }, { "epoch": 0.97, "learning_rate": 0.00022904053310817855, "loss": 1.5772, "step": 12328 }, { "epoch": 0.97, "learning_rate": 0.0002290300282625219, "loss": 1.5816, "step": 12329 }, { "epoch": 0.97, "learning_rate": 0.00022901952288029493, "loss": 1.5791, "step": 12330 }, { "epoch": 0.97, "learning_rate": 0.00022900901696156907, "loss": 1.5436, "step": 12331 }, { "epoch": 0.97, "learning_rate": 0.00022899851050641552, "loss": 1.6774, "step": 12332 }, { "epoch": 0.97, "learning_rate": 0.00022898800351490572, "loss": 1.5933, "step": 12333 }, { "epoch": 0.97, "learning_rate": 0.00022897749598711097, "loss": 1.641, "step": 12334 }, { "epoch": 0.97, "learning_rate": 0.00022896698792310258, "loss": 1.6051, "step": 12335 }, { "epoch": 0.97, "learning_rate": 0.00022895647932295196, "loss": 1.6288, "step": 12336 }, { "epoch": 0.97, "learning_rate": 0.0002289459701867304, "loss": 1.5421, "step": 12337 }, { "epoch": 0.97, "learning_rate": 0.00022893546051450925, "loss": 1.564, "step": 12338 }, { "epoch": 0.97, "learning_rate": 0.00022892495030635987, "loss": 1.6064, "step": 12339 }, { "epoch": 0.97, "learning_rate": 0.00022891443956235365, "loss": 1.5668, "step": 12340 }, { "epoch": 0.97, "learning_rate": 0.00022890392828256193, "loss": 1.576, "step": 12341 }, { "epoch": 0.97, "learning_rate": 0.00022889341646705608, "loss": 1.5654, "step": 12342 }, { "epoch": 0.97, "learning_rate": 0.00022888290411590752, "loss": 1.578, "step": 12343 }, { "epoch": 0.97, "learning_rate": 0.0002288723912291875, "loss": 1.5837, "step": 12344 }, { "epoch": 0.97, "learning_rate": 0.00022886187780696748, "loss": 1.5782, "step": 12345 }, { "epoch": 0.97, "learning_rate": 0.00022885136384931891, "loss": 1.553, "step": 12346 }, { "epoch": 0.97, "learning_rate": 0.00022884084935631297, "loss": 1.5655, "step": 12347 }, { "epoch": 0.97, "learning_rate": 0.00022883033432802123, "loss": 1.593, "step": 12348 }, { "epoch": 0.97, "learning_rate": 0.00022881981876451501, "loss": 1.5853, "step": 12349 }, { "epoch": 0.97, "learning_rate": 0.00022880930266586572, "loss": 1.6328, "step": 12350 }, { "epoch": 0.97, "learning_rate": 0.00022879878603214478, "loss": 1.5501, "step": 12351 }, { "epoch": 0.97, "learning_rate": 0.00022878826886342358, "loss": 1.6271, "step": 12352 }, { "epoch": 0.97, "learning_rate": 0.00022877775115977348, "loss": 1.5767, "step": 12353 }, { "epoch": 0.97, "learning_rate": 0.00022876723292126596, "loss": 1.5972, "step": 12354 }, { "epoch": 0.97, "learning_rate": 0.00022875671414797233, "loss": 1.577, "step": 12355 }, { "epoch": 0.97, "learning_rate": 0.00022874619483996414, "loss": 1.5697, "step": 12356 }, { "epoch": 0.97, "learning_rate": 0.00022873567499731264, "loss": 1.5977, "step": 12357 }, { "epoch": 0.97, "learning_rate": 0.00022872515462008948, "loss": 1.5528, "step": 12358 }, { "epoch": 0.97, "learning_rate": 0.00022871463370836593, "loss": 1.5531, "step": 12359 }, { "epoch": 0.97, "learning_rate": 0.00022870411226221343, "loss": 1.5556, "step": 12360 }, { "epoch": 0.97, "learning_rate": 0.00022869359028170345, "loss": 1.5978, "step": 12361 }, { "epoch": 0.97, "learning_rate": 0.0002286830677669074, "loss": 1.6069, "step": 12362 }, { "epoch": 0.97, "learning_rate": 0.0002286725447178968, "loss": 1.5883, "step": 12363 }, { "epoch": 0.97, "learning_rate": 0.00022866202113474294, "loss": 1.5243, "step": 12364 }, { "epoch": 0.97, "learning_rate": 0.00022865149701751744, "loss": 1.5684, "step": 12365 }, { "epoch": 0.97, "learning_rate": 0.00022864097236629163, "loss": 1.6339, "step": 12366 }, { "epoch": 0.97, "learning_rate": 0.00022863044718113702, "loss": 1.614, "step": 12367 }, { "epoch": 0.97, "learning_rate": 0.0002286199214621251, "loss": 1.6113, "step": 12368 }, { "epoch": 0.97, "learning_rate": 0.0002286093952093273, "loss": 1.5998, "step": 12369 }, { "epoch": 0.97, "learning_rate": 0.0002285988684228151, "loss": 1.6124, "step": 12370 }, { "epoch": 0.97, "learning_rate": 0.00022858834110265993, "loss": 1.6505, "step": 12371 }, { "epoch": 0.97, "learning_rate": 0.0002285778132489333, "loss": 1.5944, "step": 12372 }, { "epoch": 0.97, "learning_rate": 0.00022856728486170665, "loss": 1.592, "step": 12373 }, { "epoch": 0.97, "learning_rate": 0.00022855675594105152, "loss": 1.5867, "step": 12374 }, { "epoch": 0.97, "learning_rate": 0.00022854622648703935, "loss": 1.5714, "step": 12375 }, { "epoch": 0.97, "learning_rate": 0.00022853569649974168, "loss": 1.585, "step": 12376 }, { "epoch": 0.97, "learning_rate": 0.00022852516597922997, "loss": 1.5492, "step": 12377 }, { "epoch": 0.97, "learning_rate": 0.0002285146349255757, "loss": 1.5897, "step": 12378 }, { "epoch": 0.97, "learning_rate": 0.00022850410333885037, "loss": 1.648, "step": 12379 }, { "epoch": 0.97, "learning_rate": 0.00022849357121912554, "loss": 1.5934, "step": 12380 }, { "epoch": 0.97, "learning_rate": 0.00022848303856647263, "loss": 1.5661, "step": 12381 }, { "epoch": 0.97, "learning_rate": 0.00022847250538096322, "loss": 1.6381, "step": 12382 }, { "epoch": 0.97, "learning_rate": 0.0002284619716626688, "loss": 1.6273, "step": 12383 }, { "epoch": 0.97, "learning_rate": 0.00022845143741166089, "loss": 1.5604, "step": 12384 }, { "epoch": 0.97, "learning_rate": 0.00022844090262801107, "loss": 1.5559, "step": 12385 }, { "epoch": 0.97, "learning_rate": 0.00022843036731179074, "loss": 1.5588, "step": 12386 }, { "epoch": 0.97, "learning_rate": 0.0002284198314630715, "loss": 1.575, "step": 12387 }, { "epoch": 0.97, "learning_rate": 0.00022840929508192496, "loss": 1.6581, "step": 12388 }, { "epoch": 0.97, "learning_rate": 0.0002283987581684225, "loss": 1.6517, "step": 12389 }, { "epoch": 0.97, "learning_rate": 0.00022838822072263572, "loss": 1.5884, "step": 12390 }, { "epoch": 0.97, "learning_rate": 0.0002283776827446362, "loss": 1.5738, "step": 12391 }, { "epoch": 0.98, "learning_rate": 0.0002283671442344955, "loss": 1.5593, "step": 12392 }, { "epoch": 0.98, "learning_rate": 0.0002283566051922851, "loss": 1.6052, "step": 12393 }, { "epoch": 0.98, "learning_rate": 0.00022834606561807663, "loss": 1.5977, "step": 12394 }, { "epoch": 0.98, "learning_rate": 0.00022833552551194158, "loss": 1.5864, "step": 12395 }, { "epoch": 0.98, "learning_rate": 0.0002283249848739515, "loss": 1.5958, "step": 12396 }, { "epoch": 0.98, "learning_rate": 0.00022831444370417808, "loss": 1.5817, "step": 12397 }, { "epoch": 0.98, "learning_rate": 0.00022830390200269277, "loss": 1.5966, "step": 12398 }, { "epoch": 0.98, "learning_rate": 0.00022829335976956718, "loss": 1.597, "step": 12399 }, { "epoch": 0.98, "learning_rate": 0.00022828281700487286, "loss": 1.6187, "step": 12400 }, { "epoch": 0.98, "learning_rate": 0.0002282722737086814, "loss": 1.573, "step": 12401 }, { "epoch": 0.98, "learning_rate": 0.00022826172988106447, "loss": 1.5948, "step": 12402 }, { "epoch": 0.98, "learning_rate": 0.00022825118552209352, "loss": 1.6082, "step": 12403 }, { "epoch": 0.98, "learning_rate": 0.0002282406406318402, "loss": 1.601, "step": 12404 }, { "epoch": 0.98, "learning_rate": 0.00022823009521037615, "loss": 1.5791, "step": 12405 }, { "epoch": 0.98, "learning_rate": 0.00022821954925777288, "loss": 1.5669, "step": 12406 }, { "epoch": 0.98, "learning_rate": 0.0002282090027741021, "loss": 1.5354, "step": 12407 }, { "epoch": 0.98, "learning_rate": 0.00022819845575943528, "loss": 1.6254, "step": 12408 }, { "epoch": 0.98, "learning_rate": 0.00022818790821384414, "loss": 1.6127, "step": 12409 }, { "epoch": 0.98, "learning_rate": 0.00022817736013740024, "loss": 1.5615, "step": 12410 }, { "epoch": 0.98, "learning_rate": 0.0002281668115301752, "loss": 1.5787, "step": 12411 }, { "epoch": 0.98, "learning_rate": 0.00022815626239224061, "loss": 1.5614, "step": 12412 }, { "epoch": 0.98, "learning_rate": 0.0002281457127236682, "loss": 1.5551, "step": 12413 }, { "epoch": 0.98, "learning_rate": 0.0002281351625245295, "loss": 1.5652, "step": 12414 }, { "epoch": 0.98, "learning_rate": 0.00022812461179489614, "loss": 1.5817, "step": 12415 }, { "epoch": 0.98, "learning_rate": 0.0002281140605348398, "loss": 1.5836, "step": 12416 }, { "epoch": 0.98, "learning_rate": 0.00022810350874443211, "loss": 1.6376, "step": 12417 }, { "epoch": 0.98, "learning_rate": 0.00022809295642374464, "loss": 1.6469, "step": 12418 }, { "epoch": 0.98, "learning_rate": 0.0002280824035728492, "loss": 1.6602, "step": 12419 }, { "epoch": 0.98, "learning_rate": 0.0002280718501918172, "loss": 1.6022, "step": 12420 }, { "epoch": 0.98, "learning_rate": 0.0002280612962807205, "loss": 1.5787, "step": 12421 }, { "epoch": 0.98, "learning_rate": 0.00022805074183963065, "loss": 1.6219, "step": 12422 }, { "epoch": 0.98, "learning_rate": 0.00022804018686861937, "loss": 1.5957, "step": 12423 }, { "epoch": 0.98, "learning_rate": 0.00022802963136775824, "loss": 1.5596, "step": 12424 }, { "epoch": 0.98, "learning_rate": 0.000228019075337119, "loss": 1.5419, "step": 12425 }, { "epoch": 0.98, "learning_rate": 0.0002280085187767733, "loss": 1.6158, "step": 12426 }, { "epoch": 0.98, "learning_rate": 0.00022799796168679277, "loss": 1.5837, "step": 12427 }, { "epoch": 0.98, "learning_rate": 0.00022798740406724917, "loss": 1.5915, "step": 12428 }, { "epoch": 0.98, "learning_rate": 0.00022797684591821407, "loss": 1.6172, "step": 12429 }, { "epoch": 0.98, "learning_rate": 0.00022796628723975926, "loss": 1.5887, "step": 12430 }, { "epoch": 0.98, "learning_rate": 0.0002279557280319564, "loss": 1.6068, "step": 12431 }, { "epoch": 0.98, "learning_rate": 0.00022794516829487713, "loss": 1.5897, "step": 12432 }, { "epoch": 0.98, "learning_rate": 0.0002279346080285932, "loss": 1.6628, "step": 12433 }, { "epoch": 0.98, "learning_rate": 0.00022792404723317628, "loss": 1.5889, "step": 12434 }, { "epoch": 0.98, "learning_rate": 0.0002279134859086981, "loss": 1.5493, "step": 12435 }, { "epoch": 0.98, "learning_rate": 0.00022790292405523035, "loss": 1.5733, "step": 12436 }, { "epoch": 0.98, "learning_rate": 0.0002278923616728447, "loss": 1.6007, "step": 12437 }, { "epoch": 0.98, "learning_rate": 0.00022788179876161293, "loss": 1.5947, "step": 12438 }, { "epoch": 0.98, "learning_rate": 0.00022787123532160667, "loss": 1.5944, "step": 12439 }, { "epoch": 0.98, "learning_rate": 0.00022786067135289773, "loss": 1.6136, "step": 12440 }, { "epoch": 0.98, "learning_rate": 0.00022785010685555786, "loss": 1.6007, "step": 12441 }, { "epoch": 0.98, "learning_rate": 0.00022783954182965867, "loss": 1.6805, "step": 12442 }, { "epoch": 0.98, "learning_rate": 0.00022782897627527196, "loss": 1.5473, "step": 12443 }, { "epoch": 0.98, "learning_rate": 0.0002278184101924694, "loss": 1.6305, "step": 12444 }, { "epoch": 0.98, "learning_rate": 0.00022780784358132283, "loss": 1.5752, "step": 12445 }, { "epoch": 0.98, "learning_rate": 0.00022779727644190394, "loss": 1.5621, "step": 12446 }, { "epoch": 0.98, "learning_rate": 0.00022778670877428444, "loss": 1.5999, "step": 12447 }, { "epoch": 0.98, "learning_rate": 0.00022777614057853618, "loss": 1.5815, "step": 12448 }, { "epoch": 0.98, "learning_rate": 0.0002277655718547308, "loss": 1.6327, "step": 12449 }, { "epoch": 0.98, "learning_rate": 0.0002277550026029401, "loss": 1.555, "step": 12450 }, { "epoch": 0.98, "learning_rate": 0.00022774443282323582, "loss": 1.5437, "step": 12451 }, { "epoch": 0.98, "learning_rate": 0.00022773386251568977, "loss": 1.6098, "step": 12452 }, { "epoch": 0.98, "learning_rate": 0.0002277232916803737, "loss": 1.5907, "step": 12453 }, { "epoch": 0.98, "learning_rate": 0.0002277127203173594, "loss": 1.6053, "step": 12454 }, { "epoch": 0.98, "learning_rate": 0.00022770214842671854, "loss": 1.6188, "step": 12455 }, { "epoch": 0.98, "learning_rate": 0.00022769157600852302, "loss": 1.6011, "step": 12456 }, { "epoch": 0.98, "learning_rate": 0.00022768100306284452, "loss": 1.5606, "step": 12457 }, { "epoch": 0.98, "learning_rate": 0.00022767042958975498, "loss": 1.5999, "step": 12458 }, { "epoch": 0.98, "learning_rate": 0.00022765985558932601, "loss": 1.531, "step": 12459 }, { "epoch": 0.98, "learning_rate": 0.0002276492810616295, "loss": 1.602, "step": 12460 }, { "epoch": 0.98, "learning_rate": 0.00022763870600673718, "loss": 1.5669, "step": 12461 }, { "epoch": 0.98, "learning_rate": 0.0002276281304247209, "loss": 1.5491, "step": 12462 }, { "epoch": 0.98, "learning_rate": 0.00022761755431565251, "loss": 1.5682, "step": 12463 }, { "epoch": 0.98, "learning_rate": 0.00022760697767960374, "loss": 1.5657, "step": 12464 }, { "epoch": 0.98, "learning_rate": 0.00022759640051664637, "loss": 1.6032, "step": 12465 }, { "epoch": 0.98, "learning_rate": 0.00022758582282685232, "loss": 1.6213, "step": 12466 }, { "epoch": 0.98, "learning_rate": 0.00022757524461029333, "loss": 1.6192, "step": 12467 }, { "epoch": 0.98, "learning_rate": 0.00022756466586704123, "loss": 1.5315, "step": 12468 }, { "epoch": 0.98, "learning_rate": 0.00022755408659716782, "loss": 1.541, "step": 12469 }, { "epoch": 0.98, "learning_rate": 0.00022754350680074503, "loss": 1.5598, "step": 12470 }, { "epoch": 0.98, "learning_rate": 0.00022753292647784455, "loss": 1.5769, "step": 12471 }, { "epoch": 0.98, "learning_rate": 0.00022752234562853837, "loss": 1.579, "step": 12472 }, { "epoch": 0.98, "learning_rate": 0.00022751176425289817, "loss": 1.6202, "step": 12473 }, { "epoch": 0.98, "learning_rate": 0.0002275011823509959, "loss": 1.5865, "step": 12474 }, { "epoch": 0.98, "learning_rate": 0.00022749059992290333, "loss": 1.5761, "step": 12475 }, { "epoch": 0.98, "learning_rate": 0.00022748001696869239, "loss": 1.5751, "step": 12476 }, { "epoch": 0.98, "learning_rate": 0.00022746943348843493, "loss": 1.5715, "step": 12477 }, { "epoch": 0.98, "learning_rate": 0.00022745884948220267, "loss": 1.5933, "step": 12478 }, { "epoch": 0.98, "learning_rate": 0.00022744826495006766, "loss": 1.5797, "step": 12479 }, { "epoch": 0.98, "learning_rate": 0.00022743767989210161, "loss": 1.6091, "step": 12480 }, { "epoch": 0.98, "learning_rate": 0.00022742709430837647, "loss": 1.5522, "step": 12481 }, { "epoch": 0.98, "learning_rate": 0.0002274165081989641, "loss": 1.5935, "step": 12482 }, { "epoch": 0.98, "learning_rate": 0.00022740592156393632, "loss": 1.5957, "step": 12483 }, { "epoch": 0.98, "learning_rate": 0.00022739533440336508, "loss": 1.579, "step": 12484 }, { "epoch": 0.98, "learning_rate": 0.0002273847467173222, "loss": 1.6389, "step": 12485 }, { "epoch": 0.98, "learning_rate": 0.00022737415850587964, "loss": 1.6025, "step": 12486 }, { "epoch": 0.98, "learning_rate": 0.00022736356976910924, "loss": 1.6102, "step": 12487 }, { "epoch": 0.98, "learning_rate": 0.00022735298050708284, "loss": 1.6008, "step": 12488 }, { "epoch": 0.98, "learning_rate": 0.0002273423907198724, "loss": 1.5583, "step": 12489 }, { "epoch": 0.98, "learning_rate": 0.00022733180040754983, "loss": 1.6031, "step": 12490 }, { "epoch": 0.98, "learning_rate": 0.000227321209570187, "loss": 1.5508, "step": 12491 }, { "epoch": 0.98, "learning_rate": 0.00022731061820785586, "loss": 1.6445, "step": 12492 }, { "epoch": 0.98, "learning_rate": 0.00022730002632062826, "loss": 1.5815, "step": 12493 }, { "epoch": 0.98, "learning_rate": 0.00022728943390857616, "loss": 1.5966, "step": 12494 }, { "epoch": 0.98, "learning_rate": 0.00022727884097177142, "loss": 1.5887, "step": 12495 }, { "epoch": 0.98, "learning_rate": 0.000227268247510286, "loss": 1.5751, "step": 12496 }, { "epoch": 0.98, "learning_rate": 0.00022725765352419187, "loss": 1.6288, "step": 12497 }, { "epoch": 0.98, "learning_rate": 0.00022724705901356086, "loss": 1.5305, "step": 12498 }, { "epoch": 0.98, "learning_rate": 0.00022723646397846496, "loss": 1.6169, "step": 12499 }, { "epoch": 0.98, "learning_rate": 0.00022722586841897606, "loss": 1.5722, "step": 12500 }, { "epoch": 0.98, "learning_rate": 0.00022721527233516618, "loss": 1.5924, "step": 12501 }, { "epoch": 0.98, "learning_rate": 0.00022720467572710716, "loss": 1.5829, "step": 12502 }, { "epoch": 0.98, "learning_rate": 0.00022719407859487104, "loss": 1.5912, "step": 12503 }, { "epoch": 0.98, "learning_rate": 0.00022718348093852975, "loss": 1.5803, "step": 12504 }, { "epoch": 0.98, "learning_rate": 0.00022717288275815516, "loss": 1.6048, "step": 12505 }, { "epoch": 0.98, "learning_rate": 0.00022716228405381928, "loss": 1.5759, "step": 12506 }, { "epoch": 0.98, "learning_rate": 0.0002271516848255941, "loss": 1.5827, "step": 12507 }, { "epoch": 0.98, "learning_rate": 0.00022714108507355154, "loss": 1.6094, "step": 12508 }, { "epoch": 0.98, "learning_rate": 0.00022713048479776362, "loss": 1.6211, "step": 12509 }, { "epoch": 0.98, "learning_rate": 0.00022711988399830223, "loss": 1.5627, "step": 12510 }, { "epoch": 0.98, "learning_rate": 0.00022710928267523941, "loss": 1.6087, "step": 12511 }, { "epoch": 0.98, "learning_rate": 0.00022709868082864713, "loss": 1.5885, "step": 12512 }, { "epoch": 0.98, "learning_rate": 0.00022708807845859733, "loss": 1.5696, "step": 12513 }, { "epoch": 0.98, "learning_rate": 0.00022707747556516202, "loss": 1.5652, "step": 12514 }, { "epoch": 0.98, "learning_rate": 0.00022706687214841314, "loss": 1.6078, "step": 12515 }, { "epoch": 0.98, "learning_rate": 0.00022705626820842279, "loss": 1.5382, "step": 12516 }, { "epoch": 0.98, "learning_rate": 0.0002270456637452629, "loss": 1.6627, "step": 12517 }, { "epoch": 0.98, "learning_rate": 0.00022703505875900544, "loss": 1.6019, "step": 12518 }, { "epoch": 0.99, "learning_rate": 0.00022702445324972246, "loss": 1.614, "step": 12519 }, { "epoch": 0.99, "learning_rate": 0.00022701384721748595, "loss": 1.559, "step": 12520 }, { "epoch": 0.99, "learning_rate": 0.00022700324066236795, "loss": 1.5435, "step": 12521 }, { "epoch": 0.99, "learning_rate": 0.00022699263358444036, "loss": 1.6076, "step": 12522 }, { "epoch": 0.99, "learning_rate": 0.00022698202598377533, "loss": 1.5997, "step": 12523 }, { "epoch": 0.99, "learning_rate": 0.0002269714178604448, "loss": 1.5586, "step": 12524 }, { "epoch": 0.99, "learning_rate": 0.0002269608092145208, "loss": 1.6355, "step": 12525 }, { "epoch": 0.99, "learning_rate": 0.00022695020004607548, "loss": 1.5779, "step": 12526 }, { "epoch": 0.99, "learning_rate": 0.0002269395903551807, "loss": 1.6294, "step": 12527 }, { "epoch": 0.99, "learning_rate": 0.00022692898014190855, "loss": 1.599, "step": 12528 }, { "epoch": 0.99, "learning_rate": 0.00022691836940633107, "loss": 1.535, "step": 12529 }, { "epoch": 0.99, "learning_rate": 0.00022690775814852032, "loss": 1.5794, "step": 12530 }, { "epoch": 0.99, "learning_rate": 0.00022689714636854832, "loss": 1.5763, "step": 12531 }, { "epoch": 0.99, "learning_rate": 0.00022688653406648714, "loss": 1.6237, "step": 12532 }, { "epoch": 0.99, "learning_rate": 0.00022687592124240885, "loss": 1.5676, "step": 12533 }, { "epoch": 0.99, "learning_rate": 0.00022686530789638547, "loss": 1.6662, "step": 12534 }, { "epoch": 0.99, "learning_rate": 0.00022685469402848902, "loss": 1.5755, "step": 12535 }, { "epoch": 0.99, "learning_rate": 0.0002268440796387917, "loss": 1.6288, "step": 12536 }, { "epoch": 0.99, "learning_rate": 0.00022683346472736538, "loss": 1.5502, "step": 12537 }, { "epoch": 0.99, "learning_rate": 0.00022682284929428229, "loss": 1.5816, "step": 12538 }, { "epoch": 0.99, "learning_rate": 0.00022681223333961443, "loss": 1.5686, "step": 12539 }, { "epoch": 0.99, "learning_rate": 0.00022680161686343392, "loss": 1.5742, "step": 12540 }, { "epoch": 0.99, "learning_rate": 0.0002267909998658128, "loss": 1.6289, "step": 12541 }, { "epoch": 0.99, "learning_rate": 0.0002267803823468232, "loss": 1.6127, "step": 12542 }, { "epoch": 0.99, "learning_rate": 0.00022676976430653715, "loss": 1.5777, "step": 12543 }, { "epoch": 0.99, "learning_rate": 0.00022675914574502677, "loss": 1.5505, "step": 12544 }, { "epoch": 0.99, "learning_rate": 0.0002267485266623641, "loss": 1.5362, "step": 12545 }, { "epoch": 0.99, "learning_rate": 0.00022673790705862132, "loss": 1.5517, "step": 12546 }, { "epoch": 0.99, "learning_rate": 0.0002267272869338705, "loss": 1.5796, "step": 12547 }, { "epoch": 0.99, "learning_rate": 0.00022671666628818377, "loss": 1.5527, "step": 12548 }, { "epoch": 0.99, "learning_rate": 0.0002267060451216332, "loss": 1.5487, "step": 12549 }, { "epoch": 0.99, "learning_rate": 0.00022669542343429092, "loss": 1.5547, "step": 12550 }, { "epoch": 0.99, "learning_rate": 0.00022668480122622897, "loss": 1.6274, "step": 12551 }, { "epoch": 0.99, "learning_rate": 0.00022667417849751959, "loss": 1.6069, "step": 12552 }, { "epoch": 0.99, "learning_rate": 0.00022666355524823486, "loss": 1.6267, "step": 12553 }, { "epoch": 0.99, "learning_rate": 0.00022665293147844685, "loss": 1.5486, "step": 12554 }, { "epoch": 0.99, "learning_rate": 0.0002266423071882278, "loss": 1.5662, "step": 12555 }, { "epoch": 0.99, "learning_rate": 0.00022663168237764975, "loss": 1.6135, "step": 12556 }, { "epoch": 0.99, "learning_rate": 0.0002266210570467849, "loss": 1.5489, "step": 12557 }, { "epoch": 0.99, "learning_rate": 0.0002266104311957053, "loss": 1.5926, "step": 12558 }, { "epoch": 0.99, "learning_rate": 0.0002265998048244832, "loss": 1.6073, "step": 12559 }, { "epoch": 0.99, "learning_rate": 0.00022658917793319064, "loss": 1.5501, "step": 12560 }, { "epoch": 0.99, "learning_rate": 0.00022657855052189986, "loss": 1.6009, "step": 12561 }, { "epoch": 0.99, "learning_rate": 0.00022656792259068297, "loss": 1.557, "step": 12562 }, { "epoch": 0.99, "learning_rate": 0.00022655729413961211, "loss": 1.6037, "step": 12563 }, { "epoch": 0.99, "learning_rate": 0.00022654666516875953, "loss": 1.5963, "step": 12564 }, { "epoch": 0.99, "learning_rate": 0.00022653603567819732, "loss": 1.6278, "step": 12565 }, { "epoch": 0.99, "learning_rate": 0.00022652540566799764, "loss": 1.6209, "step": 12566 }, { "epoch": 0.99, "learning_rate": 0.00022651477513823274, "loss": 1.6265, "step": 12567 }, { "epoch": 0.99, "learning_rate": 0.0002265041440889747, "loss": 1.5955, "step": 12568 }, { "epoch": 0.99, "learning_rate": 0.00022649351252029574, "loss": 1.5794, "step": 12569 }, { "epoch": 0.99, "learning_rate": 0.00022648288043226804, "loss": 1.5962, "step": 12570 }, { "epoch": 0.99, "learning_rate": 0.00022647224782496378, "loss": 1.5634, "step": 12571 }, { "epoch": 0.99, "learning_rate": 0.0002264616146984552, "loss": 1.5974, "step": 12572 }, { "epoch": 0.99, "learning_rate": 0.0002264509810528144, "loss": 1.5984, "step": 12573 }, { "epoch": 0.99, "learning_rate": 0.00022644034688811365, "loss": 1.5789, "step": 12574 }, { "epoch": 0.99, "learning_rate": 0.00022642971220442515, "loss": 1.5912, "step": 12575 }, { "epoch": 0.99, "learning_rate": 0.00022641907700182107, "loss": 1.6386, "step": 12576 }, { "epoch": 0.99, "learning_rate": 0.0002264084412803736, "loss": 1.6094, "step": 12577 }, { "epoch": 0.99, "learning_rate": 0.000226397805040155, "loss": 1.5724, "step": 12578 }, { "epoch": 0.99, "learning_rate": 0.00022638716828123748, "loss": 1.63, "step": 12579 }, { "epoch": 0.99, "learning_rate": 0.00022637653100369322, "loss": 1.5805, "step": 12580 }, { "epoch": 0.99, "learning_rate": 0.00022636589320759441, "loss": 1.6087, "step": 12581 }, { "epoch": 0.99, "learning_rate": 0.00022635525489301343, "loss": 1.542, "step": 12582 }, { "epoch": 0.99, "learning_rate": 0.00022634461606002235, "loss": 1.5816, "step": 12583 }, { "epoch": 0.99, "learning_rate": 0.0002263339767086935, "loss": 1.5448, "step": 12584 }, { "epoch": 0.99, "learning_rate": 0.000226323336839099, "loss": 1.5721, "step": 12585 }, { "epoch": 0.99, "learning_rate": 0.0002263126964513112, "loss": 1.5623, "step": 12586 }, { "epoch": 0.99, "learning_rate": 0.00022630205554540232, "loss": 1.5507, "step": 12587 }, { "epoch": 0.99, "learning_rate": 0.0002262914141214446, "loss": 1.5447, "step": 12588 }, { "epoch": 0.99, "learning_rate": 0.00022628077217951023, "loss": 1.5488, "step": 12589 }, { "epoch": 0.99, "learning_rate": 0.00022627012971967151, "loss": 1.6483, "step": 12590 }, { "epoch": 0.99, "learning_rate": 0.00022625948674200074, "loss": 1.6106, "step": 12591 }, { "epoch": 0.99, "learning_rate": 0.00022624884324657014, "loss": 1.6406, "step": 12592 }, { "epoch": 0.99, "learning_rate": 0.0002262381992334519, "loss": 1.5604, "step": 12593 }, { "epoch": 0.99, "learning_rate": 0.00022622755470271845, "loss": 1.6044, "step": 12594 }, { "epoch": 0.99, "learning_rate": 0.00022621690965444192, "loss": 1.6073, "step": 12595 }, { "epoch": 0.99, "learning_rate": 0.00022620626408869466, "loss": 1.5937, "step": 12596 }, { "epoch": 0.99, "learning_rate": 0.00022619561800554892, "loss": 1.6161, "step": 12597 }, { "epoch": 0.99, "learning_rate": 0.00022618497140507694, "loss": 1.6275, "step": 12598 }, { "epoch": 0.99, "learning_rate": 0.00022617432428735112, "loss": 1.5848, "step": 12599 }, { "epoch": 0.99, "learning_rate": 0.0002261636766524436, "loss": 1.5441, "step": 12600 }, { "epoch": 0.99, "learning_rate": 0.00022615302850042675, "loss": 1.5455, "step": 12601 }, { "epoch": 0.99, "learning_rate": 0.0002261423798313729, "loss": 1.566, "step": 12602 }, { "epoch": 0.99, "learning_rate": 0.00022613173064535427, "loss": 1.5974, "step": 12603 }, { "epoch": 0.99, "learning_rate": 0.00022612108094244328, "loss": 1.6307, "step": 12604 }, { "epoch": 0.99, "learning_rate": 0.0002261104307227121, "loss": 1.5782, "step": 12605 }, { "epoch": 0.99, "learning_rate": 0.00022609977998623313, "loss": 1.592, "step": 12606 }, { "epoch": 0.99, "learning_rate": 0.0002260891287330786, "loss": 1.6166, "step": 12607 }, { "epoch": 0.99, "learning_rate": 0.0002260784769633209, "loss": 1.6064, "step": 12608 }, { "epoch": 0.99, "learning_rate": 0.0002260678246770323, "loss": 1.5772, "step": 12609 }, { "epoch": 0.99, "learning_rate": 0.00022605717187428517, "loss": 1.5655, "step": 12610 }, { "epoch": 0.99, "learning_rate": 0.00022604651855515185, "loss": 1.5842, "step": 12611 }, { "epoch": 0.99, "learning_rate": 0.0002260358647197046, "loss": 1.5485, "step": 12612 }, { "epoch": 0.99, "learning_rate": 0.00022602521036801576, "loss": 1.6106, "step": 12613 }, { "epoch": 0.99, "learning_rate": 0.00022601455550015778, "loss": 1.5921, "step": 12614 }, { "epoch": 0.99, "learning_rate": 0.00022600390011620283, "loss": 1.5755, "step": 12615 }, { "epoch": 0.99, "learning_rate": 0.0002259932442162234, "loss": 1.551, "step": 12616 }, { "epoch": 0.99, "learning_rate": 0.00022598258780029168, "loss": 1.5531, "step": 12617 }, { "epoch": 0.99, "learning_rate": 0.00022597193086848025, "loss": 1.5933, "step": 12618 }, { "epoch": 0.99, "learning_rate": 0.00022596127342086123, "loss": 1.5883, "step": 12619 }, { "epoch": 0.99, "learning_rate": 0.00022595061545750713, "loss": 1.6076, "step": 12620 }, { "epoch": 0.99, "learning_rate": 0.0002259399569784903, "loss": 1.5924, "step": 12621 }, { "epoch": 0.99, "learning_rate": 0.000225929297983883, "loss": 1.5831, "step": 12622 }, { "epoch": 0.99, "learning_rate": 0.00022591863847375772, "loss": 1.647, "step": 12623 }, { "epoch": 0.99, "learning_rate": 0.00022590797844818672, "loss": 1.6436, "step": 12624 }, { "epoch": 0.99, "learning_rate": 0.00022589731790724252, "loss": 1.5894, "step": 12625 }, { "epoch": 0.99, "learning_rate": 0.00022588665685099735, "loss": 1.6032, "step": 12626 }, { "epoch": 0.99, "learning_rate": 0.00022587599527952365, "loss": 1.5954, "step": 12627 }, { "epoch": 0.99, "learning_rate": 0.00022586533319289386, "loss": 1.6194, "step": 12628 }, { "epoch": 0.99, "learning_rate": 0.0002258546705911803, "loss": 1.5773, "step": 12629 }, { "epoch": 0.99, "learning_rate": 0.00022584400747445536, "loss": 1.5993, "step": 12630 }, { "epoch": 0.99, "learning_rate": 0.00022583334384279155, "loss": 1.6108, "step": 12631 }, { "epoch": 0.99, "learning_rate": 0.00022582267969626111, "loss": 1.5828, "step": 12632 }, { "epoch": 0.99, "learning_rate": 0.00022581201503493652, "loss": 1.5952, "step": 12633 }, { "epoch": 0.99, "learning_rate": 0.00022580134985889023, "loss": 1.5659, "step": 12634 }, { "epoch": 0.99, "learning_rate": 0.00022579068416819458, "loss": 1.5873, "step": 12635 }, { "epoch": 0.99, "learning_rate": 0.00022578001796292197, "loss": 1.5775, "step": 12636 }, { "epoch": 0.99, "learning_rate": 0.00022576935124314488, "loss": 1.549, "step": 12637 }, { "epoch": 0.99, "learning_rate": 0.00022575868400893578, "loss": 1.6088, "step": 12638 }, { "epoch": 0.99, "learning_rate": 0.00022574801626036695, "loss": 1.5899, "step": 12639 }, { "epoch": 0.99, "learning_rate": 0.00022573734799751088, "loss": 1.6224, "step": 12640 }, { "epoch": 0.99, "learning_rate": 0.00022572667922044002, "loss": 1.6124, "step": 12641 }, { "epoch": 0.99, "learning_rate": 0.00022571600992922678, "loss": 1.5923, "step": 12642 }, { "epoch": 0.99, "learning_rate": 0.00022570534012394367, "loss": 1.5509, "step": 12643 }, { "epoch": 0.99, "learning_rate": 0.00022569466980466307, "loss": 1.5504, "step": 12644 }, { "epoch": 0.99, "learning_rate": 0.00022568399897145744, "loss": 1.5701, "step": 12645 }, { "epoch": 1.0, "learning_rate": 0.0002256733276243992, "loss": 1.5698, "step": 12646 }, { "epoch": 1.0, "learning_rate": 0.00022566265576356084, "loss": 1.6058, "step": 12647 }, { "epoch": 1.0, "learning_rate": 0.00022565198338901478, "loss": 1.5262, "step": 12648 }, { "epoch": 1.0, "learning_rate": 0.0002256413105008335, "loss": 1.6294, "step": 12649 }, { "epoch": 1.0, "learning_rate": 0.00022563063709908946, "loss": 1.5668, "step": 12650 }, { "epoch": 1.0, "learning_rate": 0.00022561996318385517, "loss": 1.6042, "step": 12651 }, { "epoch": 1.0, "learning_rate": 0.00022560928875520306, "loss": 1.583, "step": 12652 }, { "epoch": 1.0, "learning_rate": 0.00022559861381320556, "loss": 1.5638, "step": 12653 }, { "epoch": 1.0, "learning_rate": 0.00022558793835793518, "loss": 1.6016, "step": 12654 }, { "epoch": 1.0, "learning_rate": 0.00022557726238946448, "loss": 1.6071, "step": 12655 }, { "epoch": 1.0, "learning_rate": 0.00022556658590786578, "loss": 1.5974, "step": 12656 }, { "epoch": 1.0, "learning_rate": 0.0002255559089132118, "loss": 1.5929, "step": 12657 }, { "epoch": 1.0, "learning_rate": 0.00022554523140557478, "loss": 1.6263, "step": 12658 }, { "epoch": 1.0, "learning_rate": 0.00022553455338502736, "loss": 1.6059, "step": 12659 }, { "epoch": 1.0, "learning_rate": 0.00022552387485164202, "loss": 1.5304, "step": 12660 }, { "epoch": 1.0, "learning_rate": 0.00022551319580549123, "loss": 1.593, "step": 12661 }, { "epoch": 1.0, "learning_rate": 0.00022550251624664755, "loss": 1.5504, "step": 12662 }, { "epoch": 1.0, "learning_rate": 0.0002254918361751834, "loss": 1.5655, "step": 12663 }, { "epoch": 1.0, "learning_rate": 0.00022548115559117135, "loss": 1.5817, "step": 12664 }, { "epoch": 1.0, "learning_rate": 0.0002254704744946839, "loss": 1.5986, "step": 12665 }, { "epoch": 1.0, "learning_rate": 0.0002254597928857936, "loss": 1.6303, "step": 12666 }, { "epoch": 1.0, "learning_rate": 0.00022544911076457296, "loss": 1.6426, "step": 12667 }, { "epoch": 1.0, "learning_rate": 0.00022543842813109447, "loss": 1.5656, "step": 12668 }, { "epoch": 1.0, "learning_rate": 0.00022542774498543073, "loss": 1.6326, "step": 12669 }, { "epoch": 1.0, "learning_rate": 0.00022541706132765414, "loss": 1.5846, "step": 12670 }, { "epoch": 1.0, "learning_rate": 0.00022540637715783737, "loss": 1.6251, "step": 12671 }, { "epoch": 1.0, "learning_rate": 0.0002253956924760529, "loss": 1.5935, "step": 12672 }, { "epoch": 1.0, "learning_rate": 0.00022538500728237328, "loss": 1.6438, "step": 12673 }, { "epoch": 1.0, "learning_rate": 0.0002253743215768711, "loss": 1.603, "step": 12674 }, { "epoch": 1.0, "learning_rate": 0.00022536363535961886, "loss": 1.5739, "step": 12675 }, { "epoch": 1.0, "learning_rate": 0.0002253529486306891, "loss": 1.6244, "step": 12676 }, { "epoch": 1.0, "learning_rate": 0.0002253422613901544, "loss": 1.5618, "step": 12677 }, { "epoch": 1.0, "learning_rate": 0.0002253315736380874, "loss": 1.5876, "step": 12678 }, { "epoch": 1.0, "learning_rate": 0.00022532088537456047, "loss": 1.5571, "step": 12679 }, { "epoch": 1.0, "learning_rate": 0.00022531019659964634, "loss": 1.5593, "step": 12680 }, { "epoch": 1.0, "learning_rate": 0.00022529950731341755, "loss": 1.586, "step": 12681 }, { "epoch": 1.0, "learning_rate": 0.00022528881751594668, "loss": 1.5566, "step": 12682 }, { "epoch": 1.0, "learning_rate": 0.00022527812720730622, "loss": 1.5613, "step": 12683 }, { "epoch": 1.0, "learning_rate": 0.00022526743638756887, "loss": 1.5695, "step": 12684 }, { "epoch": 1.0, "learning_rate": 0.00022525674505680717, "loss": 1.6052, "step": 12685 }, { "epoch": 1.0, "learning_rate": 0.00022524605321509365, "loss": 1.5881, "step": 12686 }, { "epoch": 1.0, "learning_rate": 0.000225235360862501, "loss": 1.6302, "step": 12687 }, { "epoch": 1.0, "learning_rate": 0.00022522466799910175, "loss": 1.5983, "step": 12688 }, { "epoch": 1.0, "learning_rate": 0.0002252139746249685, "loss": 1.5641, "step": 12689 }, { "epoch": 1.0, "learning_rate": 0.00022520328074017388, "loss": 1.591, "step": 12690 }, { "epoch": 1.0, "learning_rate": 0.00022519258634479052, "loss": 1.6098, "step": 12691 }, { "epoch": 1.0, "learning_rate": 0.00022518189143889096, "loss": 1.6391, "step": 12692 }, { "epoch": 1.0, "learning_rate": 0.00022517119602254783, "loss": 1.5737, "step": 12693 }, { "epoch": 1.0, "learning_rate": 0.00022516050009583385, "loss": 1.6284, "step": 12694 }, { "epoch": 1.0, "learning_rate": 0.0002251498036588214, "loss": 1.5684, "step": 12695 }, { "epoch": 1.0, "learning_rate": 0.0002251391067115834, "loss": 1.5697, "step": 12696 }, { "epoch": 1.0, "learning_rate": 0.00022512840925419222, "loss": 1.5683, "step": 12697 }, { "epoch": 1.0, "learning_rate": 0.00022511771128672068, "loss": 1.5834, "step": 12698 }, { "epoch": 1.0, "learning_rate": 0.0002251070128092413, "loss": 1.6082, "step": 12699 }, { "epoch": 1.0, "learning_rate": 0.00022509631382182675, "loss": 1.5829, "step": 12700 }, { "epoch": 1.0, "learning_rate": 0.0002250856143245497, "loss": 1.5954, "step": 12701 }, { "epoch": 1.0, "learning_rate": 0.00022507491431748272, "loss": 1.5967, "step": 12702 }, { "epoch": 1.0, "learning_rate": 0.00022506421380069853, "loss": 1.5937, "step": 12703 }, { "epoch": 1.0, "learning_rate": 0.0002250535127742697, "loss": 1.5679, "step": 12704 }, { "epoch": 1.0, "learning_rate": 0.00022504281123826903, "loss": 1.5984, "step": 12705 }, { "epoch": 1.0, "learning_rate": 0.000225032109192769, "loss": 1.5512, "step": 12706 }, { "epoch": 1.0, "learning_rate": 0.00022502140663784238, "loss": 1.5817, "step": 12707 }, { "epoch": 1.0, "learning_rate": 0.00022501070357356187, "loss": 1.6012, "step": 12708 }, { "epoch": 1.0, "learning_rate": 0.000225, "loss": 1.5703, "step": 12709 }, { "epoch": 1.0, "learning_rate": 0.00022498929591722953, "loss": 1.6076, "step": 12710 }, { "epoch": 1.0, "learning_rate": 0.00022497859132532315, "loss": 1.5634, "step": 12711 }, { "epoch": 1.0, "learning_rate": 0.00022496788622435347, "loss": 1.5549, "step": 12712 }, { "epoch": 1.0, "learning_rate": 0.00022495718061439328, "loss": 1.5171, "step": 12713 }, { "epoch": 1.0, "learning_rate": 0.0002249464744955151, "loss": 1.5547, "step": 12714 }, { "epoch": 1.0, "learning_rate": 0.00022493576786779179, "loss": 1.5623, "step": 12715 }, { "epoch": 1.0, "learning_rate": 0.00022492506073129597, "loss": 1.5476, "step": 12716 }, { "epoch": 1.0, "learning_rate": 0.0002249143530861003, "loss": 1.5405, "step": 12717 }, { "epoch": 1.0, "learning_rate": 0.00022490364493227757, "loss": 1.5766, "step": 12718 }, { "epoch": 1.0, "learning_rate": 0.00022489293626990034, "loss": 1.5565, "step": 12719 }, { "epoch": 1.0, "learning_rate": 0.00022488222709904148, "loss": 1.5565, "step": 12720 }, { "epoch": 1.0, "learning_rate": 0.0002248715174197736, "loss": 1.5791, "step": 12721 }, { "epoch": 1.0, "learning_rate": 0.0002248608072321694, "loss": 1.5086, "step": 12722 }, { "epoch": 1.0, "learning_rate": 0.00022485009653630167, "loss": 1.609, "step": 12723 }, { "epoch": 1.0, "learning_rate": 0.00022483938533224306, "loss": 1.6191, "step": 12724 }, { "epoch": 1.0, "learning_rate": 0.00022482867362006635, "loss": 1.5766, "step": 12725 }, { "epoch": 1.0, "learning_rate": 0.00022481796139984424, "loss": 1.5776, "step": 12726 }, { "epoch": 1.0, "learning_rate": 0.00022480724867164942, "loss": 1.5708, "step": 12727 }, { "epoch": 1.0, "learning_rate": 0.00022479653543555473, "loss": 1.6023, "step": 12728 }, { "epoch": 1.0, "learning_rate": 0.00022478582169163278, "loss": 1.5851, "step": 12729 }, { "epoch": 1.0, "learning_rate": 0.00022477510743995643, "loss": 1.5701, "step": 12730 }, { "epoch": 1.0, "learning_rate": 0.00022476439268059834, "loss": 1.5311, "step": 12731 }, { "epoch": 1.0, "learning_rate": 0.00022475367741363125, "loss": 1.5708, "step": 12732 }, { "epoch": 1.0, "learning_rate": 0.00022474296163912797, "loss": 1.5256, "step": 12733 }, { "epoch": 1.0, "learning_rate": 0.0002247322453571612, "loss": 1.5429, "step": 12734 }, { "epoch": 1.0, "learning_rate": 0.00022472152856780378, "loss": 1.5558, "step": 12735 }, { "epoch": 1.0, "learning_rate": 0.00022471081127112836, "loss": 1.5746, "step": 12736 }, { "epoch": 1.0, "learning_rate": 0.00022470009346720778, "loss": 1.566, "step": 12737 }, { "epoch": 1.0, "learning_rate": 0.0002246893751561148, "loss": 1.5642, "step": 12738 }, { "epoch": 1.0, "learning_rate": 0.00022467865633792218, "loss": 1.5734, "step": 12739 }, { "epoch": 1.0, "learning_rate": 0.00022466793701270268, "loss": 1.5814, "step": 12740 }, { "epoch": 1.0, "learning_rate": 0.00022465721718052908, "loss": 1.5865, "step": 12741 }, { "epoch": 1.0, "learning_rate": 0.00022464649684147422, "loss": 1.611, "step": 12742 }, { "epoch": 1.0, "learning_rate": 0.00022463577599561078, "loss": 1.5309, "step": 12743 }, { "epoch": 1.0, "learning_rate": 0.00022462505464301163, "loss": 1.5629, "step": 12744 }, { "epoch": 1.0, "learning_rate": 0.0002246143327837496, "loss": 1.5453, "step": 12745 }, { "epoch": 1.0, "learning_rate": 0.00022460361041789739, "loss": 1.5616, "step": 12746 }, { "epoch": 1.0, "learning_rate": 0.00022459288754552782, "loss": 1.5717, "step": 12747 }, { "epoch": 1.0, "learning_rate": 0.0002245821641667137, "loss": 1.565, "step": 12748 }, { "epoch": 1.0, "learning_rate": 0.00022457144028152783, "loss": 1.5945, "step": 12749 }, { "epoch": 1.0, "learning_rate": 0.00022456071589004308, "loss": 1.5355, "step": 12750 }, { "epoch": 1.0, "learning_rate": 0.00022454999099233216, "loss": 1.5215, "step": 12751 }, { "epoch": 1.0, "learning_rate": 0.00022453926558846802, "loss": 1.5736, "step": 12752 }, { "epoch": 1.0, "learning_rate": 0.00022452853967852332, "loss": 1.5793, "step": 12753 }, { "epoch": 1.0, "learning_rate": 0.000224517813262571, "loss": 1.5752, "step": 12754 }, { "epoch": 1.0, "learning_rate": 0.00022450708634068385, "loss": 1.5909, "step": 12755 }, { "epoch": 1.0, "learning_rate": 0.00022449635891293472, "loss": 1.5237, "step": 12756 }, { "epoch": 1.0, "learning_rate": 0.0002244856309793964, "loss": 1.5917, "step": 12757 }, { "epoch": 1.0, "learning_rate": 0.00022447490254014172, "loss": 1.5519, "step": 12758 }, { "epoch": 1.0, "learning_rate": 0.00022446417359524358, "loss": 1.5484, "step": 12759 }, { "epoch": 1.0, "learning_rate": 0.0002244534441447748, "loss": 1.5631, "step": 12760 }, { "epoch": 1.0, "learning_rate": 0.0002244427141888082, "loss": 1.6429, "step": 12761 }, { "epoch": 1.0, "learning_rate": 0.0002244319837274167, "loss": 1.6174, "step": 12762 }, { "epoch": 1.0, "learning_rate": 0.00022442125276067308, "loss": 1.5602, "step": 12763 }, { "epoch": 1.0, "learning_rate": 0.00022441052128865021, "loss": 1.5686, "step": 12764 }, { "epoch": 1.0, "learning_rate": 0.00022439978931142096, "loss": 1.5839, "step": 12765 }, { "epoch": 1.0, "learning_rate": 0.00022438905682905825, "loss": 1.595, "step": 12766 }, { "epoch": 1.0, "learning_rate": 0.0002243783238416348, "loss": 1.5596, "step": 12767 }, { "epoch": 1.0, "learning_rate": 0.00022436759034922364, "loss": 1.5859, "step": 12768 }, { "epoch": 1.0, "learning_rate": 0.0002243568563518976, "loss": 1.5822, "step": 12769 }, { "epoch": 1.0, "learning_rate": 0.00022434612184972947, "loss": 1.5838, "step": 12770 }, { "epoch": 1.0, "learning_rate": 0.00022433538684279224, "loss": 1.5921, "step": 12771 }, { "epoch": 1.0, "learning_rate": 0.0002243246513311588, "loss": 1.5726, "step": 12772 }, { "epoch": 1.0, "learning_rate": 0.0002243139153149019, "loss": 1.6001, "step": 12773 }, { "epoch": 1.01, "learning_rate": 0.00022430317879409457, "loss": 1.5696, "step": 12774 }, { "epoch": 1.01, "learning_rate": 0.00022429244176880967, "loss": 1.5999, "step": 12775 }, { "epoch": 1.01, "learning_rate": 0.0002242817042391201, "loss": 1.5566, "step": 12776 }, { "epoch": 1.01, "learning_rate": 0.00022427096620509872, "loss": 1.5675, "step": 12777 }, { "epoch": 1.01, "learning_rate": 0.00022426022766681845, "loss": 1.6168, "step": 12778 }, { "epoch": 1.01, "learning_rate": 0.00022424948862435226, "loss": 1.6123, "step": 12779 }, { "epoch": 1.01, "learning_rate": 0.00022423874907777299, "loss": 1.5662, "step": 12780 }, { "epoch": 1.01, "learning_rate": 0.0002242280090271536, "loss": 1.5403, "step": 12781 }, { "epoch": 1.01, "learning_rate": 0.00022421726847256696, "loss": 1.4945, "step": 12782 }, { "epoch": 1.01, "learning_rate": 0.00022420652741408605, "loss": 1.611, "step": 12783 }, { "epoch": 1.01, "learning_rate": 0.00022419578585178377, "loss": 1.5785, "step": 12784 }, { "epoch": 1.01, "learning_rate": 0.00022418504378573305, "loss": 1.5752, "step": 12785 }, { "epoch": 1.01, "learning_rate": 0.00022417430121600683, "loss": 1.5389, "step": 12786 }, { "epoch": 1.01, "learning_rate": 0.00022416355814267803, "loss": 1.5723, "step": 12787 }, { "epoch": 1.01, "learning_rate": 0.00022415281456581956, "loss": 1.6173, "step": 12788 }, { "epoch": 1.01, "learning_rate": 0.00022414207048550443, "loss": 1.5503, "step": 12789 }, { "epoch": 1.01, "learning_rate": 0.00022413132590180557, "loss": 1.5905, "step": 12790 }, { "epoch": 1.01, "learning_rate": 0.0002241205808147959, "loss": 1.5662, "step": 12791 }, { "epoch": 1.01, "learning_rate": 0.00022410983522454838, "loss": 1.5507, "step": 12792 }, { "epoch": 1.01, "learning_rate": 0.00022409908913113602, "loss": 1.5314, "step": 12793 }, { "epoch": 1.01, "learning_rate": 0.00022408834253463165, "loss": 1.5925, "step": 12794 }, { "epoch": 1.01, "learning_rate": 0.00022407759543510838, "loss": 1.5844, "step": 12795 }, { "epoch": 1.01, "learning_rate": 0.00022406684783263914, "loss": 1.5908, "step": 12796 }, { "epoch": 1.01, "learning_rate": 0.0002240560997272968, "loss": 1.6089, "step": 12797 }, { "epoch": 1.01, "learning_rate": 0.00022404535111915448, "loss": 1.5557, "step": 12798 }, { "epoch": 1.01, "learning_rate": 0.00022403460200828506, "loss": 1.5585, "step": 12799 }, { "epoch": 1.01, "learning_rate": 0.00022402385239476155, "loss": 1.5847, "step": 12800 }, { "epoch": 1.01, "learning_rate": 0.00022401310227865696, "loss": 1.5673, "step": 12801 }, { "epoch": 1.01, "learning_rate": 0.00022400235166004418, "loss": 1.5216, "step": 12802 }, { "epoch": 1.01, "learning_rate": 0.00022399160053899637, "loss": 1.6005, "step": 12803 }, { "epoch": 1.01, "learning_rate": 0.00022398084891558633, "loss": 1.5364, "step": 12804 }, { "epoch": 1.01, "learning_rate": 0.0002239700967898872, "loss": 1.5447, "step": 12805 }, { "epoch": 1.01, "learning_rate": 0.0002239593441619719, "loss": 1.5333, "step": 12806 }, { "epoch": 1.01, "learning_rate": 0.0002239485910319135, "loss": 1.5439, "step": 12807 }, { "epoch": 1.01, "learning_rate": 0.00022393783739978497, "loss": 1.5849, "step": 12808 }, { "epoch": 1.01, "learning_rate": 0.0002239270832656593, "loss": 1.553, "step": 12809 }, { "epoch": 1.01, "learning_rate": 0.00022391632862960953, "loss": 1.5324, "step": 12810 }, { "epoch": 1.01, "learning_rate": 0.00022390557349170873, "loss": 1.6348, "step": 12811 }, { "epoch": 1.01, "learning_rate": 0.00022389481785202984, "loss": 1.5242, "step": 12812 }, { "epoch": 1.01, "learning_rate": 0.0002238840617106459, "loss": 1.5984, "step": 12813 }, { "epoch": 1.01, "learning_rate": 0.00022387330506763, "loss": 1.5729, "step": 12814 }, { "epoch": 1.01, "learning_rate": 0.0002238625479230551, "loss": 1.5439, "step": 12815 }, { "epoch": 1.01, "learning_rate": 0.00022385179027699422, "loss": 1.5362, "step": 12816 }, { "epoch": 1.01, "learning_rate": 0.0002238410321295205, "loss": 1.5656, "step": 12817 }, { "epoch": 1.01, "learning_rate": 0.0002238302734807069, "loss": 1.5915, "step": 12818 }, { "epoch": 1.01, "learning_rate": 0.00022381951433062645, "loss": 1.5599, "step": 12819 }, { "epoch": 1.01, "learning_rate": 0.0002238087546793523, "loss": 1.5692, "step": 12820 }, { "epoch": 1.01, "learning_rate": 0.00022379799452695734, "loss": 1.5669, "step": 12821 }, { "epoch": 1.01, "learning_rate": 0.00022378723387351485, "loss": 1.5768, "step": 12822 }, { "epoch": 1.01, "learning_rate": 0.0002237764727190977, "loss": 1.5931, "step": 12823 }, { "epoch": 1.01, "learning_rate": 0.00022376571106377897, "loss": 1.5853, "step": 12824 }, { "epoch": 1.01, "learning_rate": 0.0002237549489076318, "loss": 1.5369, "step": 12825 }, { "epoch": 1.01, "learning_rate": 0.00022374418625072925, "loss": 1.616, "step": 12826 }, { "epoch": 1.01, "learning_rate": 0.00022373342309314436, "loss": 1.5545, "step": 12827 }, { "epoch": 1.01, "learning_rate": 0.00022372265943495026, "loss": 1.5766, "step": 12828 }, { "epoch": 1.01, "learning_rate": 0.00022371189527621989, "loss": 1.5599, "step": 12829 }, { "epoch": 1.01, "learning_rate": 0.00022370113061702645, "loss": 1.5616, "step": 12830 }, { "epoch": 1.01, "learning_rate": 0.00022369036545744303, "loss": 1.5843, "step": 12831 }, { "epoch": 1.01, "learning_rate": 0.00022367959979754275, "loss": 1.5699, "step": 12832 }, { "epoch": 1.01, "learning_rate": 0.00022366883363739856, "loss": 1.5194, "step": 12833 }, { "epoch": 1.01, "learning_rate": 0.0002236580669770837, "loss": 1.5358, "step": 12834 }, { "epoch": 1.01, "learning_rate": 0.0002236472998166712, "loss": 1.5797, "step": 12835 }, { "epoch": 1.01, "learning_rate": 0.00022363653215623416, "loss": 1.5229, "step": 12836 }, { "epoch": 1.01, "learning_rate": 0.00022362576399584567, "loss": 1.582, "step": 12837 }, { "epoch": 1.01, "learning_rate": 0.00022361499533557892, "loss": 1.5767, "step": 12838 }, { "epoch": 1.01, "learning_rate": 0.00022360422617550695, "loss": 1.5873, "step": 12839 }, { "epoch": 1.01, "learning_rate": 0.00022359345651570297, "loss": 1.5708, "step": 12840 }, { "epoch": 1.01, "learning_rate": 0.00022358268635623997, "loss": 1.5444, "step": 12841 }, { "epoch": 1.01, "learning_rate": 0.00022357191569719116, "loss": 1.5909, "step": 12842 }, { "epoch": 1.01, "learning_rate": 0.00022356114453862962, "loss": 1.5707, "step": 12843 }, { "epoch": 1.01, "learning_rate": 0.00022355037288062851, "loss": 1.5262, "step": 12844 }, { "epoch": 1.01, "learning_rate": 0.00022353960072326096, "loss": 1.5964, "step": 12845 }, { "epoch": 1.01, "learning_rate": 0.0002235288280666001, "loss": 1.6067, "step": 12846 }, { "epoch": 1.01, "learning_rate": 0.0002235180549107191, "loss": 1.6097, "step": 12847 }, { "epoch": 1.01, "learning_rate": 0.00022350728125569106, "loss": 1.5079, "step": 12848 }, { "epoch": 1.01, "learning_rate": 0.00022349650710158913, "loss": 1.5432, "step": 12849 }, { "epoch": 1.01, "learning_rate": 0.0002234857324484865, "loss": 1.5512, "step": 12850 }, { "epoch": 1.01, "learning_rate": 0.00022347495729645628, "loss": 1.5179, "step": 12851 }, { "epoch": 1.01, "learning_rate": 0.00022346418164557162, "loss": 1.5642, "step": 12852 }, { "epoch": 1.01, "learning_rate": 0.00022345340549590576, "loss": 1.6375, "step": 12853 }, { "epoch": 1.01, "learning_rate": 0.00022344262884753182, "loss": 1.5717, "step": 12854 }, { "epoch": 1.01, "learning_rate": 0.0002234318517005229, "loss": 1.5243, "step": 12855 }, { "epoch": 1.01, "learning_rate": 0.00022342107405495226, "loss": 1.5669, "step": 12856 }, { "epoch": 1.01, "learning_rate": 0.00022341029591089307, "loss": 1.553, "step": 12857 }, { "epoch": 1.01, "learning_rate": 0.00022339951726841844, "loss": 1.6142, "step": 12858 }, { "epoch": 1.01, "learning_rate": 0.00022338873812760164, "loss": 1.5519, "step": 12859 }, { "epoch": 1.01, "learning_rate": 0.00022337795848851574, "loss": 1.5165, "step": 12860 }, { "epoch": 1.01, "learning_rate": 0.00022336717835123407, "loss": 1.5779, "step": 12861 }, { "epoch": 1.01, "learning_rate": 0.00022335639771582966, "loss": 1.6213, "step": 12862 }, { "epoch": 1.01, "learning_rate": 0.00022334561658237585, "loss": 1.6038, "step": 12863 }, { "epoch": 1.01, "learning_rate": 0.0002233348349509458, "loss": 1.5734, "step": 12864 }, { "epoch": 1.01, "learning_rate": 0.00022332405282161265, "loss": 1.5347, "step": 12865 }, { "epoch": 1.01, "learning_rate": 0.00022331327019444963, "loss": 1.5676, "step": 12866 }, { "epoch": 1.01, "learning_rate": 0.00022330248706953, "loss": 1.606, "step": 12867 }, { "epoch": 1.01, "learning_rate": 0.00022329170344692688, "loss": 1.5473, "step": 12868 }, { "epoch": 1.01, "learning_rate": 0.00022328091932671362, "loss": 1.5691, "step": 12869 }, { "epoch": 1.01, "learning_rate": 0.00022327013470896333, "loss": 1.6428, "step": 12870 }, { "epoch": 1.01, "learning_rate": 0.00022325934959374925, "loss": 1.5478, "step": 12871 }, { "epoch": 1.01, "learning_rate": 0.0002232485639811446, "loss": 1.5801, "step": 12872 }, { "epoch": 1.01, "learning_rate": 0.0002232377778712226, "loss": 1.5864, "step": 12873 }, { "epoch": 1.01, "learning_rate": 0.00022322699126405658, "loss": 1.5576, "step": 12874 }, { "epoch": 1.01, "learning_rate": 0.0002232162041597197, "loss": 1.5487, "step": 12875 }, { "epoch": 1.01, "learning_rate": 0.0002232054165582851, "loss": 1.5291, "step": 12876 }, { "epoch": 1.01, "learning_rate": 0.0002231946284598262, "loss": 1.5736, "step": 12877 }, { "epoch": 1.01, "learning_rate": 0.00022318383986441614, "loss": 1.5259, "step": 12878 }, { "epoch": 1.01, "learning_rate": 0.00022317305077212816, "loss": 1.5355, "step": 12879 }, { "epoch": 1.01, "learning_rate": 0.0002231622611830356, "loss": 1.5456, "step": 12880 }, { "epoch": 1.01, "learning_rate": 0.00022315147109721166, "loss": 1.5803, "step": 12881 }, { "epoch": 1.01, "learning_rate": 0.00022314068051472956, "loss": 1.5745, "step": 12882 }, { "epoch": 1.01, "learning_rate": 0.00022312988943566262, "loss": 1.6124, "step": 12883 }, { "epoch": 1.01, "learning_rate": 0.00022311909786008408, "loss": 1.6066, "step": 12884 }, { "epoch": 1.01, "learning_rate": 0.00022310830578806722, "loss": 1.5796, "step": 12885 }, { "epoch": 1.01, "learning_rate": 0.00022309751321968532, "loss": 1.6492, "step": 12886 }, { "epoch": 1.01, "learning_rate": 0.00022308672015501166, "loss": 1.5245, "step": 12887 }, { "epoch": 1.01, "learning_rate": 0.00022307592659411945, "loss": 1.532, "step": 12888 }, { "epoch": 1.01, "learning_rate": 0.00022306513253708208, "loss": 1.5152, "step": 12889 }, { "epoch": 1.01, "learning_rate": 0.00022305433798397274, "loss": 1.6107, "step": 12890 }, { "epoch": 1.01, "learning_rate": 0.00022304354293486482, "loss": 1.5952, "step": 12891 }, { "epoch": 1.01, "learning_rate": 0.00022303274738983144, "loss": 1.5696, "step": 12892 }, { "epoch": 1.01, "learning_rate": 0.0002230219513489461, "loss": 1.5699, "step": 12893 }, { "epoch": 1.01, "learning_rate": 0.00022301115481228195, "loss": 1.5138, "step": 12894 }, { "epoch": 1.01, "learning_rate": 0.00022300035777991239, "loss": 1.5703, "step": 12895 }, { "epoch": 1.01, "learning_rate": 0.00022298956025191072, "loss": 1.6115, "step": 12896 }, { "epoch": 1.01, "learning_rate": 0.00022297876222835016, "loss": 1.5839, "step": 12897 }, { "epoch": 1.01, "learning_rate": 0.0002229679637093041, "loss": 1.5145, "step": 12898 }, { "epoch": 1.01, "learning_rate": 0.0002229571646948458, "loss": 1.5895, "step": 12899 }, { "epoch": 1.01, "learning_rate": 0.00022294636518504864, "loss": 1.5815, "step": 12900 }, { "epoch": 1.02, "learning_rate": 0.0002229355651799859, "loss": 1.5524, "step": 12901 }, { "epoch": 1.02, "learning_rate": 0.00022292476467973094, "loss": 1.6086, "step": 12902 }, { "epoch": 1.02, "learning_rate": 0.00022291396368435707, "loss": 1.614, "step": 12903 }, { "epoch": 1.02, "learning_rate": 0.0002229031621939376, "loss": 1.5722, "step": 12904 }, { "epoch": 1.02, "learning_rate": 0.00022289236020854594, "loss": 1.5736, "step": 12905 }, { "epoch": 1.02, "learning_rate": 0.00022288155772825534, "loss": 1.5372, "step": 12906 }, { "epoch": 1.02, "learning_rate": 0.0002228707547531392, "loss": 1.5627, "step": 12907 }, { "epoch": 1.02, "learning_rate": 0.00022285995128327083, "loss": 1.5067, "step": 12908 }, { "epoch": 1.02, "learning_rate": 0.0002228491473187236, "loss": 1.6282, "step": 12909 }, { "epoch": 1.02, "learning_rate": 0.00022283834285957086, "loss": 1.5346, "step": 12910 }, { "epoch": 1.02, "learning_rate": 0.00022282753790588597, "loss": 1.6062, "step": 12911 }, { "epoch": 1.02, "learning_rate": 0.00022281673245774227, "loss": 1.5768, "step": 12912 }, { "epoch": 1.02, "learning_rate": 0.0002228059265152132, "loss": 1.5961, "step": 12913 }, { "epoch": 1.02, "learning_rate": 0.00022279512007837205, "loss": 1.6004, "step": 12914 }, { "epoch": 1.02, "learning_rate": 0.00022278431314729215, "loss": 1.6025, "step": 12915 }, { "epoch": 1.02, "learning_rate": 0.00022277350572204695, "loss": 1.5462, "step": 12916 }, { "epoch": 1.02, "learning_rate": 0.00022276269780270987, "loss": 1.5645, "step": 12917 }, { "epoch": 1.02, "learning_rate": 0.00022275188938935417, "loss": 1.5028, "step": 12918 }, { "epoch": 1.02, "learning_rate": 0.00022274108048205325, "loss": 1.5501, "step": 12919 }, { "epoch": 1.02, "learning_rate": 0.00022273027108088065, "loss": 1.5388, "step": 12920 }, { "epoch": 1.02, "learning_rate": 0.00022271946118590955, "loss": 1.5813, "step": 12921 }, { "epoch": 1.02, "learning_rate": 0.00022270865079721344, "loss": 1.6022, "step": 12922 }, { "epoch": 1.02, "learning_rate": 0.00022269783991486574, "loss": 1.6066, "step": 12923 }, { "epoch": 1.02, "learning_rate": 0.00022268702853893982, "loss": 1.5844, "step": 12924 }, { "epoch": 1.02, "learning_rate": 0.00022267621666950912, "loss": 1.5676, "step": 12925 }, { "epoch": 1.02, "learning_rate": 0.00022266540430664696, "loss": 1.5804, "step": 12926 }, { "epoch": 1.02, "learning_rate": 0.00022265459145042686, "loss": 1.5435, "step": 12927 }, { "epoch": 1.02, "learning_rate": 0.00022264377810092214, "loss": 1.5871, "step": 12928 }, { "epoch": 1.02, "learning_rate": 0.00022263296425820627, "loss": 1.5755, "step": 12929 }, { "epoch": 1.02, "learning_rate": 0.00022262214992235265, "loss": 1.5691, "step": 12930 }, { "epoch": 1.02, "learning_rate": 0.0002226113350934347, "loss": 1.5873, "step": 12931 }, { "epoch": 1.02, "learning_rate": 0.00022260051977152586, "loss": 1.5803, "step": 12932 }, { "epoch": 1.02, "learning_rate": 0.00022258970395669958, "loss": 1.6099, "step": 12933 }, { "epoch": 1.02, "learning_rate": 0.00022257888764902925, "loss": 1.6084, "step": 12934 }, { "epoch": 1.02, "learning_rate": 0.0002225680708485883, "loss": 1.573, "step": 12935 }, { "epoch": 1.02, "learning_rate": 0.00022255725355545023, "loss": 1.5501, "step": 12936 }, { "epoch": 1.02, "learning_rate": 0.00022254643576968846, "loss": 1.589, "step": 12937 }, { "epoch": 1.02, "learning_rate": 0.0002225356174913764, "loss": 1.557, "step": 12938 }, { "epoch": 1.02, "learning_rate": 0.0002225247987205875, "loss": 1.6282, "step": 12939 }, { "epoch": 1.02, "learning_rate": 0.00022251397945739526, "loss": 1.5555, "step": 12940 }, { "epoch": 1.02, "learning_rate": 0.00022250315970187313, "loss": 1.5573, "step": 12941 }, { "epoch": 1.02, "learning_rate": 0.00022249233945409458, "loss": 1.5591, "step": 12942 }, { "epoch": 1.02, "learning_rate": 0.00022248151871413297, "loss": 1.5818, "step": 12943 }, { "epoch": 1.02, "learning_rate": 0.00022247069748206194, "loss": 1.5731, "step": 12944 }, { "epoch": 1.02, "learning_rate": 0.0002224598757579548, "loss": 1.5645, "step": 12945 }, { "epoch": 1.02, "learning_rate": 0.00022244905354188512, "loss": 1.6237, "step": 12946 }, { "epoch": 1.02, "learning_rate": 0.00022243823083392631, "loss": 1.569, "step": 12947 }, { "epoch": 1.02, "learning_rate": 0.00022242740763415194, "loss": 1.5595, "step": 12948 }, { "epoch": 1.02, "learning_rate": 0.00022241658394263542, "loss": 1.555, "step": 12949 }, { "epoch": 1.02, "learning_rate": 0.00022240575975945024, "loss": 1.5565, "step": 12950 }, { "epoch": 1.02, "learning_rate": 0.00022239493508466993, "loss": 1.6198, "step": 12951 }, { "epoch": 1.02, "learning_rate": 0.00022238410991836798, "loss": 1.6036, "step": 12952 }, { "epoch": 1.02, "learning_rate": 0.00022237328426061783, "loss": 1.5187, "step": 12953 }, { "epoch": 1.02, "learning_rate": 0.00022236245811149303, "loss": 1.5594, "step": 12954 }, { "epoch": 1.02, "learning_rate": 0.00022235163147106706, "loss": 1.5909, "step": 12955 }, { "epoch": 1.02, "learning_rate": 0.00022234080433941348, "loss": 1.5982, "step": 12956 }, { "epoch": 1.02, "learning_rate": 0.00022232997671660574, "loss": 1.584, "step": 12957 }, { "epoch": 1.02, "learning_rate": 0.00022231914860271733, "loss": 1.542, "step": 12958 }, { "epoch": 1.02, "learning_rate": 0.00022230831999782186, "loss": 1.6387, "step": 12959 }, { "epoch": 1.02, "learning_rate": 0.0002222974909019928, "loss": 1.6186, "step": 12960 }, { "epoch": 1.02, "learning_rate": 0.00022228666131530366, "loss": 1.5631, "step": 12961 }, { "epoch": 1.02, "learning_rate": 0.00022227583123782794, "loss": 1.5677, "step": 12962 }, { "epoch": 1.02, "learning_rate": 0.00022226500066963926, "loss": 1.5856, "step": 12963 }, { "epoch": 1.02, "learning_rate": 0.00022225416961081112, "loss": 1.5581, "step": 12964 }, { "epoch": 1.02, "learning_rate": 0.00022224333806141703, "loss": 1.5023, "step": 12965 }, { "epoch": 1.02, "learning_rate": 0.00022223250602153055, "loss": 1.5463, "step": 12966 }, { "epoch": 1.02, "learning_rate": 0.00022222167349122518, "loss": 1.5329, "step": 12967 }, { "epoch": 1.02, "learning_rate": 0.0002222108404705745, "loss": 1.5496, "step": 12968 }, { "epoch": 1.02, "learning_rate": 0.0002222000069596521, "loss": 1.5387, "step": 12969 }, { "epoch": 1.02, "learning_rate": 0.00022218917295853145, "loss": 1.5037, "step": 12970 }, { "epoch": 1.02, "learning_rate": 0.00022217833846728622, "loss": 1.5783, "step": 12971 }, { "epoch": 1.02, "learning_rate": 0.00022216750348598983, "loss": 1.65, "step": 12972 }, { "epoch": 1.02, "learning_rate": 0.000222156668014716, "loss": 1.6246, "step": 12973 }, { "epoch": 1.02, "learning_rate": 0.00022214583205353814, "loss": 1.5719, "step": 12974 }, { "epoch": 1.02, "learning_rate": 0.0002221349956025299, "loss": 1.5717, "step": 12975 }, { "epoch": 1.02, "learning_rate": 0.00022212415866176488, "loss": 1.5632, "step": 12976 }, { "epoch": 1.02, "learning_rate": 0.0002221133212313166, "loss": 1.5807, "step": 12977 }, { "epoch": 1.02, "learning_rate": 0.00022210248331125867, "loss": 1.5827, "step": 12978 }, { "epoch": 1.02, "learning_rate": 0.00022209164490166465, "loss": 1.5819, "step": 12979 }, { "epoch": 1.02, "learning_rate": 0.00022208080600260815, "loss": 1.5274, "step": 12980 }, { "epoch": 1.02, "learning_rate": 0.00022206996661416282, "loss": 1.5935, "step": 12981 }, { "epoch": 1.02, "learning_rate": 0.00022205912673640212, "loss": 1.5686, "step": 12982 }, { "epoch": 1.02, "learning_rate": 0.00022204828636939976, "loss": 1.5366, "step": 12983 }, { "epoch": 1.02, "learning_rate": 0.00022203744551322922, "loss": 1.5499, "step": 12984 }, { "epoch": 1.02, "learning_rate": 0.00022202660416796425, "loss": 1.5735, "step": 12985 }, { "epoch": 1.02, "learning_rate": 0.00022201576233367833, "loss": 1.5675, "step": 12986 }, { "epoch": 1.02, "learning_rate": 0.00022200492001044517, "loss": 1.5769, "step": 12987 }, { "epoch": 1.02, "learning_rate": 0.00022199407719833831, "loss": 1.6106, "step": 12988 }, { "epoch": 1.02, "learning_rate": 0.00022198323389743143, "loss": 1.6385, "step": 12989 }, { "epoch": 1.02, "learning_rate": 0.00022197239010779808, "loss": 1.6015, "step": 12990 }, { "epoch": 1.02, "learning_rate": 0.00022196154582951194, "loss": 1.5195, "step": 12991 }, { "epoch": 1.02, "learning_rate": 0.00022195070106264663, "loss": 1.5573, "step": 12992 }, { "epoch": 1.02, "learning_rate": 0.00022193985580727576, "loss": 1.6263, "step": 12993 }, { "epoch": 1.02, "learning_rate": 0.0002219290100634729, "loss": 1.5938, "step": 12994 }, { "epoch": 1.02, "learning_rate": 0.0002219181638313118, "loss": 1.5931, "step": 12995 }, { "epoch": 1.02, "learning_rate": 0.0002219073171108661, "loss": 1.5371, "step": 12996 }, { "epoch": 1.02, "learning_rate": 0.00022189646990220934, "loss": 1.625, "step": 12997 }, { "epoch": 1.02, "learning_rate": 0.0002218856222054153, "loss": 1.5833, "step": 12998 }, { "epoch": 1.02, "learning_rate": 0.00022187477402055747, "loss": 1.594, "step": 12999 }, { "epoch": 1.02, "learning_rate": 0.00022186392534770963, "loss": 1.6006, "step": 13000 }, { "epoch": 1.02, "learning_rate": 0.0002218530761869454, "loss": 1.6179, "step": 13001 }, { "epoch": 1.02, "learning_rate": 0.0002218422265383384, "loss": 1.5422, "step": 13002 }, { "epoch": 1.02, "learning_rate": 0.00022183137640196233, "loss": 1.5836, "step": 13003 }, { "epoch": 1.02, "learning_rate": 0.00022182052577789088, "loss": 1.5648, "step": 13004 }, { "epoch": 1.02, "learning_rate": 0.0002218096746661977, "loss": 1.6029, "step": 13005 }, { "epoch": 1.02, "learning_rate": 0.00022179882306695643, "loss": 1.57, "step": 13006 }, { "epoch": 1.02, "learning_rate": 0.0002217879709802408, "loss": 1.5806, "step": 13007 }, { "epoch": 1.02, "learning_rate": 0.00022177711840612447, "loss": 1.585, "step": 13008 }, { "epoch": 1.02, "learning_rate": 0.00022176626534468107, "loss": 1.5812, "step": 13009 }, { "epoch": 1.02, "learning_rate": 0.00022175541179598435, "loss": 1.5386, "step": 13010 }, { "epoch": 1.02, "learning_rate": 0.000221744557760108, "loss": 1.5731, "step": 13011 }, { "epoch": 1.02, "learning_rate": 0.0002217337032371257, "loss": 1.563, "step": 13012 }, { "epoch": 1.02, "learning_rate": 0.0002217228482271111, "loss": 1.5541, "step": 13013 }, { "epoch": 1.02, "learning_rate": 0.00022171199273013798, "loss": 1.5158, "step": 13014 }, { "epoch": 1.02, "learning_rate": 0.00022170113674627997, "loss": 1.5674, "step": 13015 }, { "epoch": 1.02, "learning_rate": 0.00022169028027561085, "loss": 1.5621, "step": 13016 }, { "epoch": 1.02, "learning_rate": 0.00022167942331820426, "loss": 1.5241, "step": 13017 }, { "epoch": 1.02, "learning_rate": 0.00022166856587413396, "loss": 1.558, "step": 13018 }, { "epoch": 1.02, "learning_rate": 0.00022165770794347361, "loss": 1.5289, "step": 13019 }, { "epoch": 1.02, "learning_rate": 0.00022164684952629703, "loss": 1.5952, "step": 13020 }, { "epoch": 1.02, "learning_rate": 0.0002216359906226778, "loss": 1.5298, "step": 13021 }, { "epoch": 1.02, "learning_rate": 0.0002216251312326898, "loss": 1.6042, "step": 13022 }, { "epoch": 1.02, "learning_rate": 0.00022161427135640666, "loss": 1.5422, "step": 13023 }, { "epoch": 1.02, "learning_rate": 0.00022160341099390212, "loss": 1.5521, "step": 13024 }, { "epoch": 1.02, "learning_rate": 0.00022159255014524991, "loss": 1.6151, "step": 13025 }, { "epoch": 1.02, "learning_rate": 0.00022158168881052386, "loss": 1.5719, "step": 13026 }, { "epoch": 1.02, "learning_rate": 0.00022157082698979761, "loss": 1.5696, "step": 13027 }, { "epoch": 1.03, "learning_rate": 0.00022155996468314494, "loss": 1.5272, "step": 13028 }, { "epoch": 1.03, "learning_rate": 0.00022154910189063962, "loss": 1.5539, "step": 13029 }, { "epoch": 1.03, "learning_rate": 0.00022153823861235534, "loss": 1.5456, "step": 13030 }, { "epoch": 1.03, "learning_rate": 0.00022152737484836595, "loss": 1.5787, "step": 13031 }, { "epoch": 1.03, "learning_rate": 0.00022151651059874517, "loss": 1.5683, "step": 13032 }, { "epoch": 1.03, "learning_rate": 0.00022150564586356664, "loss": 1.55, "step": 13033 }, { "epoch": 1.03, "learning_rate": 0.0002214947806429043, "loss": 1.5298, "step": 13034 }, { "epoch": 1.03, "learning_rate": 0.00022148391493683188, "loss": 1.5785, "step": 13035 }, { "epoch": 1.03, "learning_rate": 0.0002214730487454231, "loss": 1.6301, "step": 13036 }, { "epoch": 1.03, "learning_rate": 0.0002214621820687518, "loss": 1.5962, "step": 13037 }, { "epoch": 1.03, "learning_rate": 0.00022145131490689164, "loss": 1.5122, "step": 13038 }, { "epoch": 1.03, "learning_rate": 0.00022144044725991654, "loss": 1.5746, "step": 13039 }, { "epoch": 1.03, "learning_rate": 0.00022142957912790021, "loss": 1.6018, "step": 13040 }, { "epoch": 1.03, "learning_rate": 0.00022141871051091646, "loss": 1.5769, "step": 13041 }, { "epoch": 1.03, "learning_rate": 0.00022140784140903906, "loss": 1.6113, "step": 13042 }, { "epoch": 1.03, "learning_rate": 0.00022139697182234184, "loss": 1.5662, "step": 13043 }, { "epoch": 1.03, "learning_rate": 0.0002213861017508986, "loss": 1.5961, "step": 13044 }, { "epoch": 1.03, "learning_rate": 0.0002213752311947831, "loss": 1.5725, "step": 13045 }, { "epoch": 1.03, "learning_rate": 0.00022136436015406918, "loss": 1.5518, "step": 13046 }, { "epoch": 1.03, "learning_rate": 0.00022135348862883063, "loss": 1.5165, "step": 13047 }, { "epoch": 1.03, "learning_rate": 0.00022134261661914127, "loss": 1.6185, "step": 13048 }, { "epoch": 1.03, "learning_rate": 0.00022133174412507488, "loss": 1.5526, "step": 13049 }, { "epoch": 1.03, "learning_rate": 0.00022132087114670537, "loss": 1.5696, "step": 13050 }, { "epoch": 1.03, "learning_rate": 0.00022130999768410646, "loss": 1.5924, "step": 13051 }, { "epoch": 1.03, "learning_rate": 0.00022129912373735204, "loss": 1.5269, "step": 13052 }, { "epoch": 1.03, "learning_rate": 0.0002212882493065159, "loss": 1.6137, "step": 13053 }, { "epoch": 1.03, "learning_rate": 0.0002212773743916719, "loss": 1.5659, "step": 13054 }, { "epoch": 1.03, "learning_rate": 0.00022126649899289387, "loss": 1.555, "step": 13055 }, { "epoch": 1.03, "learning_rate": 0.00022125562311025565, "loss": 1.5826, "step": 13056 }, { "epoch": 1.03, "learning_rate": 0.00022124474674383102, "loss": 1.5928, "step": 13057 }, { "epoch": 1.03, "learning_rate": 0.00022123386989369393, "loss": 1.5164, "step": 13058 }, { "epoch": 1.03, "learning_rate": 0.00022122299255991813, "loss": 1.5189, "step": 13059 }, { "epoch": 1.03, "learning_rate": 0.0002212121147425775, "loss": 1.4595, "step": 13060 }, { "epoch": 1.03, "learning_rate": 0.00022120123644174598, "loss": 1.5635, "step": 13061 }, { "epoch": 1.03, "learning_rate": 0.00022119035765749733, "loss": 1.6173, "step": 13062 }, { "epoch": 1.03, "learning_rate": 0.0002211794783899054, "loss": 1.5862, "step": 13063 }, { "epoch": 1.03, "learning_rate": 0.00022116859863904412, "loss": 1.5988, "step": 13064 }, { "epoch": 1.03, "learning_rate": 0.0002211577184049873, "loss": 1.5771, "step": 13065 }, { "epoch": 1.03, "learning_rate": 0.0002211468376878089, "loss": 1.5188, "step": 13066 }, { "epoch": 1.03, "learning_rate": 0.0002211359564875827, "loss": 1.5221, "step": 13067 }, { "epoch": 1.03, "learning_rate": 0.00022112507480438263, "loss": 1.5356, "step": 13068 }, { "epoch": 1.03, "learning_rate": 0.00022111419263828253, "loss": 1.6176, "step": 13069 }, { "epoch": 1.03, "learning_rate": 0.00022110330998935631, "loss": 1.5327, "step": 13070 }, { "epoch": 1.03, "learning_rate": 0.00022109242685767786, "loss": 1.6169, "step": 13071 }, { "epoch": 1.03, "learning_rate": 0.00022108154324332102, "loss": 1.5447, "step": 13072 }, { "epoch": 1.03, "learning_rate": 0.0002210706591463598, "loss": 1.5192, "step": 13073 }, { "epoch": 1.03, "learning_rate": 0.000221059774566868, "loss": 1.556, "step": 13074 }, { "epoch": 1.03, "learning_rate": 0.0002210488895049195, "loss": 1.5468, "step": 13075 }, { "epoch": 1.03, "learning_rate": 0.00022103800396058832, "loss": 1.5532, "step": 13076 }, { "epoch": 1.03, "learning_rate": 0.00022102711793394825, "loss": 1.5709, "step": 13077 }, { "epoch": 1.03, "learning_rate": 0.00022101623142507326, "loss": 1.5237, "step": 13078 }, { "epoch": 1.03, "learning_rate": 0.00022100534443403726, "loss": 1.5336, "step": 13079 }, { "epoch": 1.03, "learning_rate": 0.00022099445696091411, "loss": 1.6235, "step": 13080 }, { "epoch": 1.03, "learning_rate": 0.0002209835690057778, "loss": 1.6045, "step": 13081 }, { "epoch": 1.03, "learning_rate": 0.00022097268056870222, "loss": 1.6023, "step": 13082 }, { "epoch": 1.03, "learning_rate": 0.00022096179164976136, "loss": 1.5852, "step": 13083 }, { "epoch": 1.03, "learning_rate": 0.00022095090224902902, "loss": 1.5824, "step": 13084 }, { "epoch": 1.03, "learning_rate": 0.00022094001236657926, "loss": 1.6005, "step": 13085 }, { "epoch": 1.03, "learning_rate": 0.00022092912200248594, "loss": 1.5858, "step": 13086 }, { "epoch": 1.03, "learning_rate": 0.000220918231156823, "loss": 1.5629, "step": 13087 }, { "epoch": 1.03, "learning_rate": 0.0002209073398296644, "loss": 1.6149, "step": 13088 }, { "epoch": 1.03, "learning_rate": 0.00022089644802108417, "loss": 1.5474, "step": 13089 }, { "epoch": 1.03, "learning_rate": 0.00022088555573115612, "loss": 1.6006, "step": 13090 }, { "epoch": 1.03, "learning_rate": 0.0002208746629599543, "loss": 1.548, "step": 13091 }, { "epoch": 1.03, "learning_rate": 0.0002208637697075526, "loss": 1.5448, "step": 13092 }, { "epoch": 1.03, "learning_rate": 0.00022085287597402504, "loss": 1.6067, "step": 13093 }, { "epoch": 1.03, "learning_rate": 0.00022084198175944552, "loss": 1.5731, "step": 13094 }, { "epoch": 1.03, "learning_rate": 0.00022083108706388808, "loss": 1.5673, "step": 13095 }, { "epoch": 1.03, "learning_rate": 0.0002208201918874266, "loss": 1.5787, "step": 13096 }, { "epoch": 1.03, "learning_rate": 0.00022080929623013513, "loss": 1.5829, "step": 13097 }, { "epoch": 1.03, "learning_rate": 0.00022079840009208755, "loss": 1.5479, "step": 13098 }, { "epoch": 1.03, "learning_rate": 0.00022078750347335796, "loss": 1.5671, "step": 13099 }, { "epoch": 1.03, "learning_rate": 0.0002207766063740203, "loss": 1.5946, "step": 13100 }, { "epoch": 1.03, "learning_rate": 0.00022076570879414853, "loss": 1.5336, "step": 13101 }, { "epoch": 1.03, "learning_rate": 0.00022075481073381662, "loss": 1.5719, "step": 13102 }, { "epoch": 1.03, "learning_rate": 0.00022074391219309861, "loss": 1.6146, "step": 13103 }, { "epoch": 1.03, "learning_rate": 0.00022073301317206845, "loss": 1.5436, "step": 13104 }, { "epoch": 1.03, "learning_rate": 0.00022072211367080025, "loss": 1.5821, "step": 13105 }, { "epoch": 1.03, "learning_rate": 0.00022071121368936783, "loss": 1.5666, "step": 13106 }, { "epoch": 1.03, "learning_rate": 0.00022070031322784535, "loss": 1.5747, "step": 13107 }, { "epoch": 1.03, "learning_rate": 0.00022068941228630675, "loss": 1.6303, "step": 13108 }, { "epoch": 1.03, "learning_rate": 0.00022067851086482603, "loss": 1.5886, "step": 13109 }, { "epoch": 1.03, "learning_rate": 0.0002206676089634772, "loss": 1.5317, "step": 13110 }, { "epoch": 1.03, "learning_rate": 0.00022065670658233435, "loss": 1.5128, "step": 13111 }, { "epoch": 1.03, "learning_rate": 0.00022064580372147143, "loss": 1.5206, "step": 13112 }, { "epoch": 1.03, "learning_rate": 0.00022063490038096248, "loss": 1.5921, "step": 13113 }, { "epoch": 1.03, "learning_rate": 0.00022062399656088156, "loss": 1.6043, "step": 13114 }, { "epoch": 1.03, "learning_rate": 0.0002206130922613027, "loss": 1.5227, "step": 13115 }, { "epoch": 1.03, "learning_rate": 0.00022060218748229984, "loss": 1.5594, "step": 13116 }, { "epoch": 1.03, "learning_rate": 0.00022059128222394716, "loss": 1.5875, "step": 13117 }, { "epoch": 1.03, "learning_rate": 0.00022058037648631858, "loss": 1.5, "step": 13118 }, { "epoch": 1.03, "learning_rate": 0.00022056947026948822, "loss": 1.5429, "step": 13119 }, { "epoch": 1.03, "learning_rate": 0.00022055856357353006, "loss": 1.5512, "step": 13120 }, { "epoch": 1.03, "learning_rate": 0.00022054765639851822, "loss": 1.5143, "step": 13121 }, { "epoch": 1.03, "learning_rate": 0.00022053674874452677, "loss": 1.5462, "step": 13122 }, { "epoch": 1.03, "learning_rate": 0.00022052584061162966, "loss": 1.5916, "step": 13123 }, { "epoch": 1.03, "learning_rate": 0.00022051493199990103, "loss": 1.543, "step": 13124 }, { "epoch": 1.03, "learning_rate": 0.00022050402290941493, "loss": 1.6087, "step": 13125 }, { "epoch": 1.03, "learning_rate": 0.00022049311334024538, "loss": 1.5231, "step": 13126 }, { "epoch": 1.03, "learning_rate": 0.00022048220329246655, "loss": 1.6186, "step": 13127 }, { "epoch": 1.03, "learning_rate": 0.0002204712927661524, "loss": 1.5477, "step": 13128 }, { "epoch": 1.03, "learning_rate": 0.00022046038176137714, "loss": 1.6007, "step": 13129 }, { "epoch": 1.03, "learning_rate": 0.0002204494702782147, "loss": 1.5725, "step": 13130 }, { "epoch": 1.03, "learning_rate": 0.00022043855831673924, "loss": 1.6043, "step": 13131 }, { "epoch": 1.03, "learning_rate": 0.00022042764587702489, "loss": 1.5431, "step": 13132 }, { "epoch": 1.03, "learning_rate": 0.00022041673295914563, "loss": 1.5494, "step": 13133 }, { "epoch": 1.03, "learning_rate": 0.00022040581956317567, "loss": 1.5427, "step": 13134 }, { "epoch": 1.03, "learning_rate": 0.000220394905689189, "loss": 1.5869, "step": 13135 }, { "epoch": 1.03, "learning_rate": 0.00022038399133725978, "loss": 1.5472, "step": 13136 }, { "epoch": 1.03, "learning_rate": 0.00022037307650746212, "loss": 1.5744, "step": 13137 }, { "epoch": 1.03, "learning_rate": 0.0002203621611998701, "loss": 1.5365, "step": 13138 }, { "epoch": 1.03, "learning_rate": 0.00022035124541455785, "loss": 1.5206, "step": 13139 }, { "epoch": 1.03, "learning_rate": 0.00022034032915159942, "loss": 1.5656, "step": 13140 }, { "epoch": 1.03, "learning_rate": 0.000220329412411069, "loss": 1.5653, "step": 13141 }, { "epoch": 1.03, "learning_rate": 0.00022031849519304068, "loss": 1.5356, "step": 13142 }, { "epoch": 1.03, "learning_rate": 0.00022030757749758856, "loss": 1.5565, "step": 13143 }, { "epoch": 1.03, "learning_rate": 0.0002202966593247868, "loss": 1.6126, "step": 13144 }, { "epoch": 1.03, "learning_rate": 0.00022028574067470952, "loss": 1.5567, "step": 13145 }, { "epoch": 1.03, "learning_rate": 0.00022027482154743087, "loss": 1.5106, "step": 13146 }, { "epoch": 1.03, "learning_rate": 0.00022026390194302493, "loss": 1.5435, "step": 13147 }, { "epoch": 1.03, "learning_rate": 0.0002202529818615659, "loss": 1.5571, "step": 13148 }, { "epoch": 1.03, "learning_rate": 0.00022024206130312788, "loss": 1.5958, "step": 13149 }, { "epoch": 1.03, "learning_rate": 0.00022023114026778503, "loss": 1.5903, "step": 13150 }, { "epoch": 1.03, "learning_rate": 0.00022022021875561147, "loss": 1.5188, "step": 13151 }, { "epoch": 1.03, "learning_rate": 0.00022020929676668137, "loss": 1.5837, "step": 13152 }, { "epoch": 1.03, "learning_rate": 0.00022019837430106893, "loss": 1.5436, "step": 13153 }, { "epoch": 1.03, "learning_rate": 0.00022018745135884824, "loss": 1.6005, "step": 13154 }, { "epoch": 1.04, "learning_rate": 0.00022017652794009348, "loss": 1.5811, "step": 13155 }, { "epoch": 1.04, "learning_rate": 0.00022016560404487887, "loss": 1.5656, "step": 13156 }, { "epoch": 1.04, "learning_rate": 0.0002201546796732785, "loss": 1.5265, "step": 13157 }, { "epoch": 1.04, "learning_rate": 0.00022014375482536655, "loss": 1.5292, "step": 13158 }, { "epoch": 1.04, "learning_rate": 0.0002201328295012172, "loss": 1.5694, "step": 13159 }, { "epoch": 1.04, "learning_rate": 0.0002201219037009047, "loss": 1.555, "step": 13160 }, { "epoch": 1.04, "learning_rate": 0.00022011097742450316, "loss": 1.5903, "step": 13161 }, { "epoch": 1.04, "learning_rate": 0.0002201000506720867, "loss": 1.5731, "step": 13162 }, { "epoch": 1.04, "learning_rate": 0.00022008912344372968, "loss": 1.6098, "step": 13163 }, { "epoch": 1.04, "learning_rate": 0.00022007819573950614, "loss": 1.5223, "step": 13164 }, { "epoch": 1.04, "learning_rate": 0.00022006726755949033, "loss": 1.5604, "step": 13165 }, { "epoch": 1.04, "learning_rate": 0.00022005633890375645, "loss": 1.4896, "step": 13166 }, { "epoch": 1.04, "learning_rate": 0.00022004540977237867, "loss": 1.5852, "step": 13167 }, { "epoch": 1.04, "learning_rate": 0.0002200344801654312, "loss": 1.5973, "step": 13168 }, { "epoch": 1.04, "learning_rate": 0.00022002355008298826, "loss": 1.517, "step": 13169 }, { "epoch": 1.04, "learning_rate": 0.0002200126195251241, "loss": 1.5914, "step": 13170 }, { "epoch": 1.04, "learning_rate": 0.0002200016884919129, "loss": 1.5571, "step": 13171 }, { "epoch": 1.04, "learning_rate": 0.0002199907569834288, "loss": 1.6102, "step": 13172 }, { "epoch": 1.04, "learning_rate": 0.00021997982499974612, "loss": 1.5174, "step": 13173 }, { "epoch": 1.04, "learning_rate": 0.00021996889254093902, "loss": 1.5694, "step": 13174 }, { "epoch": 1.04, "learning_rate": 0.0002199579596070818, "loss": 1.5672, "step": 13175 }, { "epoch": 1.04, "learning_rate": 0.00021994702619824858, "loss": 1.6213, "step": 13176 }, { "epoch": 1.04, "learning_rate": 0.00021993609231451368, "loss": 1.5697, "step": 13177 }, { "epoch": 1.04, "learning_rate": 0.00021992515795595132, "loss": 1.5594, "step": 13178 }, { "epoch": 1.04, "learning_rate": 0.00021991422312263575, "loss": 1.6254, "step": 13179 }, { "epoch": 1.04, "learning_rate": 0.00021990328781464115, "loss": 1.6169, "step": 13180 }, { "epoch": 1.04, "learning_rate": 0.0002198923520320418, "loss": 1.5538, "step": 13181 }, { "epoch": 1.04, "learning_rate": 0.00021988141577491193, "loss": 1.558, "step": 13182 }, { "epoch": 1.04, "learning_rate": 0.0002198704790433258, "loss": 1.6071, "step": 13183 }, { "epoch": 1.04, "learning_rate": 0.00021985954183735773, "loss": 1.5684, "step": 13184 }, { "epoch": 1.04, "learning_rate": 0.00021984860415708192, "loss": 1.5828, "step": 13185 }, { "epoch": 1.04, "learning_rate": 0.00021983766600257263, "loss": 1.6016, "step": 13186 }, { "epoch": 1.04, "learning_rate": 0.0002198267273739041, "loss": 1.6679, "step": 13187 }, { "epoch": 1.04, "learning_rate": 0.00021981578827115063, "loss": 1.6116, "step": 13188 }, { "epoch": 1.04, "learning_rate": 0.00021980484869438648, "loss": 1.6306, "step": 13189 }, { "epoch": 1.04, "learning_rate": 0.00021979390864368593, "loss": 1.5847, "step": 13190 }, { "epoch": 1.04, "learning_rate": 0.00021978296811912327, "loss": 1.5809, "step": 13191 }, { "epoch": 1.04, "learning_rate": 0.0002197720271207728, "loss": 1.5469, "step": 13192 }, { "epoch": 1.04, "learning_rate": 0.00021976108564870873, "loss": 1.5419, "step": 13193 }, { "epoch": 1.04, "learning_rate": 0.0002197501437030054, "loss": 1.5784, "step": 13194 }, { "epoch": 1.04, "learning_rate": 0.00021973920128373706, "loss": 1.5654, "step": 13195 }, { "epoch": 1.04, "learning_rate": 0.00021972825839097803, "loss": 1.625, "step": 13196 }, { "epoch": 1.04, "learning_rate": 0.00021971731502480265, "loss": 1.5625, "step": 13197 }, { "epoch": 1.04, "learning_rate": 0.0002197063711852851, "loss": 1.5649, "step": 13198 }, { "epoch": 1.04, "learning_rate": 0.0002196954268724998, "loss": 1.5251, "step": 13199 }, { "epoch": 1.04, "learning_rate": 0.00021968448208652103, "loss": 1.6216, "step": 13200 }, { "epoch": 1.04, "learning_rate": 0.00021967353682742305, "loss": 1.5568, "step": 13201 }, { "epoch": 1.04, "learning_rate": 0.00021966259109528025, "loss": 1.5873, "step": 13202 }, { "epoch": 1.04, "learning_rate": 0.00021965164489016684, "loss": 1.5478, "step": 13203 }, { "epoch": 1.04, "learning_rate": 0.0002196406982121572, "loss": 1.567, "step": 13204 }, { "epoch": 1.04, "learning_rate": 0.0002196297510613257, "loss": 1.5459, "step": 13205 }, { "epoch": 1.04, "learning_rate": 0.00021961880343774657, "loss": 1.5921, "step": 13206 }, { "epoch": 1.04, "learning_rate": 0.00021960785534149422, "loss": 1.513, "step": 13207 }, { "epoch": 1.04, "learning_rate": 0.0002195969067726429, "loss": 1.5519, "step": 13208 }, { "epoch": 1.04, "learning_rate": 0.00021958595773126705, "loss": 1.5647, "step": 13209 }, { "epoch": 1.04, "learning_rate": 0.0002195750082174409, "loss": 1.586, "step": 13210 }, { "epoch": 1.04, "learning_rate": 0.00021956405823123884, "loss": 1.6158, "step": 13211 }, { "epoch": 1.04, "learning_rate": 0.00021955310777273528, "loss": 1.5901, "step": 13212 }, { "epoch": 1.04, "learning_rate": 0.00021954215684200442, "loss": 1.5541, "step": 13213 }, { "epoch": 1.04, "learning_rate": 0.0002195312054391207, "loss": 1.5339, "step": 13214 }, { "epoch": 1.04, "learning_rate": 0.00021952025356415848, "loss": 1.6325, "step": 13215 }, { "epoch": 1.04, "learning_rate": 0.00021950930121719211, "loss": 1.593, "step": 13216 }, { "epoch": 1.04, "learning_rate": 0.00021949834839829596, "loss": 1.5262, "step": 13217 }, { "epoch": 1.04, "learning_rate": 0.00021948739510754435, "loss": 1.5632, "step": 13218 }, { "epoch": 1.04, "learning_rate": 0.0002194764413450117, "loss": 1.5556, "step": 13219 }, { "epoch": 1.04, "learning_rate": 0.00021946548711077233, "loss": 1.6297, "step": 13220 }, { "epoch": 1.04, "learning_rate": 0.00021945453240490066, "loss": 1.5822, "step": 13221 }, { "epoch": 1.04, "learning_rate": 0.000219443577227471, "loss": 1.5225, "step": 13222 }, { "epoch": 1.04, "learning_rate": 0.00021943262157855776, "loss": 1.5889, "step": 13223 }, { "epoch": 1.04, "learning_rate": 0.00021942166545823542, "loss": 1.5825, "step": 13224 }, { "epoch": 1.04, "learning_rate": 0.00021941070886657824, "loss": 1.591, "step": 13225 }, { "epoch": 1.04, "learning_rate": 0.00021939975180366064, "loss": 1.572, "step": 13226 }, { "epoch": 1.04, "learning_rate": 0.00021938879426955705, "loss": 1.5793, "step": 13227 }, { "epoch": 1.04, "learning_rate": 0.00021937783626434178, "loss": 1.4996, "step": 13228 }, { "epoch": 1.04, "learning_rate": 0.0002193668777880893, "loss": 1.5794, "step": 13229 }, { "epoch": 1.04, "learning_rate": 0.00021935591884087404, "loss": 1.5321, "step": 13230 }, { "epoch": 1.04, "learning_rate": 0.0002193449594227704, "loss": 1.5565, "step": 13231 }, { "epoch": 1.04, "learning_rate": 0.00021933399953385268, "loss": 1.5516, "step": 13232 }, { "epoch": 1.04, "learning_rate": 0.00021932303917419538, "loss": 1.5769, "step": 13233 }, { "epoch": 1.04, "learning_rate": 0.0002193120783438729, "loss": 1.5985, "step": 13234 }, { "epoch": 1.04, "learning_rate": 0.00021930111704295967, "loss": 1.6331, "step": 13235 }, { "epoch": 1.04, "learning_rate": 0.0002192901552715301, "loss": 1.5775, "step": 13236 }, { "epoch": 1.04, "learning_rate": 0.0002192791930296586, "loss": 1.6029, "step": 13237 }, { "epoch": 1.04, "learning_rate": 0.00021926823031741962, "loss": 1.5746, "step": 13238 }, { "epoch": 1.04, "learning_rate": 0.00021925726713488758, "loss": 1.5051, "step": 13239 }, { "epoch": 1.04, "learning_rate": 0.00021924630348213692, "loss": 1.5342, "step": 13240 }, { "epoch": 1.04, "learning_rate": 0.0002192353393592421, "loss": 1.5725, "step": 13241 }, { "epoch": 1.04, "learning_rate": 0.00021922437476627746, "loss": 1.5601, "step": 13242 }, { "epoch": 1.04, "learning_rate": 0.00021921340970331755, "loss": 1.5324, "step": 13243 }, { "epoch": 1.04, "learning_rate": 0.0002192024441704368, "loss": 1.5432, "step": 13244 }, { "epoch": 1.04, "learning_rate": 0.0002191914781677096, "loss": 1.6287, "step": 13245 }, { "epoch": 1.04, "learning_rate": 0.00021918051169521048, "loss": 1.5272, "step": 13246 }, { "epoch": 1.04, "learning_rate": 0.00021916954475301387, "loss": 1.6059, "step": 13247 }, { "epoch": 1.04, "learning_rate": 0.00021915857734119425, "loss": 1.5795, "step": 13248 }, { "epoch": 1.04, "learning_rate": 0.00021914760945982603, "loss": 1.6461, "step": 13249 }, { "epoch": 1.04, "learning_rate": 0.00021913664110898367, "loss": 1.5372, "step": 13250 }, { "epoch": 1.04, "learning_rate": 0.0002191256722887417, "loss": 1.5909, "step": 13251 }, { "epoch": 1.04, "learning_rate": 0.00021911470299917454, "loss": 1.6018, "step": 13252 }, { "epoch": 1.04, "learning_rate": 0.00021910373324035668, "loss": 1.5998, "step": 13253 }, { "epoch": 1.04, "learning_rate": 0.00021909276301236262, "loss": 1.5836, "step": 13254 }, { "epoch": 1.04, "learning_rate": 0.00021908179231526687, "loss": 1.5514, "step": 13255 }, { "epoch": 1.04, "learning_rate": 0.00021907082114914383, "loss": 1.541, "step": 13256 }, { "epoch": 1.04, "learning_rate": 0.00021905984951406802, "loss": 1.5866, "step": 13257 }, { "epoch": 1.04, "learning_rate": 0.000219048877410114, "loss": 1.5844, "step": 13258 }, { "epoch": 1.04, "learning_rate": 0.00021903790483735613, "loss": 1.5698, "step": 13259 }, { "epoch": 1.04, "learning_rate": 0.00021902693179586902, "loss": 1.5387, "step": 13260 }, { "epoch": 1.04, "learning_rate": 0.00021901595828572711, "loss": 1.5642, "step": 13261 }, { "epoch": 1.04, "learning_rate": 0.00021900498430700493, "loss": 1.5829, "step": 13262 }, { "epoch": 1.04, "learning_rate": 0.00021899400985977705, "loss": 1.5685, "step": 13263 }, { "epoch": 1.04, "learning_rate": 0.00021898303494411787, "loss": 1.545, "step": 13264 }, { "epoch": 1.04, "learning_rate": 0.00021897205956010197, "loss": 1.5406, "step": 13265 }, { "epoch": 1.04, "learning_rate": 0.00021896108370780384, "loss": 1.5716, "step": 13266 }, { "epoch": 1.04, "learning_rate": 0.00021895010738729796, "loss": 1.6312, "step": 13267 }, { "epoch": 1.04, "learning_rate": 0.000218939130598659, "loss": 1.5768, "step": 13268 }, { "epoch": 1.04, "learning_rate": 0.0002189281533419613, "loss": 1.5928, "step": 13269 }, { "epoch": 1.04, "learning_rate": 0.0002189171756172795, "loss": 1.5745, "step": 13270 }, { "epoch": 1.04, "learning_rate": 0.00021890619742468814, "loss": 1.5196, "step": 13271 }, { "epoch": 1.04, "learning_rate": 0.00021889521876426165, "loss": 1.6021, "step": 13272 }, { "epoch": 1.04, "learning_rate": 0.00021888423963607474, "loss": 1.5822, "step": 13273 }, { "epoch": 1.04, "learning_rate": 0.0002188732600402018, "loss": 1.4956, "step": 13274 }, { "epoch": 1.04, "learning_rate": 0.0002188622799767175, "loss": 1.5373, "step": 13275 }, { "epoch": 1.04, "learning_rate": 0.00021885129944569623, "loss": 1.5832, "step": 13276 }, { "epoch": 1.04, "learning_rate": 0.00021884031844721265, "loss": 1.554, "step": 13277 }, { "epoch": 1.04, "learning_rate": 0.0002188293369813413, "loss": 1.5884, "step": 13278 }, { "epoch": 1.04, "learning_rate": 0.00021881835504815672, "loss": 1.5647, "step": 13279 }, { "epoch": 1.04, "learning_rate": 0.00021880737264773356, "loss": 1.5707, "step": 13280 }, { "epoch": 1.04, "learning_rate": 0.00021879638978014625, "loss": 1.5864, "step": 13281 }, { "epoch": 1.05, "learning_rate": 0.00021878540644546944, "loss": 1.6006, "step": 13282 }, { "epoch": 1.05, "learning_rate": 0.00021877442264377767, "loss": 1.5641, "step": 13283 }, { "epoch": 1.05, "learning_rate": 0.00021876343837514553, "loss": 1.5283, "step": 13284 }, { "epoch": 1.05, "learning_rate": 0.00021875245363964758, "loss": 1.5792, "step": 13285 }, { "epoch": 1.05, "learning_rate": 0.00021874146843735843, "loss": 1.556, "step": 13286 }, { "epoch": 1.05, "learning_rate": 0.00021873048276835263, "loss": 1.5541, "step": 13287 }, { "epoch": 1.05, "learning_rate": 0.00021871949663270477, "loss": 1.6204, "step": 13288 }, { "epoch": 1.05, "learning_rate": 0.00021870851003048943, "loss": 1.5504, "step": 13289 }, { "epoch": 1.05, "learning_rate": 0.0002186975229617813, "loss": 1.5363, "step": 13290 }, { "epoch": 1.05, "learning_rate": 0.00021868653542665484, "loss": 1.6054, "step": 13291 }, { "epoch": 1.05, "learning_rate": 0.00021867554742518473, "loss": 1.5454, "step": 13292 }, { "epoch": 1.05, "learning_rate": 0.0002186645589574455, "loss": 1.6188, "step": 13293 }, { "epoch": 1.05, "learning_rate": 0.0002186535700235119, "loss": 1.4926, "step": 13294 }, { "epoch": 1.05, "learning_rate": 0.00021864258062345837, "loss": 1.5286, "step": 13295 }, { "epoch": 1.05, "learning_rate": 0.00021863159075735962, "loss": 1.5761, "step": 13296 }, { "epoch": 1.05, "learning_rate": 0.00021862060042529026, "loss": 1.5768, "step": 13297 }, { "epoch": 1.05, "learning_rate": 0.0002186096096273249, "loss": 1.5876, "step": 13298 }, { "epoch": 1.05, "learning_rate": 0.0002185986183635381, "loss": 1.5256, "step": 13299 }, { "epoch": 1.05, "learning_rate": 0.00021858762663400455, "loss": 1.5221, "step": 13300 }, { "epoch": 1.05, "learning_rate": 0.0002185766344387989, "loss": 1.5777, "step": 13301 }, { "epoch": 1.05, "learning_rate": 0.00021856564177799573, "loss": 1.5656, "step": 13302 }, { "epoch": 1.05, "learning_rate": 0.00021855464865166968, "loss": 1.5568, "step": 13303 }, { "epoch": 1.05, "learning_rate": 0.00021854365505989543, "loss": 1.58, "step": 13304 }, { "epoch": 1.05, "learning_rate": 0.0002185326610027476, "loss": 1.5449, "step": 13305 }, { "epoch": 1.05, "learning_rate": 0.00021852166648030075, "loss": 1.5926, "step": 13306 }, { "epoch": 1.05, "learning_rate": 0.00021851067149262967, "loss": 1.5555, "step": 13307 }, { "epoch": 1.05, "learning_rate": 0.00021849967603980883, "loss": 1.5567, "step": 13308 }, { "epoch": 1.05, "learning_rate": 0.0002184886801219131, "loss": 1.5339, "step": 13309 }, { "epoch": 1.05, "learning_rate": 0.00021847768373901697, "loss": 1.5611, "step": 13310 }, { "epoch": 1.05, "learning_rate": 0.0002184666868911952, "loss": 1.5655, "step": 13311 }, { "epoch": 1.05, "learning_rate": 0.0002184556895785224, "loss": 1.5727, "step": 13312 }, { "epoch": 1.05, "learning_rate": 0.0002184446918010732, "loss": 1.5384, "step": 13313 }, { "epoch": 1.05, "learning_rate": 0.00021843369355892234, "loss": 1.5824, "step": 13314 }, { "epoch": 1.05, "learning_rate": 0.00021842269485214448, "loss": 1.5781, "step": 13315 }, { "epoch": 1.05, "learning_rate": 0.00021841169568081426, "loss": 1.5765, "step": 13316 }, { "epoch": 1.05, "learning_rate": 0.00021840069604500638, "loss": 1.5588, "step": 13317 }, { "epoch": 1.05, "learning_rate": 0.00021838969594479554, "loss": 1.5729, "step": 13318 }, { "epoch": 1.05, "learning_rate": 0.00021837869538025642, "loss": 1.544, "step": 13319 }, { "epoch": 1.05, "learning_rate": 0.0002183676943514636, "loss": 1.5441, "step": 13320 }, { "epoch": 1.05, "learning_rate": 0.000218356692858492, "loss": 1.5514, "step": 13321 }, { "epoch": 1.05, "learning_rate": 0.0002183456909014161, "loss": 1.5609, "step": 13322 }, { "epoch": 1.05, "learning_rate": 0.00021833468848031067, "loss": 1.6014, "step": 13323 }, { "epoch": 1.05, "learning_rate": 0.00021832368559525042, "loss": 1.5917, "step": 13324 }, { "epoch": 1.05, "learning_rate": 0.00021831268224631006, "loss": 1.6101, "step": 13325 }, { "epoch": 1.05, "learning_rate": 0.00021830167843356427, "loss": 1.565, "step": 13326 }, { "epoch": 1.05, "learning_rate": 0.00021829067415708782, "loss": 1.5762, "step": 13327 }, { "epoch": 1.05, "learning_rate": 0.00021827966941695531, "loss": 1.614, "step": 13328 }, { "epoch": 1.05, "learning_rate": 0.0002182686642132416, "loss": 1.5847, "step": 13329 }, { "epoch": 1.05, "learning_rate": 0.00021825765854602128, "loss": 1.5806, "step": 13330 }, { "epoch": 1.05, "learning_rate": 0.00021824665241536916, "loss": 1.572, "step": 13331 }, { "epoch": 1.05, "learning_rate": 0.00021823564582135988, "loss": 1.5846, "step": 13332 }, { "epoch": 1.05, "learning_rate": 0.00021822463876406827, "loss": 1.5611, "step": 13333 }, { "epoch": 1.05, "learning_rate": 0.000218213631243569, "loss": 1.5591, "step": 13334 }, { "epoch": 1.05, "learning_rate": 0.0002182026232599368, "loss": 1.5637, "step": 13335 }, { "epoch": 1.05, "learning_rate": 0.00021819161481324644, "loss": 1.5427, "step": 13336 }, { "epoch": 1.05, "learning_rate": 0.00021818060590357265, "loss": 1.5351, "step": 13337 }, { "epoch": 1.05, "learning_rate": 0.0002181695965309902, "loss": 1.5392, "step": 13338 }, { "epoch": 1.05, "learning_rate": 0.00021815858669557372, "loss": 1.5487, "step": 13339 }, { "epoch": 1.05, "learning_rate": 0.0002181475763973981, "loss": 1.5874, "step": 13340 }, { "epoch": 1.05, "learning_rate": 0.00021813656563653806, "loss": 1.5303, "step": 13341 }, { "epoch": 1.05, "learning_rate": 0.00021812555441306833, "loss": 1.5851, "step": 13342 }, { "epoch": 1.05, "learning_rate": 0.0002181145427270637, "loss": 1.5053, "step": 13343 }, { "epoch": 1.05, "learning_rate": 0.0002181035305785989, "loss": 1.553, "step": 13344 }, { "epoch": 1.05, "learning_rate": 0.0002180925179677487, "loss": 1.5625, "step": 13345 }, { "epoch": 1.05, "learning_rate": 0.00021808150489458788, "loss": 1.5712, "step": 13346 }, { "epoch": 1.05, "learning_rate": 0.00021807049135919119, "loss": 1.524, "step": 13347 }, { "epoch": 1.05, "learning_rate": 0.00021805947736163345, "loss": 1.6045, "step": 13348 }, { "epoch": 1.05, "learning_rate": 0.0002180484629019894, "loss": 1.5201, "step": 13349 }, { "epoch": 1.05, "learning_rate": 0.0002180374479803339, "loss": 1.5794, "step": 13350 }, { "epoch": 1.05, "learning_rate": 0.00021802643259674162, "loss": 1.5595, "step": 13351 }, { "epoch": 1.05, "learning_rate": 0.0002180154167512874, "loss": 1.5889, "step": 13352 }, { "epoch": 1.05, "learning_rate": 0.00021800440044404605, "loss": 1.5374, "step": 13353 }, { "epoch": 1.05, "learning_rate": 0.00021799338367509236, "loss": 1.564, "step": 13354 }, { "epoch": 1.05, "learning_rate": 0.0002179823664445011, "loss": 1.572, "step": 13355 }, { "epoch": 1.05, "learning_rate": 0.0002179713487523471, "loss": 1.5162, "step": 13356 }, { "epoch": 1.05, "learning_rate": 0.0002179603305987051, "loss": 1.5835, "step": 13357 }, { "epoch": 1.05, "learning_rate": 0.00021794931198365004, "loss": 1.5896, "step": 13358 }, { "epoch": 1.05, "learning_rate": 0.0002179382929072566, "loss": 1.5905, "step": 13359 }, { "epoch": 1.05, "learning_rate": 0.0002179272733695997, "loss": 1.5631, "step": 13360 }, { "epoch": 1.05, "learning_rate": 0.000217916253370754, "loss": 1.5282, "step": 13361 }, { "epoch": 1.05, "learning_rate": 0.00021790523291079447, "loss": 1.5595, "step": 13362 }, { "epoch": 1.05, "learning_rate": 0.00021789421198979591, "loss": 1.5691, "step": 13363 }, { "epoch": 1.05, "learning_rate": 0.00021788319060783308, "loss": 1.5781, "step": 13364 }, { "epoch": 1.05, "learning_rate": 0.00021787216876498086, "loss": 1.592, "step": 13365 }, { "epoch": 1.05, "learning_rate": 0.00021786114646131404, "loss": 1.6039, "step": 13366 }, { "epoch": 1.05, "learning_rate": 0.00021785012369690754, "loss": 1.566, "step": 13367 }, { "epoch": 1.05, "learning_rate": 0.00021783910047183612, "loss": 1.6002, "step": 13368 }, { "epoch": 1.05, "learning_rate": 0.00021782807678617466, "loss": 1.5302, "step": 13369 }, { "epoch": 1.05, "learning_rate": 0.00021781705263999797, "loss": 1.5444, "step": 13370 }, { "epoch": 1.05, "learning_rate": 0.0002178060280333809, "loss": 1.612, "step": 13371 }, { "epoch": 1.05, "learning_rate": 0.00021779500296639832, "loss": 1.5042, "step": 13372 }, { "epoch": 1.05, "learning_rate": 0.0002177839774391251, "loss": 1.5382, "step": 13373 }, { "epoch": 1.05, "learning_rate": 0.00021777295145163607, "loss": 1.5949, "step": 13374 }, { "epoch": 1.05, "learning_rate": 0.0002177619250040061, "loss": 1.6194, "step": 13375 }, { "epoch": 1.05, "learning_rate": 0.00021775089809631006, "loss": 1.5711, "step": 13376 }, { "epoch": 1.05, "learning_rate": 0.00021773987072862285, "loss": 1.5354, "step": 13377 }, { "epoch": 1.05, "learning_rate": 0.00021772884290101926, "loss": 1.5308, "step": 13378 }, { "epoch": 1.05, "learning_rate": 0.00021771781461357416, "loss": 1.5679, "step": 13379 }, { "epoch": 1.05, "learning_rate": 0.0002177067858663625, "loss": 1.5861, "step": 13380 }, { "epoch": 1.05, "learning_rate": 0.00021769575665945914, "loss": 1.5861, "step": 13381 }, { "epoch": 1.05, "learning_rate": 0.000217684726992939, "loss": 1.5523, "step": 13382 }, { "epoch": 1.05, "learning_rate": 0.0002176736968668768, "loss": 1.5399, "step": 13383 }, { "epoch": 1.05, "learning_rate": 0.00021766266628134764, "loss": 1.5932, "step": 13384 }, { "epoch": 1.05, "learning_rate": 0.00021765163523642628, "loss": 1.5614, "step": 13385 }, { "epoch": 1.05, "learning_rate": 0.00021764060373218768, "loss": 1.5585, "step": 13386 }, { "epoch": 1.05, "learning_rate": 0.00021762957176870663, "loss": 1.5957, "step": 13387 }, { "epoch": 1.05, "learning_rate": 0.00021761853934605817, "loss": 1.5572, "step": 13388 }, { "epoch": 1.05, "learning_rate": 0.00021760750646431716, "loss": 1.5519, "step": 13389 }, { "epoch": 1.05, "learning_rate": 0.00021759647312355845, "loss": 1.5961, "step": 13390 }, { "epoch": 1.05, "learning_rate": 0.00021758543932385698, "loss": 1.4874, "step": 13391 }, { "epoch": 1.05, "learning_rate": 0.00021757440506528774, "loss": 1.5365, "step": 13392 }, { "epoch": 1.05, "learning_rate": 0.00021756337034792552, "loss": 1.5491, "step": 13393 }, { "epoch": 1.05, "learning_rate": 0.00021755233517184528, "loss": 1.5697, "step": 13394 }, { "epoch": 1.05, "learning_rate": 0.00021754129953712202, "loss": 1.585, "step": 13395 }, { "epoch": 1.05, "learning_rate": 0.00021753026344383057, "loss": 1.5524, "step": 13396 }, { "epoch": 1.05, "learning_rate": 0.00021751922689204593, "loss": 1.6348, "step": 13397 }, { "epoch": 1.05, "learning_rate": 0.000217508189881843, "loss": 1.5511, "step": 13398 }, { "epoch": 1.05, "learning_rate": 0.0002174971524132967, "loss": 1.544, "step": 13399 }, { "epoch": 1.05, "learning_rate": 0.00021748611448648198, "loss": 1.5862, "step": 13400 }, { "epoch": 1.05, "learning_rate": 0.00021747507610147377, "loss": 1.5559, "step": 13401 }, { "epoch": 1.05, "learning_rate": 0.00021746403725834705, "loss": 1.5442, "step": 13402 }, { "epoch": 1.05, "learning_rate": 0.00021745299795717673, "loss": 1.5757, "step": 13403 }, { "epoch": 1.05, "learning_rate": 0.0002174419581980378, "loss": 1.5337, "step": 13404 }, { "epoch": 1.05, "learning_rate": 0.00021743091798100516, "loss": 1.562, "step": 13405 }, { "epoch": 1.05, "learning_rate": 0.00021741987730615386, "loss": 1.5961, "step": 13406 }, { "epoch": 1.05, "learning_rate": 0.00021740883617355874, "loss": 1.5624, "step": 13407 }, { "epoch": 1.05, "learning_rate": 0.00021739779458329484, "loss": 1.5305, "step": 13408 }, { "epoch": 1.06, "learning_rate": 0.00021738675253543712, "loss": 1.6133, "step": 13409 }, { "epoch": 1.06, "learning_rate": 0.00021737571003006047, "loss": 1.5707, "step": 13410 }, { "epoch": 1.06, "learning_rate": 0.00021736466706724002, "loss": 1.5798, "step": 13411 }, { "epoch": 1.06, "learning_rate": 0.0002173536236470506, "loss": 1.5143, "step": 13412 }, { "epoch": 1.06, "learning_rate": 0.00021734257976956727, "loss": 1.5801, "step": 13413 }, { "epoch": 1.06, "learning_rate": 0.000217331535434865, "loss": 1.5763, "step": 13414 }, { "epoch": 1.06, "learning_rate": 0.00021732049064301874, "loss": 1.547, "step": 13415 }, { "epoch": 1.06, "learning_rate": 0.00021730944539410352, "loss": 1.5452, "step": 13416 }, { "epoch": 1.06, "learning_rate": 0.0002172983996881943, "loss": 1.5773, "step": 13417 }, { "epoch": 1.06, "learning_rate": 0.00021728735352536605, "loss": 1.5881, "step": 13418 }, { "epoch": 1.06, "learning_rate": 0.0002172763069056938, "loss": 1.576, "step": 13419 }, { "epoch": 1.06, "learning_rate": 0.00021726525982925258, "loss": 1.555, "step": 13420 }, { "epoch": 1.06, "learning_rate": 0.00021725421229611738, "loss": 1.5712, "step": 13421 }, { "epoch": 1.06, "learning_rate": 0.00021724316430636316, "loss": 1.5317, "step": 13422 }, { "epoch": 1.06, "learning_rate": 0.00021723211586006501, "loss": 1.5569, "step": 13423 }, { "epoch": 1.06, "learning_rate": 0.00021722106695729786, "loss": 1.5439, "step": 13424 }, { "epoch": 1.06, "learning_rate": 0.00021721001759813675, "loss": 1.5908, "step": 13425 }, { "epoch": 1.06, "learning_rate": 0.0002171989677826567, "loss": 1.5467, "step": 13426 }, { "epoch": 1.06, "learning_rate": 0.0002171879175109328, "loss": 1.5516, "step": 13427 }, { "epoch": 1.06, "learning_rate": 0.00021717686678304, "loss": 1.5923, "step": 13428 }, { "epoch": 1.06, "learning_rate": 0.0002171658155990533, "loss": 1.5506, "step": 13429 }, { "epoch": 1.06, "learning_rate": 0.00021715476395904783, "loss": 1.5773, "step": 13430 }, { "epoch": 1.06, "learning_rate": 0.00021714371186309857, "loss": 1.5598, "step": 13431 }, { "epoch": 1.06, "learning_rate": 0.0002171326593112805, "loss": 1.5634, "step": 13432 }, { "epoch": 1.06, "learning_rate": 0.00021712160630366878, "loss": 1.4876, "step": 13433 }, { "epoch": 1.06, "learning_rate": 0.00021711055284033835, "loss": 1.5538, "step": 13434 }, { "epoch": 1.06, "learning_rate": 0.00021709949892136432, "loss": 1.5383, "step": 13435 }, { "epoch": 1.06, "learning_rate": 0.00021708844454682174, "loss": 1.5631, "step": 13436 }, { "epoch": 1.06, "learning_rate": 0.0002170773897167856, "loss": 1.6015, "step": 13437 }, { "epoch": 1.06, "learning_rate": 0.0002170663344313311, "loss": 1.5734, "step": 13438 }, { "epoch": 1.06, "learning_rate": 0.0002170552786905331, "loss": 1.5585, "step": 13439 }, { "epoch": 1.06, "learning_rate": 0.0002170442224944668, "loss": 1.5027, "step": 13440 }, { "epoch": 1.06, "learning_rate": 0.00021703316584320722, "loss": 1.5386, "step": 13441 }, { "epoch": 1.06, "learning_rate": 0.00021702210873682942, "loss": 1.588, "step": 13442 }, { "epoch": 1.06, "learning_rate": 0.0002170110511754085, "loss": 1.5593, "step": 13443 }, { "epoch": 1.06, "learning_rate": 0.00021699999315901952, "loss": 1.4894, "step": 13444 }, { "epoch": 1.06, "learning_rate": 0.0002169889346877376, "loss": 1.6082, "step": 13445 }, { "epoch": 1.06, "learning_rate": 0.00021697787576163772, "loss": 1.5714, "step": 13446 }, { "epoch": 1.06, "learning_rate": 0.00021696681638079505, "loss": 1.6282, "step": 13447 }, { "epoch": 1.06, "learning_rate": 0.00021695575654528466, "loss": 1.5871, "step": 13448 }, { "epoch": 1.06, "learning_rate": 0.0002169446962551816, "loss": 1.5966, "step": 13449 }, { "epoch": 1.06, "learning_rate": 0.00021693363551056102, "loss": 1.6374, "step": 13450 }, { "epoch": 1.06, "learning_rate": 0.00021692257431149797, "loss": 1.5588, "step": 13451 }, { "epoch": 1.06, "learning_rate": 0.0002169115126580676, "loss": 1.57, "step": 13452 }, { "epoch": 1.06, "learning_rate": 0.000216900450550345, "loss": 1.5624, "step": 13453 }, { "epoch": 1.06, "learning_rate": 0.00021688938798840524, "loss": 1.5738, "step": 13454 }, { "epoch": 1.06, "learning_rate": 0.00021687832497232346, "loss": 1.5316, "step": 13455 }, { "epoch": 1.06, "learning_rate": 0.00021686726150217474, "loss": 1.5383, "step": 13456 }, { "epoch": 1.06, "learning_rate": 0.00021685619757803423, "loss": 1.5823, "step": 13457 }, { "epoch": 1.06, "learning_rate": 0.000216845133199977, "loss": 1.5235, "step": 13458 }, { "epoch": 1.06, "learning_rate": 0.0002168340683680782, "loss": 1.5068, "step": 13459 }, { "epoch": 1.06, "learning_rate": 0.00021682300308241304, "loss": 1.5826, "step": 13460 }, { "epoch": 1.06, "learning_rate": 0.00021681193734305647, "loss": 1.5906, "step": 13461 }, { "epoch": 1.06, "learning_rate": 0.00021680087115008378, "loss": 1.4911, "step": 13462 }, { "epoch": 1.06, "learning_rate": 0.00021678980450357002, "loss": 1.4993, "step": 13463 }, { "epoch": 1.06, "learning_rate": 0.00021677873740359033, "loss": 1.5869, "step": 13464 }, { "epoch": 1.06, "learning_rate": 0.00021676766985021987, "loss": 1.5511, "step": 13465 }, { "epoch": 1.06, "learning_rate": 0.00021675660184353375, "loss": 1.5967, "step": 13466 }, { "epoch": 1.06, "learning_rate": 0.0002167455333836072, "loss": 1.5375, "step": 13467 }, { "epoch": 1.06, "learning_rate": 0.00021673446447051527, "loss": 1.5719, "step": 13468 }, { "epoch": 1.06, "learning_rate": 0.00021672339510433317, "loss": 1.6014, "step": 13469 }, { "epoch": 1.06, "learning_rate": 0.00021671232528513607, "loss": 1.5249, "step": 13470 }, { "epoch": 1.06, "learning_rate": 0.00021670125501299902, "loss": 1.5504, "step": 13471 }, { "epoch": 1.06, "learning_rate": 0.00021669018428799734, "loss": 1.5619, "step": 13472 }, { "epoch": 1.06, "learning_rate": 0.00021667911311020602, "loss": 1.5998, "step": 13473 }, { "epoch": 1.06, "learning_rate": 0.0002166680414797004, "loss": 1.582, "step": 13474 }, { "epoch": 1.06, "learning_rate": 0.00021665696939655553, "loss": 1.5754, "step": 13475 }, { "epoch": 1.06, "learning_rate": 0.0002166458968608466, "loss": 1.5622, "step": 13476 }, { "epoch": 1.06, "learning_rate": 0.0002166348238726489, "loss": 1.555, "step": 13477 }, { "epoch": 1.06, "learning_rate": 0.00021662375043203744, "loss": 1.6117, "step": 13478 }, { "epoch": 1.06, "learning_rate": 0.00021661267653908748, "loss": 1.558, "step": 13479 }, { "epoch": 1.06, "learning_rate": 0.00021660160219387424, "loss": 1.5635, "step": 13480 }, { "epoch": 1.06, "learning_rate": 0.00021659052739647283, "loss": 1.5426, "step": 13481 }, { "epoch": 1.06, "learning_rate": 0.00021657945214695852, "loss": 1.4794, "step": 13482 }, { "epoch": 1.06, "learning_rate": 0.00021656837644540647, "loss": 1.5531, "step": 13483 }, { "epoch": 1.06, "learning_rate": 0.00021655730029189192, "loss": 1.556, "step": 13484 }, { "epoch": 1.06, "learning_rate": 0.00021654622368648995, "loss": 1.544, "step": 13485 }, { "epoch": 1.06, "learning_rate": 0.00021653514662927587, "loss": 1.5406, "step": 13486 }, { "epoch": 1.06, "learning_rate": 0.00021652406912032492, "loss": 1.6195, "step": 13487 }, { "epoch": 1.06, "learning_rate": 0.00021651299115971217, "loss": 1.5094, "step": 13488 }, { "epoch": 1.06, "learning_rate": 0.00021650191274751295, "loss": 1.6377, "step": 13489 }, { "epoch": 1.06, "learning_rate": 0.00021649083388380243, "loss": 1.5773, "step": 13490 }, { "epoch": 1.06, "learning_rate": 0.00021647975456865588, "loss": 1.5862, "step": 13491 }, { "epoch": 1.06, "learning_rate": 0.00021646867480214845, "loss": 1.5992, "step": 13492 }, { "epoch": 1.06, "learning_rate": 0.0002164575945843554, "loss": 1.5655, "step": 13493 }, { "epoch": 1.06, "learning_rate": 0.00021644651391535197, "loss": 1.6099, "step": 13494 }, { "epoch": 1.06, "learning_rate": 0.00021643543279521336, "loss": 1.5384, "step": 13495 }, { "epoch": 1.06, "learning_rate": 0.00021642435122401482, "loss": 1.5684, "step": 13496 }, { "epoch": 1.06, "learning_rate": 0.00021641326920183158, "loss": 1.531, "step": 13497 }, { "epoch": 1.06, "learning_rate": 0.00021640218672873892, "loss": 1.5498, "step": 13498 }, { "epoch": 1.06, "learning_rate": 0.00021639110380481207, "loss": 1.5835, "step": 13499 }, { "epoch": 1.06, "learning_rate": 0.00021638002043012622, "loss": 1.5331, "step": 13500 }, { "epoch": 1.06, "learning_rate": 0.00021636893660475674, "loss": 1.5658, "step": 13501 }, { "epoch": 1.06, "learning_rate": 0.00021635785232877874, "loss": 1.5123, "step": 13502 }, { "epoch": 1.06, "learning_rate": 0.00021634676760226752, "loss": 1.5602, "step": 13503 }, { "epoch": 1.06, "learning_rate": 0.0002163356824252984, "loss": 1.589, "step": 13504 }, { "epoch": 1.06, "learning_rate": 0.0002163245967979466, "loss": 1.5982, "step": 13505 }, { "epoch": 1.06, "learning_rate": 0.0002163135107202874, "loss": 1.5877, "step": 13506 }, { "epoch": 1.06, "learning_rate": 0.00021630242419239603, "loss": 1.5279, "step": 13507 }, { "epoch": 1.06, "learning_rate": 0.0002162913372143478, "loss": 1.5544, "step": 13508 }, { "epoch": 1.06, "learning_rate": 0.00021628024978621798, "loss": 1.5629, "step": 13509 }, { "epoch": 1.06, "learning_rate": 0.00021626916190808186, "loss": 1.5647, "step": 13510 }, { "epoch": 1.06, "learning_rate": 0.00021625807358001468, "loss": 1.5456, "step": 13511 }, { "epoch": 1.06, "learning_rate": 0.0002162469848020917, "loss": 1.5871, "step": 13512 }, { "epoch": 1.06, "learning_rate": 0.00021623589557438834, "loss": 1.5973, "step": 13513 }, { "epoch": 1.06, "learning_rate": 0.00021622480589697973, "loss": 1.5785, "step": 13514 }, { "epoch": 1.06, "learning_rate": 0.00021621371576994124, "loss": 1.5033, "step": 13515 }, { "epoch": 1.06, "learning_rate": 0.00021620262519334818, "loss": 1.5628, "step": 13516 }, { "epoch": 1.06, "learning_rate": 0.00021619153416727583, "loss": 1.6004, "step": 13517 }, { "epoch": 1.06, "learning_rate": 0.0002161804426917995, "loss": 1.5369, "step": 13518 }, { "epoch": 1.06, "learning_rate": 0.00021616935076699447, "loss": 1.5904, "step": 13519 }, { "epoch": 1.06, "learning_rate": 0.00021615825839293605, "loss": 1.5283, "step": 13520 }, { "epoch": 1.06, "learning_rate": 0.00021614716556969958, "loss": 1.5917, "step": 13521 }, { "epoch": 1.06, "learning_rate": 0.00021613607229736036, "loss": 1.6127, "step": 13522 }, { "epoch": 1.06, "learning_rate": 0.00021612497857599372, "loss": 1.571, "step": 13523 }, { "epoch": 1.06, "learning_rate": 0.00021611388440567495, "loss": 1.5297, "step": 13524 }, { "epoch": 1.06, "learning_rate": 0.00021610278978647938, "loss": 1.5308, "step": 13525 }, { "epoch": 1.06, "learning_rate": 0.00021609169471848238, "loss": 1.5928, "step": 13526 }, { "epoch": 1.06, "learning_rate": 0.0002160805992017592, "loss": 1.5682, "step": 13527 }, { "epoch": 1.06, "learning_rate": 0.00021606950323638526, "loss": 1.5742, "step": 13528 }, { "epoch": 1.06, "learning_rate": 0.00021605840682243583, "loss": 1.5596, "step": 13529 }, { "epoch": 1.06, "learning_rate": 0.00021604730995998628, "loss": 1.5287, "step": 13530 }, { "epoch": 1.06, "learning_rate": 0.00021603621264911193, "loss": 1.5751, "step": 13531 }, { "epoch": 1.06, "learning_rate": 0.00021602511488988814, "loss": 1.5343, "step": 13532 }, { "epoch": 1.06, "learning_rate": 0.00021601401668239027, "loss": 1.5977, "step": 13533 }, { "epoch": 1.06, "learning_rate": 0.00021600291802669364, "loss": 1.6154, "step": 13534 }, { "epoch": 1.06, "learning_rate": 0.00021599181892287362, "loss": 1.555, "step": 13535 }, { "epoch": 1.07, "learning_rate": 0.00021598071937100558, "loss": 1.5636, "step": 13536 }, { "epoch": 1.07, "learning_rate": 0.00021596961937116486, "loss": 1.5717, "step": 13537 }, { "epoch": 1.07, "learning_rate": 0.00021595851892342686, "loss": 1.5739, "step": 13538 }, { "epoch": 1.07, "learning_rate": 0.00021594741802786685, "loss": 1.5599, "step": 13539 }, { "epoch": 1.07, "learning_rate": 0.00021593631668456032, "loss": 1.5987, "step": 13540 }, { "epoch": 1.07, "learning_rate": 0.0002159252148935826, "loss": 1.5399, "step": 13541 }, { "epoch": 1.07, "learning_rate": 0.00021591411265500899, "loss": 1.564, "step": 13542 }, { "epoch": 1.07, "learning_rate": 0.00021590300996891497, "loss": 1.5214, "step": 13543 }, { "epoch": 1.07, "learning_rate": 0.00021589190683537584, "loss": 1.5477, "step": 13544 }, { "epoch": 1.07, "learning_rate": 0.00021588080325446706, "loss": 1.5356, "step": 13545 }, { "epoch": 1.07, "learning_rate": 0.00021586969922626398, "loss": 1.5882, "step": 13546 }, { "epoch": 1.07, "learning_rate": 0.000215858594750842, "loss": 1.6175, "step": 13547 }, { "epoch": 1.07, "learning_rate": 0.0002158474898282765, "loss": 1.5434, "step": 13548 }, { "epoch": 1.07, "learning_rate": 0.00021583638445864286, "loss": 1.5902, "step": 13549 }, { "epoch": 1.07, "learning_rate": 0.00021582527864201653, "loss": 1.5542, "step": 13550 }, { "epoch": 1.07, "learning_rate": 0.00021581417237847284, "loss": 1.6015, "step": 13551 }, { "epoch": 1.07, "learning_rate": 0.0002158030656680873, "loss": 1.536, "step": 13552 }, { "epoch": 1.07, "learning_rate": 0.00021579195851093518, "loss": 1.5795, "step": 13553 }, { "epoch": 1.07, "learning_rate": 0.00021578085090709202, "loss": 1.6138, "step": 13554 }, { "epoch": 1.07, "learning_rate": 0.0002157697428566332, "loss": 1.663, "step": 13555 }, { "epoch": 1.07, "learning_rate": 0.00021575863435963408, "loss": 1.5657, "step": 13556 }, { "epoch": 1.07, "learning_rate": 0.00021574752541617015, "loss": 1.5395, "step": 13557 }, { "epoch": 1.07, "learning_rate": 0.0002157364160263168, "loss": 1.5864, "step": 13558 }, { "epoch": 1.07, "learning_rate": 0.00021572530619014946, "loss": 1.5683, "step": 13559 }, { "epoch": 1.07, "learning_rate": 0.00021571419590774352, "loss": 1.6056, "step": 13560 }, { "epoch": 1.07, "learning_rate": 0.0002157030851791745, "loss": 1.5661, "step": 13561 }, { "epoch": 1.07, "learning_rate": 0.00021569197400451778, "loss": 1.5532, "step": 13562 }, { "epoch": 1.07, "learning_rate": 0.00021568086238384882, "loss": 1.532, "step": 13563 }, { "epoch": 1.07, "learning_rate": 0.00021566975031724303, "loss": 1.5192, "step": 13564 }, { "epoch": 1.07, "learning_rate": 0.00021565863780477593, "loss": 1.5692, "step": 13565 }, { "epoch": 1.07, "learning_rate": 0.00021564752484652284, "loss": 1.5393, "step": 13566 }, { "epoch": 1.07, "learning_rate": 0.0002156364114425593, "loss": 1.5636, "step": 13567 }, { "epoch": 1.07, "learning_rate": 0.00021562529759296077, "loss": 1.5194, "step": 13568 }, { "epoch": 1.07, "learning_rate": 0.00021561418329780268, "loss": 1.5819, "step": 13569 }, { "epoch": 1.07, "learning_rate": 0.00021560306855716044, "loss": 1.5863, "step": 13570 }, { "epoch": 1.07, "learning_rate": 0.00021559195337110963, "loss": 1.5575, "step": 13571 }, { "epoch": 1.07, "learning_rate": 0.00021558083773972567, "loss": 1.5522, "step": 13572 }, { "epoch": 1.07, "learning_rate": 0.00021556972166308398, "loss": 1.5577, "step": 13573 }, { "epoch": 1.07, "learning_rate": 0.00021555860514126007, "loss": 1.5885, "step": 13574 }, { "epoch": 1.07, "learning_rate": 0.00021554748817432937, "loss": 1.5757, "step": 13575 }, { "epoch": 1.07, "learning_rate": 0.00021553637076236743, "loss": 1.5617, "step": 13576 }, { "epoch": 1.07, "learning_rate": 0.0002155252529054497, "loss": 1.5224, "step": 13577 }, { "epoch": 1.07, "learning_rate": 0.00021551413460365164, "loss": 1.5858, "step": 13578 }, { "epoch": 1.07, "learning_rate": 0.00021550301585704883, "loss": 1.5724, "step": 13579 }, { "epoch": 1.07, "learning_rate": 0.0002154918966657166, "loss": 1.5666, "step": 13580 }, { "epoch": 1.07, "learning_rate": 0.0002154807770297306, "loss": 1.6197, "step": 13581 }, { "epoch": 1.07, "learning_rate": 0.00021546965694916622, "loss": 1.5932, "step": 13582 }, { "epoch": 1.07, "learning_rate": 0.00021545853642409898, "loss": 1.5456, "step": 13583 }, { "epoch": 1.07, "learning_rate": 0.00021544741545460446, "loss": 1.6024, "step": 13584 }, { "epoch": 1.07, "learning_rate": 0.00021543629404075808, "loss": 1.5765, "step": 13585 }, { "epoch": 1.07, "learning_rate": 0.00021542517218263538, "loss": 1.5975, "step": 13586 }, { "epoch": 1.07, "learning_rate": 0.00021541404988031186, "loss": 1.5559, "step": 13587 }, { "epoch": 1.07, "learning_rate": 0.00021540292713386305, "loss": 1.5685, "step": 13588 }, { "epoch": 1.07, "learning_rate": 0.00021539180394336446, "loss": 1.5679, "step": 13589 }, { "epoch": 1.07, "learning_rate": 0.00021538068030889157, "loss": 1.5979, "step": 13590 }, { "epoch": 1.07, "learning_rate": 0.00021536955623051995, "loss": 1.5585, "step": 13591 }, { "epoch": 1.07, "learning_rate": 0.00021535843170832511, "loss": 1.591, "step": 13592 }, { "epoch": 1.07, "learning_rate": 0.0002153473067423826, "loss": 1.5245, "step": 13593 }, { "epoch": 1.07, "learning_rate": 0.00021533618133276795, "loss": 1.6036, "step": 13594 }, { "epoch": 1.07, "learning_rate": 0.0002153250554795567, "loss": 1.5567, "step": 13595 }, { "epoch": 1.07, "learning_rate": 0.00021531392918282434, "loss": 1.5703, "step": 13596 }, { "epoch": 1.07, "learning_rate": 0.00021530280244264646, "loss": 1.5635, "step": 13597 }, { "epoch": 1.07, "learning_rate": 0.0002152916752590986, "loss": 1.5332, "step": 13598 }, { "epoch": 1.07, "learning_rate": 0.00021528054763225626, "loss": 1.5939, "step": 13599 }, { "epoch": 1.07, "learning_rate": 0.00021526941956219505, "loss": 1.5698, "step": 13600 }, { "epoch": 1.07, "learning_rate": 0.0002152582910489905, "loss": 1.56, "step": 13601 }, { "epoch": 1.07, "learning_rate": 0.00021524716209271816, "loss": 1.5505, "step": 13602 }, { "epoch": 1.07, "learning_rate": 0.00021523603269345365, "loss": 1.5326, "step": 13603 }, { "epoch": 1.07, "learning_rate": 0.0002152249028512724, "loss": 1.5725, "step": 13604 }, { "epoch": 1.07, "learning_rate": 0.00021521377256625006, "loss": 1.5391, "step": 13605 }, { "epoch": 1.07, "learning_rate": 0.00021520264183846227, "loss": 1.5635, "step": 13606 }, { "epoch": 1.07, "learning_rate": 0.0002151915106679844, "loss": 1.5572, "step": 13607 }, { "epoch": 1.07, "learning_rate": 0.00021518037905489225, "loss": 1.5579, "step": 13608 }, { "epoch": 1.07, "learning_rate": 0.00021516924699926124, "loss": 1.5992, "step": 13609 }, { "epoch": 1.07, "learning_rate": 0.000215158114501167, "loss": 1.5697, "step": 13610 }, { "epoch": 1.07, "learning_rate": 0.00021514698156068518, "loss": 1.5652, "step": 13611 }, { "epoch": 1.07, "learning_rate": 0.00021513584817789126, "loss": 1.5474, "step": 13612 }, { "epoch": 1.07, "learning_rate": 0.0002151247143528609, "loss": 1.5957, "step": 13613 }, { "epoch": 1.07, "learning_rate": 0.00021511358008566962, "loss": 1.6077, "step": 13614 }, { "epoch": 1.07, "learning_rate": 0.00021510244537639313, "loss": 1.5703, "step": 13615 }, { "epoch": 1.07, "learning_rate": 0.0002150913102251069, "loss": 1.5638, "step": 13616 }, { "epoch": 1.07, "learning_rate": 0.00021508017463188662, "loss": 1.5838, "step": 13617 }, { "epoch": 1.07, "learning_rate": 0.00021506903859680793, "loss": 1.5684, "step": 13618 }, { "epoch": 1.07, "learning_rate": 0.00021505790211994631, "loss": 1.5954, "step": 13619 }, { "epoch": 1.07, "learning_rate": 0.00021504676520137746, "loss": 1.4958, "step": 13620 }, { "epoch": 1.07, "learning_rate": 0.00021503562784117697, "loss": 1.6329, "step": 13621 }, { "epoch": 1.07, "learning_rate": 0.00021502449003942039, "loss": 1.5669, "step": 13622 }, { "epoch": 1.07, "learning_rate": 0.00021501335179618348, "loss": 1.55, "step": 13623 }, { "epoch": 1.07, "learning_rate": 0.00021500221311154179, "loss": 1.5926, "step": 13624 }, { "epoch": 1.07, "learning_rate": 0.00021499107398557094, "loss": 1.5325, "step": 13625 }, { "epoch": 1.07, "learning_rate": 0.0002149799344183465, "loss": 1.6094, "step": 13626 }, { "epoch": 1.07, "learning_rate": 0.00021496879440994425, "loss": 1.5272, "step": 13627 }, { "epoch": 1.07, "learning_rate": 0.00021495765396043967, "loss": 1.617, "step": 13628 }, { "epoch": 1.07, "learning_rate": 0.00021494651306990848, "loss": 1.5665, "step": 13629 }, { "epoch": 1.07, "learning_rate": 0.00021493537173842634, "loss": 1.5169, "step": 13630 }, { "epoch": 1.07, "learning_rate": 0.00021492422996606883, "loss": 1.5593, "step": 13631 }, { "epoch": 1.07, "learning_rate": 0.00021491308775291166, "loss": 1.5681, "step": 13632 }, { "epoch": 1.07, "learning_rate": 0.0002149019450990304, "loss": 1.6085, "step": 13633 }, { "epoch": 1.07, "learning_rate": 0.00021489080200450079, "loss": 1.5672, "step": 13634 }, { "epoch": 1.07, "learning_rate": 0.00021487965846939843, "loss": 1.6229, "step": 13635 }, { "epoch": 1.07, "learning_rate": 0.000214868514493799, "loss": 1.6037, "step": 13636 }, { "epoch": 1.07, "learning_rate": 0.00021485737007777815, "loss": 1.6078, "step": 13637 }, { "epoch": 1.07, "learning_rate": 0.00021484622522141152, "loss": 1.5564, "step": 13638 }, { "epoch": 1.07, "learning_rate": 0.0002148350799247748, "loss": 1.5393, "step": 13639 }, { "epoch": 1.07, "learning_rate": 0.00021482393418794372, "loss": 1.5516, "step": 13640 }, { "epoch": 1.07, "learning_rate": 0.00021481278801099388, "loss": 1.5633, "step": 13641 }, { "epoch": 1.07, "learning_rate": 0.00021480164139400099, "loss": 1.5463, "step": 13642 }, { "epoch": 1.07, "learning_rate": 0.00021479049433704067, "loss": 1.5657, "step": 13643 }, { "epoch": 1.07, "learning_rate": 0.00021477934684018866, "loss": 1.544, "step": 13644 }, { "epoch": 1.07, "learning_rate": 0.0002147681989035207, "loss": 1.5763, "step": 13645 }, { "epoch": 1.07, "learning_rate": 0.00021475705052711232, "loss": 1.5053, "step": 13646 }, { "epoch": 1.07, "learning_rate": 0.00021474590171103935, "loss": 1.5659, "step": 13647 }, { "epoch": 1.07, "learning_rate": 0.00021473475245537742, "loss": 1.5452, "step": 13648 }, { "epoch": 1.07, "learning_rate": 0.00021472360276020226, "loss": 1.6075, "step": 13649 }, { "epoch": 1.07, "learning_rate": 0.00021471245262558953, "loss": 1.5396, "step": 13650 }, { "epoch": 1.07, "learning_rate": 0.00021470130205161498, "loss": 1.5804, "step": 13651 }, { "epoch": 1.07, "learning_rate": 0.00021469015103835434, "loss": 1.5491, "step": 13652 }, { "epoch": 1.07, "learning_rate": 0.00021467899958588322, "loss": 1.6211, "step": 13653 }, { "epoch": 1.07, "learning_rate": 0.00021466784769427733, "loss": 1.5605, "step": 13654 }, { "epoch": 1.07, "learning_rate": 0.00021465669536361253, "loss": 1.6249, "step": 13655 }, { "epoch": 1.07, "learning_rate": 0.00021464554259396438, "loss": 1.5329, "step": 13656 }, { "epoch": 1.07, "learning_rate": 0.00021463438938540874, "loss": 1.6086, "step": 13657 }, { "epoch": 1.07, "learning_rate": 0.00021462323573802125, "loss": 1.5538, "step": 13658 }, { "epoch": 1.07, "learning_rate": 0.00021461208165187763, "loss": 1.5266, "step": 13659 }, { "epoch": 1.07, "learning_rate": 0.00021460092712705366, "loss": 1.5925, "step": 13660 }, { "epoch": 1.07, "learning_rate": 0.000214589772163625, "loss": 1.6184, "step": 13661 }, { "epoch": 1.07, "learning_rate": 0.00021457861676166742, "loss": 1.5373, "step": 13662 }, { "epoch": 1.08, "learning_rate": 0.0002145674609212567, "loss": 1.5784, "step": 13663 }, { "epoch": 1.08, "learning_rate": 0.00021455630464246856, "loss": 1.588, "step": 13664 }, { "epoch": 1.08, "learning_rate": 0.00021454514792537875, "loss": 1.5689, "step": 13665 }, { "epoch": 1.08, "learning_rate": 0.00021453399077006296, "loss": 1.5336, "step": 13666 }, { "epoch": 1.08, "learning_rate": 0.00021452283317659703, "loss": 1.5689, "step": 13667 }, { "epoch": 1.08, "learning_rate": 0.00021451167514505663, "loss": 1.5837, "step": 13668 }, { "epoch": 1.08, "learning_rate": 0.00021450051667551757, "loss": 1.5869, "step": 13669 }, { "epoch": 1.08, "learning_rate": 0.00021448935776805558, "loss": 1.5962, "step": 13670 }, { "epoch": 1.08, "learning_rate": 0.00021447819842274648, "loss": 1.6095, "step": 13671 }, { "epoch": 1.08, "learning_rate": 0.000214467038639666, "loss": 1.5895, "step": 13672 }, { "epoch": 1.08, "learning_rate": 0.00021445587841888988, "loss": 1.5934, "step": 13673 }, { "epoch": 1.08, "learning_rate": 0.0002144447177604939, "loss": 1.564, "step": 13674 }, { "epoch": 1.08, "learning_rate": 0.00021443355666455387, "loss": 1.5369, "step": 13675 }, { "epoch": 1.08, "learning_rate": 0.00021442239513114552, "loss": 1.5239, "step": 13676 }, { "epoch": 1.08, "learning_rate": 0.00021441123316034467, "loss": 1.5475, "step": 13677 }, { "epoch": 1.08, "learning_rate": 0.00021440007075222708, "loss": 1.5008, "step": 13678 }, { "epoch": 1.08, "learning_rate": 0.00021438890790686862, "loss": 1.5663, "step": 13679 }, { "epoch": 1.08, "learning_rate": 0.00021437774462434496, "loss": 1.5748, "step": 13680 }, { "epoch": 1.08, "learning_rate": 0.00021436658090473194, "loss": 1.5864, "step": 13681 }, { "epoch": 1.08, "learning_rate": 0.00021435541674810535, "loss": 1.5801, "step": 13682 }, { "epoch": 1.08, "learning_rate": 0.00021434425215454097, "loss": 1.5184, "step": 13683 }, { "epoch": 1.08, "learning_rate": 0.0002143330871241147, "loss": 1.5668, "step": 13684 }, { "epoch": 1.08, "learning_rate": 0.00021432192165690217, "loss": 1.5414, "step": 13685 }, { "epoch": 1.08, "learning_rate": 0.00021431075575297935, "loss": 1.5696, "step": 13686 }, { "epoch": 1.08, "learning_rate": 0.000214299589412422, "loss": 1.6006, "step": 13687 }, { "epoch": 1.08, "learning_rate": 0.0002142884226353059, "loss": 1.5411, "step": 13688 }, { "epoch": 1.08, "learning_rate": 0.0002142772554217069, "loss": 1.569, "step": 13689 }, { "epoch": 1.08, "learning_rate": 0.00021426608777170078, "loss": 1.576, "step": 13690 }, { "epoch": 1.08, "learning_rate": 0.00021425491968536341, "loss": 1.558, "step": 13691 }, { "epoch": 1.08, "learning_rate": 0.0002142437511627706, "loss": 1.54, "step": 13692 }, { "epoch": 1.08, "learning_rate": 0.00021423258220399816, "loss": 1.5963, "step": 13693 }, { "epoch": 1.08, "learning_rate": 0.00021422141280912194, "loss": 1.6287, "step": 13694 }, { "epoch": 1.08, "learning_rate": 0.00021421024297821773, "loss": 1.5534, "step": 13695 }, { "epoch": 1.08, "learning_rate": 0.00021419907271136147, "loss": 1.5886, "step": 13696 }, { "epoch": 1.08, "learning_rate": 0.00021418790200862888, "loss": 1.5539, "step": 13697 }, { "epoch": 1.08, "learning_rate": 0.0002141767308700959, "loss": 1.5612, "step": 13698 }, { "epoch": 1.08, "learning_rate": 0.00021416555929583831, "loss": 1.5863, "step": 13699 }, { "epoch": 1.08, "learning_rate": 0.00021415438728593196, "loss": 1.6106, "step": 13700 }, { "epoch": 1.08, "learning_rate": 0.00021414321484045275, "loss": 1.5618, "step": 13701 }, { "epoch": 1.08, "learning_rate": 0.0002141320419594765, "loss": 1.5289, "step": 13702 }, { "epoch": 1.08, "learning_rate": 0.00021412086864307911, "loss": 1.513, "step": 13703 }, { "epoch": 1.08, "learning_rate": 0.00021410969489133635, "loss": 1.5279, "step": 13704 }, { "epoch": 1.08, "learning_rate": 0.00021409852070432416, "loss": 1.5774, "step": 13705 }, { "epoch": 1.08, "learning_rate": 0.00021408734608211843, "loss": 1.5874, "step": 13706 }, { "epoch": 1.08, "learning_rate": 0.00021407617102479494, "loss": 1.6025, "step": 13707 }, { "epoch": 1.08, "learning_rate": 0.00021406499553242963, "loss": 1.5554, "step": 13708 }, { "epoch": 1.08, "learning_rate": 0.00021405381960509833, "loss": 1.5917, "step": 13709 }, { "epoch": 1.08, "learning_rate": 0.00021404264324287697, "loss": 1.5381, "step": 13710 }, { "epoch": 1.08, "learning_rate": 0.0002140314664458414, "loss": 1.5163, "step": 13711 }, { "epoch": 1.08, "learning_rate": 0.00021402028921406745, "loss": 1.5724, "step": 13712 }, { "epoch": 1.08, "learning_rate": 0.00021400911154763116, "loss": 1.5897, "step": 13713 }, { "epoch": 1.08, "learning_rate": 0.00021399793344660826, "loss": 1.5977, "step": 13714 }, { "epoch": 1.08, "learning_rate": 0.00021398675491107475, "loss": 1.5494, "step": 13715 }, { "epoch": 1.08, "learning_rate": 0.00021397557594110648, "loss": 1.5493, "step": 13716 }, { "epoch": 1.08, "learning_rate": 0.00021396439653677927, "loss": 1.5714, "step": 13717 }, { "epoch": 1.08, "learning_rate": 0.00021395321669816922, "loss": 1.5732, "step": 13718 }, { "epoch": 1.08, "learning_rate": 0.00021394203642535205, "loss": 1.5318, "step": 13719 }, { "epoch": 1.08, "learning_rate": 0.0002139308557184038, "loss": 1.629, "step": 13720 }, { "epoch": 1.08, "learning_rate": 0.00021391967457740026, "loss": 1.5534, "step": 13721 }, { "epoch": 1.08, "learning_rate": 0.0002139084930024174, "loss": 1.5681, "step": 13722 }, { "epoch": 1.08, "learning_rate": 0.00021389731099353122, "loss": 1.5454, "step": 13723 }, { "epoch": 1.08, "learning_rate": 0.00021388612855081747, "loss": 1.5267, "step": 13724 }, { "epoch": 1.08, "learning_rate": 0.00021387494567435221, "loss": 1.616, "step": 13725 }, { "epoch": 1.08, "learning_rate": 0.00021386376236421132, "loss": 1.5868, "step": 13726 }, { "epoch": 1.08, "learning_rate": 0.00021385257862047074, "loss": 1.573, "step": 13727 }, { "epoch": 1.08, "learning_rate": 0.0002138413944432063, "loss": 1.5653, "step": 13728 }, { "epoch": 1.08, "learning_rate": 0.00021383020983249413, "loss": 1.5359, "step": 13729 }, { "epoch": 1.08, "learning_rate": 0.00021381902478841, "loss": 1.5714, "step": 13730 }, { "epoch": 1.08, "learning_rate": 0.00021380783931102993, "loss": 1.6057, "step": 13731 }, { "epoch": 1.08, "learning_rate": 0.00021379665340042983, "loss": 1.56, "step": 13732 }, { "epoch": 1.08, "learning_rate": 0.00021378546705668564, "loss": 1.621, "step": 13733 }, { "epoch": 1.08, "learning_rate": 0.00021377428027987336, "loss": 1.5337, "step": 13734 }, { "epoch": 1.08, "learning_rate": 0.00021376309307006894, "loss": 1.5875, "step": 13735 }, { "epoch": 1.08, "learning_rate": 0.00021375190542734826, "loss": 1.5301, "step": 13736 }, { "epoch": 1.08, "learning_rate": 0.00021374071735178737, "loss": 1.6265, "step": 13737 }, { "epoch": 1.08, "learning_rate": 0.00021372952884346212, "loss": 1.5243, "step": 13738 }, { "epoch": 1.08, "learning_rate": 0.00021371833990244856, "loss": 1.5229, "step": 13739 }, { "epoch": 1.08, "learning_rate": 0.0002137071505288226, "loss": 1.5682, "step": 13740 }, { "epoch": 1.08, "learning_rate": 0.00021369596072266033, "loss": 1.5871, "step": 13741 }, { "epoch": 1.08, "learning_rate": 0.00021368477048403758, "loss": 1.5526, "step": 13742 }, { "epoch": 1.08, "learning_rate": 0.0002136735798130304, "loss": 1.5245, "step": 13743 }, { "epoch": 1.08, "learning_rate": 0.00021366238870971477, "loss": 1.5797, "step": 13744 }, { "epoch": 1.08, "learning_rate": 0.00021365119717416662, "loss": 1.541, "step": 13745 }, { "epoch": 1.08, "learning_rate": 0.00021364000520646196, "loss": 1.5175, "step": 13746 }, { "epoch": 1.08, "learning_rate": 0.00021362881280667683, "loss": 1.5445, "step": 13747 }, { "epoch": 1.08, "learning_rate": 0.00021361761997488711, "loss": 1.6199, "step": 13748 }, { "epoch": 1.08, "learning_rate": 0.00021360642671116892, "loss": 1.6328, "step": 13749 }, { "epoch": 1.08, "learning_rate": 0.00021359523301559815, "loss": 1.5415, "step": 13750 }, { "epoch": 1.08, "learning_rate": 0.00021358403888825086, "loss": 1.567, "step": 13751 }, { "epoch": 1.08, "learning_rate": 0.00021357284432920305, "loss": 1.58, "step": 13752 }, { "epoch": 1.08, "learning_rate": 0.00021356164933853067, "loss": 1.4754, "step": 13753 }, { "epoch": 1.08, "learning_rate": 0.00021355045391630983, "loss": 1.5454, "step": 13754 }, { "epoch": 1.08, "learning_rate": 0.00021353925806261642, "loss": 1.5632, "step": 13755 }, { "epoch": 1.08, "learning_rate": 0.00021352806177752653, "loss": 1.5678, "step": 13756 }, { "epoch": 1.08, "learning_rate": 0.00021351686506111613, "loss": 1.5549, "step": 13757 }, { "epoch": 1.08, "learning_rate": 0.00021350566791346128, "loss": 1.5182, "step": 13758 }, { "epoch": 1.08, "learning_rate": 0.00021349447033463804, "loss": 1.5279, "step": 13759 }, { "epoch": 1.08, "learning_rate": 0.00021348327232472233, "loss": 1.5534, "step": 13760 }, { "epoch": 1.08, "learning_rate": 0.00021347207388379026, "loss": 1.5814, "step": 13761 }, { "epoch": 1.08, "learning_rate": 0.00021346087501191785, "loss": 1.5881, "step": 13762 }, { "epoch": 1.08, "learning_rate": 0.0002134496757091811, "loss": 1.6034, "step": 13763 }, { "epoch": 1.08, "learning_rate": 0.00021343847597565604, "loss": 1.5585, "step": 13764 }, { "epoch": 1.08, "learning_rate": 0.00021342727581141874, "loss": 1.5602, "step": 13765 }, { "epoch": 1.08, "learning_rate": 0.00021341607521654528, "loss": 1.5517, "step": 13766 }, { "epoch": 1.08, "learning_rate": 0.00021340487419111166, "loss": 1.5326, "step": 13767 }, { "epoch": 1.08, "learning_rate": 0.0002133936727351939, "loss": 1.6128, "step": 13768 }, { "epoch": 1.08, "learning_rate": 0.0002133824708488681, "loss": 1.5648, "step": 13769 }, { "epoch": 1.08, "learning_rate": 0.00021337126853221034, "loss": 1.5633, "step": 13770 }, { "epoch": 1.08, "learning_rate": 0.00021336006578529662, "loss": 1.5098, "step": 13771 }, { "epoch": 1.08, "learning_rate": 0.00021334886260820294, "loss": 1.5765, "step": 13772 }, { "epoch": 1.08, "learning_rate": 0.0002133376590010055, "loss": 1.5852, "step": 13773 }, { "epoch": 1.08, "learning_rate": 0.00021332645496378034, "loss": 1.534, "step": 13774 }, { "epoch": 1.08, "learning_rate": 0.00021331525049660347, "loss": 1.562, "step": 13775 }, { "epoch": 1.08, "learning_rate": 0.000213304045599551, "loss": 1.5563, "step": 13776 }, { "epoch": 1.08, "learning_rate": 0.00021329284027269899, "loss": 1.5877, "step": 13777 }, { "epoch": 1.08, "learning_rate": 0.0002132816345161235, "loss": 1.5688, "step": 13778 }, { "epoch": 1.08, "learning_rate": 0.00021327042832990062, "loss": 1.5748, "step": 13779 }, { "epoch": 1.08, "learning_rate": 0.00021325922171410648, "loss": 1.558, "step": 13780 }, { "epoch": 1.08, "learning_rate": 0.00021324801466881716, "loss": 1.5238, "step": 13781 }, { "epoch": 1.08, "learning_rate": 0.00021323680719410868, "loss": 1.5598, "step": 13782 }, { "epoch": 1.08, "learning_rate": 0.0002132255992900572, "loss": 1.5432, "step": 13783 }, { "epoch": 1.08, "learning_rate": 0.00021321439095673875, "loss": 1.5414, "step": 13784 }, { "epoch": 1.08, "learning_rate": 0.0002132031821942295, "loss": 1.5405, "step": 13785 }, { "epoch": 1.08, "learning_rate": 0.00021319197300260554, "loss": 1.5485, "step": 13786 }, { "epoch": 1.08, "learning_rate": 0.0002131807633819429, "loss": 1.5231, "step": 13787 }, { "epoch": 1.08, "learning_rate": 0.00021316955333231782, "loss": 1.5259, "step": 13788 }, { "epoch": 1.08, "learning_rate": 0.0002131583428538063, "loss": 1.5796, "step": 13789 }, { "epoch": 1.09, "learning_rate": 0.00021314713194648443, "loss": 1.5942, "step": 13790 }, { "epoch": 1.09, "learning_rate": 0.00021313592061042848, "loss": 1.5776, "step": 13791 }, { "epoch": 1.09, "learning_rate": 0.0002131247088457144, "loss": 1.5367, "step": 13792 }, { "epoch": 1.09, "learning_rate": 0.00021311349665241843, "loss": 1.5359, "step": 13793 }, { "epoch": 1.09, "learning_rate": 0.0002131022840306166, "loss": 1.6022, "step": 13794 }, { "epoch": 1.09, "learning_rate": 0.0002130910709803851, "loss": 1.5774, "step": 13795 }, { "epoch": 1.09, "learning_rate": 0.00021307985750180006, "loss": 1.5854, "step": 13796 }, { "epoch": 1.09, "learning_rate": 0.00021306864359493756, "loss": 1.5436, "step": 13797 }, { "epoch": 1.09, "learning_rate": 0.00021305742925987382, "loss": 1.5997, "step": 13798 }, { "epoch": 1.09, "learning_rate": 0.0002130462144966849, "loss": 1.5488, "step": 13799 }, { "epoch": 1.09, "learning_rate": 0.000213034999305447, "loss": 1.5624, "step": 13800 }, { "epoch": 1.09, "learning_rate": 0.00021302378368623622, "loss": 1.5119, "step": 13801 }, { "epoch": 1.09, "learning_rate": 0.00021301256763912876, "loss": 1.5029, "step": 13802 }, { "epoch": 1.09, "learning_rate": 0.0002130013511642007, "loss": 1.5923, "step": 13803 }, { "epoch": 1.09, "learning_rate": 0.00021299013426152822, "loss": 1.5796, "step": 13804 }, { "epoch": 1.09, "learning_rate": 0.00021297891693118753, "loss": 1.5327, "step": 13805 }, { "epoch": 1.09, "learning_rate": 0.00021296769917325474, "loss": 1.5372, "step": 13806 }, { "epoch": 1.09, "learning_rate": 0.000212956480987806, "loss": 1.5349, "step": 13807 }, { "epoch": 1.09, "learning_rate": 0.00021294526237491753, "loss": 1.5378, "step": 13808 }, { "epoch": 1.09, "learning_rate": 0.00021293404333466546, "loss": 1.5757, "step": 13809 }, { "epoch": 1.09, "learning_rate": 0.000212922823867126, "loss": 1.6138, "step": 13810 }, { "epoch": 1.09, "learning_rate": 0.00021291160397237516, "loss": 1.5499, "step": 13811 }, { "epoch": 1.09, "learning_rate": 0.00021290038365048936, "loss": 1.5468, "step": 13812 }, { "epoch": 1.09, "learning_rate": 0.00021288916290154462, "loss": 1.5764, "step": 13813 }, { "epoch": 1.09, "learning_rate": 0.00021287794172561718, "loss": 1.5457, "step": 13814 }, { "epoch": 1.09, "learning_rate": 0.00021286672012278327, "loss": 1.5613, "step": 13815 }, { "epoch": 1.09, "learning_rate": 0.00021285549809311894, "loss": 1.5826, "step": 13816 }, { "epoch": 1.09, "learning_rate": 0.0002128442756367005, "loss": 1.5504, "step": 13817 }, { "epoch": 1.09, "learning_rate": 0.00021283305275360414, "loss": 1.5389, "step": 13818 }, { "epoch": 1.09, "learning_rate": 0.00021282182944390595, "loss": 1.5738, "step": 13819 }, { "epoch": 1.09, "learning_rate": 0.00021281060570768227, "loss": 1.547, "step": 13820 }, { "epoch": 1.09, "learning_rate": 0.00021279938154500922, "loss": 1.5189, "step": 13821 }, { "epoch": 1.09, "learning_rate": 0.000212788156955963, "loss": 1.5524, "step": 13822 }, { "epoch": 1.09, "learning_rate": 0.0002127769319406199, "loss": 1.5781, "step": 13823 }, { "epoch": 1.09, "learning_rate": 0.00021276570649905602, "loss": 1.5751, "step": 13824 }, { "epoch": 1.09, "learning_rate": 0.00021275448063134769, "loss": 1.5833, "step": 13825 }, { "epoch": 1.09, "learning_rate": 0.000212743254337571, "loss": 1.4912, "step": 13826 }, { "epoch": 1.09, "learning_rate": 0.00021273202761780226, "loss": 1.5541, "step": 13827 }, { "epoch": 1.09, "learning_rate": 0.00021272080047211766, "loss": 1.5889, "step": 13828 }, { "epoch": 1.09, "learning_rate": 0.00021270957290059342, "loss": 1.5226, "step": 13829 }, { "epoch": 1.09, "learning_rate": 0.00021269834490330588, "loss": 1.6056, "step": 13830 }, { "epoch": 1.09, "learning_rate": 0.0002126871164803311, "loss": 1.6168, "step": 13831 }, { "epoch": 1.09, "learning_rate": 0.0002126758876317454, "loss": 1.5931, "step": 13832 }, { "epoch": 1.09, "learning_rate": 0.00021266465835762506, "loss": 1.6113, "step": 13833 }, { "epoch": 1.09, "learning_rate": 0.0002126534286580462, "loss": 1.5632, "step": 13834 }, { "epoch": 1.09, "learning_rate": 0.00021264219853308516, "loss": 1.5415, "step": 13835 }, { "epoch": 1.09, "learning_rate": 0.00021263096798281814, "loss": 1.5912, "step": 13836 }, { "epoch": 1.09, "learning_rate": 0.00021261973700732148, "loss": 1.4958, "step": 13837 }, { "epoch": 1.09, "learning_rate": 0.00021260850560667128, "loss": 1.6392, "step": 13838 }, { "epoch": 1.09, "learning_rate": 0.00021259727378094399, "loss": 1.5886, "step": 13839 }, { "epoch": 1.09, "learning_rate": 0.00021258604153021567, "loss": 1.5307, "step": 13840 }, { "epoch": 1.09, "learning_rate": 0.00021257480885456263, "loss": 1.5303, "step": 13841 }, { "epoch": 1.09, "learning_rate": 0.0002125635757540612, "loss": 1.5402, "step": 13842 }, { "epoch": 1.09, "learning_rate": 0.00021255234222878765, "loss": 1.6114, "step": 13843 }, { "epoch": 1.09, "learning_rate": 0.00021254110827881821, "loss": 1.5783, "step": 13844 }, { "epoch": 1.09, "learning_rate": 0.00021252987390422913, "loss": 1.5468, "step": 13845 }, { "epoch": 1.09, "learning_rate": 0.00021251863910509673, "loss": 1.514, "step": 13846 }, { "epoch": 1.09, "learning_rate": 0.00021250740388149727, "loss": 1.5657, "step": 13847 }, { "epoch": 1.09, "learning_rate": 0.00021249616823350705, "loss": 1.5558, "step": 13848 }, { "epoch": 1.09, "learning_rate": 0.00021248493216120235, "loss": 1.5708, "step": 13849 }, { "epoch": 1.09, "learning_rate": 0.00021247369566465937, "loss": 1.575, "step": 13850 }, { "epoch": 1.09, "learning_rate": 0.00021246245874395454, "loss": 1.5768, "step": 13851 }, { "epoch": 1.09, "learning_rate": 0.00021245122139916403, "loss": 1.5978, "step": 13852 }, { "epoch": 1.09, "learning_rate": 0.00021243998363036423, "loss": 1.5075, "step": 13853 }, { "epoch": 1.09, "learning_rate": 0.00021242874543763137, "loss": 1.5598, "step": 13854 }, { "epoch": 1.09, "learning_rate": 0.00021241750682104182, "loss": 1.557, "step": 13855 }, { "epoch": 1.09, "learning_rate": 0.00021240626778067177, "loss": 1.5863, "step": 13856 }, { "epoch": 1.09, "learning_rate": 0.0002123950283165977, "loss": 1.6094, "step": 13857 }, { "epoch": 1.09, "learning_rate": 0.00021238378842889573, "loss": 1.4625, "step": 13858 }, { "epoch": 1.09, "learning_rate": 0.00021237254811764232, "loss": 1.5202, "step": 13859 }, { "epoch": 1.09, "learning_rate": 0.00021236130738291371, "loss": 1.5625, "step": 13860 }, { "epoch": 1.09, "learning_rate": 0.00021235006622478627, "loss": 1.5865, "step": 13861 }, { "epoch": 1.09, "learning_rate": 0.00021233882464333624, "loss": 1.5648, "step": 13862 }, { "epoch": 1.09, "learning_rate": 0.00021232758263864, "loss": 1.5965, "step": 13863 }, { "epoch": 1.09, "learning_rate": 0.0002123163402107739, "loss": 1.5483, "step": 13864 }, { "epoch": 1.09, "learning_rate": 0.0002123050973598142, "loss": 1.5996, "step": 13865 }, { "epoch": 1.09, "learning_rate": 0.0002122938540858373, "loss": 1.571, "step": 13866 }, { "epoch": 1.09, "learning_rate": 0.00021228261038891947, "loss": 1.5488, "step": 13867 }, { "epoch": 1.09, "learning_rate": 0.00021227136626913713, "loss": 1.5791, "step": 13868 }, { "epoch": 1.09, "learning_rate": 0.00021226012172656655, "loss": 1.5525, "step": 13869 }, { "epoch": 1.09, "learning_rate": 0.00021224887676128408, "loss": 1.576, "step": 13870 }, { "epoch": 1.09, "learning_rate": 0.00021223763137336615, "loss": 1.6368, "step": 13871 }, { "epoch": 1.09, "learning_rate": 0.000212226385562889, "loss": 1.5962, "step": 13872 }, { "epoch": 1.09, "learning_rate": 0.00021221513932992905, "loss": 1.5591, "step": 13873 }, { "epoch": 1.09, "learning_rate": 0.0002122038926745626, "loss": 1.6336, "step": 13874 }, { "epoch": 1.09, "learning_rate": 0.0002121926455968661, "loss": 1.4603, "step": 13875 }, { "epoch": 1.09, "learning_rate": 0.00021218139809691587, "loss": 1.5213, "step": 13876 }, { "epoch": 1.09, "learning_rate": 0.0002121701501747882, "loss": 1.532, "step": 13877 }, { "epoch": 1.09, "learning_rate": 0.00021215890183055958, "loss": 1.5747, "step": 13878 }, { "epoch": 1.09, "learning_rate": 0.0002121476530643063, "loss": 1.5806, "step": 13879 }, { "epoch": 1.09, "learning_rate": 0.0002121364038761047, "loss": 1.5852, "step": 13880 }, { "epoch": 1.09, "learning_rate": 0.00021212515426603128, "loss": 1.5849, "step": 13881 }, { "epoch": 1.09, "learning_rate": 0.00021211390423416226, "loss": 1.5362, "step": 13882 }, { "epoch": 1.09, "learning_rate": 0.0002121026537805742, "loss": 1.6358, "step": 13883 }, { "epoch": 1.09, "learning_rate": 0.00021209140290534334, "loss": 1.5562, "step": 13884 }, { "epoch": 1.09, "learning_rate": 0.00021208015160854613, "loss": 1.5261, "step": 13885 }, { "epoch": 1.09, "learning_rate": 0.00021206889989025898, "loss": 1.6102, "step": 13886 }, { "epoch": 1.09, "learning_rate": 0.00021205764775055817, "loss": 1.5631, "step": 13887 }, { "epoch": 1.09, "learning_rate": 0.00021204639518952026, "loss": 1.5715, "step": 13888 }, { "epoch": 1.09, "learning_rate": 0.00021203514220722154, "loss": 1.5953, "step": 13889 }, { "epoch": 1.09, "learning_rate": 0.00021202388880373844, "loss": 1.5464, "step": 13890 }, { "epoch": 1.09, "learning_rate": 0.00021201263497914734, "loss": 1.5522, "step": 13891 }, { "epoch": 1.09, "learning_rate": 0.00021200138073352467, "loss": 1.5674, "step": 13892 }, { "epoch": 1.09, "learning_rate": 0.0002119901260669469, "loss": 1.5636, "step": 13893 }, { "epoch": 1.09, "learning_rate": 0.0002119788709794903, "loss": 1.5445, "step": 13894 }, { "epoch": 1.09, "learning_rate": 0.00021196761547123143, "loss": 1.5261, "step": 13895 }, { "epoch": 1.09, "learning_rate": 0.00021195635954224663, "loss": 1.5577, "step": 13896 }, { "epoch": 1.09, "learning_rate": 0.0002119451031926123, "loss": 1.5505, "step": 13897 }, { "epoch": 1.09, "learning_rate": 0.00021193384642240494, "loss": 1.5723, "step": 13898 }, { "epoch": 1.09, "learning_rate": 0.00021192258923170094, "loss": 1.4838, "step": 13899 }, { "epoch": 1.09, "learning_rate": 0.00021191133162057677, "loss": 1.5808, "step": 13900 }, { "epoch": 1.09, "learning_rate": 0.00021190007358910877, "loss": 1.5297, "step": 13901 }, { "epoch": 1.09, "learning_rate": 0.0002118888151373734, "loss": 1.5353, "step": 13902 }, { "epoch": 1.09, "learning_rate": 0.00021187755626544722, "loss": 1.5883, "step": 13903 }, { "epoch": 1.09, "learning_rate": 0.00021186629697340654, "loss": 1.5986, "step": 13904 }, { "epoch": 1.09, "learning_rate": 0.0002118550372613278, "loss": 1.5825, "step": 13905 }, { "epoch": 1.09, "learning_rate": 0.00021184377712928754, "loss": 1.6134, "step": 13906 }, { "epoch": 1.09, "learning_rate": 0.00021183251657736217, "loss": 1.5559, "step": 13907 }, { "epoch": 1.09, "learning_rate": 0.0002118212556056281, "loss": 1.5542, "step": 13908 }, { "epoch": 1.09, "learning_rate": 0.00021180999421416182, "loss": 1.5922, "step": 13909 }, { "epoch": 1.09, "learning_rate": 0.00021179873240303985, "loss": 1.5638, "step": 13910 }, { "epoch": 1.09, "learning_rate": 0.00021178747017233852, "loss": 1.6037, "step": 13911 }, { "epoch": 1.09, "learning_rate": 0.00021177620752213435, "loss": 1.5903, "step": 13912 }, { "epoch": 1.09, "learning_rate": 0.00021176494445250386, "loss": 1.5214, "step": 13913 }, { "epoch": 1.09, "learning_rate": 0.0002117536809635235, "loss": 1.5264, "step": 13914 }, { "epoch": 1.09, "learning_rate": 0.00021174241705526972, "loss": 1.541, "step": 13915 }, { "epoch": 1.09, "learning_rate": 0.00021173115272781897, "loss": 1.5394, "step": 13916 }, { "epoch": 1.1, "learning_rate": 0.0002117198879812478, "loss": 1.6199, "step": 13917 }, { "epoch": 1.1, "learning_rate": 0.00021170862281563263, "loss": 1.5475, "step": 13918 }, { "epoch": 1.1, "learning_rate": 0.00021169735723104995, "loss": 1.5519, "step": 13919 }, { "epoch": 1.1, "learning_rate": 0.0002116860912275763, "loss": 1.5394, "step": 13920 }, { "epoch": 1.1, "learning_rate": 0.00021167482480528805, "loss": 1.5534, "step": 13921 }, { "epoch": 1.1, "learning_rate": 0.00021166355796426185, "loss": 1.5479, "step": 13922 }, { "epoch": 1.1, "learning_rate": 0.00021165229070457407, "loss": 1.585, "step": 13923 }, { "epoch": 1.1, "learning_rate": 0.0002116410230263013, "loss": 1.5436, "step": 13924 }, { "epoch": 1.1, "learning_rate": 0.00021162975492952, "loss": 1.5332, "step": 13925 }, { "epoch": 1.1, "learning_rate": 0.00021161848641430668, "loss": 1.5104, "step": 13926 }, { "epoch": 1.1, "learning_rate": 0.00021160721748073781, "loss": 1.5574, "step": 13927 }, { "epoch": 1.1, "learning_rate": 0.00021159594812888996, "loss": 1.5953, "step": 13928 }, { "epoch": 1.1, "learning_rate": 0.0002115846783588396, "loss": 1.5845, "step": 13929 }, { "epoch": 1.1, "learning_rate": 0.0002115734081706632, "loss": 1.5458, "step": 13930 }, { "epoch": 1.1, "learning_rate": 0.00021156213756443743, "loss": 1.5597, "step": 13931 }, { "epoch": 1.1, "learning_rate": 0.0002115508665402387, "loss": 1.5792, "step": 13932 }, { "epoch": 1.1, "learning_rate": 0.00021153959509814351, "loss": 1.5594, "step": 13933 }, { "epoch": 1.1, "learning_rate": 0.0002115283232382285, "loss": 1.5197, "step": 13934 }, { "epoch": 1.1, "learning_rate": 0.0002115170509605701, "loss": 1.5555, "step": 13935 }, { "epoch": 1.1, "learning_rate": 0.00021150577826524483, "loss": 1.588, "step": 13936 }, { "epoch": 1.1, "learning_rate": 0.00021149450515232926, "loss": 1.558, "step": 13937 }, { "epoch": 1.1, "learning_rate": 0.00021148323162189996, "loss": 1.5737, "step": 13938 }, { "epoch": 1.1, "learning_rate": 0.0002114719576740335, "loss": 1.56, "step": 13939 }, { "epoch": 1.1, "learning_rate": 0.0002114606833088063, "loss": 1.5487, "step": 13940 }, { "epoch": 1.1, "learning_rate": 0.000211449408526295, "loss": 1.5598, "step": 13941 }, { "epoch": 1.1, "learning_rate": 0.00021143813332657614, "loss": 1.5791, "step": 13942 }, { "epoch": 1.1, "learning_rate": 0.00021142685770972623, "loss": 1.5914, "step": 13943 }, { "epoch": 1.1, "learning_rate": 0.0002114155816758219, "loss": 1.6038, "step": 13944 }, { "epoch": 1.1, "learning_rate": 0.00021140430522493964, "loss": 1.5565, "step": 13945 }, { "epoch": 1.1, "learning_rate": 0.00021139302835715602, "loss": 1.5584, "step": 13946 }, { "epoch": 1.1, "learning_rate": 0.00021138175107254762, "loss": 1.5309, "step": 13947 }, { "epoch": 1.1, "learning_rate": 0.000211370473371191, "loss": 1.5467, "step": 13948 }, { "epoch": 1.1, "learning_rate": 0.00021135919525316278, "loss": 1.5472, "step": 13949 }, { "epoch": 1.1, "learning_rate": 0.00021134791671853942, "loss": 1.4963, "step": 13950 }, { "epoch": 1.1, "learning_rate": 0.00021133663776739763, "loss": 1.6412, "step": 13951 }, { "epoch": 1.1, "learning_rate": 0.00021132535839981381, "loss": 1.5985, "step": 13952 }, { "epoch": 1.1, "learning_rate": 0.00021131407861586473, "loss": 1.5974, "step": 13953 }, { "epoch": 1.1, "learning_rate": 0.0002113027984156269, "loss": 1.5475, "step": 13954 }, { "epoch": 1.1, "learning_rate": 0.00021129151779917683, "loss": 1.5343, "step": 13955 }, { "epoch": 1.1, "learning_rate": 0.00021128023676659125, "loss": 1.5411, "step": 13956 }, { "epoch": 1.1, "learning_rate": 0.00021126895531794665, "loss": 1.5841, "step": 13957 }, { "epoch": 1.1, "learning_rate": 0.00021125767345331965, "loss": 1.5409, "step": 13958 }, { "epoch": 1.1, "learning_rate": 0.0002112463911727869, "loss": 1.5481, "step": 13959 }, { "epoch": 1.1, "learning_rate": 0.00021123510847642483, "loss": 1.615, "step": 13960 }, { "epoch": 1.1, "learning_rate": 0.00021122382536431028, "loss": 1.582, "step": 13961 }, { "epoch": 1.1, "learning_rate": 0.0002112125418365197, "loss": 1.5786, "step": 13962 }, { "epoch": 1.1, "learning_rate": 0.00021120125789312978, "loss": 1.5595, "step": 13963 }, { "epoch": 1.1, "learning_rate": 0.00021118997353421708, "loss": 1.6043, "step": 13964 }, { "epoch": 1.1, "learning_rate": 0.00021117868875985816, "loss": 1.5613, "step": 13965 }, { "epoch": 1.1, "learning_rate": 0.0002111674035701298, "loss": 1.4604, "step": 13966 }, { "epoch": 1.1, "learning_rate": 0.00021115611796510846, "loss": 1.5411, "step": 13967 }, { "epoch": 1.1, "learning_rate": 0.00021114483194487082, "loss": 1.5268, "step": 13968 }, { "epoch": 1.1, "learning_rate": 0.00021113354550949355, "loss": 1.525, "step": 13969 }, { "epoch": 1.1, "learning_rate": 0.00021112225865905324, "loss": 1.5501, "step": 13970 }, { "epoch": 1.1, "learning_rate": 0.0002111109713936265, "loss": 1.5782, "step": 13971 }, { "epoch": 1.1, "learning_rate": 0.00021109968371329002, "loss": 1.5854, "step": 13972 }, { "epoch": 1.1, "learning_rate": 0.00021108839561812039, "loss": 1.581, "step": 13973 }, { "epoch": 1.1, "learning_rate": 0.00021107710710819427, "loss": 1.5723, "step": 13974 }, { "epoch": 1.1, "learning_rate": 0.0002110658181835883, "loss": 1.5653, "step": 13975 }, { "epoch": 1.1, "learning_rate": 0.0002110545288443791, "loss": 1.571, "step": 13976 }, { "epoch": 1.1, "learning_rate": 0.00021104323909064337, "loss": 1.5209, "step": 13977 }, { "epoch": 1.1, "learning_rate": 0.0002110319489224577, "loss": 1.571, "step": 13978 }, { "epoch": 1.1, "learning_rate": 0.00021102065833989879, "loss": 1.5689, "step": 13979 }, { "epoch": 1.1, "learning_rate": 0.00021100936734304334, "loss": 1.5882, "step": 13980 }, { "epoch": 1.1, "learning_rate": 0.00021099807593196788, "loss": 1.5008, "step": 13981 }, { "epoch": 1.1, "learning_rate": 0.00021098678410674915, "loss": 1.5002, "step": 13982 }, { "epoch": 1.1, "learning_rate": 0.00021097549186746385, "loss": 1.6167, "step": 13983 }, { "epoch": 1.1, "learning_rate": 0.00021096419921418856, "loss": 1.5256, "step": 13984 }, { "epoch": 1.1, "learning_rate": 0.00021095290614700005, "loss": 1.5665, "step": 13985 }, { "epoch": 1.1, "learning_rate": 0.00021094161266597492, "loss": 1.5334, "step": 13986 }, { "epoch": 1.1, "learning_rate": 0.00021093031877118988, "loss": 1.5243, "step": 13987 }, { "epoch": 1.1, "learning_rate": 0.00021091902446272162, "loss": 1.5613, "step": 13988 }, { "epoch": 1.1, "learning_rate": 0.00021090772974064677, "loss": 1.5416, "step": 13989 }, { "epoch": 1.1, "learning_rate": 0.00021089643460504205, "loss": 1.5574, "step": 13990 }, { "epoch": 1.1, "learning_rate": 0.00021088513905598416, "loss": 1.5301, "step": 13991 }, { "epoch": 1.1, "learning_rate": 0.00021087384309354974, "loss": 1.575, "step": 13992 }, { "epoch": 1.1, "learning_rate": 0.00021086254671781555, "loss": 1.5762, "step": 13993 }, { "epoch": 1.1, "learning_rate": 0.00021085124992885823, "loss": 1.5349, "step": 13994 }, { "epoch": 1.1, "learning_rate": 0.00021083995272675452, "loss": 1.4543, "step": 13995 }, { "epoch": 1.1, "learning_rate": 0.00021082865511158112, "loss": 1.5655, "step": 13996 }, { "epoch": 1.1, "learning_rate": 0.0002108173570834147, "loss": 1.5856, "step": 13997 }, { "epoch": 1.1, "learning_rate": 0.000210806058642332, "loss": 1.5953, "step": 13998 }, { "epoch": 1.1, "learning_rate": 0.0002107947597884097, "loss": 1.5683, "step": 13999 }, { "epoch": 1.1, "learning_rate": 0.00021078346052172452, "loss": 1.5182, "step": 14000 }, { "epoch": 1.1, "learning_rate": 0.0002107721608423532, "loss": 1.5809, "step": 14001 }, { "epoch": 1.1, "learning_rate": 0.00021076086075037248, "loss": 1.4959, "step": 14002 }, { "epoch": 1.1, "learning_rate": 0.00021074956024585902, "loss": 1.6144, "step": 14003 }, { "epoch": 1.1, "learning_rate": 0.00021073825932888953, "loss": 1.5414, "step": 14004 }, { "epoch": 1.1, "learning_rate": 0.00021072695799954086, "loss": 1.5278, "step": 14005 }, { "epoch": 1.1, "learning_rate": 0.00021071565625788957, "loss": 1.5965, "step": 14006 }, { "epoch": 1.1, "learning_rate": 0.00021070435410401253, "loss": 1.5578, "step": 14007 }, { "epoch": 1.1, "learning_rate": 0.0002106930515379864, "loss": 1.5797, "step": 14008 }, { "epoch": 1.1, "learning_rate": 0.00021068174855988798, "loss": 1.5231, "step": 14009 }, { "epoch": 1.1, "learning_rate": 0.00021067044516979395, "loss": 1.5467, "step": 14010 }, { "epoch": 1.1, "learning_rate": 0.00021065914136778106, "loss": 1.5759, "step": 14011 }, { "epoch": 1.1, "learning_rate": 0.00021064783715392613, "loss": 1.5199, "step": 14012 }, { "epoch": 1.1, "learning_rate": 0.00021063653252830582, "loss": 1.596, "step": 14013 }, { "epoch": 1.1, "learning_rate": 0.00021062522749099692, "loss": 1.5897, "step": 14014 }, { "epoch": 1.1, "learning_rate": 0.00021061392204207614, "loss": 1.5442, "step": 14015 }, { "epoch": 1.1, "learning_rate": 0.00021060261618162032, "loss": 1.5129, "step": 14016 }, { "epoch": 1.1, "learning_rate": 0.0002105913099097062, "loss": 1.5503, "step": 14017 }, { "epoch": 1.1, "learning_rate": 0.00021058000322641046, "loss": 1.5646, "step": 14018 }, { "epoch": 1.1, "learning_rate": 0.00021056869613181003, "loss": 1.5562, "step": 14019 }, { "epoch": 1.1, "learning_rate": 0.0002105573886259815, "loss": 1.5391, "step": 14020 }, { "epoch": 1.1, "learning_rate": 0.00021054608070900172, "loss": 1.5843, "step": 14021 }, { "epoch": 1.1, "learning_rate": 0.0002105347723809475, "loss": 1.5607, "step": 14022 }, { "epoch": 1.1, "learning_rate": 0.00021052346364189555, "loss": 1.5326, "step": 14023 }, { "epoch": 1.1, "learning_rate": 0.0002105121544919227, "loss": 1.5503, "step": 14024 }, { "epoch": 1.1, "learning_rate": 0.00021050084493110565, "loss": 1.5426, "step": 14025 }, { "epoch": 1.1, "learning_rate": 0.00021048953495952133, "loss": 1.5291, "step": 14026 }, { "epoch": 1.1, "learning_rate": 0.00021047822457724645, "loss": 1.5636, "step": 14027 }, { "epoch": 1.1, "learning_rate": 0.00021046691378435772, "loss": 1.5614, "step": 14028 }, { "epoch": 1.1, "learning_rate": 0.00021045560258093214, "loss": 1.5779, "step": 14029 }, { "epoch": 1.1, "learning_rate": 0.00021044429096704628, "loss": 1.641, "step": 14030 }, { "epoch": 1.1, "learning_rate": 0.00021043297894277708, "loss": 1.5975, "step": 14031 }, { "epoch": 1.1, "learning_rate": 0.00021042166650820125, "loss": 1.5402, "step": 14032 }, { "epoch": 1.1, "learning_rate": 0.0002104103536633957, "loss": 1.5411, "step": 14033 }, { "epoch": 1.1, "learning_rate": 0.00021039904040843718, "loss": 1.5675, "step": 14034 }, { "epoch": 1.1, "learning_rate": 0.0002103877267434025, "loss": 1.5845, "step": 14035 }, { "epoch": 1.1, "learning_rate": 0.00021037641266836852, "loss": 1.5508, "step": 14036 }, { "epoch": 1.1, "learning_rate": 0.00021036509818341196, "loss": 1.5363, "step": 14037 }, { "epoch": 1.1, "learning_rate": 0.0002103537832886097, "loss": 1.5639, "step": 14038 }, { "epoch": 1.1, "learning_rate": 0.00021034246798403857, "loss": 1.5491, "step": 14039 }, { "epoch": 1.1, "learning_rate": 0.0002103311522697754, "loss": 1.5932, "step": 14040 }, { "epoch": 1.1, "learning_rate": 0.00021031983614589698, "loss": 1.5851, "step": 14041 }, { "epoch": 1.1, "learning_rate": 0.00021030851961248017, "loss": 1.5819, "step": 14042 }, { "epoch": 1.1, "learning_rate": 0.00021029720266960175, "loss": 1.4933, "step": 14043 }, { "epoch": 1.11, "learning_rate": 0.00021028588531733867, "loss": 1.5601, "step": 14044 }, { "epoch": 1.11, "learning_rate": 0.00021027456755576764, "loss": 1.5612, "step": 14045 }, { "epoch": 1.11, "learning_rate": 0.00021026324938496562, "loss": 1.5005, "step": 14046 }, { "epoch": 1.11, "learning_rate": 0.00021025193080500933, "loss": 1.5618, "step": 14047 }, { "epoch": 1.11, "learning_rate": 0.0002102406118159757, "loss": 1.5106, "step": 14048 }, { "epoch": 1.11, "learning_rate": 0.00021022929241794154, "loss": 1.5267, "step": 14049 }, { "epoch": 1.11, "learning_rate": 0.00021021797261098373, "loss": 1.5172, "step": 14050 }, { "epoch": 1.11, "learning_rate": 0.00021020665239517917, "loss": 1.5936, "step": 14051 }, { "epoch": 1.11, "learning_rate": 0.0002101953317706046, "loss": 1.5525, "step": 14052 }, { "epoch": 1.11, "learning_rate": 0.000210184010737337, "loss": 1.5053, "step": 14053 }, { "epoch": 1.11, "learning_rate": 0.00021017268929545313, "loss": 1.5676, "step": 14054 }, { "epoch": 1.11, "learning_rate": 0.00021016136744502988, "loss": 1.5684, "step": 14055 }, { "epoch": 1.11, "learning_rate": 0.00021015004518614425, "loss": 1.547, "step": 14056 }, { "epoch": 1.11, "learning_rate": 0.00021013872251887295, "loss": 1.5217, "step": 14057 }, { "epoch": 1.11, "learning_rate": 0.0002101273994432929, "loss": 1.6049, "step": 14058 }, { "epoch": 1.11, "learning_rate": 0.000210116075959481, "loss": 1.5761, "step": 14059 }, { "epoch": 1.11, "learning_rate": 0.0002101047520675141, "loss": 1.6092, "step": 14060 }, { "epoch": 1.11, "learning_rate": 0.00021009342776746916, "loss": 1.5839, "step": 14061 }, { "epoch": 1.11, "learning_rate": 0.0002100821030594229, "loss": 1.5396, "step": 14062 }, { "epoch": 1.11, "learning_rate": 0.00021007077794345241, "loss": 1.6007, "step": 14063 }, { "epoch": 1.11, "learning_rate": 0.00021005945241963443, "loss": 1.6015, "step": 14064 }, { "epoch": 1.11, "learning_rate": 0.00021004812648804598, "loss": 1.5017, "step": 14065 }, { "epoch": 1.11, "learning_rate": 0.00021003680014876385, "loss": 1.5242, "step": 14066 }, { "epoch": 1.11, "learning_rate": 0.000210025473401865, "loss": 1.5939, "step": 14067 }, { "epoch": 1.11, "learning_rate": 0.0002100141462474263, "loss": 1.5711, "step": 14068 }, { "epoch": 1.11, "learning_rate": 0.00021000281868552463, "loss": 1.5783, "step": 14069 }, { "epoch": 1.11, "learning_rate": 0.00020999149071623696, "loss": 1.5689, "step": 14070 }, { "epoch": 1.11, "learning_rate": 0.00020998016233964018, "loss": 1.5515, "step": 14071 }, { "epoch": 1.11, "learning_rate": 0.00020996883355581117, "loss": 1.5521, "step": 14072 }, { "epoch": 1.11, "learning_rate": 0.00020995750436482688, "loss": 1.6229, "step": 14073 }, { "epoch": 1.11, "learning_rate": 0.00020994617476676424, "loss": 1.558, "step": 14074 }, { "epoch": 1.11, "learning_rate": 0.0002099348447617002, "loss": 1.5694, "step": 14075 }, { "epoch": 1.11, "learning_rate": 0.00020992351434971155, "loss": 1.6166, "step": 14076 }, { "epoch": 1.11, "learning_rate": 0.00020991218353087534, "loss": 1.5689, "step": 14077 }, { "epoch": 1.11, "learning_rate": 0.00020990085230526847, "loss": 1.5551, "step": 14078 }, { "epoch": 1.11, "learning_rate": 0.00020988952067296784, "loss": 1.5417, "step": 14079 }, { "epoch": 1.11, "learning_rate": 0.00020987818863405048, "loss": 1.5546, "step": 14080 }, { "epoch": 1.11, "learning_rate": 0.0002098668561885932, "loss": 1.5367, "step": 14081 }, { "epoch": 1.11, "learning_rate": 0.00020985552333667304, "loss": 1.5438, "step": 14082 }, { "epoch": 1.11, "learning_rate": 0.00020984419007836694, "loss": 1.5822, "step": 14083 }, { "epoch": 1.11, "learning_rate": 0.00020983285641375176, "loss": 1.5821, "step": 14084 }, { "epoch": 1.11, "learning_rate": 0.00020982152234290453, "loss": 1.5807, "step": 14085 }, { "epoch": 1.11, "learning_rate": 0.00020981018786590211, "loss": 1.5581, "step": 14086 }, { "epoch": 1.11, "learning_rate": 0.0002097988529828216, "loss": 1.5619, "step": 14087 }, { "epoch": 1.11, "learning_rate": 0.00020978751769373983, "loss": 1.555, "step": 14088 }, { "epoch": 1.11, "learning_rate": 0.00020977618199873385, "loss": 1.5862, "step": 14089 }, { "epoch": 1.11, "learning_rate": 0.00020976484589788056, "loss": 1.5497, "step": 14090 }, { "epoch": 1.11, "learning_rate": 0.00020975350939125695, "loss": 1.6064, "step": 14091 }, { "epoch": 1.11, "learning_rate": 0.00020974217247894, "loss": 1.5764, "step": 14092 }, { "epoch": 1.11, "learning_rate": 0.00020973083516100666, "loss": 1.5851, "step": 14093 }, { "epoch": 1.11, "learning_rate": 0.00020971949743753385, "loss": 1.5234, "step": 14094 }, { "epoch": 1.11, "learning_rate": 0.00020970815930859867, "loss": 1.5808, "step": 14095 }, { "epoch": 1.11, "learning_rate": 0.00020969682077427802, "loss": 1.5662, "step": 14096 }, { "epoch": 1.11, "learning_rate": 0.00020968548183464896, "loss": 1.5689, "step": 14097 }, { "epoch": 1.11, "learning_rate": 0.00020967414248978833, "loss": 1.5077, "step": 14098 }, { "epoch": 1.11, "learning_rate": 0.00020966280273977323, "loss": 1.5671, "step": 14099 }, { "epoch": 1.11, "learning_rate": 0.00020965146258468065, "loss": 1.6022, "step": 14100 }, { "epoch": 1.11, "learning_rate": 0.00020964012202458754, "loss": 1.545, "step": 14101 }, { "epoch": 1.11, "learning_rate": 0.0002096287810595709, "loss": 1.5582, "step": 14102 }, { "epoch": 1.11, "learning_rate": 0.00020961743968970773, "loss": 1.573, "step": 14103 }, { "epoch": 1.11, "learning_rate": 0.0002096060979150751, "loss": 1.524, "step": 14104 }, { "epoch": 1.11, "learning_rate": 0.00020959475573574993, "loss": 1.5784, "step": 14105 }, { "epoch": 1.11, "learning_rate": 0.00020958341315180923, "loss": 1.5673, "step": 14106 }, { "epoch": 1.11, "learning_rate": 0.0002095720701633301, "loss": 1.5608, "step": 14107 }, { "epoch": 1.11, "learning_rate": 0.00020956072677038941, "loss": 1.5375, "step": 14108 }, { "epoch": 1.11, "learning_rate": 0.0002095493829730643, "loss": 1.5894, "step": 14109 }, { "epoch": 1.11, "learning_rate": 0.00020953803877143173, "loss": 1.5543, "step": 14110 }, { "epoch": 1.11, "learning_rate": 0.00020952669416556872, "loss": 1.5085, "step": 14111 }, { "epoch": 1.11, "learning_rate": 0.00020951534915555233, "loss": 1.5625, "step": 14112 }, { "epoch": 1.11, "learning_rate": 0.00020950400374145957, "loss": 1.5538, "step": 14113 }, { "epoch": 1.11, "learning_rate": 0.00020949265792336746, "loss": 1.6039, "step": 14114 }, { "epoch": 1.11, "learning_rate": 0.00020948131170135298, "loss": 1.5406, "step": 14115 }, { "epoch": 1.11, "learning_rate": 0.00020946996507549328, "loss": 1.5875, "step": 14116 }, { "epoch": 1.11, "learning_rate": 0.0002094586180458653, "loss": 1.5798, "step": 14117 }, { "epoch": 1.11, "learning_rate": 0.00020944727061254613, "loss": 1.5826, "step": 14118 }, { "epoch": 1.11, "learning_rate": 0.0002094359227756128, "loss": 1.5351, "step": 14119 }, { "epoch": 1.11, "learning_rate": 0.00020942457453514235, "loss": 1.5593, "step": 14120 }, { "epoch": 1.11, "learning_rate": 0.00020941322589121186, "loss": 1.5655, "step": 14121 }, { "epoch": 1.11, "learning_rate": 0.0002094018768438983, "loss": 1.5599, "step": 14122 }, { "epoch": 1.11, "learning_rate": 0.0002093905273932788, "loss": 1.5984, "step": 14123 }, { "epoch": 1.11, "learning_rate": 0.0002093791775394304, "loss": 1.5573, "step": 14124 }, { "epoch": 1.11, "learning_rate": 0.0002093678272824301, "loss": 1.5151, "step": 14125 }, { "epoch": 1.11, "learning_rate": 0.0002093564766223551, "loss": 1.546, "step": 14126 }, { "epoch": 1.11, "learning_rate": 0.00020934512555928234, "loss": 1.5618, "step": 14127 }, { "epoch": 1.11, "learning_rate": 0.00020933377409328892, "loss": 1.6309, "step": 14128 }, { "epoch": 1.11, "learning_rate": 0.00020932242222445195, "loss": 1.5973, "step": 14129 }, { "epoch": 1.11, "learning_rate": 0.00020931106995284842, "loss": 1.5747, "step": 14130 }, { "epoch": 1.11, "learning_rate": 0.0002092997172785555, "loss": 1.5441, "step": 14131 }, { "epoch": 1.11, "learning_rate": 0.0002092883642016502, "loss": 1.5799, "step": 14132 }, { "epoch": 1.11, "learning_rate": 0.00020927701072220961, "loss": 1.5311, "step": 14133 }, { "epoch": 1.11, "learning_rate": 0.00020926565684031086, "loss": 1.5518, "step": 14134 }, { "epoch": 1.11, "learning_rate": 0.00020925430255603098, "loss": 1.5769, "step": 14135 }, { "epoch": 1.11, "learning_rate": 0.00020924294786944713, "loss": 1.5832, "step": 14136 }, { "epoch": 1.11, "learning_rate": 0.0002092315927806363, "loss": 1.5792, "step": 14137 }, { "epoch": 1.11, "learning_rate": 0.0002092202372896757, "loss": 1.5756, "step": 14138 }, { "epoch": 1.11, "learning_rate": 0.00020920888139664234, "loss": 1.57, "step": 14139 }, { "epoch": 1.11, "learning_rate": 0.00020919752510161334, "loss": 1.5803, "step": 14140 }, { "epoch": 1.11, "learning_rate": 0.00020918616840466582, "loss": 1.5246, "step": 14141 }, { "epoch": 1.11, "learning_rate": 0.00020917481130587682, "loss": 1.5561, "step": 14142 }, { "epoch": 1.11, "learning_rate": 0.0002091634538053236, "loss": 1.5225, "step": 14143 }, { "epoch": 1.11, "learning_rate": 0.00020915209590308316, "loss": 1.5596, "step": 14144 }, { "epoch": 1.11, "learning_rate": 0.00020914073759923258, "loss": 1.526, "step": 14145 }, { "epoch": 1.11, "learning_rate": 0.00020912937889384909, "loss": 1.5868, "step": 14146 }, { "epoch": 1.11, "learning_rate": 0.0002091180197870097, "loss": 1.5535, "step": 14147 }, { "epoch": 1.11, "learning_rate": 0.00020910666027879166, "loss": 1.5867, "step": 14148 }, { "epoch": 1.11, "learning_rate": 0.0002090953003692719, "loss": 1.5907, "step": 14149 }, { "epoch": 1.11, "learning_rate": 0.0002090839400585277, "loss": 1.5322, "step": 14150 }, { "epoch": 1.11, "learning_rate": 0.00020907257934663618, "loss": 1.5537, "step": 14151 }, { "epoch": 1.11, "learning_rate": 0.00020906121823367445, "loss": 1.5624, "step": 14152 }, { "epoch": 1.11, "learning_rate": 0.00020904985671971963, "loss": 1.5604, "step": 14153 }, { "epoch": 1.11, "learning_rate": 0.00020903849480484885, "loss": 1.5446, "step": 14154 }, { "epoch": 1.11, "learning_rate": 0.0002090271324891393, "loss": 1.5466, "step": 14155 }, { "epoch": 1.11, "learning_rate": 0.00020901576977266808, "loss": 1.5699, "step": 14156 }, { "epoch": 1.11, "learning_rate": 0.0002090044066555123, "loss": 1.5679, "step": 14157 }, { "epoch": 1.11, "learning_rate": 0.00020899304313774924, "loss": 1.5274, "step": 14158 }, { "epoch": 1.11, "learning_rate": 0.00020898167921945594, "loss": 1.5488, "step": 14159 }, { "epoch": 1.11, "learning_rate": 0.0002089703149007096, "loss": 1.5401, "step": 14160 }, { "epoch": 1.11, "learning_rate": 0.00020895895018158736, "loss": 1.5092, "step": 14161 }, { "epoch": 1.11, "learning_rate": 0.00020894758506216635, "loss": 1.5412, "step": 14162 }, { "epoch": 1.11, "learning_rate": 0.00020893621954252382, "loss": 1.5187, "step": 14163 }, { "epoch": 1.11, "learning_rate": 0.00020892485362273685, "loss": 1.5455, "step": 14164 }, { "epoch": 1.11, "learning_rate": 0.0002089134873028826, "loss": 1.5305, "step": 14165 }, { "epoch": 1.11, "learning_rate": 0.00020890212058303836, "loss": 1.5918, "step": 14166 }, { "epoch": 1.11, "learning_rate": 0.0002088907534632812, "loss": 1.5512, "step": 14167 }, { "epoch": 1.11, "learning_rate": 0.00020887938594368833, "loss": 1.6142, "step": 14168 }, { "epoch": 1.11, "learning_rate": 0.0002088680180243369, "loss": 1.5171, "step": 14169 }, { "epoch": 1.11, "learning_rate": 0.00020885664970530414, "loss": 1.5836, "step": 14170 }, { "epoch": 1.11, "learning_rate": 0.00020884528098666719, "loss": 1.5951, "step": 14171 }, { "epoch": 1.12, "learning_rate": 0.00020883391186850324, "loss": 1.5551, "step": 14172 }, { "epoch": 1.12, "learning_rate": 0.00020882254235088951, "loss": 1.5678, "step": 14173 }, { "epoch": 1.12, "learning_rate": 0.0002088111724339032, "loss": 1.5216, "step": 14174 }, { "epoch": 1.12, "learning_rate": 0.00020879980211762147, "loss": 1.6171, "step": 14175 }, { "epoch": 1.12, "learning_rate": 0.00020878843140212153, "loss": 1.5851, "step": 14176 }, { "epoch": 1.12, "learning_rate": 0.0002087770602874806, "loss": 1.4874, "step": 14177 }, { "epoch": 1.12, "learning_rate": 0.00020876568877377583, "loss": 1.5775, "step": 14178 }, { "epoch": 1.12, "learning_rate": 0.00020875431686108448, "loss": 1.5532, "step": 14179 }, { "epoch": 1.12, "learning_rate": 0.00020874294454948373, "loss": 1.578, "step": 14180 }, { "epoch": 1.12, "learning_rate": 0.00020873157183905078, "loss": 1.4725, "step": 14181 }, { "epoch": 1.12, "learning_rate": 0.00020872019872986294, "loss": 1.5869, "step": 14182 }, { "epoch": 1.12, "learning_rate": 0.0002087088252219973, "loss": 1.612, "step": 14183 }, { "epoch": 1.12, "learning_rate": 0.00020869745131553118, "loss": 1.5933, "step": 14184 }, { "epoch": 1.12, "learning_rate": 0.00020868607701054174, "loss": 1.5696, "step": 14185 }, { "epoch": 1.12, "learning_rate": 0.00020867470230710622, "loss": 1.6297, "step": 14186 }, { "epoch": 1.12, "learning_rate": 0.00020866332720530185, "loss": 1.5825, "step": 14187 }, { "epoch": 1.12, "learning_rate": 0.00020865195170520585, "loss": 1.5653, "step": 14188 }, { "epoch": 1.12, "learning_rate": 0.00020864057580689544, "loss": 1.552, "step": 14189 }, { "epoch": 1.12, "learning_rate": 0.00020862919951044795, "loss": 1.5456, "step": 14190 }, { "epoch": 1.12, "learning_rate": 0.0002086178228159405, "loss": 1.5655, "step": 14191 }, { "epoch": 1.12, "learning_rate": 0.00020860644572345038, "loss": 1.5712, "step": 14192 }, { "epoch": 1.12, "learning_rate": 0.00020859506823305482, "loss": 1.5846, "step": 14193 }, { "epoch": 1.12, "learning_rate": 0.0002085836903448311, "loss": 1.5467, "step": 14194 }, { "epoch": 1.12, "learning_rate": 0.0002085723120588565, "loss": 1.5991, "step": 14195 }, { "epoch": 1.12, "learning_rate": 0.00020856093337520815, "loss": 1.5762, "step": 14196 }, { "epoch": 1.12, "learning_rate": 0.00020854955429396344, "loss": 1.5453, "step": 14197 }, { "epoch": 1.12, "learning_rate": 0.00020853817481519954, "loss": 1.5632, "step": 14198 }, { "epoch": 1.12, "learning_rate": 0.00020852679493899376, "loss": 1.6024, "step": 14199 }, { "epoch": 1.12, "learning_rate": 0.0002085154146654233, "loss": 1.5557, "step": 14200 }, { "epoch": 1.12, "learning_rate": 0.0002085040339945655, "loss": 1.5576, "step": 14201 }, { "epoch": 1.12, "learning_rate": 0.00020849265292649757, "loss": 1.5882, "step": 14202 }, { "epoch": 1.12, "learning_rate": 0.00020848127146129683, "loss": 1.5929, "step": 14203 }, { "epoch": 1.12, "learning_rate": 0.0002084698895990405, "loss": 1.5091, "step": 14204 }, { "epoch": 1.12, "learning_rate": 0.0002084585073398059, "loss": 1.5361, "step": 14205 }, { "epoch": 1.12, "learning_rate": 0.00020844712468367027, "loss": 1.5679, "step": 14206 }, { "epoch": 1.12, "learning_rate": 0.00020843574163071095, "loss": 1.5711, "step": 14207 }, { "epoch": 1.12, "learning_rate": 0.0002084243581810052, "loss": 1.5248, "step": 14208 }, { "epoch": 1.12, "learning_rate": 0.0002084129743346303, "loss": 1.5382, "step": 14209 }, { "epoch": 1.12, "learning_rate": 0.0002084015900916635, "loss": 1.5548, "step": 14210 }, { "epoch": 1.12, "learning_rate": 0.00020839020545218215, "loss": 1.6118, "step": 14211 }, { "epoch": 1.12, "learning_rate": 0.00020837882041626352, "loss": 1.5438, "step": 14212 }, { "epoch": 1.12, "learning_rate": 0.0002083674349839849, "loss": 1.5891, "step": 14213 }, { "epoch": 1.12, "learning_rate": 0.0002083560491554237, "loss": 1.586, "step": 14214 }, { "epoch": 1.12, "learning_rate": 0.00020834466293065705, "loss": 1.5301, "step": 14215 }, { "epoch": 1.12, "learning_rate": 0.00020833327630976237, "loss": 1.5828, "step": 14216 }, { "epoch": 1.12, "learning_rate": 0.00020832188929281688, "loss": 1.5634, "step": 14217 }, { "epoch": 1.12, "learning_rate": 0.000208310501879898, "loss": 1.5976, "step": 14218 }, { "epoch": 1.12, "learning_rate": 0.000208299114071083, "loss": 1.5612, "step": 14219 }, { "epoch": 1.12, "learning_rate": 0.0002082877258664491, "loss": 1.5702, "step": 14220 }, { "epoch": 1.12, "learning_rate": 0.0002082763372660738, "loss": 1.5349, "step": 14221 }, { "epoch": 1.12, "learning_rate": 0.00020826494827003427, "loss": 1.602, "step": 14222 }, { "epoch": 1.12, "learning_rate": 0.00020825355887840792, "loss": 1.5905, "step": 14223 }, { "epoch": 1.12, "learning_rate": 0.00020824216909127205, "loss": 1.5802, "step": 14224 }, { "epoch": 1.12, "learning_rate": 0.000208230778908704, "loss": 1.5204, "step": 14225 }, { "epoch": 1.12, "learning_rate": 0.00020821938833078113, "loss": 1.5833, "step": 14226 }, { "epoch": 1.12, "learning_rate": 0.00020820799735758066, "loss": 1.5975, "step": 14227 }, { "epoch": 1.12, "learning_rate": 0.00020819660598918004, "loss": 1.5918, "step": 14228 }, { "epoch": 1.12, "learning_rate": 0.0002081852142256566, "loss": 1.5732, "step": 14229 }, { "epoch": 1.12, "learning_rate": 0.00020817382206708766, "loss": 1.58, "step": 14230 }, { "epoch": 1.12, "learning_rate": 0.00020816242951355058, "loss": 1.6128, "step": 14231 }, { "epoch": 1.12, "learning_rate": 0.00020815103656512268, "loss": 1.6127, "step": 14232 }, { "epoch": 1.12, "learning_rate": 0.00020813964322188134, "loss": 1.5895, "step": 14233 }, { "epoch": 1.12, "learning_rate": 0.00020812824948390394, "loss": 1.6027, "step": 14234 }, { "epoch": 1.12, "learning_rate": 0.0002081168553512677, "loss": 1.5199, "step": 14235 }, { "epoch": 1.12, "learning_rate": 0.00020810546082405018, "loss": 1.547, "step": 14236 }, { "epoch": 1.12, "learning_rate": 0.00020809406590232863, "loss": 1.5548, "step": 14237 }, { "epoch": 1.12, "learning_rate": 0.00020808267058618045, "loss": 1.5575, "step": 14238 }, { "epoch": 1.12, "learning_rate": 0.00020807127487568295, "loss": 1.5372, "step": 14239 }, { "epoch": 1.12, "learning_rate": 0.00020805987877091354, "loss": 1.5822, "step": 14240 }, { "epoch": 1.12, "learning_rate": 0.0002080484822719496, "loss": 1.5094, "step": 14241 }, { "epoch": 1.12, "learning_rate": 0.0002080370853788685, "loss": 1.6101, "step": 14242 }, { "epoch": 1.12, "learning_rate": 0.00020802568809174764, "loss": 1.5215, "step": 14243 }, { "epoch": 1.12, "learning_rate": 0.00020801429041066434, "loss": 1.5469, "step": 14244 }, { "epoch": 1.12, "learning_rate": 0.00020800289233569608, "loss": 1.5, "step": 14245 }, { "epoch": 1.12, "learning_rate": 0.00020799149386692013, "loss": 1.5535, "step": 14246 }, { "epoch": 1.12, "learning_rate": 0.00020798009500441395, "loss": 1.5396, "step": 14247 }, { "epoch": 1.12, "learning_rate": 0.00020796869574825496, "loss": 1.5777, "step": 14248 }, { "epoch": 1.12, "learning_rate": 0.00020795729609852047, "loss": 1.5296, "step": 14249 }, { "epoch": 1.12, "learning_rate": 0.00020794589605528793, "loss": 1.5724, "step": 14250 }, { "epoch": 1.12, "learning_rate": 0.00020793449561863476, "loss": 1.5531, "step": 14251 }, { "epoch": 1.12, "learning_rate": 0.00020792309478863828, "loss": 1.4807, "step": 14252 }, { "epoch": 1.12, "learning_rate": 0.00020791169356537602, "loss": 1.5591, "step": 14253 }, { "epoch": 1.12, "learning_rate": 0.0002079002919489253, "loss": 1.5227, "step": 14254 }, { "epoch": 1.12, "learning_rate": 0.00020788888993936356, "loss": 1.5413, "step": 14255 }, { "epoch": 1.12, "learning_rate": 0.00020787748753676817, "loss": 1.5395, "step": 14256 }, { "epoch": 1.12, "learning_rate": 0.00020786608474121659, "loss": 1.5476, "step": 14257 }, { "epoch": 1.12, "learning_rate": 0.00020785468155278623, "loss": 1.5761, "step": 14258 }, { "epoch": 1.12, "learning_rate": 0.0002078432779715545, "loss": 1.575, "step": 14259 }, { "epoch": 1.12, "learning_rate": 0.00020783187399759883, "loss": 1.5238, "step": 14260 }, { "epoch": 1.12, "learning_rate": 0.0002078204696309967, "loss": 1.5769, "step": 14261 }, { "epoch": 1.12, "learning_rate": 0.0002078090648718254, "loss": 1.5676, "step": 14262 }, { "epoch": 1.12, "learning_rate": 0.00020779765972016255, "loss": 1.55, "step": 14263 }, { "epoch": 1.12, "learning_rate": 0.00020778625417608543, "loss": 1.5506, "step": 14264 }, { "epoch": 1.12, "learning_rate": 0.00020777484823967154, "loss": 1.549, "step": 14265 }, { "epoch": 1.12, "learning_rate": 0.00020776344191099832, "loss": 1.5385, "step": 14266 }, { "epoch": 1.12, "learning_rate": 0.00020775203519014318, "loss": 1.6073, "step": 14267 }, { "epoch": 1.12, "learning_rate": 0.00020774062807718362, "loss": 1.6087, "step": 14268 }, { "epoch": 1.12, "learning_rate": 0.00020772922057219707, "loss": 1.5628, "step": 14269 }, { "epoch": 1.12, "learning_rate": 0.00020771781267526097, "loss": 1.5644, "step": 14270 }, { "epoch": 1.12, "learning_rate": 0.00020770640438645273, "loss": 1.565, "step": 14271 }, { "epoch": 1.12, "learning_rate": 0.00020769499570584988, "loss": 1.5743, "step": 14272 }, { "epoch": 1.12, "learning_rate": 0.00020768358663352988, "loss": 1.5265, "step": 14273 }, { "epoch": 1.12, "learning_rate": 0.00020767217716957008, "loss": 1.5092, "step": 14274 }, { "epoch": 1.12, "learning_rate": 0.00020766076731404805, "loss": 1.5631, "step": 14275 }, { "epoch": 1.12, "learning_rate": 0.00020764935706704123, "loss": 1.5967, "step": 14276 }, { "epoch": 1.12, "learning_rate": 0.00020763794642862714, "loss": 1.5578, "step": 14277 }, { "epoch": 1.12, "learning_rate": 0.00020762653539888317, "loss": 1.5124, "step": 14278 }, { "epoch": 1.12, "learning_rate": 0.0002076151239778868, "loss": 1.5642, "step": 14279 }, { "epoch": 1.12, "learning_rate": 0.00020760371216571558, "loss": 1.6092, "step": 14280 }, { "epoch": 1.12, "learning_rate": 0.0002075922999624469, "loss": 1.5421, "step": 14281 }, { "epoch": 1.12, "learning_rate": 0.0002075808873681583, "loss": 1.5477, "step": 14282 }, { "epoch": 1.12, "learning_rate": 0.00020756947438292723, "loss": 1.5358, "step": 14283 }, { "epoch": 1.12, "learning_rate": 0.00020755806100683125, "loss": 1.5136, "step": 14284 }, { "epoch": 1.12, "learning_rate": 0.00020754664723994775, "loss": 1.5384, "step": 14285 }, { "epoch": 1.12, "learning_rate": 0.0002075352330823543, "loss": 1.5564, "step": 14286 }, { "epoch": 1.12, "learning_rate": 0.00020752381853412837, "loss": 1.5123, "step": 14287 }, { "epoch": 1.12, "learning_rate": 0.00020751240359534744, "loss": 1.5553, "step": 14288 }, { "epoch": 1.12, "learning_rate": 0.000207500988266089, "loss": 1.5203, "step": 14289 }, { "epoch": 1.12, "learning_rate": 0.00020748957254643061, "loss": 1.5947, "step": 14290 }, { "epoch": 1.12, "learning_rate": 0.00020747815643644977, "loss": 1.5764, "step": 14291 }, { "epoch": 1.12, "learning_rate": 0.00020746673993622395, "loss": 1.5315, "step": 14292 }, { "epoch": 1.12, "learning_rate": 0.00020745532304583067, "loss": 1.4287, "step": 14293 }, { "epoch": 1.12, "learning_rate": 0.00020744390576534746, "loss": 1.565, "step": 14294 }, { "epoch": 1.12, "learning_rate": 0.00020743248809485182, "loss": 1.5466, "step": 14295 }, { "epoch": 1.12, "learning_rate": 0.00020742107003442133, "loss": 1.5157, "step": 14296 }, { "epoch": 1.12, "learning_rate": 0.00020740965158413344, "loss": 1.5826, "step": 14297 }, { "epoch": 1.12, "learning_rate": 0.0002073982327440656, "loss": 1.5141, "step": 14298 }, { "epoch": 1.13, "learning_rate": 0.00020738681351429556, "loss": 1.5434, "step": 14299 }, { "epoch": 1.13, "learning_rate": 0.00020737539389490065, "loss": 1.6036, "step": 14300 }, { "epoch": 1.13, "learning_rate": 0.00020736397388595854, "loss": 1.6009, "step": 14301 }, { "epoch": 1.13, "learning_rate": 0.00020735255348754668, "loss": 1.5404, "step": 14302 }, { "epoch": 1.13, "learning_rate": 0.0002073411326997426, "loss": 1.5675, "step": 14303 }, { "epoch": 1.13, "learning_rate": 0.0002073297115226239, "loss": 1.5867, "step": 14304 }, { "epoch": 1.13, "learning_rate": 0.00020731828995626807, "loss": 1.5289, "step": 14305 }, { "epoch": 1.13, "learning_rate": 0.00020730686800075272, "loss": 1.5168, "step": 14306 }, { "epoch": 1.13, "learning_rate": 0.00020729544565615534, "loss": 1.533, "step": 14307 }, { "epoch": 1.13, "learning_rate": 0.0002072840229225535, "loss": 1.5603, "step": 14308 }, { "epoch": 1.13, "learning_rate": 0.00020727259980002477, "loss": 1.4877, "step": 14309 }, { "epoch": 1.13, "learning_rate": 0.00020726117628864666, "loss": 1.5948, "step": 14310 }, { "epoch": 1.13, "learning_rate": 0.00020724975238849684, "loss": 1.535, "step": 14311 }, { "epoch": 1.13, "learning_rate": 0.0002072383280996527, "loss": 1.5463, "step": 14312 }, { "epoch": 1.13, "learning_rate": 0.00020722690342219193, "loss": 1.5861, "step": 14313 }, { "epoch": 1.13, "learning_rate": 0.00020721547835619207, "loss": 1.5362, "step": 14314 }, { "epoch": 1.13, "learning_rate": 0.0002072040529017307, "loss": 1.5834, "step": 14315 }, { "epoch": 1.13, "learning_rate": 0.00020719262705888537, "loss": 1.5628, "step": 14316 }, { "epoch": 1.13, "learning_rate": 0.00020718120082773367, "loss": 1.5439, "step": 14317 }, { "epoch": 1.13, "learning_rate": 0.00020716977420835316, "loss": 1.5061, "step": 14318 }, { "epoch": 1.13, "learning_rate": 0.00020715834720082146, "loss": 1.4814, "step": 14319 }, { "epoch": 1.13, "learning_rate": 0.00020714691980521608, "loss": 1.5309, "step": 14320 }, { "epoch": 1.13, "learning_rate": 0.0002071354920216147, "loss": 1.5161, "step": 14321 }, { "epoch": 1.13, "learning_rate": 0.0002071240638500948, "loss": 1.5294, "step": 14322 }, { "epoch": 1.13, "learning_rate": 0.00020711263529073407, "loss": 1.5654, "step": 14323 }, { "epoch": 1.13, "learning_rate": 0.00020710120634361007, "loss": 1.5601, "step": 14324 }, { "epoch": 1.13, "learning_rate": 0.00020708977700880035, "loss": 1.556, "step": 14325 }, { "epoch": 1.13, "learning_rate": 0.0002070783472863826, "loss": 1.557, "step": 14326 }, { "epoch": 1.13, "learning_rate": 0.00020706691717643433, "loss": 1.5257, "step": 14327 }, { "epoch": 1.13, "learning_rate": 0.00020705548667903324, "loss": 1.5382, "step": 14328 }, { "epoch": 1.13, "learning_rate": 0.00020704405579425683, "loss": 1.5226, "step": 14329 }, { "epoch": 1.13, "learning_rate": 0.00020703262452218275, "loss": 1.5727, "step": 14330 }, { "epoch": 1.13, "learning_rate": 0.00020702119286288863, "loss": 1.6115, "step": 14331 }, { "epoch": 1.13, "learning_rate": 0.0002070097608164521, "loss": 1.5604, "step": 14332 }, { "epoch": 1.13, "learning_rate": 0.00020699832838295078, "loss": 1.5373, "step": 14333 }, { "epoch": 1.13, "learning_rate": 0.0002069868955624622, "loss": 1.6019, "step": 14334 }, { "epoch": 1.13, "learning_rate": 0.00020697546235506407, "loss": 1.5751, "step": 14335 }, { "epoch": 1.13, "learning_rate": 0.00020696402876083404, "loss": 1.527, "step": 14336 }, { "epoch": 1.13, "learning_rate": 0.00020695259477984963, "loss": 1.5525, "step": 14337 }, { "epoch": 1.13, "learning_rate": 0.00020694116041218853, "loss": 1.5534, "step": 14338 }, { "epoch": 1.13, "learning_rate": 0.00020692972565792842, "loss": 1.5374, "step": 14339 }, { "epoch": 1.13, "learning_rate": 0.00020691829051714688, "loss": 1.5195, "step": 14340 }, { "epoch": 1.13, "learning_rate": 0.00020690685498992155, "loss": 1.566, "step": 14341 }, { "epoch": 1.13, "learning_rate": 0.00020689541907633005, "loss": 1.5075, "step": 14342 }, { "epoch": 1.13, "learning_rate": 0.00020688398277645008, "loss": 1.5677, "step": 14343 }, { "epoch": 1.13, "learning_rate": 0.00020687254609035925, "loss": 1.5852, "step": 14344 }, { "epoch": 1.13, "learning_rate": 0.0002068611090181352, "loss": 1.5905, "step": 14345 }, { "epoch": 1.13, "learning_rate": 0.0002068496715598556, "loss": 1.6193, "step": 14346 }, { "epoch": 1.13, "learning_rate": 0.0002068382337155981, "loss": 1.5077, "step": 14347 }, { "epoch": 1.13, "learning_rate": 0.00020682679548544042, "loss": 1.5871, "step": 14348 }, { "epoch": 1.13, "learning_rate": 0.0002068153568694601, "loss": 1.5442, "step": 14349 }, { "epoch": 1.13, "learning_rate": 0.0002068039178677349, "loss": 1.5439, "step": 14350 }, { "epoch": 1.13, "learning_rate": 0.00020679247848034242, "loss": 1.55, "step": 14351 }, { "epoch": 1.13, "learning_rate": 0.00020678103870736033, "loss": 1.5095, "step": 14352 }, { "epoch": 1.13, "learning_rate": 0.00020676959854886633, "loss": 1.5191, "step": 14353 }, { "epoch": 1.13, "learning_rate": 0.0002067581580049381, "loss": 1.5933, "step": 14354 }, { "epoch": 1.13, "learning_rate": 0.00020674671707565333, "loss": 1.5696, "step": 14355 }, { "epoch": 1.13, "learning_rate": 0.0002067352757610896, "loss": 1.5431, "step": 14356 }, { "epoch": 1.13, "learning_rate": 0.00020672383406132472, "loss": 1.567, "step": 14357 }, { "epoch": 1.13, "learning_rate": 0.00020671239197643626, "loss": 1.5631, "step": 14358 }, { "epoch": 1.13, "learning_rate": 0.00020670094950650194, "loss": 1.6025, "step": 14359 }, { "epoch": 1.13, "learning_rate": 0.00020668950665159953, "loss": 1.528, "step": 14360 }, { "epoch": 1.13, "learning_rate": 0.00020667806341180658, "loss": 1.5426, "step": 14361 }, { "epoch": 1.13, "learning_rate": 0.00020666661978720093, "loss": 1.5392, "step": 14362 }, { "epoch": 1.13, "learning_rate": 0.00020665517577786018, "loss": 1.5593, "step": 14363 }, { "epoch": 1.13, "learning_rate": 0.00020664373138386204, "loss": 1.5992, "step": 14364 }, { "epoch": 1.13, "learning_rate": 0.00020663228660528423, "loss": 1.5317, "step": 14365 }, { "epoch": 1.13, "learning_rate": 0.00020662084144220443, "loss": 1.6087, "step": 14366 }, { "epoch": 1.13, "learning_rate": 0.0002066093958947004, "loss": 1.5361, "step": 14367 }, { "epoch": 1.13, "learning_rate": 0.00020659794996284977, "loss": 1.5642, "step": 14368 }, { "epoch": 1.13, "learning_rate": 0.0002065865036467303, "loss": 1.5178, "step": 14369 }, { "epoch": 1.13, "learning_rate": 0.0002065750569464197, "loss": 1.5648, "step": 14370 }, { "epoch": 1.13, "learning_rate": 0.00020656360986199567, "loss": 1.5135, "step": 14371 }, { "epoch": 1.13, "learning_rate": 0.000206552162393536, "loss": 1.558, "step": 14372 }, { "epoch": 1.13, "learning_rate": 0.0002065407145411183, "loss": 1.5597, "step": 14373 }, { "epoch": 1.13, "learning_rate": 0.00020652926630482035, "loss": 1.5782, "step": 14374 }, { "epoch": 1.13, "learning_rate": 0.00020651781768471993, "loss": 1.4993, "step": 14375 }, { "epoch": 1.13, "learning_rate": 0.00020650636868089467, "loss": 1.5416, "step": 14376 }, { "epoch": 1.13, "learning_rate": 0.00020649491929342236, "loss": 1.5124, "step": 14377 }, { "epoch": 1.13, "learning_rate": 0.00020648346952238073, "loss": 1.5843, "step": 14378 }, { "epoch": 1.13, "learning_rate": 0.0002064720193678475, "loss": 1.5904, "step": 14379 }, { "epoch": 1.13, "learning_rate": 0.00020646056882990042, "loss": 1.5491, "step": 14380 }, { "epoch": 1.13, "learning_rate": 0.00020644911790861727, "loss": 1.5729, "step": 14381 }, { "epoch": 1.13, "learning_rate": 0.00020643766660407575, "loss": 1.6006, "step": 14382 }, { "epoch": 1.13, "learning_rate": 0.00020642621491635357, "loss": 1.5493, "step": 14383 }, { "epoch": 1.13, "learning_rate": 0.00020641476284552861, "loss": 1.5444, "step": 14384 }, { "epoch": 1.13, "learning_rate": 0.00020640331039167845, "loss": 1.5296, "step": 14385 }, { "epoch": 1.13, "learning_rate": 0.00020639185755488103, "loss": 1.599, "step": 14386 }, { "epoch": 1.13, "learning_rate": 0.00020638040433521395, "loss": 1.559, "step": 14387 }, { "epoch": 1.13, "learning_rate": 0.00020636895073275501, "loss": 1.5453, "step": 14388 }, { "epoch": 1.13, "learning_rate": 0.0002063574967475821, "loss": 1.5668, "step": 14389 }, { "epoch": 1.13, "learning_rate": 0.00020634604237977283, "loss": 1.5308, "step": 14390 }, { "epoch": 1.13, "learning_rate": 0.000206334587629405, "loss": 1.5806, "step": 14391 }, { "epoch": 1.13, "learning_rate": 0.00020632313249655646, "loss": 1.5623, "step": 14392 }, { "epoch": 1.13, "learning_rate": 0.0002063116769813049, "loss": 1.5953, "step": 14393 }, { "epoch": 1.13, "learning_rate": 0.00020630022108372817, "loss": 1.5306, "step": 14394 }, { "epoch": 1.13, "learning_rate": 0.00020628876480390396, "loss": 1.5218, "step": 14395 }, { "epoch": 1.13, "learning_rate": 0.00020627730814191014, "loss": 1.498, "step": 14396 }, { "epoch": 1.13, "learning_rate": 0.00020626585109782442, "loss": 1.5399, "step": 14397 }, { "epoch": 1.13, "learning_rate": 0.00020625439367172465, "loss": 1.6219, "step": 14398 }, { "epoch": 1.13, "learning_rate": 0.0002062429358636886, "loss": 1.5434, "step": 14399 }, { "epoch": 1.13, "learning_rate": 0.00020623147767379396, "loss": 1.5971, "step": 14400 }, { "epoch": 1.13, "learning_rate": 0.00020622001910211875, "loss": 1.5177, "step": 14401 }, { "epoch": 1.13, "learning_rate": 0.00020620856014874056, "loss": 1.5602, "step": 14402 }, { "epoch": 1.13, "learning_rate": 0.00020619710081373727, "loss": 1.5386, "step": 14403 }, { "epoch": 1.13, "learning_rate": 0.00020618564109718668, "loss": 1.5777, "step": 14404 }, { "epoch": 1.13, "learning_rate": 0.0002061741809991666, "loss": 1.5636, "step": 14405 }, { "epoch": 1.13, "learning_rate": 0.00020616272051975486, "loss": 1.5046, "step": 14406 }, { "epoch": 1.13, "learning_rate": 0.0002061512596590292, "loss": 1.5948, "step": 14407 }, { "epoch": 1.13, "learning_rate": 0.00020613979841706747, "loss": 1.5409, "step": 14408 }, { "epoch": 1.13, "learning_rate": 0.00020612833679394752, "loss": 1.4702, "step": 14409 }, { "epoch": 1.13, "learning_rate": 0.00020611687478974707, "loss": 1.5121, "step": 14410 }, { "epoch": 1.13, "learning_rate": 0.0002061054124045441, "loss": 1.5672, "step": 14411 }, { "epoch": 1.13, "learning_rate": 0.0002060939496384163, "loss": 1.5222, "step": 14412 }, { "epoch": 1.13, "learning_rate": 0.00020608248649144154, "loss": 1.5755, "step": 14413 }, { "epoch": 1.13, "learning_rate": 0.00020607102296369765, "loss": 1.536, "step": 14414 }, { "epoch": 1.13, "learning_rate": 0.00020605955905526242, "loss": 1.5129, "step": 14415 }, { "epoch": 1.13, "learning_rate": 0.00020604809476621375, "loss": 1.6037, "step": 14416 }, { "epoch": 1.13, "learning_rate": 0.00020603663009662946, "loss": 1.5333, "step": 14417 }, { "epoch": 1.13, "learning_rate": 0.00020602516504658738, "loss": 1.5609, "step": 14418 }, { "epoch": 1.13, "learning_rate": 0.0002060136996161653, "loss": 1.552, "step": 14419 }, { "epoch": 1.13, "learning_rate": 0.00020600223380544112, "loss": 1.5372, "step": 14420 }, { "epoch": 1.13, "learning_rate": 0.00020599076761449272, "loss": 1.531, "step": 14421 }, { "epoch": 1.13, "learning_rate": 0.00020597930104339788, "loss": 1.5693, "step": 14422 }, { "epoch": 1.13, "learning_rate": 0.0002059678340922345, "loss": 1.515, "step": 14423 }, { "epoch": 1.13, "learning_rate": 0.00020595636676108036, "loss": 1.5519, "step": 14424 }, { "epoch": 1.13, "learning_rate": 0.00020594489905001342, "loss": 1.5639, "step": 14425 }, { "epoch": 1.14, "learning_rate": 0.00020593343095911144, "loss": 1.5585, "step": 14426 }, { "epoch": 1.14, "learning_rate": 0.00020592196248845235, "loss": 1.5275, "step": 14427 }, { "epoch": 1.14, "learning_rate": 0.00020591049363811404, "loss": 1.5384, "step": 14428 }, { "epoch": 1.14, "learning_rate": 0.0002058990244081743, "loss": 1.5446, "step": 14429 }, { "epoch": 1.14, "learning_rate": 0.00020588755479871102, "loss": 1.5573, "step": 14430 }, { "epoch": 1.14, "learning_rate": 0.0002058760848098021, "loss": 1.5607, "step": 14431 }, { "epoch": 1.14, "learning_rate": 0.00020586461444152535, "loss": 1.5961, "step": 14432 }, { "epoch": 1.14, "learning_rate": 0.00020585314369395879, "loss": 1.5117, "step": 14433 }, { "epoch": 1.14, "learning_rate": 0.00020584167256718013, "loss": 1.5166, "step": 14434 }, { "epoch": 1.14, "learning_rate": 0.00020583020106126735, "loss": 1.6384, "step": 14435 }, { "epoch": 1.14, "learning_rate": 0.00020581872917629834, "loss": 1.5829, "step": 14436 }, { "epoch": 1.14, "learning_rate": 0.0002058072569123509, "loss": 1.5924, "step": 14437 }, { "epoch": 1.14, "learning_rate": 0.00020579578426950306, "loss": 1.5681, "step": 14438 }, { "epoch": 1.14, "learning_rate": 0.00020578431124783255, "loss": 1.6036, "step": 14439 }, { "epoch": 1.14, "learning_rate": 0.00020577283784741743, "loss": 1.5142, "step": 14440 }, { "epoch": 1.14, "learning_rate": 0.00020576136406833545, "loss": 1.5, "step": 14441 }, { "epoch": 1.14, "learning_rate": 0.00020574988991066466, "loss": 1.5611, "step": 14442 }, { "epoch": 1.14, "learning_rate": 0.00020573841537448284, "loss": 1.5582, "step": 14443 }, { "epoch": 1.14, "learning_rate": 0.00020572694045986793, "loss": 1.5112, "step": 14444 }, { "epoch": 1.14, "learning_rate": 0.00020571546516689787, "loss": 1.5827, "step": 14445 }, { "epoch": 1.14, "learning_rate": 0.00020570398949565054, "loss": 1.5456, "step": 14446 }, { "epoch": 1.14, "learning_rate": 0.00020569251344620384, "loss": 1.5457, "step": 14447 }, { "epoch": 1.14, "learning_rate": 0.0002056810370186357, "loss": 1.5567, "step": 14448 }, { "epoch": 1.14, "learning_rate": 0.00020566956021302407, "loss": 1.5831, "step": 14449 }, { "epoch": 1.14, "learning_rate": 0.00020565808302944687, "loss": 1.5754, "step": 14450 }, { "epoch": 1.14, "learning_rate": 0.00020564660546798196, "loss": 1.5635, "step": 14451 }, { "epoch": 1.14, "learning_rate": 0.00020563512752870734, "loss": 1.5098, "step": 14452 }, { "epoch": 1.14, "learning_rate": 0.0002056236492117009, "loss": 1.5661, "step": 14453 }, { "epoch": 1.14, "learning_rate": 0.00020561217051704055, "loss": 1.5407, "step": 14454 }, { "epoch": 1.14, "learning_rate": 0.00020560069144480425, "loss": 1.5846, "step": 14455 }, { "epoch": 1.14, "learning_rate": 0.00020558921199506994, "loss": 1.5942, "step": 14456 }, { "epoch": 1.14, "learning_rate": 0.0002055777321679156, "loss": 1.5755, "step": 14457 }, { "epoch": 1.14, "learning_rate": 0.00020556625196341909, "loss": 1.5363, "step": 14458 }, { "epoch": 1.14, "learning_rate": 0.00020555477138165844, "loss": 1.539, "step": 14459 }, { "epoch": 1.14, "learning_rate": 0.00020554329042271152, "loss": 1.5369, "step": 14460 }, { "epoch": 1.14, "learning_rate": 0.0002055318090866563, "loss": 1.5228, "step": 14461 }, { "epoch": 1.14, "learning_rate": 0.00020552032737357077, "loss": 1.6003, "step": 14462 }, { "epoch": 1.14, "learning_rate": 0.00020550884528353278, "loss": 1.5493, "step": 14463 }, { "epoch": 1.14, "learning_rate": 0.00020549736281662046, "loss": 1.5293, "step": 14464 }, { "epoch": 1.14, "learning_rate": 0.0002054858799729116, "loss": 1.5711, "step": 14465 }, { "epoch": 1.14, "learning_rate": 0.00020547439675248425, "loss": 1.5592, "step": 14466 }, { "epoch": 1.14, "learning_rate": 0.0002054629131554164, "loss": 1.5545, "step": 14467 }, { "epoch": 1.14, "learning_rate": 0.00020545142918178594, "loss": 1.5931, "step": 14468 }, { "epoch": 1.14, "learning_rate": 0.0002054399448316709, "loss": 1.5425, "step": 14469 }, { "epoch": 1.14, "learning_rate": 0.0002054284601051492, "loss": 1.5858, "step": 14470 }, { "epoch": 1.14, "learning_rate": 0.00020541697500229885, "loss": 1.5406, "step": 14471 }, { "epoch": 1.14, "learning_rate": 0.00020540548952319783, "loss": 1.5691, "step": 14472 }, { "epoch": 1.14, "learning_rate": 0.0002053940036679241, "loss": 1.5976, "step": 14473 }, { "epoch": 1.14, "learning_rate": 0.0002053825174365557, "loss": 1.5159, "step": 14474 }, { "epoch": 1.14, "learning_rate": 0.0002053710308291705, "loss": 1.5417, "step": 14475 }, { "epoch": 1.14, "learning_rate": 0.0002053595438458466, "loss": 1.5338, "step": 14476 }, { "epoch": 1.14, "learning_rate": 0.00020534805648666195, "loss": 1.5803, "step": 14477 }, { "epoch": 1.14, "learning_rate": 0.00020533656875169453, "loss": 1.5544, "step": 14478 }, { "epoch": 1.14, "learning_rate": 0.00020532508064102233, "loss": 1.5379, "step": 14479 }, { "epoch": 1.14, "learning_rate": 0.00020531359215472336, "loss": 1.6044, "step": 14480 }, { "epoch": 1.14, "learning_rate": 0.0002053021032928757, "loss": 1.5323, "step": 14481 }, { "epoch": 1.14, "learning_rate": 0.0002052906140555572, "loss": 1.5943, "step": 14482 }, { "epoch": 1.14, "learning_rate": 0.00020527912444284595, "loss": 1.5412, "step": 14483 }, { "epoch": 1.14, "learning_rate": 0.00020526763445481998, "loss": 1.5492, "step": 14484 }, { "epoch": 1.14, "learning_rate": 0.00020525614409155722, "loss": 1.5539, "step": 14485 }, { "epoch": 1.14, "learning_rate": 0.00020524465335313577, "loss": 1.5179, "step": 14486 }, { "epoch": 1.14, "learning_rate": 0.0002052331622396336, "loss": 1.5376, "step": 14487 }, { "epoch": 1.14, "learning_rate": 0.00020522167075112874, "loss": 1.6135, "step": 14488 }, { "epoch": 1.14, "learning_rate": 0.00020521017888769922, "loss": 1.5174, "step": 14489 }, { "epoch": 1.14, "learning_rate": 0.00020519868664942308, "loss": 1.5658, "step": 14490 }, { "epoch": 1.14, "learning_rate": 0.00020518719403637829, "loss": 1.5562, "step": 14491 }, { "epoch": 1.14, "learning_rate": 0.00020517570104864287, "loss": 1.5651, "step": 14492 }, { "epoch": 1.14, "learning_rate": 0.00020516420768629492, "loss": 1.5831, "step": 14493 }, { "epoch": 1.14, "learning_rate": 0.00020515271394941248, "loss": 1.5491, "step": 14494 }, { "epoch": 1.14, "learning_rate": 0.00020514121983807347, "loss": 1.5692, "step": 14495 }, { "epoch": 1.14, "learning_rate": 0.00020512972535235608, "loss": 1.5642, "step": 14496 }, { "epoch": 1.14, "learning_rate": 0.00020511823049233825, "loss": 1.5595, "step": 14497 }, { "epoch": 1.14, "learning_rate": 0.00020510673525809804, "loss": 1.5232, "step": 14498 }, { "epoch": 1.14, "learning_rate": 0.0002050952396497135, "loss": 1.5176, "step": 14499 }, { "epoch": 1.14, "learning_rate": 0.0002050837436672627, "loss": 1.5333, "step": 14500 }, { "epoch": 1.14, "learning_rate": 0.00020507224731082372, "loss": 1.5772, "step": 14501 }, { "epoch": 1.14, "learning_rate": 0.00020506075058047447, "loss": 1.5367, "step": 14502 }, { "epoch": 1.14, "learning_rate": 0.00020504925347629319, "loss": 1.5238, "step": 14503 }, { "epoch": 1.14, "learning_rate": 0.00020503775599835784, "loss": 1.5069, "step": 14504 }, { "epoch": 1.14, "learning_rate": 0.0002050262581467465, "loss": 1.53, "step": 14505 }, { "epoch": 1.14, "learning_rate": 0.00020501475992153724, "loss": 1.5734, "step": 14506 }, { "epoch": 1.14, "learning_rate": 0.00020500326132280814, "loss": 1.5378, "step": 14507 }, { "epoch": 1.14, "learning_rate": 0.00020499176235063722, "loss": 1.5709, "step": 14508 }, { "epoch": 1.14, "learning_rate": 0.0002049802630051026, "loss": 1.5305, "step": 14509 }, { "epoch": 1.14, "learning_rate": 0.00020496876328628228, "loss": 1.5341, "step": 14510 }, { "epoch": 1.14, "learning_rate": 0.00020495726319425442, "loss": 1.6043, "step": 14511 }, { "epoch": 1.14, "learning_rate": 0.00020494576272909708, "loss": 1.5114, "step": 14512 }, { "epoch": 1.14, "learning_rate": 0.00020493426189088833, "loss": 1.583, "step": 14513 }, { "epoch": 1.14, "learning_rate": 0.00020492276067970628, "loss": 1.6263, "step": 14514 }, { "epoch": 1.14, "learning_rate": 0.00020491125909562896, "loss": 1.5463, "step": 14515 }, { "epoch": 1.14, "learning_rate": 0.0002048997571387345, "loss": 1.609, "step": 14516 }, { "epoch": 1.14, "learning_rate": 0.000204888254809101, "loss": 1.5287, "step": 14517 }, { "epoch": 1.14, "learning_rate": 0.00020487675210680652, "loss": 1.4799, "step": 14518 }, { "epoch": 1.14, "learning_rate": 0.00020486524903192918, "loss": 1.5688, "step": 14519 }, { "epoch": 1.14, "learning_rate": 0.0002048537455845471, "loss": 1.5571, "step": 14520 }, { "epoch": 1.14, "learning_rate": 0.00020484224176473836, "loss": 1.5463, "step": 14521 }, { "epoch": 1.14, "learning_rate": 0.000204830737572581, "loss": 1.5329, "step": 14522 }, { "epoch": 1.14, "learning_rate": 0.00020481923300815326, "loss": 1.5437, "step": 14523 }, { "epoch": 1.14, "learning_rate": 0.00020480772807153315, "loss": 1.595, "step": 14524 }, { "epoch": 1.14, "learning_rate": 0.00020479622276279886, "loss": 1.5827, "step": 14525 }, { "epoch": 1.14, "learning_rate": 0.00020478471708202837, "loss": 1.5723, "step": 14526 }, { "epoch": 1.14, "learning_rate": 0.0002047732110292999, "loss": 1.5361, "step": 14527 }, { "epoch": 1.14, "learning_rate": 0.00020476170460469162, "loss": 1.5595, "step": 14528 }, { "epoch": 1.14, "learning_rate": 0.0002047501978082815, "loss": 1.5428, "step": 14529 }, { "epoch": 1.14, "learning_rate": 0.00020473869064014784, "loss": 1.5962, "step": 14530 }, { "epoch": 1.14, "learning_rate": 0.00020472718310036864, "loss": 1.568, "step": 14531 }, { "epoch": 1.14, "learning_rate": 0.00020471567518902205, "loss": 1.5679, "step": 14532 }, { "epoch": 1.14, "learning_rate": 0.00020470416690618624, "loss": 1.5544, "step": 14533 }, { "epoch": 1.14, "learning_rate": 0.00020469265825193926, "loss": 1.5487, "step": 14534 }, { "epoch": 1.14, "learning_rate": 0.0002046811492263594, "loss": 1.5238, "step": 14535 }, { "epoch": 1.14, "learning_rate": 0.0002046696398295247, "loss": 1.5682, "step": 14536 }, { "epoch": 1.14, "learning_rate": 0.0002046581300615133, "loss": 1.565, "step": 14537 }, { "epoch": 1.14, "learning_rate": 0.00020464661992240335, "loss": 1.5669, "step": 14538 }, { "epoch": 1.14, "learning_rate": 0.000204635109412273, "loss": 1.5666, "step": 14539 }, { "epoch": 1.14, "learning_rate": 0.00020462359853120045, "loss": 1.5509, "step": 14540 }, { "epoch": 1.14, "learning_rate": 0.00020461208727926377, "loss": 1.5784, "step": 14541 }, { "epoch": 1.14, "learning_rate": 0.00020460057565654114, "loss": 1.5457, "step": 14542 }, { "epoch": 1.14, "learning_rate": 0.00020458906366311073, "loss": 1.5907, "step": 14543 }, { "epoch": 1.14, "learning_rate": 0.00020457755129905077, "loss": 1.5853, "step": 14544 }, { "epoch": 1.14, "learning_rate": 0.00020456603856443931, "loss": 1.547, "step": 14545 }, { "epoch": 1.14, "learning_rate": 0.00020455452545935457, "loss": 1.5661, "step": 14546 }, { "epoch": 1.14, "learning_rate": 0.0002045430119838747, "loss": 1.5135, "step": 14547 }, { "epoch": 1.14, "learning_rate": 0.0002045314981380779, "loss": 1.5719, "step": 14548 }, { "epoch": 1.14, "learning_rate": 0.00020451998392204227, "loss": 1.5167, "step": 14549 }, { "epoch": 1.14, "learning_rate": 0.0002045084693358461, "loss": 1.5946, "step": 14550 }, { "epoch": 1.14, "learning_rate": 0.00020449695437956743, "loss": 1.5479, "step": 14551 }, { "epoch": 1.14, "learning_rate": 0.00020448543905328458, "loss": 1.5284, "step": 14552 }, { "epoch": 1.15, "learning_rate": 0.00020447392335707563, "loss": 1.5441, "step": 14553 }, { "epoch": 1.15, "learning_rate": 0.00020446240729101885, "loss": 1.5141, "step": 14554 }, { "epoch": 1.15, "learning_rate": 0.00020445089085519233, "loss": 1.497, "step": 14555 }, { "epoch": 1.15, "learning_rate": 0.00020443937404967426, "loss": 1.5628, "step": 14556 }, { "epoch": 1.15, "learning_rate": 0.00020442785687454295, "loss": 1.552, "step": 14557 }, { "epoch": 1.15, "learning_rate": 0.00020441633932987652, "loss": 1.499, "step": 14558 }, { "epoch": 1.15, "learning_rate": 0.0002044048214157532, "loss": 1.5853, "step": 14559 }, { "epoch": 1.15, "learning_rate": 0.00020439330313225113, "loss": 1.5032, "step": 14560 }, { "epoch": 1.15, "learning_rate": 0.00020438178447944856, "loss": 1.5757, "step": 14561 }, { "epoch": 1.15, "learning_rate": 0.0002043702654574237, "loss": 1.559, "step": 14562 }, { "epoch": 1.15, "learning_rate": 0.00020435874606625473, "loss": 1.5359, "step": 14563 }, { "epoch": 1.15, "learning_rate": 0.0002043472263060199, "loss": 1.4927, "step": 14564 }, { "epoch": 1.15, "learning_rate": 0.0002043357061767973, "loss": 1.5515, "step": 14565 }, { "epoch": 1.15, "learning_rate": 0.00020432418567866532, "loss": 1.5246, "step": 14566 }, { "epoch": 1.15, "learning_rate": 0.00020431266481170209, "loss": 1.5239, "step": 14567 }, { "epoch": 1.15, "learning_rate": 0.0002043011435759858, "loss": 1.5756, "step": 14568 }, { "epoch": 1.15, "learning_rate": 0.00020428962197159475, "loss": 1.5746, "step": 14569 }, { "epoch": 1.15, "learning_rate": 0.00020427809999860712, "loss": 1.5295, "step": 14570 }, { "epoch": 1.15, "learning_rate": 0.00020426657765710112, "loss": 1.5099, "step": 14571 }, { "epoch": 1.15, "learning_rate": 0.00020425505494715506, "loss": 1.5485, "step": 14572 }, { "epoch": 1.15, "learning_rate": 0.00020424353186884706, "loss": 1.5548, "step": 14573 }, { "epoch": 1.15, "learning_rate": 0.00020423200842225545, "loss": 1.56, "step": 14574 }, { "epoch": 1.15, "learning_rate": 0.0002042204846074584, "loss": 1.5289, "step": 14575 }, { "epoch": 1.15, "learning_rate": 0.00020420896042453422, "loss": 1.5634, "step": 14576 }, { "epoch": 1.15, "learning_rate": 0.00020419743587356108, "loss": 1.4872, "step": 14577 }, { "epoch": 1.15, "learning_rate": 0.00020418591095461725, "loss": 1.5121, "step": 14578 }, { "epoch": 1.15, "learning_rate": 0.00020417438566778102, "loss": 1.5648, "step": 14579 }, { "epoch": 1.15, "learning_rate": 0.0002041628600131306, "loss": 1.5436, "step": 14580 }, { "epoch": 1.15, "learning_rate": 0.0002041513339907442, "loss": 1.526, "step": 14581 }, { "epoch": 1.15, "learning_rate": 0.0002041398076007002, "loss": 1.4753, "step": 14582 }, { "epoch": 1.15, "learning_rate": 0.00020412828084307672, "loss": 1.5619, "step": 14583 }, { "epoch": 1.15, "learning_rate": 0.00020411675371795215, "loss": 1.5424, "step": 14584 }, { "epoch": 1.15, "learning_rate": 0.00020410522622540462, "loss": 1.5148, "step": 14585 }, { "epoch": 1.15, "learning_rate": 0.00020409369836551253, "loss": 1.538, "step": 14586 }, { "epoch": 1.15, "learning_rate": 0.00020408217013835405, "loss": 1.5477, "step": 14587 }, { "epoch": 1.15, "learning_rate": 0.00020407064154400744, "loss": 1.5603, "step": 14588 }, { "epoch": 1.15, "learning_rate": 0.00020405911258255103, "loss": 1.5654, "step": 14589 }, { "epoch": 1.15, "learning_rate": 0.00020404758325406308, "loss": 1.5328, "step": 14590 }, { "epoch": 1.15, "learning_rate": 0.00020403605355862192, "loss": 1.5792, "step": 14591 }, { "epoch": 1.15, "learning_rate": 0.00020402452349630574, "loss": 1.5513, "step": 14592 }, { "epoch": 1.15, "learning_rate": 0.00020401299306719285, "loss": 1.5482, "step": 14593 }, { "epoch": 1.15, "learning_rate": 0.00020400146227136153, "loss": 1.5297, "step": 14594 }, { "epoch": 1.15, "learning_rate": 0.0002039899311088901, "loss": 1.4981, "step": 14595 }, { "epoch": 1.15, "learning_rate": 0.00020397839957985686, "loss": 1.5866, "step": 14596 }, { "epoch": 1.15, "learning_rate": 0.00020396686768434, "loss": 1.534, "step": 14597 }, { "epoch": 1.15, "learning_rate": 0.00020395533542241794, "loss": 1.4891, "step": 14598 }, { "epoch": 1.15, "learning_rate": 0.00020394380279416892, "loss": 1.5765, "step": 14599 }, { "epoch": 1.15, "learning_rate": 0.00020393226979967125, "loss": 1.5165, "step": 14600 }, { "epoch": 1.15, "learning_rate": 0.00020392073643900324, "loss": 1.5136, "step": 14601 }, { "epoch": 1.15, "learning_rate": 0.00020390920271224315, "loss": 1.5723, "step": 14602 }, { "epoch": 1.15, "learning_rate": 0.0002038976686194694, "loss": 1.5471, "step": 14603 }, { "epoch": 1.15, "learning_rate": 0.00020388613416076016, "loss": 1.5292, "step": 14604 }, { "epoch": 1.15, "learning_rate": 0.0002038745993361938, "loss": 1.5924, "step": 14605 }, { "epoch": 1.15, "learning_rate": 0.00020386306414584864, "loss": 1.5856, "step": 14606 }, { "epoch": 1.15, "learning_rate": 0.00020385152858980302, "loss": 1.5533, "step": 14607 }, { "epoch": 1.15, "learning_rate": 0.00020383999266813526, "loss": 1.5577, "step": 14608 }, { "epoch": 1.15, "learning_rate": 0.0002038284563809236, "loss": 1.5818, "step": 14609 }, { "epoch": 1.15, "learning_rate": 0.0002038169197282465, "loss": 1.5683, "step": 14610 }, { "epoch": 1.15, "learning_rate": 0.00020380538271018217, "loss": 1.4751, "step": 14611 }, { "epoch": 1.15, "learning_rate": 0.00020379384532680895, "loss": 1.5719, "step": 14612 }, { "epoch": 1.15, "learning_rate": 0.00020378230757820526, "loss": 1.5951, "step": 14613 }, { "epoch": 1.15, "learning_rate": 0.0002037707694644494, "loss": 1.5342, "step": 14614 }, { "epoch": 1.15, "learning_rate": 0.00020375923098561965, "loss": 1.5825, "step": 14615 }, { "epoch": 1.15, "learning_rate": 0.00020374769214179437, "loss": 1.5924, "step": 14616 }, { "epoch": 1.15, "learning_rate": 0.00020373615293305195, "loss": 1.5866, "step": 14617 }, { "epoch": 1.15, "learning_rate": 0.00020372461335947073, "loss": 1.5842, "step": 14618 }, { "epoch": 1.15, "learning_rate": 0.000203713073421129, "loss": 1.5601, "step": 14619 }, { "epoch": 1.15, "learning_rate": 0.00020370153311810514, "loss": 1.5212, "step": 14620 }, { "epoch": 1.15, "learning_rate": 0.0002036899924504775, "loss": 1.5721, "step": 14621 }, { "epoch": 1.15, "learning_rate": 0.00020367845141832448, "loss": 1.5391, "step": 14622 }, { "epoch": 1.15, "learning_rate": 0.00020366691002172434, "loss": 1.5562, "step": 14623 }, { "epoch": 1.15, "learning_rate": 0.00020365536826075554, "loss": 1.5317, "step": 14624 }, { "epoch": 1.15, "learning_rate": 0.00020364382613549637, "loss": 1.5385, "step": 14625 }, { "epoch": 1.15, "learning_rate": 0.00020363228364602526, "loss": 1.5932, "step": 14626 }, { "epoch": 1.15, "learning_rate": 0.00020362074079242047, "loss": 1.5171, "step": 14627 }, { "epoch": 1.15, "learning_rate": 0.00020360919757476047, "loss": 1.482, "step": 14628 }, { "epoch": 1.15, "learning_rate": 0.00020359765399312365, "loss": 1.5211, "step": 14629 }, { "epoch": 1.15, "learning_rate": 0.00020358611004758832, "loss": 1.5565, "step": 14630 }, { "epoch": 1.15, "learning_rate": 0.00020357456573823286, "loss": 1.5008, "step": 14631 }, { "epoch": 1.15, "learning_rate": 0.00020356302106513567, "loss": 1.5224, "step": 14632 }, { "epoch": 1.15, "learning_rate": 0.00020355147602837514, "loss": 1.5813, "step": 14633 }, { "epoch": 1.15, "learning_rate": 0.0002035399306280296, "loss": 1.5441, "step": 14634 }, { "epoch": 1.15, "learning_rate": 0.00020352838486417752, "loss": 1.5483, "step": 14635 }, { "epoch": 1.15, "learning_rate": 0.0002035168387368972, "loss": 1.574, "step": 14636 }, { "epoch": 1.15, "learning_rate": 0.0002035052922462671, "loss": 1.5228, "step": 14637 }, { "epoch": 1.15, "learning_rate": 0.0002034937453923656, "loss": 1.4952, "step": 14638 }, { "epoch": 1.15, "learning_rate": 0.00020348219817527106, "loss": 1.5558, "step": 14639 }, { "epoch": 1.15, "learning_rate": 0.00020347065059506198, "loss": 1.5652, "step": 14640 }, { "epoch": 1.15, "learning_rate": 0.00020345910265181662, "loss": 1.5505, "step": 14641 }, { "epoch": 1.15, "learning_rate": 0.00020344755434561349, "loss": 1.6149, "step": 14642 }, { "epoch": 1.15, "learning_rate": 0.00020343600567653095, "loss": 1.5319, "step": 14643 }, { "epoch": 1.15, "learning_rate": 0.00020342445664464742, "loss": 1.529, "step": 14644 }, { "epoch": 1.15, "learning_rate": 0.00020341290725004127, "loss": 1.6191, "step": 14645 }, { "epoch": 1.15, "learning_rate": 0.000203401357492791, "loss": 1.5582, "step": 14646 }, { "epoch": 1.15, "learning_rate": 0.000203389807372975, "loss": 1.5517, "step": 14647 }, { "epoch": 1.15, "learning_rate": 0.00020337825689067162, "loss": 1.5506, "step": 14648 }, { "epoch": 1.15, "learning_rate": 0.0002033667060459594, "loss": 1.5928, "step": 14649 }, { "epoch": 1.15, "learning_rate": 0.00020335515483891662, "loss": 1.474, "step": 14650 }, { "epoch": 1.15, "learning_rate": 0.00020334360326962185, "loss": 1.5459, "step": 14651 }, { "epoch": 1.15, "learning_rate": 0.00020333205133815337, "loss": 1.5455, "step": 14652 }, { "epoch": 1.15, "learning_rate": 0.00020332049904458975, "loss": 1.5064, "step": 14653 }, { "epoch": 1.15, "learning_rate": 0.0002033089463890094, "loss": 1.5072, "step": 14654 }, { "epoch": 1.15, "learning_rate": 0.00020329739337149067, "loss": 1.5704, "step": 14655 }, { "epoch": 1.15, "learning_rate": 0.00020328583999211204, "loss": 1.5651, "step": 14656 }, { "epoch": 1.15, "learning_rate": 0.000203274286250952, "loss": 1.5288, "step": 14657 }, { "epoch": 1.15, "learning_rate": 0.00020326273214808893, "loss": 1.6144, "step": 14658 }, { "epoch": 1.15, "learning_rate": 0.00020325117768360136, "loss": 1.5691, "step": 14659 }, { "epoch": 1.15, "learning_rate": 0.00020323962285756758, "loss": 1.5603, "step": 14660 }, { "epoch": 1.15, "learning_rate": 0.00020322806767006618, "loss": 1.5502, "step": 14661 }, { "epoch": 1.15, "learning_rate": 0.00020321651212117559, "loss": 1.5687, "step": 14662 }, { "epoch": 1.15, "learning_rate": 0.00020320495621097424, "loss": 1.4882, "step": 14663 }, { "epoch": 1.15, "learning_rate": 0.00020319339993954064, "loss": 1.5422, "step": 14664 }, { "epoch": 1.15, "learning_rate": 0.00020318184330695314, "loss": 1.5496, "step": 14665 }, { "epoch": 1.15, "learning_rate": 0.0002031702863132903, "loss": 1.5871, "step": 14666 }, { "epoch": 1.15, "learning_rate": 0.00020315872895863057, "loss": 1.5374, "step": 14667 }, { "epoch": 1.15, "learning_rate": 0.00020314717124305238, "loss": 1.5916, "step": 14668 }, { "epoch": 1.15, "learning_rate": 0.00020313561316663426, "loss": 1.5374, "step": 14669 }, { "epoch": 1.15, "learning_rate": 0.0002031240547294546, "loss": 1.5299, "step": 14670 }, { "epoch": 1.15, "learning_rate": 0.000203112495931592, "loss": 1.5709, "step": 14671 }, { "epoch": 1.15, "learning_rate": 0.00020310093677312481, "loss": 1.5724, "step": 14672 }, { "epoch": 1.15, "learning_rate": 0.00020308937725413155, "loss": 1.5585, "step": 14673 }, { "epoch": 1.15, "learning_rate": 0.00020307781737469077, "loss": 1.5137, "step": 14674 }, { "epoch": 1.15, "learning_rate": 0.00020306625713488084, "loss": 1.6098, "step": 14675 }, { "epoch": 1.15, "learning_rate": 0.00020305469653478036, "loss": 1.582, "step": 14676 }, { "epoch": 1.15, "learning_rate": 0.00020304313557446775, "loss": 1.5919, "step": 14677 }, { "epoch": 1.15, "learning_rate": 0.0002030315742540215, "loss": 1.5556, "step": 14678 }, { "epoch": 1.15, "learning_rate": 0.00020302001257352015, "loss": 1.6076, "step": 14679 }, { "epoch": 1.16, "learning_rate": 0.00020300845053304215, "loss": 1.5628, "step": 14680 }, { "epoch": 1.16, "learning_rate": 0.0002029968881326661, "loss": 1.5804, "step": 14681 }, { "epoch": 1.16, "learning_rate": 0.00020298532537247035, "loss": 1.5316, "step": 14682 }, { "epoch": 1.16, "learning_rate": 0.00020297376225253345, "loss": 1.5722, "step": 14683 }, { "epoch": 1.16, "learning_rate": 0.000202962198772934, "loss": 1.6335, "step": 14684 }, { "epoch": 1.16, "learning_rate": 0.00020295063493375043, "loss": 1.5216, "step": 14685 }, { "epoch": 1.16, "learning_rate": 0.00020293907073506127, "loss": 1.6007, "step": 14686 }, { "epoch": 1.16, "learning_rate": 0.00020292750617694502, "loss": 1.5381, "step": 14687 }, { "epoch": 1.16, "learning_rate": 0.00020291594125948026, "loss": 1.5442, "step": 14688 }, { "epoch": 1.16, "learning_rate": 0.0002029043759827454, "loss": 1.5463, "step": 14689 }, { "epoch": 1.16, "learning_rate": 0.0002028928103468191, "loss": 1.5181, "step": 14690 }, { "epoch": 1.16, "learning_rate": 0.0002028812443517797, "loss": 1.5405, "step": 14691 }, { "epoch": 1.16, "learning_rate": 0.00020286967799770588, "loss": 1.5657, "step": 14692 }, { "epoch": 1.16, "learning_rate": 0.00020285811128467615, "loss": 1.5463, "step": 14693 }, { "epoch": 1.16, "learning_rate": 0.00020284654421276897, "loss": 1.5997, "step": 14694 }, { "epoch": 1.16, "learning_rate": 0.00020283497678206297, "loss": 1.5269, "step": 14695 }, { "epoch": 1.16, "learning_rate": 0.0002028234089926366, "loss": 1.5346, "step": 14696 }, { "epoch": 1.16, "learning_rate": 0.00020281184084456843, "loss": 1.5217, "step": 14697 }, { "epoch": 1.16, "learning_rate": 0.00020280027233793706, "loss": 1.5805, "step": 14698 }, { "epoch": 1.16, "learning_rate": 0.00020278870347282087, "loss": 1.5264, "step": 14699 }, { "epoch": 1.16, "learning_rate": 0.00020277713424929862, "loss": 1.5386, "step": 14700 }, { "epoch": 1.16, "learning_rate": 0.0002027655646674487, "loss": 1.6007, "step": 14701 }, { "epoch": 1.16, "learning_rate": 0.0002027539947273497, "loss": 1.5726, "step": 14702 }, { "epoch": 1.16, "learning_rate": 0.00020274242442908026, "loss": 1.4688, "step": 14703 }, { "epoch": 1.16, "learning_rate": 0.0002027308537727188, "loss": 1.5376, "step": 14704 }, { "epoch": 1.16, "learning_rate": 0.00020271928275834397, "loss": 1.5483, "step": 14705 }, { "epoch": 1.16, "learning_rate": 0.0002027077113860343, "loss": 1.5083, "step": 14706 }, { "epoch": 1.16, "learning_rate": 0.00020269613965586832, "loss": 1.5353, "step": 14707 }, { "epoch": 1.16, "learning_rate": 0.00020268456756792466, "loss": 1.5598, "step": 14708 }, { "epoch": 1.16, "learning_rate": 0.00020267299512228185, "loss": 1.5665, "step": 14709 }, { "epoch": 1.16, "learning_rate": 0.00020266142231901852, "loss": 1.5285, "step": 14710 }, { "epoch": 1.16, "learning_rate": 0.00020264984915821312, "loss": 1.5768, "step": 14711 }, { "epoch": 1.16, "learning_rate": 0.00020263827563994435, "loss": 1.5236, "step": 14712 }, { "epoch": 1.16, "learning_rate": 0.00020262670176429074, "loss": 1.5497, "step": 14713 }, { "epoch": 1.16, "learning_rate": 0.0002026151275313308, "loss": 1.5252, "step": 14714 }, { "epoch": 1.16, "learning_rate": 0.00020260355294114324, "loss": 1.5874, "step": 14715 }, { "epoch": 1.16, "learning_rate": 0.00020259197799380656, "loss": 1.5845, "step": 14716 }, { "epoch": 1.16, "learning_rate": 0.0002025804026893994, "loss": 1.4976, "step": 14717 }, { "epoch": 1.16, "learning_rate": 0.00020256882702800028, "loss": 1.5212, "step": 14718 }, { "epoch": 1.16, "learning_rate": 0.00020255725100968788, "loss": 1.5178, "step": 14719 }, { "epoch": 1.16, "learning_rate": 0.00020254567463454072, "loss": 1.5556, "step": 14720 }, { "epoch": 1.16, "learning_rate": 0.00020253409790263745, "loss": 1.5565, "step": 14721 }, { "epoch": 1.16, "learning_rate": 0.00020252252081405663, "loss": 1.6056, "step": 14722 }, { "epoch": 1.16, "learning_rate": 0.00020251094336887684, "loss": 1.5879, "step": 14723 }, { "epoch": 1.16, "learning_rate": 0.00020249936556717676, "loss": 1.5907, "step": 14724 }, { "epoch": 1.16, "learning_rate": 0.00020248778740903498, "loss": 1.516, "step": 14725 }, { "epoch": 1.16, "learning_rate": 0.00020247620889453006, "loss": 1.5659, "step": 14726 }, { "epoch": 1.16, "learning_rate": 0.00020246463002374066, "loss": 1.5869, "step": 14727 }, { "epoch": 1.16, "learning_rate": 0.00020245305079674537, "loss": 1.5381, "step": 14728 }, { "epoch": 1.16, "learning_rate": 0.0002024414712136228, "loss": 1.5659, "step": 14729 }, { "epoch": 1.16, "learning_rate": 0.00020242989127445158, "loss": 1.5798, "step": 14730 }, { "epoch": 1.16, "learning_rate": 0.00020241831097931028, "loss": 1.5154, "step": 14731 }, { "epoch": 1.16, "learning_rate": 0.0002024067303282777, "loss": 1.5378, "step": 14732 }, { "epoch": 1.16, "learning_rate": 0.00020239514932143227, "loss": 1.5464, "step": 14733 }, { "epoch": 1.16, "learning_rate": 0.0002023835679588527, "loss": 1.567, "step": 14734 }, { "epoch": 1.16, "learning_rate": 0.0002023719862406176, "loss": 1.5498, "step": 14735 }, { "epoch": 1.16, "learning_rate": 0.0002023604041668056, "loss": 1.5794, "step": 14736 }, { "epoch": 1.16, "learning_rate": 0.00020234882173749539, "loss": 1.5393, "step": 14737 }, { "epoch": 1.16, "learning_rate": 0.0002023372389527655, "loss": 1.5395, "step": 14738 }, { "epoch": 1.16, "learning_rate": 0.00020232565581269473, "loss": 1.5525, "step": 14739 }, { "epoch": 1.16, "learning_rate": 0.0002023140723173616, "loss": 1.5826, "step": 14740 }, { "epoch": 1.16, "learning_rate": 0.00020230248846684473, "loss": 1.5497, "step": 14741 }, { "epoch": 1.16, "learning_rate": 0.0002022909042612229, "loss": 1.5407, "step": 14742 }, { "epoch": 1.16, "learning_rate": 0.00020227931970057467, "loss": 1.5309, "step": 14743 }, { "epoch": 1.16, "learning_rate": 0.00020226773478497872, "loss": 1.5075, "step": 14744 }, { "epoch": 1.16, "learning_rate": 0.00020225614951451367, "loss": 1.5777, "step": 14745 }, { "epoch": 1.16, "learning_rate": 0.0002022445638892582, "loss": 1.5025, "step": 14746 }, { "epoch": 1.16, "learning_rate": 0.00020223297790929095, "loss": 1.5504, "step": 14747 }, { "epoch": 1.16, "learning_rate": 0.00020222139157469063, "loss": 1.5517, "step": 14748 }, { "epoch": 1.16, "learning_rate": 0.00020220980488553592, "loss": 1.581, "step": 14749 }, { "epoch": 1.16, "learning_rate": 0.0002021982178419054, "loss": 1.5754, "step": 14750 }, { "epoch": 1.16, "learning_rate": 0.00020218663044387777, "loss": 1.5564, "step": 14751 }, { "epoch": 1.16, "learning_rate": 0.00020217504269153178, "loss": 1.5642, "step": 14752 }, { "epoch": 1.16, "learning_rate": 0.00020216345458494602, "loss": 1.5638, "step": 14753 }, { "epoch": 1.16, "learning_rate": 0.00020215186612419913, "loss": 1.5371, "step": 14754 }, { "epoch": 1.16, "learning_rate": 0.0002021402773093699, "loss": 1.527, "step": 14755 }, { "epoch": 1.16, "learning_rate": 0.00020212868814053697, "loss": 1.6033, "step": 14756 }, { "epoch": 1.16, "learning_rate": 0.00020211709861777899, "loss": 1.5139, "step": 14757 }, { "epoch": 1.16, "learning_rate": 0.00020210550874117465, "loss": 1.5785, "step": 14758 }, { "epoch": 1.16, "learning_rate": 0.00020209391851080274, "loss": 1.5443, "step": 14759 }, { "epoch": 1.16, "learning_rate": 0.00020208232792674183, "loss": 1.5456, "step": 14760 }, { "epoch": 1.16, "learning_rate": 0.00020207073698907065, "loss": 1.5755, "step": 14761 }, { "epoch": 1.16, "learning_rate": 0.00020205914569786787, "loss": 1.5339, "step": 14762 }, { "epoch": 1.16, "learning_rate": 0.00020204755405321226, "loss": 1.5351, "step": 14763 }, { "epoch": 1.16, "learning_rate": 0.00020203596205518247, "loss": 1.5919, "step": 14764 }, { "epoch": 1.16, "learning_rate": 0.0002020243697038572, "loss": 1.5963, "step": 14765 }, { "epoch": 1.16, "learning_rate": 0.00020201277699931518, "loss": 1.536, "step": 14766 }, { "epoch": 1.16, "learning_rate": 0.0002020011839416351, "loss": 1.5433, "step": 14767 }, { "epoch": 1.16, "learning_rate": 0.0002019895905308957, "loss": 1.5868, "step": 14768 }, { "epoch": 1.16, "learning_rate": 0.00020197799676717566, "loss": 1.5595, "step": 14769 }, { "epoch": 1.16, "learning_rate": 0.00020196640265055367, "loss": 1.5617, "step": 14770 }, { "epoch": 1.16, "learning_rate": 0.00020195480818110853, "loss": 1.5395, "step": 14771 }, { "epoch": 1.16, "learning_rate": 0.00020194321335891889, "loss": 1.5928, "step": 14772 }, { "epoch": 1.16, "learning_rate": 0.00020193161818406354, "loss": 1.5845, "step": 14773 }, { "epoch": 1.16, "learning_rate": 0.00020192002265662112, "loss": 1.549, "step": 14774 }, { "epoch": 1.16, "learning_rate": 0.0002019084267766704, "loss": 1.5151, "step": 14775 }, { "epoch": 1.16, "learning_rate": 0.0002018968305442901, "loss": 1.5163, "step": 14776 }, { "epoch": 1.16, "learning_rate": 0.00020188523395955896, "loss": 1.5491, "step": 14777 }, { "epoch": 1.16, "learning_rate": 0.00020187363702255573, "loss": 1.5473, "step": 14778 }, { "epoch": 1.16, "learning_rate": 0.00020186203973335913, "loss": 1.5338, "step": 14779 }, { "epoch": 1.16, "learning_rate": 0.00020185044209204787, "loss": 1.5385, "step": 14780 }, { "epoch": 1.16, "learning_rate": 0.00020183884409870077, "loss": 1.5487, "step": 14781 }, { "epoch": 1.16, "learning_rate": 0.0002018272457533965, "loss": 1.5084, "step": 14782 }, { "epoch": 1.16, "learning_rate": 0.00020181564705621386, "loss": 1.5114, "step": 14783 }, { "epoch": 1.16, "learning_rate": 0.00020180404800723153, "loss": 1.4976, "step": 14784 }, { "epoch": 1.16, "learning_rate": 0.0002017924486065283, "loss": 1.5851, "step": 14785 }, { "epoch": 1.16, "learning_rate": 0.00020178084885418292, "loss": 1.5363, "step": 14786 }, { "epoch": 1.16, "learning_rate": 0.00020176924875027418, "loss": 1.5774, "step": 14787 }, { "epoch": 1.16, "learning_rate": 0.00020175764829488083, "loss": 1.5812, "step": 14788 }, { "epoch": 1.16, "learning_rate": 0.00020174604748808154, "loss": 1.5417, "step": 14789 }, { "epoch": 1.16, "learning_rate": 0.00020173444632995524, "loss": 1.5528, "step": 14790 }, { "epoch": 1.16, "learning_rate": 0.0002017228448205805, "loss": 1.5234, "step": 14791 }, { "epoch": 1.16, "learning_rate": 0.00020171124296003624, "loss": 1.5112, "step": 14792 }, { "epoch": 1.16, "learning_rate": 0.00020169964074840118, "loss": 1.5467, "step": 14793 }, { "epoch": 1.16, "learning_rate": 0.00020168803818575406, "loss": 1.5401, "step": 14794 }, { "epoch": 1.16, "learning_rate": 0.00020167643527217374, "loss": 1.5875, "step": 14795 }, { "epoch": 1.16, "learning_rate": 0.00020166483200773888, "loss": 1.5776, "step": 14796 }, { "epoch": 1.16, "learning_rate": 0.00020165322839252832, "loss": 1.5203, "step": 14797 }, { "epoch": 1.16, "learning_rate": 0.0002016416244266209, "loss": 1.5547, "step": 14798 }, { "epoch": 1.16, "learning_rate": 0.00020163002011009534, "loss": 1.5525, "step": 14799 }, { "epoch": 1.16, "learning_rate": 0.00020161841544303043, "loss": 1.5536, "step": 14800 }, { "epoch": 1.16, "learning_rate": 0.0002016068104255049, "loss": 1.5867, "step": 14801 }, { "epoch": 1.16, "learning_rate": 0.0002015952050575977, "loss": 1.521, "step": 14802 }, { "epoch": 1.16, "learning_rate": 0.00020158359933938744, "loss": 1.5936, "step": 14803 }, { "epoch": 1.16, "learning_rate": 0.00020157199327095306, "loss": 1.5668, "step": 14804 }, { "epoch": 1.16, "learning_rate": 0.0002015603868523733, "loss": 1.5778, "step": 14805 }, { "epoch": 1.16, "learning_rate": 0.00020154878008372696, "loss": 1.6052, "step": 14806 }, { "epoch": 1.17, "learning_rate": 0.00020153717296509286, "loss": 1.5361, "step": 14807 }, { "epoch": 1.17, "learning_rate": 0.00020152556549654982, "loss": 1.549, "step": 14808 }, { "epoch": 1.17, "learning_rate": 0.00020151395767817654, "loss": 1.559, "step": 14809 }, { "epoch": 1.17, "learning_rate": 0.00020150234951005203, "loss": 1.545, "step": 14810 }, { "epoch": 1.17, "learning_rate": 0.00020149074099225488, "loss": 1.5672, "step": 14811 }, { "epoch": 1.17, "learning_rate": 0.0002014791321248641, "loss": 1.5207, "step": 14812 }, { "epoch": 1.17, "learning_rate": 0.00020146752290795835, "loss": 1.5614, "step": 14813 }, { "epoch": 1.17, "learning_rate": 0.00020145591334161655, "loss": 1.5117, "step": 14814 }, { "epoch": 1.17, "learning_rate": 0.00020144430342591753, "loss": 1.5713, "step": 14815 }, { "epoch": 1.17, "learning_rate": 0.00020143269316094003, "loss": 1.5605, "step": 14816 }, { "epoch": 1.17, "learning_rate": 0.00020142108254676296, "loss": 1.5727, "step": 14817 }, { "epoch": 1.17, "learning_rate": 0.0002014094715834651, "loss": 1.5471, "step": 14818 }, { "epoch": 1.17, "learning_rate": 0.0002013978602711253, "loss": 1.5476, "step": 14819 }, { "epoch": 1.17, "learning_rate": 0.00020138624860982238, "loss": 1.4714, "step": 14820 }, { "epoch": 1.17, "learning_rate": 0.0002013746365996352, "loss": 1.5565, "step": 14821 }, { "epoch": 1.17, "learning_rate": 0.0002013630242406426, "loss": 1.5253, "step": 14822 }, { "epoch": 1.17, "learning_rate": 0.0002013514115329234, "loss": 1.5142, "step": 14823 }, { "epoch": 1.17, "learning_rate": 0.00020133979847655642, "loss": 1.5387, "step": 14824 }, { "epoch": 1.17, "learning_rate": 0.00020132818507162057, "loss": 1.5293, "step": 14825 }, { "epoch": 1.17, "learning_rate": 0.00020131657131819465, "loss": 1.513, "step": 14826 }, { "epoch": 1.17, "learning_rate": 0.0002013049572163576, "loss": 1.5747, "step": 14827 }, { "epoch": 1.17, "learning_rate": 0.00020129334276618814, "loss": 1.5856, "step": 14828 }, { "epoch": 1.17, "learning_rate": 0.0002012817279677652, "loss": 1.5796, "step": 14829 }, { "epoch": 1.17, "learning_rate": 0.00020127011282116764, "loss": 1.5458, "step": 14830 }, { "epoch": 1.17, "learning_rate": 0.00020125849732647428, "loss": 1.5454, "step": 14831 }, { "epoch": 1.17, "learning_rate": 0.00020124688148376402, "loss": 1.5315, "step": 14832 }, { "epoch": 1.17, "learning_rate": 0.0002012352652931157, "loss": 1.5269, "step": 14833 }, { "epoch": 1.17, "learning_rate": 0.00020122364875460827, "loss": 1.533, "step": 14834 }, { "epoch": 1.17, "learning_rate": 0.00020121203186832047, "loss": 1.5931, "step": 14835 }, { "epoch": 1.17, "learning_rate": 0.00020120041463433125, "loss": 1.5714, "step": 14836 }, { "epoch": 1.17, "learning_rate": 0.0002011887970527195, "loss": 1.5201, "step": 14837 }, { "epoch": 1.17, "learning_rate": 0.000201177179123564, "loss": 1.5252, "step": 14838 }, { "epoch": 1.17, "learning_rate": 0.00020116556084694376, "loss": 1.5444, "step": 14839 }, { "epoch": 1.17, "learning_rate": 0.00020115394222293753, "loss": 1.6306, "step": 14840 }, { "epoch": 1.17, "learning_rate": 0.00020114232325162433, "loss": 1.5699, "step": 14841 }, { "epoch": 1.17, "learning_rate": 0.00020113070393308293, "loss": 1.5552, "step": 14842 }, { "epoch": 1.17, "learning_rate": 0.00020111908426739228, "loss": 1.5328, "step": 14843 }, { "epoch": 1.17, "learning_rate": 0.00020110746425463128, "loss": 1.5323, "step": 14844 }, { "epoch": 1.17, "learning_rate": 0.00020109584389487877, "loss": 1.5051, "step": 14845 }, { "epoch": 1.17, "learning_rate": 0.00020108422318821373, "loss": 1.5107, "step": 14846 }, { "epoch": 1.17, "learning_rate": 0.00020107260213471495, "loss": 1.5769, "step": 14847 }, { "epoch": 1.17, "learning_rate": 0.00020106098073446136, "loss": 1.5591, "step": 14848 }, { "epoch": 1.17, "learning_rate": 0.00020104935898753194, "loss": 1.5003, "step": 14849 }, { "epoch": 1.17, "learning_rate": 0.00020103773689400555, "loss": 1.5339, "step": 14850 }, { "epoch": 1.17, "learning_rate": 0.00020102611445396108, "loss": 1.5181, "step": 14851 }, { "epoch": 1.17, "learning_rate": 0.00020101449166747744, "loss": 1.5542, "step": 14852 }, { "epoch": 1.17, "learning_rate": 0.00020100286853463355, "loss": 1.5119, "step": 14853 }, { "epoch": 1.17, "learning_rate": 0.00020099124505550836, "loss": 1.5094, "step": 14854 }, { "epoch": 1.17, "learning_rate": 0.00020097962123018072, "loss": 1.5504, "step": 14855 }, { "epoch": 1.17, "learning_rate": 0.00020096799705872958, "loss": 1.5466, "step": 14856 }, { "epoch": 1.17, "learning_rate": 0.0002009563725412339, "loss": 1.5844, "step": 14857 }, { "epoch": 1.17, "learning_rate": 0.00020094474767777255, "loss": 1.529, "step": 14858 }, { "epoch": 1.17, "learning_rate": 0.0002009331224684245, "loss": 1.5405, "step": 14859 }, { "epoch": 1.17, "learning_rate": 0.00020092149691326865, "loss": 1.5552, "step": 14860 }, { "epoch": 1.17, "learning_rate": 0.00020090987101238392, "loss": 1.575, "step": 14861 }, { "epoch": 1.17, "learning_rate": 0.00020089824476584927, "loss": 1.529, "step": 14862 }, { "epoch": 1.17, "learning_rate": 0.0002008866181737436, "loss": 1.5695, "step": 14863 }, { "epoch": 1.17, "learning_rate": 0.0002008749912361459, "loss": 1.5962, "step": 14864 }, { "epoch": 1.17, "learning_rate": 0.00020086336395313506, "loss": 1.525, "step": 14865 }, { "epoch": 1.17, "learning_rate": 0.00020085173632479009, "loss": 1.5515, "step": 14866 }, { "epoch": 1.17, "learning_rate": 0.00020084010835118987, "loss": 1.5824, "step": 14867 }, { "epoch": 1.17, "learning_rate": 0.00020082848003241338, "loss": 1.5512, "step": 14868 }, { "epoch": 1.17, "learning_rate": 0.00020081685136853956, "loss": 1.4863, "step": 14869 }, { "epoch": 1.17, "learning_rate": 0.00020080522235964735, "loss": 1.5709, "step": 14870 }, { "epoch": 1.17, "learning_rate": 0.00020079359300581573, "loss": 1.5397, "step": 14871 }, { "epoch": 1.17, "learning_rate": 0.0002007819633071236, "loss": 1.5804, "step": 14872 }, { "epoch": 1.17, "learning_rate": 0.00020077033326364998, "loss": 1.5459, "step": 14873 }, { "epoch": 1.17, "learning_rate": 0.00020075870287547385, "loss": 1.5148, "step": 14874 }, { "epoch": 1.17, "learning_rate": 0.00020074707214267414, "loss": 1.5637, "step": 14875 }, { "epoch": 1.17, "learning_rate": 0.00020073544106532978, "loss": 1.5873, "step": 14876 }, { "epoch": 1.17, "learning_rate": 0.00020072380964351977, "loss": 1.5166, "step": 14877 }, { "epoch": 1.17, "learning_rate": 0.00020071217787732314, "loss": 1.5387, "step": 14878 }, { "epoch": 1.17, "learning_rate": 0.00020070054576681875, "loss": 1.5389, "step": 14879 }, { "epoch": 1.17, "learning_rate": 0.00020068891331208566, "loss": 1.564, "step": 14880 }, { "epoch": 1.17, "learning_rate": 0.00020067728051320277, "loss": 1.6148, "step": 14881 }, { "epoch": 1.17, "learning_rate": 0.00020066564737024917, "loss": 1.5884, "step": 14882 }, { "epoch": 1.17, "learning_rate": 0.0002006540138833038, "loss": 1.5261, "step": 14883 }, { "epoch": 1.17, "learning_rate": 0.0002006423800524456, "loss": 1.5482, "step": 14884 }, { "epoch": 1.17, "learning_rate": 0.00020063074587775359, "loss": 1.5589, "step": 14885 }, { "epoch": 1.17, "learning_rate": 0.00020061911135930673, "loss": 1.6026, "step": 14886 }, { "epoch": 1.17, "learning_rate": 0.00020060747649718405, "loss": 1.5523, "step": 14887 }, { "epoch": 1.17, "learning_rate": 0.00020059584129146453, "loss": 1.5497, "step": 14888 }, { "epoch": 1.17, "learning_rate": 0.00020058420574222714, "loss": 1.5489, "step": 14889 }, { "epoch": 1.17, "learning_rate": 0.000200572569849551, "loss": 1.5432, "step": 14890 }, { "epoch": 1.17, "learning_rate": 0.00020056093361351497, "loss": 1.5275, "step": 14891 }, { "epoch": 1.17, "learning_rate": 0.00020054929703419808, "loss": 1.5759, "step": 14892 }, { "epoch": 1.17, "learning_rate": 0.00020053766011167938, "loss": 1.5592, "step": 14893 }, { "epoch": 1.17, "learning_rate": 0.00020052602284603786, "loss": 1.5129, "step": 14894 }, { "epoch": 1.17, "learning_rate": 0.00020051438523735251, "loss": 1.5439, "step": 14895 }, { "epoch": 1.17, "learning_rate": 0.00020050274728570234, "loss": 1.6067, "step": 14896 }, { "epoch": 1.17, "learning_rate": 0.00020049110899116645, "loss": 1.5165, "step": 14897 }, { "epoch": 1.17, "learning_rate": 0.00020047947035382378, "loss": 1.5567, "step": 14898 }, { "epoch": 1.17, "learning_rate": 0.0002004678313737533, "loss": 1.5046, "step": 14899 }, { "epoch": 1.17, "learning_rate": 0.00020045619205103418, "loss": 1.5188, "step": 14900 }, { "epoch": 1.17, "learning_rate": 0.0002004445523857453, "loss": 1.4878, "step": 14901 }, { "epoch": 1.17, "learning_rate": 0.00020043291237796578, "loss": 1.5835, "step": 14902 }, { "epoch": 1.17, "learning_rate": 0.00020042127202777457, "loss": 1.5147, "step": 14903 }, { "epoch": 1.17, "learning_rate": 0.00020040963133525076, "loss": 1.5929, "step": 14904 }, { "epoch": 1.17, "learning_rate": 0.00020039799030047343, "loss": 1.5245, "step": 14905 }, { "epoch": 1.17, "learning_rate": 0.00020038634892352152, "loss": 1.557, "step": 14906 }, { "epoch": 1.17, "learning_rate": 0.00020037470720447412, "loss": 1.5266, "step": 14907 }, { "epoch": 1.17, "learning_rate": 0.00020036306514341023, "loss": 1.5465, "step": 14908 }, { "epoch": 1.17, "learning_rate": 0.00020035142274040893, "loss": 1.5323, "step": 14909 }, { "epoch": 1.17, "learning_rate": 0.00020033977999554928, "loss": 1.5395, "step": 14910 }, { "epoch": 1.17, "learning_rate": 0.00020032813690891023, "loss": 1.5867, "step": 14911 }, { "epoch": 1.17, "learning_rate": 0.000200316493480571, "loss": 1.5376, "step": 14912 }, { "epoch": 1.17, "learning_rate": 0.00020030484971061047, "loss": 1.5901, "step": 14913 }, { "epoch": 1.17, "learning_rate": 0.00020029320559910782, "loss": 1.6383, "step": 14914 }, { "epoch": 1.17, "learning_rate": 0.00020028156114614202, "loss": 1.6228, "step": 14915 }, { "epoch": 1.17, "learning_rate": 0.00020026991635179218, "loss": 1.6023, "step": 14916 }, { "epoch": 1.17, "learning_rate": 0.0002002582712161374, "loss": 1.565, "step": 14917 }, { "epoch": 1.17, "learning_rate": 0.00020024662573925664, "loss": 1.5326, "step": 14918 }, { "epoch": 1.17, "learning_rate": 0.00020023497992122902, "loss": 1.5025, "step": 14919 }, { "epoch": 1.17, "learning_rate": 0.0002002233337621336, "loss": 1.5684, "step": 14920 }, { "epoch": 1.17, "learning_rate": 0.00020021168726204946, "loss": 1.5261, "step": 14921 }, { "epoch": 1.17, "learning_rate": 0.00020020004042105573, "loss": 1.5787, "step": 14922 }, { "epoch": 1.17, "learning_rate": 0.0002001883932392314, "loss": 1.5355, "step": 14923 }, { "epoch": 1.17, "learning_rate": 0.00020017674571665554, "loss": 1.5146, "step": 14924 }, { "epoch": 1.17, "learning_rate": 0.0002001650978534073, "loss": 1.5514, "step": 14925 }, { "epoch": 1.17, "learning_rate": 0.00020015344964956572, "loss": 1.5647, "step": 14926 }, { "epoch": 1.17, "learning_rate": 0.0002001418011052099, "loss": 1.5621, "step": 14927 }, { "epoch": 1.17, "learning_rate": 0.00020013015222041888, "loss": 1.5433, "step": 14928 }, { "epoch": 1.17, "learning_rate": 0.00020011850299527184, "loss": 1.5437, "step": 14929 }, { "epoch": 1.17, "learning_rate": 0.0002001068534298478, "loss": 1.6097, "step": 14930 }, { "epoch": 1.17, "learning_rate": 0.0002000952035242259, "loss": 1.5176, "step": 14931 }, { "epoch": 1.17, "learning_rate": 0.00020008355327848522, "loss": 1.5434, "step": 14932 }, { "epoch": 1.17, "learning_rate": 0.00020007190269270478, "loss": 1.499, "step": 14933 }, { "epoch": 1.18, "learning_rate": 0.00020006025176696384, "loss": 1.5835, "step": 14934 }, { "epoch": 1.18, "learning_rate": 0.00020004860050134134, "loss": 1.6121, "step": 14935 }, { "epoch": 1.18, "learning_rate": 0.00020003694889591652, "loss": 1.5574, "step": 14936 }, { "epoch": 1.18, "learning_rate": 0.00020002529695076841, "loss": 1.5755, "step": 14937 }, { "epoch": 1.18, "learning_rate": 0.00020001364466597612, "loss": 1.6119, "step": 14938 }, { "epoch": 1.18, "learning_rate": 0.00020000199204161883, "loss": 1.6063, "step": 14939 }, { "epoch": 1.18, "learning_rate": 0.00019999033907777556, "loss": 1.5351, "step": 14940 }, { "epoch": 1.18, "learning_rate": 0.00019997868577452553, "loss": 1.581, "step": 14941 }, { "epoch": 1.18, "learning_rate": 0.00019996703213194772, "loss": 1.5515, "step": 14942 }, { "epoch": 1.18, "learning_rate": 0.00019995537815012138, "loss": 1.5363, "step": 14943 }, { "epoch": 1.18, "learning_rate": 0.0001999437238291256, "loss": 1.5937, "step": 14944 }, { "epoch": 1.18, "learning_rate": 0.0001999320691690395, "loss": 1.5329, "step": 14945 }, { "epoch": 1.18, "learning_rate": 0.00019992041416994224, "loss": 1.5084, "step": 14946 }, { "epoch": 1.18, "learning_rate": 0.00019990875883191283, "loss": 1.5428, "step": 14947 }, { "epoch": 1.18, "learning_rate": 0.0001998971031550305, "loss": 1.5711, "step": 14948 }, { "epoch": 1.18, "learning_rate": 0.00019988544713937445, "loss": 1.5345, "step": 14949 }, { "epoch": 1.18, "learning_rate": 0.00019987379078502363, "loss": 1.5537, "step": 14950 }, { "epoch": 1.18, "learning_rate": 0.00019986213409205742, "loss": 1.5461, "step": 14951 }, { "epoch": 1.18, "learning_rate": 0.00019985047706055475, "loss": 1.5037, "step": 14952 }, { "epoch": 1.18, "learning_rate": 0.00019983881969059492, "loss": 1.5135, "step": 14953 }, { "epoch": 1.18, "learning_rate": 0.00019982716198225695, "loss": 1.5276, "step": 14954 }, { "epoch": 1.18, "learning_rate": 0.00019981550393562006, "loss": 1.5506, "step": 14955 }, { "epoch": 1.18, "learning_rate": 0.00019980384555076338, "loss": 1.5072, "step": 14956 }, { "epoch": 1.18, "learning_rate": 0.0001997921868277661, "loss": 1.5108, "step": 14957 }, { "epoch": 1.18, "learning_rate": 0.00019978052776670733, "loss": 1.5703, "step": 14958 }, { "epoch": 1.18, "learning_rate": 0.00019976886836766623, "loss": 1.5915, "step": 14959 }, { "epoch": 1.18, "learning_rate": 0.00019975720863072197, "loss": 1.5005, "step": 14960 }, { "epoch": 1.18, "learning_rate": 0.0001997455485559538, "loss": 1.5735, "step": 14961 }, { "epoch": 1.18, "learning_rate": 0.00019973388814344074, "loss": 1.5448, "step": 14962 }, { "epoch": 1.18, "learning_rate": 0.00019972222739326207, "loss": 1.549, "step": 14963 }, { "epoch": 1.18, "learning_rate": 0.00019971056630549688, "loss": 1.5414, "step": 14964 }, { "epoch": 1.18, "learning_rate": 0.00019969890488022438, "loss": 1.5995, "step": 14965 }, { "epoch": 1.18, "learning_rate": 0.00019968724311752374, "loss": 1.5571, "step": 14966 }, { "epoch": 1.18, "learning_rate": 0.00019967558101747414, "loss": 1.5718, "step": 14967 }, { "epoch": 1.18, "learning_rate": 0.00019966391858015477, "loss": 1.5665, "step": 14968 }, { "epoch": 1.18, "learning_rate": 0.0001996522558056448, "loss": 1.5301, "step": 14969 }, { "epoch": 1.18, "learning_rate": 0.00019964059269402345, "loss": 1.5298, "step": 14970 }, { "epoch": 1.18, "learning_rate": 0.00019962892924536979, "loss": 1.5152, "step": 14971 }, { "epoch": 1.18, "learning_rate": 0.00019961726545976314, "loss": 1.5253, "step": 14972 }, { "epoch": 1.18, "learning_rate": 0.00019960560133728262, "loss": 1.5733, "step": 14973 }, { "epoch": 1.18, "learning_rate": 0.0001995939368780074, "loss": 1.5185, "step": 14974 }, { "epoch": 1.18, "learning_rate": 0.0001995822720820168, "loss": 1.5078, "step": 14975 }, { "epoch": 1.18, "learning_rate": 0.00019957060694938988, "loss": 1.548, "step": 14976 }, { "epoch": 1.18, "learning_rate": 0.0001995589414802059, "loss": 1.5486, "step": 14977 }, { "epoch": 1.18, "learning_rate": 0.0001995472756745441, "loss": 1.547, "step": 14978 }, { "epoch": 1.18, "learning_rate": 0.00019953560953248357, "loss": 1.5207, "step": 14979 }, { "epoch": 1.18, "learning_rate": 0.00019952394305410365, "loss": 1.5483, "step": 14980 }, { "epoch": 1.18, "learning_rate": 0.00019951227623948346, "loss": 1.5167, "step": 14981 }, { "epoch": 1.18, "learning_rate": 0.00019950060908870224, "loss": 1.5662, "step": 14982 }, { "epoch": 1.18, "learning_rate": 0.00019948894160183917, "loss": 1.5614, "step": 14983 }, { "epoch": 1.18, "learning_rate": 0.00019947727377897355, "loss": 1.5322, "step": 14984 }, { "epoch": 1.18, "learning_rate": 0.00019946560562018452, "loss": 1.5207, "step": 14985 }, { "epoch": 1.18, "learning_rate": 0.0001994539371255513, "loss": 1.5642, "step": 14986 }, { "epoch": 1.18, "learning_rate": 0.00019944226829515316, "loss": 1.5255, "step": 14987 }, { "epoch": 1.18, "learning_rate": 0.00019943059912906936, "loss": 1.561, "step": 14988 }, { "epoch": 1.18, "learning_rate": 0.000199418929627379, "loss": 1.5568, "step": 14989 }, { "epoch": 1.18, "learning_rate": 0.00019940725979016136, "loss": 1.5306, "step": 14990 }, { "epoch": 1.18, "learning_rate": 0.00019939558961749572, "loss": 1.5937, "step": 14991 }, { "epoch": 1.18, "learning_rate": 0.00019938391910946133, "loss": 1.5663, "step": 14992 }, { "epoch": 1.18, "learning_rate": 0.00019937224826613735, "loss": 1.5663, "step": 14993 }, { "epoch": 1.18, "learning_rate": 0.000199360577087603, "loss": 1.5557, "step": 14994 }, { "epoch": 1.18, "learning_rate": 0.00019934890557393766, "loss": 1.5369, "step": 14995 }, { "epoch": 1.18, "learning_rate": 0.00019933723372522044, "loss": 1.6417, "step": 14996 }, { "epoch": 1.18, "learning_rate": 0.00019932556154153062, "loss": 1.5543, "step": 14997 }, { "epoch": 1.18, "learning_rate": 0.00019931388902294747, "loss": 1.4782, "step": 14998 }, { "epoch": 1.18, "learning_rate": 0.00019930221616955022, "loss": 1.519, "step": 14999 }, { "epoch": 1.18, "learning_rate": 0.0001992905429814181, "loss": 1.5899, "step": 15000 }, { "epoch": 1.18, "learning_rate": 0.00019927886945863044, "loss": 1.5209, "step": 15001 }, { "epoch": 1.18, "learning_rate": 0.00019926719560126645, "loss": 1.5586, "step": 15002 }, { "epoch": 1.18, "learning_rate": 0.00019925552140940536, "loss": 1.512, "step": 15003 }, { "epoch": 1.18, "learning_rate": 0.0001992438468831265, "loss": 1.5065, "step": 15004 }, { "epoch": 1.18, "learning_rate": 0.00019923217202250906, "loss": 1.5733, "step": 15005 }, { "epoch": 1.18, "learning_rate": 0.00019922049682763232, "loss": 1.5378, "step": 15006 }, { "epoch": 1.18, "learning_rate": 0.00019920882129857562, "loss": 1.4742, "step": 15007 }, { "epoch": 1.18, "learning_rate": 0.00019919714543541818, "loss": 1.5635, "step": 15008 }, { "epoch": 1.18, "learning_rate": 0.00019918546923823927, "loss": 1.5344, "step": 15009 }, { "epoch": 1.18, "learning_rate": 0.00019917379270711813, "loss": 1.5229, "step": 15010 }, { "epoch": 1.18, "learning_rate": 0.0001991621158421341, "loss": 1.5355, "step": 15011 }, { "epoch": 1.18, "learning_rate": 0.00019915043864336646, "loss": 1.5502, "step": 15012 }, { "epoch": 1.18, "learning_rate": 0.0001991387611108944, "loss": 1.5902, "step": 15013 }, { "epoch": 1.18, "learning_rate": 0.0001991270832447973, "loss": 1.5504, "step": 15014 }, { "epoch": 1.18, "learning_rate": 0.0001991154050451544, "loss": 1.5747, "step": 15015 }, { "epoch": 1.18, "learning_rate": 0.000199103726512045, "loss": 1.5748, "step": 15016 }, { "epoch": 1.18, "learning_rate": 0.00019909204764554845, "loss": 1.5629, "step": 15017 }, { "epoch": 1.18, "learning_rate": 0.00019908036844574396, "loss": 1.5496, "step": 15018 }, { "epoch": 1.18, "learning_rate": 0.00019906868891271084, "loss": 1.5105, "step": 15019 }, { "epoch": 1.18, "learning_rate": 0.0001990570090465284, "loss": 1.4935, "step": 15020 }, { "epoch": 1.18, "learning_rate": 0.00019904532884727595, "loss": 1.5371, "step": 15021 }, { "epoch": 1.18, "learning_rate": 0.00019903364831503278, "loss": 1.5922, "step": 15022 }, { "epoch": 1.18, "learning_rate": 0.0001990219674498782, "loss": 1.4516, "step": 15023 }, { "epoch": 1.18, "learning_rate": 0.0001990102862518915, "loss": 1.5544, "step": 15024 }, { "epoch": 1.18, "learning_rate": 0.000198998604721152, "loss": 1.4893, "step": 15025 }, { "epoch": 1.18, "learning_rate": 0.00019898692285773905, "loss": 1.5298, "step": 15026 }, { "epoch": 1.18, "learning_rate": 0.0001989752406617319, "loss": 1.5757, "step": 15027 }, { "epoch": 1.18, "learning_rate": 0.0001989635581332099, "loss": 1.5665, "step": 15028 }, { "epoch": 1.18, "learning_rate": 0.00019895187527225233, "loss": 1.5765, "step": 15029 }, { "epoch": 1.18, "learning_rate": 0.00019894019207893857, "loss": 1.5699, "step": 15030 }, { "epoch": 1.18, "learning_rate": 0.00019892850855334794, "loss": 1.6082, "step": 15031 }, { "epoch": 1.18, "learning_rate": 0.00019891682469555966, "loss": 1.5253, "step": 15032 }, { "epoch": 1.18, "learning_rate": 0.0001989051405056532, "loss": 1.5763, "step": 15033 }, { "epoch": 1.18, "learning_rate": 0.00019889345598370783, "loss": 1.5641, "step": 15034 }, { "epoch": 1.18, "learning_rate": 0.00019888177112980284, "loss": 1.5061, "step": 15035 }, { "epoch": 1.18, "learning_rate": 0.00019887008594401763, "loss": 1.5658, "step": 15036 }, { "epoch": 1.18, "learning_rate": 0.00019885840042643146, "loss": 1.5756, "step": 15037 }, { "epoch": 1.18, "learning_rate": 0.0001988467145771238, "loss": 1.5409, "step": 15038 }, { "epoch": 1.18, "learning_rate": 0.00019883502839617378, "loss": 1.5851, "step": 15039 }, { "epoch": 1.18, "learning_rate": 0.00019882334188366094, "loss": 1.6157, "step": 15040 }, { "epoch": 1.18, "learning_rate": 0.00019881165503966456, "loss": 1.5541, "step": 15041 }, { "epoch": 1.18, "learning_rate": 0.00019879996786426393, "loss": 1.5472, "step": 15042 }, { "epoch": 1.18, "learning_rate": 0.00019878828035753852, "loss": 1.5314, "step": 15043 }, { "epoch": 1.18, "learning_rate": 0.00019877659251956755, "loss": 1.5478, "step": 15044 }, { "epoch": 1.18, "learning_rate": 0.00019876490435043043, "loss": 1.5551, "step": 15045 }, { "epoch": 1.18, "learning_rate": 0.00019875321585020658, "loss": 1.5567, "step": 15046 }, { "epoch": 1.18, "learning_rate": 0.00019874152701897525, "loss": 1.5371, "step": 15047 }, { "epoch": 1.18, "learning_rate": 0.00019872983785681586, "loss": 1.5331, "step": 15048 }, { "epoch": 1.18, "learning_rate": 0.00019871814836380777, "loss": 1.5894, "step": 15049 }, { "epoch": 1.18, "learning_rate": 0.00019870645854003035, "loss": 1.5745, "step": 15050 }, { "epoch": 1.18, "learning_rate": 0.00019869476838556293, "loss": 1.4963, "step": 15051 }, { "epoch": 1.18, "learning_rate": 0.00019868307790048487, "loss": 1.517, "step": 15052 }, { "epoch": 1.18, "learning_rate": 0.00019867138708487564, "loss": 1.5409, "step": 15053 }, { "epoch": 1.18, "learning_rate": 0.00019865969593881453, "loss": 1.6157, "step": 15054 }, { "epoch": 1.18, "learning_rate": 0.00019864800446238093, "loss": 1.5531, "step": 15055 }, { "epoch": 1.18, "learning_rate": 0.00019863631265565422, "loss": 1.5469, "step": 15056 }, { "epoch": 1.18, "learning_rate": 0.0001986246205187138, "loss": 1.5551, "step": 15057 }, { "epoch": 1.18, "learning_rate": 0.00019861292805163904, "loss": 1.5804, "step": 15058 }, { "epoch": 1.18, "learning_rate": 0.00019860123525450933, "loss": 1.5921, "step": 15059 }, { "epoch": 1.18, "learning_rate": 0.00019858954212740405, "loss": 1.5331, "step": 15060 }, { "epoch": 1.19, "learning_rate": 0.00019857784867040256, "loss": 1.5383, "step": 15061 }, { "epoch": 1.19, "learning_rate": 0.00019856615488358432, "loss": 1.5467, "step": 15062 }, { "epoch": 1.19, "learning_rate": 0.00019855446076702874, "loss": 1.5368, "step": 15063 }, { "epoch": 1.19, "learning_rate": 0.00019854276632081506, "loss": 1.5759, "step": 15064 }, { "epoch": 1.19, "learning_rate": 0.0001985310715450229, "loss": 1.5764, "step": 15065 }, { "epoch": 1.19, "learning_rate": 0.0001985193764397314, "loss": 1.5182, "step": 15066 }, { "epoch": 1.19, "learning_rate": 0.0001985076810050202, "loss": 1.534, "step": 15067 }, { "epoch": 1.19, "learning_rate": 0.00019849598524096862, "loss": 1.6172, "step": 15068 }, { "epoch": 1.19, "learning_rate": 0.000198484289147656, "loss": 1.5613, "step": 15069 }, { "epoch": 1.19, "learning_rate": 0.00019847259272516191, "loss": 1.596, "step": 15070 }, { "epoch": 1.19, "learning_rate": 0.00019846089597356557, "loss": 1.5526, "step": 15071 }, { "epoch": 1.19, "learning_rate": 0.00019844919889294656, "loss": 1.5339, "step": 15072 }, { "epoch": 1.19, "learning_rate": 0.0001984375014833842, "loss": 1.5204, "step": 15073 }, { "epoch": 1.19, "learning_rate": 0.00019842580374495794, "loss": 1.5384, "step": 15074 }, { "epoch": 1.19, "learning_rate": 0.00019841410567774723, "loss": 1.5563, "step": 15075 }, { "epoch": 1.19, "learning_rate": 0.00019840240728183136, "loss": 1.5664, "step": 15076 }, { "epoch": 1.19, "learning_rate": 0.00019839070855728997, "loss": 1.564, "step": 15077 }, { "epoch": 1.19, "learning_rate": 0.00019837900950420227, "loss": 1.5374, "step": 15078 }, { "epoch": 1.19, "learning_rate": 0.00019836731012264785, "loss": 1.4921, "step": 15079 }, { "epoch": 1.19, "learning_rate": 0.0001983556104127061, "loss": 1.5674, "step": 15080 }, { "epoch": 1.19, "learning_rate": 0.0001983439103744564, "loss": 1.5359, "step": 15081 }, { "epoch": 1.19, "learning_rate": 0.00019833221000797828, "loss": 1.5523, "step": 15082 }, { "epoch": 1.19, "learning_rate": 0.00019832050931335108, "loss": 1.4992, "step": 15083 }, { "epoch": 1.19, "learning_rate": 0.00019830880829065428, "loss": 1.5188, "step": 15084 }, { "epoch": 1.19, "learning_rate": 0.00019829710693996733, "loss": 1.5771, "step": 15085 }, { "epoch": 1.19, "learning_rate": 0.00019828540526136969, "loss": 1.4954, "step": 15086 }, { "epoch": 1.19, "learning_rate": 0.00019827370325494083, "loss": 1.5294, "step": 15087 }, { "epoch": 1.19, "learning_rate": 0.0001982620009207601, "loss": 1.5727, "step": 15088 }, { "epoch": 1.19, "learning_rate": 0.00019825029825890704, "loss": 1.6093, "step": 15089 }, { "epoch": 1.19, "learning_rate": 0.0001982385952694611, "loss": 1.5694, "step": 15090 }, { "epoch": 1.19, "learning_rate": 0.00019822689195250174, "loss": 1.524, "step": 15091 }, { "epoch": 1.19, "learning_rate": 0.00019821518830810835, "loss": 1.5472, "step": 15092 }, { "epoch": 1.19, "learning_rate": 0.00019820348433636045, "loss": 1.5392, "step": 15093 }, { "epoch": 1.19, "learning_rate": 0.00019819178003733752, "loss": 1.5537, "step": 15094 }, { "epoch": 1.19, "learning_rate": 0.00019818007541111895, "loss": 1.6358, "step": 15095 }, { "epoch": 1.19, "learning_rate": 0.00019816837045778427, "loss": 1.5612, "step": 15096 }, { "epoch": 1.19, "learning_rate": 0.000198156665177413, "loss": 1.5207, "step": 15097 }, { "epoch": 1.19, "learning_rate": 0.0001981449595700845, "loss": 1.579, "step": 15098 }, { "epoch": 1.19, "learning_rate": 0.00019813325363587827, "loss": 1.567, "step": 15099 }, { "epoch": 1.19, "learning_rate": 0.0001981215473748738, "loss": 1.571, "step": 15100 }, { "epoch": 1.19, "learning_rate": 0.00019810984078715062, "loss": 1.5666, "step": 15101 }, { "epoch": 1.19, "learning_rate": 0.00019809813387278817, "loss": 1.5528, "step": 15102 }, { "epoch": 1.19, "learning_rate": 0.00019808642663186592, "loss": 1.5673, "step": 15103 }, { "epoch": 1.19, "learning_rate": 0.0001980747190644634, "loss": 1.5609, "step": 15104 }, { "epoch": 1.19, "learning_rate": 0.00019806301117066002, "loss": 1.562, "step": 15105 }, { "epoch": 1.19, "learning_rate": 0.00019805130295053532, "loss": 1.5989, "step": 15106 }, { "epoch": 1.19, "learning_rate": 0.0001980395944041688, "loss": 1.5241, "step": 15107 }, { "epoch": 1.19, "learning_rate": 0.00019802788553163994, "loss": 1.4957, "step": 15108 }, { "epoch": 1.19, "learning_rate": 0.00019801617633302828, "loss": 1.5511, "step": 15109 }, { "epoch": 1.19, "learning_rate": 0.00019800446680841324, "loss": 1.5321, "step": 15110 }, { "epoch": 1.19, "learning_rate": 0.00019799275695787442, "loss": 1.5289, "step": 15111 }, { "epoch": 1.19, "learning_rate": 0.00019798104678149118, "loss": 1.5154, "step": 15112 }, { "epoch": 1.19, "learning_rate": 0.00019796933627934317, "loss": 1.5909, "step": 15113 }, { "epoch": 1.19, "learning_rate": 0.00019795762545150983, "loss": 1.5602, "step": 15114 }, { "epoch": 1.19, "learning_rate": 0.00019794591429807062, "loss": 1.5479, "step": 15115 }, { "epoch": 1.19, "learning_rate": 0.00019793420281910516, "loss": 1.6018, "step": 15116 }, { "epoch": 1.19, "learning_rate": 0.00019792249101469291, "loss": 1.5508, "step": 15117 }, { "epoch": 1.19, "learning_rate": 0.0001979107788849134, "loss": 1.5788, "step": 15118 }, { "epoch": 1.19, "learning_rate": 0.00019789906642984616, "loss": 1.5748, "step": 15119 }, { "epoch": 1.19, "learning_rate": 0.00019788735364957064, "loss": 1.5728, "step": 15120 }, { "epoch": 1.19, "learning_rate": 0.00019787564054416648, "loss": 1.512, "step": 15121 }, { "epoch": 1.19, "learning_rate": 0.00019786392711371308, "loss": 1.4686, "step": 15122 }, { "epoch": 1.19, "learning_rate": 0.00019785221335829006, "loss": 1.5711, "step": 15123 }, { "epoch": 1.19, "learning_rate": 0.00019784049927797686, "loss": 1.5277, "step": 15124 }, { "epoch": 1.19, "learning_rate": 0.00019782878487285314, "loss": 1.56, "step": 15125 }, { "epoch": 1.19, "learning_rate": 0.00019781707014299838, "loss": 1.538, "step": 15126 }, { "epoch": 1.19, "learning_rate": 0.00019780535508849207, "loss": 1.5978, "step": 15127 }, { "epoch": 1.19, "learning_rate": 0.00019779363970941373, "loss": 1.521, "step": 15128 }, { "epoch": 1.19, "learning_rate": 0.00019778192400584304, "loss": 1.5841, "step": 15129 }, { "epoch": 1.19, "learning_rate": 0.00019777020797785938, "loss": 1.6084, "step": 15130 }, { "epoch": 1.19, "learning_rate": 0.0001977584916255424, "loss": 1.5498, "step": 15131 }, { "epoch": 1.19, "learning_rate": 0.0001977467749489716, "loss": 1.5644, "step": 15132 }, { "epoch": 1.19, "learning_rate": 0.0001977350579482266, "loss": 1.5131, "step": 15133 }, { "epoch": 1.19, "learning_rate": 0.00019772334062338683, "loss": 1.5236, "step": 15134 }, { "epoch": 1.19, "learning_rate": 0.00019771162297453195, "loss": 1.5288, "step": 15135 }, { "epoch": 1.19, "learning_rate": 0.00019769990500174153, "loss": 1.5619, "step": 15136 }, { "epoch": 1.19, "learning_rate": 0.000197688186705095, "loss": 1.5319, "step": 15137 }, { "epoch": 1.19, "learning_rate": 0.00019767646808467205, "loss": 1.586, "step": 15138 }, { "epoch": 1.19, "learning_rate": 0.00019766474914055212, "loss": 1.5946, "step": 15139 }, { "epoch": 1.19, "learning_rate": 0.00019765302987281491, "loss": 1.5133, "step": 15140 }, { "epoch": 1.19, "learning_rate": 0.0001976413102815399, "loss": 1.5541, "step": 15141 }, { "epoch": 1.19, "learning_rate": 0.0001976295903668067, "loss": 1.5696, "step": 15142 }, { "epoch": 1.19, "learning_rate": 0.00019761787012869487, "loss": 1.5276, "step": 15143 }, { "epoch": 1.19, "learning_rate": 0.00019760614956728392, "loss": 1.5541, "step": 15144 }, { "epoch": 1.19, "learning_rate": 0.00019759442868265355, "loss": 1.5335, "step": 15145 }, { "epoch": 1.19, "learning_rate": 0.0001975827074748833, "loss": 1.549, "step": 15146 }, { "epoch": 1.19, "learning_rate": 0.0001975709859440526, "loss": 1.5484, "step": 15147 }, { "epoch": 1.19, "learning_rate": 0.00019755926409024128, "loss": 1.5447, "step": 15148 }, { "epoch": 1.19, "learning_rate": 0.00019754754191352874, "loss": 1.5089, "step": 15149 }, { "epoch": 1.19, "learning_rate": 0.00019753581941399468, "loss": 1.5384, "step": 15150 }, { "epoch": 1.19, "learning_rate": 0.0001975240965917186, "loss": 1.5378, "step": 15151 }, { "epoch": 1.19, "learning_rate": 0.00019751237344678012, "loss": 1.5737, "step": 15152 }, { "epoch": 1.19, "learning_rate": 0.0001975006499792589, "loss": 1.5567, "step": 15153 }, { "epoch": 1.19, "learning_rate": 0.00019748892618923441, "loss": 1.5769, "step": 15154 }, { "epoch": 1.19, "learning_rate": 0.00019747720207678634, "loss": 1.5529, "step": 15155 }, { "epoch": 1.19, "learning_rate": 0.00019746547764199428, "loss": 1.5838, "step": 15156 }, { "epoch": 1.19, "learning_rate": 0.0001974537528849378, "loss": 1.5305, "step": 15157 }, { "epoch": 1.19, "learning_rate": 0.00019744202780569659, "loss": 1.596, "step": 15158 }, { "epoch": 1.19, "learning_rate": 0.0001974303024043501, "loss": 1.5574, "step": 15159 }, { "epoch": 1.19, "learning_rate": 0.0001974185766809781, "loss": 1.5411, "step": 15160 }, { "epoch": 1.19, "learning_rate": 0.0001974068506356601, "loss": 1.5515, "step": 15161 }, { "epoch": 1.19, "learning_rate": 0.00019739512426847575, "loss": 1.5751, "step": 15162 }, { "epoch": 1.19, "learning_rate": 0.00019738339757950464, "loss": 1.5805, "step": 15163 }, { "epoch": 1.19, "learning_rate": 0.00019737167056882644, "loss": 1.494, "step": 15164 }, { "epoch": 1.19, "learning_rate": 0.00019735994323652074, "loss": 1.5545, "step": 15165 }, { "epoch": 1.19, "learning_rate": 0.00019734821558266714, "loss": 1.5392, "step": 15166 }, { "epoch": 1.19, "learning_rate": 0.00019733648760734534, "loss": 1.5975, "step": 15167 }, { "epoch": 1.19, "learning_rate": 0.00019732475931063482, "loss": 1.5224, "step": 15168 }, { "epoch": 1.19, "learning_rate": 0.00019731303069261537, "loss": 1.5142, "step": 15169 }, { "epoch": 1.19, "learning_rate": 0.0001973013017533665, "loss": 1.5421, "step": 15170 }, { "epoch": 1.19, "learning_rate": 0.00019728957249296792, "loss": 1.5604, "step": 15171 }, { "epoch": 1.19, "learning_rate": 0.0001972778429114993, "loss": 1.5661, "step": 15172 }, { "epoch": 1.19, "learning_rate": 0.00019726611300904015, "loss": 1.5943, "step": 15173 }, { "epoch": 1.19, "learning_rate": 0.00019725438278567016, "loss": 1.5527, "step": 15174 }, { "epoch": 1.19, "learning_rate": 0.000197242652241469, "loss": 1.5191, "step": 15175 }, { "epoch": 1.19, "learning_rate": 0.00019723092137651632, "loss": 1.5197, "step": 15176 }, { "epoch": 1.19, "learning_rate": 0.0001972191901908918, "loss": 1.5316, "step": 15177 }, { "epoch": 1.19, "learning_rate": 0.00019720745868467493, "loss": 1.6017, "step": 15178 }, { "epoch": 1.19, "learning_rate": 0.00019719572685794552, "loss": 1.5275, "step": 15179 }, { "epoch": 1.19, "learning_rate": 0.00019718399471078317, "loss": 1.5268, "step": 15180 }, { "epoch": 1.19, "learning_rate": 0.0001971722622432675, "loss": 1.5798, "step": 15181 }, { "epoch": 1.19, "learning_rate": 0.00019716052945547828, "loss": 1.5403, "step": 15182 }, { "epoch": 1.19, "learning_rate": 0.00019714879634749502, "loss": 1.5114, "step": 15183 }, { "epoch": 1.19, "learning_rate": 0.00019713706291939745, "loss": 1.563, "step": 15184 }, { "epoch": 1.19, "learning_rate": 0.0001971253291712653, "loss": 1.5692, "step": 15185 }, { "epoch": 1.19, "learning_rate": 0.0001971135951031781, "loss": 1.5871, "step": 15186 }, { "epoch": 1.19, "learning_rate": 0.00019710186071521564, "loss": 1.5301, "step": 15187 }, { "epoch": 1.2, "learning_rate": 0.0001970901260074575, "loss": 1.5887, "step": 15188 }, { "epoch": 1.2, "learning_rate": 0.00019707839097998344, "loss": 1.5233, "step": 15189 }, { "epoch": 1.2, "learning_rate": 0.00019706665563287302, "loss": 1.5296, "step": 15190 }, { "epoch": 1.2, "learning_rate": 0.000197054919966206, "loss": 1.6056, "step": 15191 }, { "epoch": 1.2, "learning_rate": 0.0001970431839800621, "loss": 1.5729, "step": 15192 }, { "epoch": 1.2, "learning_rate": 0.0001970314476745209, "loss": 1.545, "step": 15193 }, { "epoch": 1.2, "learning_rate": 0.00019701971104966207, "loss": 1.5797, "step": 15194 }, { "epoch": 1.2, "learning_rate": 0.00019700797410556544, "loss": 1.5796, "step": 15195 }, { "epoch": 1.2, "learning_rate": 0.00019699623684231058, "loss": 1.5449, "step": 15196 }, { "epoch": 1.2, "learning_rate": 0.00019698449925997715, "loss": 1.5799, "step": 15197 }, { "epoch": 1.2, "learning_rate": 0.00019697276135864495, "loss": 1.5938, "step": 15198 }, { "epoch": 1.2, "learning_rate": 0.00019696102313839365, "loss": 1.5334, "step": 15199 }, { "epoch": 1.2, "learning_rate": 0.00019694928459930287, "loss": 1.5203, "step": 15200 }, { "epoch": 1.2, "learning_rate": 0.00019693754574145236, "loss": 1.6097, "step": 15201 }, { "epoch": 1.2, "learning_rate": 0.0001969258065649218, "loss": 1.5877, "step": 15202 }, { "epoch": 1.2, "learning_rate": 0.00019691406706979093, "loss": 1.5608, "step": 15203 }, { "epoch": 1.2, "learning_rate": 0.00019690232725613947, "loss": 1.6108, "step": 15204 }, { "epoch": 1.2, "learning_rate": 0.00019689058712404707, "loss": 1.5715, "step": 15205 }, { "epoch": 1.2, "learning_rate": 0.00019687884667359343, "loss": 1.5258, "step": 15206 }, { "epoch": 1.2, "learning_rate": 0.00019686710590485833, "loss": 1.553, "step": 15207 }, { "epoch": 1.2, "learning_rate": 0.00019685536481792138, "loss": 1.6206, "step": 15208 }, { "epoch": 1.2, "learning_rate": 0.00019684362341286244, "loss": 1.5893, "step": 15209 }, { "epoch": 1.2, "learning_rate": 0.0001968318816897611, "loss": 1.5555, "step": 15210 }, { "epoch": 1.2, "learning_rate": 0.00019682013964869715, "loss": 1.599, "step": 15211 }, { "epoch": 1.2, "learning_rate": 0.00019680839728975023, "loss": 1.5729, "step": 15212 }, { "epoch": 1.2, "learning_rate": 0.0001967966546130002, "loss": 1.5115, "step": 15213 }, { "epoch": 1.2, "learning_rate": 0.00019678491161852668, "loss": 1.5637, "step": 15214 }, { "epoch": 1.2, "learning_rate": 0.00019677316830640947, "loss": 1.5347, "step": 15215 }, { "epoch": 1.2, "learning_rate": 0.0001967614246767282, "loss": 1.5461, "step": 15216 }, { "epoch": 1.2, "learning_rate": 0.00019674968072956267, "loss": 1.5714, "step": 15217 }, { "epoch": 1.2, "learning_rate": 0.00019673793646499263, "loss": 1.5524, "step": 15218 }, { "epoch": 1.2, "learning_rate": 0.00019672619188309775, "loss": 1.5306, "step": 15219 }, { "epoch": 1.2, "learning_rate": 0.00019671444698395784, "loss": 1.5661, "step": 15220 }, { "epoch": 1.2, "learning_rate": 0.00019670270176765263, "loss": 1.5229, "step": 15221 }, { "epoch": 1.2, "learning_rate": 0.00019669095623426185, "loss": 1.5454, "step": 15222 }, { "epoch": 1.2, "learning_rate": 0.00019667921038386523, "loss": 1.52, "step": 15223 }, { "epoch": 1.2, "learning_rate": 0.00019666746421654252, "loss": 1.5538, "step": 15224 }, { "epoch": 1.2, "learning_rate": 0.0001966557177323735, "loss": 1.5818, "step": 15225 }, { "epoch": 1.2, "learning_rate": 0.00019664397093143788, "loss": 1.5152, "step": 15226 }, { "epoch": 1.2, "learning_rate": 0.00019663222381381543, "loss": 1.5167, "step": 15227 }, { "epoch": 1.2, "learning_rate": 0.00019662047637958595, "loss": 1.5846, "step": 15228 }, { "epoch": 1.2, "learning_rate": 0.00019660872862882917, "loss": 1.625, "step": 15229 }, { "epoch": 1.2, "learning_rate": 0.0001965969805616248, "loss": 1.5358, "step": 15230 }, { "epoch": 1.2, "learning_rate": 0.00019658523217805268, "loss": 1.609, "step": 15231 }, { "epoch": 1.2, "learning_rate": 0.00019657348347819253, "loss": 1.5696, "step": 15232 }, { "epoch": 1.2, "learning_rate": 0.0001965617344621241, "loss": 1.5459, "step": 15233 }, { "epoch": 1.2, "learning_rate": 0.00019654998512992722, "loss": 1.4938, "step": 15234 }, { "epoch": 1.2, "learning_rate": 0.00019653823548168166, "loss": 1.552, "step": 15235 }, { "epoch": 1.2, "learning_rate": 0.0001965264855174671, "loss": 1.5603, "step": 15236 }, { "epoch": 1.2, "learning_rate": 0.0001965147352373634, "loss": 1.6004, "step": 15237 }, { "epoch": 1.2, "learning_rate": 0.00019650298464145033, "loss": 1.523, "step": 15238 }, { "epoch": 1.2, "learning_rate": 0.00019649123372980764, "loss": 1.5003, "step": 15239 }, { "epoch": 1.2, "learning_rate": 0.00019647948250251516, "loss": 1.5329, "step": 15240 }, { "epoch": 1.2, "learning_rate": 0.00019646773095965262, "loss": 1.5782, "step": 15241 }, { "epoch": 1.2, "learning_rate": 0.0001964559791012998, "loss": 1.5479, "step": 15242 }, { "epoch": 1.2, "learning_rate": 0.0001964442269275366, "loss": 1.5469, "step": 15243 }, { "epoch": 1.2, "learning_rate": 0.00019643247443844265, "loss": 1.5494, "step": 15244 }, { "epoch": 1.2, "learning_rate": 0.00019642072163409788, "loss": 1.5568, "step": 15245 }, { "epoch": 1.2, "learning_rate": 0.00019640896851458198, "loss": 1.5387, "step": 15246 }, { "epoch": 1.2, "learning_rate": 0.0001963972150799748, "loss": 1.567, "step": 15247 }, { "epoch": 1.2, "learning_rate": 0.0001963854613303562, "loss": 1.5161, "step": 15248 }, { "epoch": 1.2, "learning_rate": 0.0001963737072658058, "loss": 1.5177, "step": 15249 }, { "epoch": 1.2, "learning_rate": 0.00019636195288640358, "loss": 1.5844, "step": 15250 }, { "epoch": 1.2, "learning_rate": 0.0001963501981922293, "loss": 1.6065, "step": 15251 }, { "epoch": 1.2, "learning_rate": 0.00019633844318336276, "loss": 1.4813, "step": 15252 }, { "epoch": 1.2, "learning_rate": 0.00019632668785988375, "loss": 1.5072, "step": 15253 }, { "epoch": 1.2, "learning_rate": 0.00019631493222187208, "loss": 1.4841, "step": 15254 }, { "epoch": 1.2, "learning_rate": 0.00019630317626940757, "loss": 1.5031, "step": 15255 }, { "epoch": 1.2, "learning_rate": 0.00019629142000257007, "loss": 1.5607, "step": 15256 }, { "epoch": 1.2, "learning_rate": 0.00019627966342143936, "loss": 1.5202, "step": 15257 }, { "epoch": 1.2, "learning_rate": 0.00019626790652609526, "loss": 1.5463, "step": 15258 }, { "epoch": 1.2, "learning_rate": 0.00019625614931661762, "loss": 1.6016, "step": 15259 }, { "epoch": 1.2, "learning_rate": 0.0001962443917930863, "loss": 1.5064, "step": 15260 }, { "epoch": 1.2, "learning_rate": 0.000196232633955581, "loss": 1.5404, "step": 15261 }, { "epoch": 1.2, "learning_rate": 0.0001962208758041817, "loss": 1.5893, "step": 15262 }, { "epoch": 1.2, "learning_rate": 0.00019620911733896808, "loss": 1.549, "step": 15263 }, { "epoch": 1.2, "learning_rate": 0.00019619735856002011, "loss": 1.5038, "step": 15264 }, { "epoch": 1.2, "learning_rate": 0.00019618559946741755, "loss": 1.5584, "step": 15265 }, { "epoch": 1.2, "learning_rate": 0.00019617384006124028, "loss": 1.5426, "step": 15266 }, { "epoch": 1.2, "learning_rate": 0.0001961620803415681, "loss": 1.5896, "step": 15267 }, { "epoch": 1.2, "learning_rate": 0.00019615032030848088, "loss": 1.5494, "step": 15268 }, { "epoch": 1.2, "learning_rate": 0.00019613855996205844, "loss": 1.5028, "step": 15269 }, { "epoch": 1.2, "learning_rate": 0.00019612679930238066, "loss": 1.566, "step": 15270 }, { "epoch": 1.2, "learning_rate": 0.00019611503832952734, "loss": 1.5822, "step": 15271 }, { "epoch": 1.2, "learning_rate": 0.0001961032770435784, "loss": 1.5859, "step": 15272 }, { "epoch": 1.2, "learning_rate": 0.00019609151544461358, "loss": 1.5628, "step": 15273 }, { "epoch": 1.2, "learning_rate": 0.00019607975353271286, "loss": 1.5817, "step": 15274 }, { "epoch": 1.2, "learning_rate": 0.00019606799130795602, "loss": 1.5425, "step": 15275 }, { "epoch": 1.2, "learning_rate": 0.00019605622877042294, "loss": 1.5418, "step": 15276 }, { "epoch": 1.2, "learning_rate": 0.0001960444659201935, "loss": 1.5929, "step": 15277 }, { "epoch": 1.2, "learning_rate": 0.00019603270275734755, "loss": 1.5383, "step": 15278 }, { "epoch": 1.2, "learning_rate": 0.00019602093928196496, "loss": 1.5664, "step": 15279 }, { "epoch": 1.2, "learning_rate": 0.00019600917549412552, "loss": 1.5778, "step": 15280 }, { "epoch": 1.2, "learning_rate": 0.0001959974113939092, "loss": 1.5332, "step": 15281 }, { "epoch": 1.2, "learning_rate": 0.00019598564698139587, "loss": 1.5569, "step": 15282 }, { "epoch": 1.2, "learning_rate": 0.00019597388225666535, "loss": 1.5263, "step": 15283 }, { "epoch": 1.2, "learning_rate": 0.0001959621172197976, "loss": 1.5014, "step": 15284 }, { "epoch": 1.2, "learning_rate": 0.00019595035187087236, "loss": 1.527, "step": 15285 }, { "epoch": 1.2, "learning_rate": 0.0001959385862099696, "loss": 1.4592, "step": 15286 }, { "epoch": 1.2, "learning_rate": 0.00019592682023716925, "loss": 1.5439, "step": 15287 }, { "epoch": 1.2, "learning_rate": 0.00019591505395255104, "loss": 1.5235, "step": 15288 }, { "epoch": 1.2, "learning_rate": 0.00019590328735619506, "loss": 1.5922, "step": 15289 }, { "epoch": 1.2, "learning_rate": 0.000195891520448181, "loss": 1.5579, "step": 15290 }, { "epoch": 1.2, "learning_rate": 0.0001958797532285889, "loss": 1.5121, "step": 15291 }, { "epoch": 1.2, "learning_rate": 0.00019586798569749857, "loss": 1.5483, "step": 15292 }, { "epoch": 1.2, "learning_rate": 0.0001958562178549899, "loss": 1.5441, "step": 15293 }, { "epoch": 1.2, "learning_rate": 0.0001958444497011429, "loss": 1.5593, "step": 15294 }, { "epoch": 1.2, "learning_rate": 0.00019583268123603729, "loss": 1.529, "step": 15295 }, { "epoch": 1.2, "learning_rate": 0.00019582091245975308, "loss": 1.5248, "step": 15296 }, { "epoch": 1.2, "learning_rate": 0.0001958091433723702, "loss": 1.5237, "step": 15297 }, { "epoch": 1.2, "learning_rate": 0.00019579737397396851, "loss": 1.5798, "step": 15298 }, { "epoch": 1.2, "learning_rate": 0.00019578560426462794, "loss": 1.5554, "step": 15299 }, { "epoch": 1.2, "learning_rate": 0.00019577383424442836, "loss": 1.551, "step": 15300 }, { "epoch": 1.2, "learning_rate": 0.00019576206391344971, "loss": 1.4884, "step": 15301 }, { "epoch": 1.2, "learning_rate": 0.00019575029327177187, "loss": 1.5564, "step": 15302 }, { "epoch": 1.2, "learning_rate": 0.00019573852231947482, "loss": 1.5665, "step": 15303 }, { "epoch": 1.2, "learning_rate": 0.00019572675105663842, "loss": 1.5484, "step": 15304 }, { "epoch": 1.2, "learning_rate": 0.00019571497948334265, "loss": 1.5883, "step": 15305 }, { "epoch": 1.2, "learning_rate": 0.0001957032075996674, "loss": 1.624, "step": 15306 }, { "epoch": 1.2, "learning_rate": 0.00019569143540569255, "loss": 1.5579, "step": 15307 }, { "epoch": 1.2, "learning_rate": 0.00019567966290149808, "loss": 1.5526, "step": 15308 }, { "epoch": 1.2, "learning_rate": 0.00019566789008716395, "loss": 1.5976, "step": 15309 }, { "epoch": 1.2, "learning_rate": 0.00019565611696276998, "loss": 1.5371, "step": 15310 }, { "epoch": 1.2, "learning_rate": 0.00019564434352839624, "loss": 1.5677, "step": 15311 }, { "epoch": 1.2, "learning_rate": 0.00019563256978412253, "loss": 1.5502, "step": 15312 }, { "epoch": 1.2, "learning_rate": 0.00019562079573002888, "loss": 1.5279, "step": 15313 }, { "epoch": 1.2, "learning_rate": 0.0001956090213661952, "loss": 1.5123, "step": 15314 }, { "epoch": 1.21, "learning_rate": 0.00019559724669270144, "loss": 1.5086, "step": 15315 }, { "epoch": 1.21, "learning_rate": 0.00019558547170962754, "loss": 1.5283, "step": 15316 }, { "epoch": 1.21, "learning_rate": 0.00019557369641705344, "loss": 1.5322, "step": 15317 }, { "epoch": 1.21, "learning_rate": 0.0001955619208150591, "loss": 1.5441, "step": 15318 }, { "epoch": 1.21, "learning_rate": 0.00019555014490372445, "loss": 1.5533, "step": 15319 }, { "epoch": 1.21, "learning_rate": 0.00019553836868312945, "loss": 1.5209, "step": 15320 }, { "epoch": 1.21, "learning_rate": 0.00019552659215335406, "loss": 1.5492, "step": 15321 }, { "epoch": 1.21, "learning_rate": 0.00019551481531447822, "loss": 1.5816, "step": 15322 }, { "epoch": 1.21, "learning_rate": 0.00019550303816658196, "loss": 1.621, "step": 15323 }, { "epoch": 1.21, "learning_rate": 0.0001954912607097451, "loss": 1.564, "step": 15324 }, { "epoch": 1.21, "learning_rate": 0.0001954794829440477, "loss": 1.5872, "step": 15325 }, { "epoch": 1.21, "learning_rate": 0.0001954677048695698, "loss": 1.5542, "step": 15326 }, { "epoch": 1.21, "learning_rate": 0.0001954559264863912, "loss": 1.4857, "step": 15327 }, { "epoch": 1.21, "learning_rate": 0.0001954441477945919, "loss": 1.5337, "step": 15328 }, { "epoch": 1.21, "learning_rate": 0.000195432368794252, "loss": 1.5127, "step": 15329 }, { "epoch": 1.21, "learning_rate": 0.00019542058948545136, "loss": 1.5694, "step": 15330 }, { "epoch": 1.21, "learning_rate": 0.00019540880986826994, "loss": 1.504, "step": 15331 }, { "epoch": 1.21, "learning_rate": 0.00019539702994278782, "loss": 1.5496, "step": 15332 }, { "epoch": 1.21, "learning_rate": 0.00019538524970908489, "loss": 1.5604, "step": 15333 }, { "epoch": 1.21, "learning_rate": 0.00019537346916724115, "loss": 1.5649, "step": 15334 }, { "epoch": 1.21, "learning_rate": 0.00019536168831733657, "loss": 1.561, "step": 15335 }, { "epoch": 1.21, "learning_rate": 0.0001953499071594512, "loss": 1.5723, "step": 15336 }, { "epoch": 1.21, "learning_rate": 0.00019533812569366498, "loss": 1.5432, "step": 15337 }, { "epoch": 1.21, "learning_rate": 0.00019532634392005794, "loss": 1.5054, "step": 15338 }, { "epoch": 1.21, "learning_rate": 0.00019531456183871, "loss": 1.4959, "step": 15339 }, { "epoch": 1.21, "learning_rate": 0.00019530277944970122, "loss": 1.6402, "step": 15340 }, { "epoch": 1.21, "learning_rate": 0.00019529099675311154, "loss": 1.5067, "step": 15341 }, { "epoch": 1.21, "learning_rate": 0.00019527921374902098, "loss": 1.6224, "step": 15342 }, { "epoch": 1.21, "learning_rate": 0.00019526743043750955, "loss": 1.561, "step": 15343 }, { "epoch": 1.21, "learning_rate": 0.00019525564681865723, "loss": 1.6096, "step": 15344 }, { "epoch": 1.21, "learning_rate": 0.0001952438628925441, "loss": 1.5142, "step": 15345 }, { "epoch": 1.21, "learning_rate": 0.00019523207865925006, "loss": 1.5681, "step": 15346 }, { "epoch": 1.21, "learning_rate": 0.0001952202941188552, "loss": 1.512, "step": 15347 }, { "epoch": 1.21, "learning_rate": 0.00019520850927143946, "loss": 1.5087, "step": 15348 }, { "epoch": 1.21, "learning_rate": 0.0001951967241170829, "loss": 1.4646, "step": 15349 }, { "epoch": 1.21, "learning_rate": 0.00019518493865586557, "loss": 1.5217, "step": 15350 }, { "epoch": 1.21, "learning_rate": 0.00019517315288786736, "loss": 1.5797, "step": 15351 }, { "epoch": 1.21, "learning_rate": 0.00019516136681316845, "loss": 1.561, "step": 15352 }, { "epoch": 1.21, "learning_rate": 0.00019514958043184873, "loss": 1.5186, "step": 15353 }, { "epoch": 1.21, "learning_rate": 0.0001951377937439883, "loss": 1.5146, "step": 15354 }, { "epoch": 1.21, "learning_rate": 0.00019512600674966718, "loss": 1.5034, "step": 15355 }, { "epoch": 1.21, "learning_rate": 0.00019511421944896535, "loss": 1.5641, "step": 15356 }, { "epoch": 1.21, "learning_rate": 0.00019510243184196288, "loss": 1.587, "step": 15357 }, { "epoch": 1.21, "learning_rate": 0.00019509064392873973, "loss": 1.5164, "step": 15358 }, { "epoch": 1.21, "learning_rate": 0.00019507885570937603, "loss": 1.5152, "step": 15359 }, { "epoch": 1.21, "learning_rate": 0.0001950670671839518, "loss": 1.5335, "step": 15360 }, { "epoch": 1.21, "learning_rate": 0.000195055278352547, "loss": 1.5158, "step": 15361 }, { "epoch": 1.21, "learning_rate": 0.0001950434892152418, "loss": 1.5351, "step": 15362 }, { "epoch": 1.21, "learning_rate": 0.0001950316997721161, "loss": 1.5179, "step": 15363 }, { "epoch": 1.21, "learning_rate": 0.00019501991002325003, "loss": 1.5932, "step": 15364 }, { "epoch": 1.21, "learning_rate": 0.00019500811996872364, "loss": 1.569, "step": 15365 }, { "epoch": 1.21, "learning_rate": 0.00019499632960861692, "loss": 1.466, "step": 15366 }, { "epoch": 1.21, "learning_rate": 0.00019498453894300995, "loss": 1.5005, "step": 15367 }, { "epoch": 1.21, "learning_rate": 0.0001949727479719828, "loss": 1.5353, "step": 15368 }, { "epoch": 1.21, "learning_rate": 0.0001949609566956155, "loss": 1.5581, "step": 15369 }, { "epoch": 1.21, "learning_rate": 0.0001949491651139881, "loss": 1.5026, "step": 15370 }, { "epoch": 1.21, "learning_rate": 0.0001949373732271807, "loss": 1.5472, "step": 15371 }, { "epoch": 1.21, "learning_rate": 0.00019492558103527337, "loss": 1.5131, "step": 15372 }, { "epoch": 1.21, "learning_rate": 0.00019491378853834606, "loss": 1.5383, "step": 15373 }, { "epoch": 1.21, "learning_rate": 0.00019490199573647898, "loss": 1.5811, "step": 15374 }, { "epoch": 1.21, "learning_rate": 0.0001948902026297521, "loss": 1.4935, "step": 15375 }, { "epoch": 1.21, "learning_rate": 0.00019487840921824553, "loss": 1.5541, "step": 15376 }, { "epoch": 1.21, "learning_rate": 0.00019486661550203928, "loss": 1.5278, "step": 15377 }, { "epoch": 1.21, "learning_rate": 0.00019485482148121349, "loss": 1.5383, "step": 15378 }, { "epoch": 1.21, "learning_rate": 0.00019484302715584823, "loss": 1.556, "step": 15379 }, { "epoch": 1.21, "learning_rate": 0.00019483123252602355, "loss": 1.5298, "step": 15380 }, { "epoch": 1.21, "learning_rate": 0.00019481943759181954, "loss": 1.5078, "step": 15381 }, { "epoch": 1.21, "learning_rate": 0.00019480764235331634, "loss": 1.5646, "step": 15382 }, { "epoch": 1.21, "learning_rate": 0.00019479584681059386, "loss": 1.5851, "step": 15383 }, { "epoch": 1.21, "learning_rate": 0.0001947840509637324, "loss": 1.5656, "step": 15384 }, { "epoch": 1.21, "learning_rate": 0.00019477225481281192, "loss": 1.573, "step": 15385 }, { "epoch": 1.21, "learning_rate": 0.00019476045835791254, "loss": 1.5577, "step": 15386 }, { "epoch": 1.21, "learning_rate": 0.00019474866159911432, "loss": 1.56, "step": 15387 }, { "epoch": 1.21, "learning_rate": 0.00019473686453649742, "loss": 1.5167, "step": 15388 }, { "epoch": 1.21, "learning_rate": 0.00019472506717014187, "loss": 1.5413, "step": 15389 }, { "epoch": 1.21, "learning_rate": 0.00019471326950012778, "loss": 1.4872, "step": 15390 }, { "epoch": 1.21, "learning_rate": 0.00019470147152653532, "loss": 1.5048, "step": 15391 }, { "epoch": 1.21, "learning_rate": 0.0001946896732494445, "loss": 1.5983, "step": 15392 }, { "epoch": 1.21, "learning_rate": 0.00019467787466893546, "loss": 1.5506, "step": 15393 }, { "epoch": 1.21, "learning_rate": 0.00019466607578508832, "loss": 1.5474, "step": 15394 }, { "epoch": 1.21, "learning_rate": 0.00019465427659798318, "loss": 1.5153, "step": 15395 }, { "epoch": 1.21, "learning_rate": 0.00019464247710770016, "loss": 1.5187, "step": 15396 }, { "epoch": 1.21, "learning_rate": 0.0001946306773143193, "loss": 1.5125, "step": 15397 }, { "epoch": 1.21, "learning_rate": 0.00019461887721792078, "loss": 1.535, "step": 15398 }, { "epoch": 1.21, "learning_rate": 0.00019460707681858474, "loss": 1.5528, "step": 15399 }, { "epoch": 1.21, "learning_rate": 0.00019459527611639122, "loss": 1.527, "step": 15400 }, { "epoch": 1.21, "learning_rate": 0.00019458347511142044, "loss": 1.5514, "step": 15401 }, { "epoch": 1.21, "learning_rate": 0.00019457167380375245, "loss": 1.5756, "step": 15402 }, { "epoch": 1.21, "learning_rate": 0.00019455987219346737, "loss": 1.5663, "step": 15403 }, { "epoch": 1.21, "learning_rate": 0.00019454807028064535, "loss": 1.5862, "step": 15404 }, { "epoch": 1.21, "learning_rate": 0.00019453626806536654, "loss": 1.5417, "step": 15405 }, { "epoch": 1.21, "learning_rate": 0.00019452446554771101, "loss": 1.5267, "step": 15406 }, { "epoch": 1.21, "learning_rate": 0.00019451266272775897, "loss": 1.5467, "step": 15407 }, { "epoch": 1.21, "learning_rate": 0.00019450085960559052, "loss": 1.5474, "step": 15408 }, { "epoch": 1.21, "learning_rate": 0.00019448905618128575, "loss": 1.5198, "step": 15409 }, { "epoch": 1.21, "learning_rate": 0.00019447725245492486, "loss": 1.5624, "step": 15410 }, { "epoch": 1.21, "learning_rate": 0.00019446544842658797, "loss": 1.5558, "step": 15411 }, { "epoch": 1.21, "learning_rate": 0.00019445364409635522, "loss": 1.5581, "step": 15412 }, { "epoch": 1.21, "learning_rate": 0.0001944418394643068, "loss": 1.5441, "step": 15413 }, { "epoch": 1.21, "learning_rate": 0.00019443003453052272, "loss": 1.4992, "step": 15414 }, { "epoch": 1.21, "learning_rate": 0.00019441822929508332, "loss": 1.5455, "step": 15415 }, { "epoch": 1.21, "learning_rate": 0.0001944064237580686, "loss": 1.5698, "step": 15416 }, { "epoch": 1.21, "learning_rate": 0.00019439461791955878, "loss": 1.5467, "step": 15417 }, { "epoch": 1.21, "learning_rate": 0.00019438281177963402, "loss": 1.5746, "step": 15418 }, { "epoch": 1.21, "learning_rate": 0.00019437100533837445, "loss": 1.5828, "step": 15419 }, { "epoch": 1.21, "learning_rate": 0.0001943591985958602, "loss": 1.5081, "step": 15420 }, { "epoch": 1.21, "learning_rate": 0.00019434739155217156, "loss": 1.5299, "step": 15421 }, { "epoch": 1.21, "learning_rate": 0.0001943355842073885, "loss": 1.5717, "step": 15422 }, { "epoch": 1.21, "learning_rate": 0.00019432377656159136, "loss": 1.5259, "step": 15423 }, { "epoch": 1.21, "learning_rate": 0.0001943119686148602, "loss": 1.5691, "step": 15424 }, { "epoch": 1.21, "learning_rate": 0.0001943001603672753, "loss": 1.5141, "step": 15425 }, { "epoch": 1.21, "learning_rate": 0.0001942883518189167, "loss": 1.6127, "step": 15426 }, { "epoch": 1.21, "learning_rate": 0.0001942765429698646, "loss": 1.4978, "step": 15427 }, { "epoch": 1.21, "learning_rate": 0.00019426473382019928, "loss": 1.5773, "step": 15428 }, { "epoch": 1.21, "learning_rate": 0.00019425292437000077, "loss": 1.5638, "step": 15429 }, { "epoch": 1.21, "learning_rate": 0.00019424111461934936, "loss": 1.566, "step": 15430 }, { "epoch": 1.21, "learning_rate": 0.0001942293045683252, "loss": 1.6251, "step": 15431 }, { "epoch": 1.21, "learning_rate": 0.00019421749421700846, "loss": 1.5609, "step": 15432 }, { "epoch": 1.21, "learning_rate": 0.00019420568356547934, "loss": 1.5977, "step": 15433 }, { "epoch": 1.21, "learning_rate": 0.000194193872613818, "loss": 1.5159, "step": 15434 }, { "epoch": 1.21, "learning_rate": 0.00019418206136210473, "loss": 1.542, "step": 15435 }, { "epoch": 1.21, "learning_rate": 0.00019417024981041958, "loss": 1.5252, "step": 15436 }, { "epoch": 1.21, "learning_rate": 0.0001941584379588428, "loss": 1.6064, "step": 15437 }, { "epoch": 1.21, "learning_rate": 0.00019414662580745463, "loss": 1.592, "step": 15438 }, { "epoch": 1.21, "learning_rate": 0.00019413481335633519, "loss": 1.5337, "step": 15439 }, { "epoch": 1.21, "learning_rate": 0.00019412300060556476, "loss": 1.5329, "step": 15440 }, { "epoch": 1.21, "learning_rate": 0.0001941111875552235, "loss": 1.5457, "step": 15441 }, { "epoch": 1.21, "learning_rate": 0.00019409937420539165, "loss": 1.5311, "step": 15442 }, { "epoch": 1.22, "learning_rate": 0.00019408756055614934, "loss": 1.5305, "step": 15443 }, { "epoch": 1.22, "learning_rate": 0.00019407574660757683, "loss": 1.5493, "step": 15444 }, { "epoch": 1.22, "learning_rate": 0.0001940639323597543, "loss": 1.5809, "step": 15445 }, { "epoch": 1.22, "learning_rate": 0.00019405211781276202, "loss": 1.6023, "step": 15446 }, { "epoch": 1.22, "learning_rate": 0.0001940403029666802, "loss": 1.525, "step": 15447 }, { "epoch": 1.22, "learning_rate": 0.00019402848782158898, "loss": 1.5585, "step": 15448 }, { "epoch": 1.22, "learning_rate": 0.00019401667237756861, "loss": 1.5284, "step": 15449 }, { "epoch": 1.22, "learning_rate": 0.00019400485663469938, "loss": 1.5727, "step": 15450 }, { "epoch": 1.22, "learning_rate": 0.0001939930405930614, "loss": 1.5573, "step": 15451 }, { "epoch": 1.22, "learning_rate": 0.00019398122425273503, "loss": 1.4825, "step": 15452 }, { "epoch": 1.22, "learning_rate": 0.0001939694076138003, "loss": 1.5609, "step": 15453 }, { "epoch": 1.22, "learning_rate": 0.00019395759067633765, "loss": 1.5462, "step": 15454 }, { "epoch": 1.22, "learning_rate": 0.0001939457734404272, "loss": 1.4955, "step": 15455 }, { "epoch": 1.22, "learning_rate": 0.00019393395590614919, "loss": 1.5868, "step": 15456 }, { "epoch": 1.22, "learning_rate": 0.0001939221380735839, "loss": 1.5487, "step": 15457 }, { "epoch": 1.22, "learning_rate": 0.00019391031994281147, "loss": 1.5172, "step": 15458 }, { "epoch": 1.22, "learning_rate": 0.00019389850151391223, "loss": 1.567, "step": 15459 }, { "epoch": 1.22, "learning_rate": 0.0001938866827869664, "loss": 1.541, "step": 15460 }, { "epoch": 1.22, "learning_rate": 0.0001938748637620542, "loss": 1.4659, "step": 15461 }, { "epoch": 1.22, "learning_rate": 0.00019386304443925583, "loss": 1.5114, "step": 15462 }, { "epoch": 1.22, "learning_rate": 0.00019385122481865166, "loss": 1.5083, "step": 15463 }, { "epoch": 1.22, "learning_rate": 0.0001938394049003219, "loss": 1.5443, "step": 15464 }, { "epoch": 1.22, "learning_rate": 0.00019382758468434671, "loss": 1.5705, "step": 15465 }, { "epoch": 1.22, "learning_rate": 0.00019381576417080643, "loss": 1.6054, "step": 15466 }, { "epoch": 1.22, "learning_rate": 0.0001938039433597813, "loss": 1.5311, "step": 15467 }, { "epoch": 1.22, "learning_rate": 0.00019379212225135154, "loss": 1.5546, "step": 15468 }, { "epoch": 1.22, "learning_rate": 0.00019378030084559746, "loss": 1.561, "step": 15469 }, { "epoch": 1.22, "learning_rate": 0.00019376847914259927, "loss": 1.5863, "step": 15470 }, { "epoch": 1.22, "learning_rate": 0.00019375665714243734, "loss": 1.5295, "step": 15471 }, { "epoch": 1.22, "learning_rate": 0.00019374483484519176, "loss": 1.5066, "step": 15472 }, { "epoch": 1.22, "learning_rate": 0.00019373301225094293, "loss": 1.5474, "step": 15473 }, { "epoch": 1.22, "learning_rate": 0.0001937211893597711, "loss": 1.5227, "step": 15474 }, { "epoch": 1.22, "learning_rate": 0.00019370936617175652, "loss": 1.5323, "step": 15475 }, { "epoch": 1.22, "learning_rate": 0.00019369754268697945, "loss": 1.5752, "step": 15476 }, { "epoch": 1.22, "learning_rate": 0.0001936857189055201, "loss": 1.5643, "step": 15477 }, { "epoch": 1.22, "learning_rate": 0.00019367389482745893, "loss": 1.5914, "step": 15478 }, { "epoch": 1.22, "learning_rate": 0.0001936620704528761, "loss": 1.5179, "step": 15479 }, { "epoch": 1.22, "learning_rate": 0.00019365024578185192, "loss": 1.535, "step": 15480 }, { "epoch": 1.22, "learning_rate": 0.00019363842081446662, "loss": 1.5557, "step": 15481 }, { "epoch": 1.22, "learning_rate": 0.00019362659555080053, "loss": 1.5732, "step": 15482 }, { "epoch": 1.22, "learning_rate": 0.00019361476999093396, "loss": 1.5334, "step": 15483 }, { "epoch": 1.22, "learning_rate": 0.00019360294413494714, "loss": 1.5584, "step": 15484 }, { "epoch": 1.22, "learning_rate": 0.00019359111798292035, "loss": 1.557, "step": 15485 }, { "epoch": 1.22, "learning_rate": 0.00019357929153493404, "loss": 1.5614, "step": 15486 }, { "epoch": 1.22, "learning_rate": 0.0001935674647910683, "loss": 1.545, "step": 15487 }, { "epoch": 1.22, "learning_rate": 0.00019355563775140357, "loss": 1.5188, "step": 15488 }, { "epoch": 1.22, "learning_rate": 0.00019354381041602003, "loss": 1.5233, "step": 15489 }, { "epoch": 1.22, "learning_rate": 0.00019353198278499812, "loss": 1.5116, "step": 15490 }, { "epoch": 1.22, "learning_rate": 0.000193520154858418, "loss": 1.5635, "step": 15491 }, { "epoch": 1.22, "learning_rate": 0.0001935083266363601, "loss": 1.5191, "step": 15492 }, { "epoch": 1.22, "learning_rate": 0.0001934964981189046, "loss": 1.5825, "step": 15493 }, { "epoch": 1.22, "learning_rate": 0.00019348466930613198, "loss": 1.518, "step": 15494 }, { "epoch": 1.22, "learning_rate": 0.00019347284019812237, "loss": 1.5448, "step": 15495 }, { "epoch": 1.22, "learning_rate": 0.00019346101079495623, "loss": 1.5352, "step": 15496 }, { "epoch": 1.22, "learning_rate": 0.00019344918109671374, "loss": 1.5374, "step": 15497 }, { "epoch": 1.22, "learning_rate": 0.00019343735110347537, "loss": 1.5425, "step": 15498 }, { "epoch": 1.22, "learning_rate": 0.0001934255208153213, "loss": 1.5018, "step": 15499 }, { "epoch": 1.22, "learning_rate": 0.0001934136902323319, "loss": 1.4945, "step": 15500 }, { "epoch": 1.22, "learning_rate": 0.00019340185935458752, "loss": 1.5477, "step": 15501 }, { "epoch": 1.22, "learning_rate": 0.00019339002818216848, "loss": 1.4983, "step": 15502 }, { "epoch": 1.22, "learning_rate": 0.0001933781967151551, "loss": 1.5183, "step": 15503 }, { "epoch": 1.22, "learning_rate": 0.0001933663649536277, "loss": 1.591, "step": 15504 }, { "epoch": 1.22, "learning_rate": 0.00019335453289766655, "loss": 1.5616, "step": 15505 }, { "epoch": 1.22, "learning_rate": 0.00019334270054735214, "loss": 1.5243, "step": 15506 }, { "epoch": 1.22, "learning_rate": 0.00019333086790276465, "loss": 1.552, "step": 15507 }, { "epoch": 1.22, "learning_rate": 0.00019331903496398446, "loss": 1.5668, "step": 15508 }, { "epoch": 1.22, "learning_rate": 0.000193307201731092, "loss": 1.5258, "step": 15509 }, { "epoch": 1.22, "learning_rate": 0.0001932953682041675, "loss": 1.504, "step": 15510 }, { "epoch": 1.22, "learning_rate": 0.00019328353438329135, "loss": 1.4725, "step": 15511 }, { "epoch": 1.22, "learning_rate": 0.00019327170026854388, "loss": 1.4998, "step": 15512 }, { "epoch": 1.22, "learning_rate": 0.00019325986586000543, "loss": 1.4844, "step": 15513 }, { "epoch": 1.22, "learning_rate": 0.00019324803115775636, "loss": 1.5186, "step": 15514 }, { "epoch": 1.22, "learning_rate": 0.0001932361961618771, "loss": 1.5354, "step": 15515 }, { "epoch": 1.22, "learning_rate": 0.00019322436087244784, "loss": 1.5261, "step": 15516 }, { "epoch": 1.22, "learning_rate": 0.0001932125252895491, "loss": 1.5606, "step": 15517 }, { "epoch": 1.22, "learning_rate": 0.00019320068941326108, "loss": 1.5619, "step": 15518 }, { "epoch": 1.22, "learning_rate": 0.00019318885324366423, "loss": 1.5253, "step": 15519 }, { "epoch": 1.22, "learning_rate": 0.00019317701678083895, "loss": 1.5238, "step": 15520 }, { "epoch": 1.22, "learning_rate": 0.00019316518002486554, "loss": 1.5532, "step": 15521 }, { "epoch": 1.22, "learning_rate": 0.00019315334297582436, "loss": 1.4829, "step": 15522 }, { "epoch": 1.22, "learning_rate": 0.0001931415056337958, "loss": 1.4946, "step": 15523 }, { "epoch": 1.22, "learning_rate": 0.0001931296679988602, "loss": 1.487, "step": 15524 }, { "epoch": 1.22, "learning_rate": 0.000193117830071098, "loss": 1.5295, "step": 15525 }, { "epoch": 1.22, "learning_rate": 0.00019310599185058948, "loss": 1.5594, "step": 15526 }, { "epoch": 1.22, "learning_rate": 0.00019309415333741513, "loss": 1.4972, "step": 15527 }, { "epoch": 1.22, "learning_rate": 0.0001930823145316552, "loss": 1.5163, "step": 15528 }, { "epoch": 1.22, "learning_rate": 0.00019307047543339016, "loss": 1.5269, "step": 15529 }, { "epoch": 1.22, "learning_rate": 0.00019305863604270035, "loss": 1.5707, "step": 15530 }, { "epoch": 1.22, "learning_rate": 0.00019304679635966617, "loss": 1.5785, "step": 15531 }, { "epoch": 1.22, "learning_rate": 0.00019303495638436796, "loss": 1.565, "step": 15532 }, { "epoch": 1.22, "learning_rate": 0.0001930231161168862, "loss": 1.5888, "step": 15533 }, { "epoch": 1.22, "learning_rate": 0.0001930112755573012, "loss": 1.5246, "step": 15534 }, { "epoch": 1.22, "learning_rate": 0.00019299943470569338, "loss": 1.518, "step": 15535 }, { "epoch": 1.22, "learning_rate": 0.00019298759356214314, "loss": 1.5427, "step": 15536 }, { "epoch": 1.22, "learning_rate": 0.00019297575212673084, "loss": 1.5665, "step": 15537 }, { "epoch": 1.22, "learning_rate": 0.0001929639103995369, "loss": 1.55, "step": 15538 }, { "epoch": 1.22, "learning_rate": 0.0001929520683806417, "loss": 1.4961, "step": 15539 }, { "epoch": 1.22, "learning_rate": 0.00019294022607012568, "loss": 1.5259, "step": 15540 }, { "epoch": 1.22, "learning_rate": 0.0001929283834680692, "loss": 1.5453, "step": 15541 }, { "epoch": 1.22, "learning_rate": 0.00019291654057455274, "loss": 1.5317, "step": 15542 }, { "epoch": 1.22, "learning_rate": 0.0001929046973896566, "loss": 1.5826, "step": 15543 }, { "epoch": 1.22, "learning_rate": 0.0001928928539134613, "loss": 1.5054, "step": 15544 }, { "epoch": 1.22, "learning_rate": 0.00019288101014604714, "loss": 1.5448, "step": 15545 }, { "epoch": 1.22, "learning_rate": 0.00019286916608749461, "loss": 1.5612, "step": 15546 }, { "epoch": 1.22, "learning_rate": 0.0001928573217378841, "loss": 1.5564, "step": 15547 }, { "epoch": 1.22, "learning_rate": 0.00019284547709729597, "loss": 1.552, "step": 15548 }, { "epoch": 1.22, "learning_rate": 0.00019283363216581078, "loss": 1.5604, "step": 15549 }, { "epoch": 1.22, "learning_rate": 0.00019282178694350879, "loss": 1.5091, "step": 15550 }, { "epoch": 1.22, "learning_rate": 0.00019280994143047053, "loss": 1.5367, "step": 15551 }, { "epoch": 1.22, "learning_rate": 0.00019279809562677643, "loss": 1.5315, "step": 15552 }, { "epoch": 1.22, "learning_rate": 0.00019278624953250682, "loss": 1.557, "step": 15553 }, { "epoch": 1.22, "learning_rate": 0.0001927744031477422, "loss": 1.54, "step": 15554 }, { "epoch": 1.22, "learning_rate": 0.00019276255647256298, "loss": 1.5223, "step": 15555 }, { "epoch": 1.22, "learning_rate": 0.00019275070950704965, "loss": 1.5596, "step": 15556 }, { "epoch": 1.22, "learning_rate": 0.00019273886225128258, "loss": 1.5352, "step": 15557 }, { "epoch": 1.22, "learning_rate": 0.00019272701470534215, "loss": 1.4809, "step": 15558 }, { "epoch": 1.22, "learning_rate": 0.00019271516686930894, "loss": 1.6166, "step": 15559 }, { "epoch": 1.22, "learning_rate": 0.00019270331874326332, "loss": 1.4841, "step": 15560 }, { "epoch": 1.22, "learning_rate": 0.00019269147032728568, "loss": 1.5591, "step": 15561 }, { "epoch": 1.22, "learning_rate": 0.00019267962162145658, "loss": 1.4944, "step": 15562 }, { "epoch": 1.22, "learning_rate": 0.00019266777262585632, "loss": 1.5555, "step": 15563 }, { "epoch": 1.22, "learning_rate": 0.0001926559233405655, "loss": 1.5434, "step": 15564 }, { "epoch": 1.22, "learning_rate": 0.00019264407376566448, "loss": 1.5383, "step": 15565 }, { "epoch": 1.22, "learning_rate": 0.00019263222390123374, "loss": 1.5314, "step": 15566 }, { "epoch": 1.22, "learning_rate": 0.0001926203737473537, "loss": 1.5142, "step": 15567 }, { "epoch": 1.22, "learning_rate": 0.00019260852330410487, "loss": 1.5592, "step": 15568 }, { "epoch": 1.22, "learning_rate": 0.0001925966725715677, "loss": 1.5444, "step": 15569 }, { "epoch": 1.23, "learning_rate": 0.00019258482154982257, "loss": 1.4941, "step": 15570 }, { "epoch": 1.23, "learning_rate": 0.00019257297023895, "loss": 1.5522, "step": 15571 }, { "epoch": 1.23, "learning_rate": 0.00019256111863903049, "loss": 1.5129, "step": 15572 }, { "epoch": 1.23, "learning_rate": 0.0001925492667501445, "loss": 1.5187, "step": 15573 }, { "epoch": 1.23, "learning_rate": 0.00019253741457237245, "loss": 1.5513, "step": 15574 }, { "epoch": 1.23, "learning_rate": 0.00019252556210579478, "loss": 1.5482, "step": 15575 }, { "epoch": 1.23, "learning_rate": 0.00019251370935049206, "loss": 1.5818, "step": 15576 }, { "epoch": 1.23, "learning_rate": 0.00019250185630654472, "loss": 1.5026, "step": 15577 }, { "epoch": 1.23, "learning_rate": 0.00019249000297403318, "loss": 1.5497, "step": 15578 }, { "epoch": 1.23, "learning_rate": 0.00019247814935303802, "loss": 1.578, "step": 15579 }, { "epoch": 1.23, "learning_rate": 0.00019246629544363963, "loss": 1.5166, "step": 15580 }, { "epoch": 1.23, "learning_rate": 0.00019245444124591857, "loss": 1.5285, "step": 15581 }, { "epoch": 1.23, "learning_rate": 0.00019244258675995524, "loss": 1.5381, "step": 15582 }, { "epoch": 1.23, "learning_rate": 0.0001924307319858302, "loss": 1.5632, "step": 15583 }, { "epoch": 1.23, "learning_rate": 0.00019241887692362389, "loss": 1.5528, "step": 15584 }, { "epoch": 1.23, "learning_rate": 0.00019240702157341682, "loss": 1.4855, "step": 15585 }, { "epoch": 1.23, "learning_rate": 0.00019239516593528948, "loss": 1.5644, "step": 15586 }, { "epoch": 1.23, "learning_rate": 0.00019238331000932232, "loss": 1.5605, "step": 15587 }, { "epoch": 1.23, "learning_rate": 0.00019237145379559593, "loss": 1.5346, "step": 15588 }, { "epoch": 1.23, "learning_rate": 0.00019235959729419072, "loss": 1.5826, "step": 15589 }, { "epoch": 1.23, "learning_rate": 0.0001923477405051872, "loss": 1.6003, "step": 15590 }, { "epoch": 1.23, "learning_rate": 0.00019233588342866594, "loss": 1.5496, "step": 15591 }, { "epoch": 1.23, "learning_rate": 0.00019232402606470737, "loss": 1.5369, "step": 15592 }, { "epoch": 1.23, "learning_rate": 0.00019231216841339202, "loss": 1.5915, "step": 15593 }, { "epoch": 1.23, "learning_rate": 0.0001923003104748004, "loss": 1.5392, "step": 15594 }, { "epoch": 1.23, "learning_rate": 0.00019228845224901302, "loss": 1.5668, "step": 15595 }, { "epoch": 1.23, "learning_rate": 0.00019227659373611037, "loss": 1.5047, "step": 15596 }, { "epoch": 1.23, "learning_rate": 0.00019226473493617297, "loss": 1.5325, "step": 15597 }, { "epoch": 1.23, "learning_rate": 0.00019225287584928138, "loss": 1.561, "step": 15598 }, { "epoch": 1.23, "learning_rate": 0.00019224101647551605, "loss": 1.5615, "step": 15599 }, { "epoch": 1.23, "learning_rate": 0.00019222915681495754, "loss": 1.5591, "step": 15600 }, { "epoch": 1.23, "learning_rate": 0.00019221729686768634, "loss": 1.556, "step": 15601 }, { "epoch": 1.23, "learning_rate": 0.00019220543663378304, "loss": 1.5321, "step": 15602 }, { "epoch": 1.23, "learning_rate": 0.00019219357611332806, "loss": 1.5405, "step": 15603 }, { "epoch": 1.23, "learning_rate": 0.00019218171530640198, "loss": 1.5203, "step": 15604 }, { "epoch": 1.23, "learning_rate": 0.0001921698542130854, "loss": 1.527, "step": 15605 }, { "epoch": 1.23, "learning_rate": 0.00019215799283345874, "loss": 1.5634, "step": 15606 }, { "epoch": 1.23, "learning_rate": 0.00019214613116760255, "loss": 1.5241, "step": 15607 }, { "epoch": 1.23, "learning_rate": 0.00019213426921559746, "loss": 1.5244, "step": 15608 }, { "epoch": 1.23, "learning_rate": 0.00019212240697752387, "loss": 1.5644, "step": 15609 }, { "epoch": 1.23, "learning_rate": 0.00019211054445346238, "loss": 1.5512, "step": 15610 }, { "epoch": 1.23, "learning_rate": 0.00019209868164349352, "loss": 1.5835, "step": 15611 }, { "epoch": 1.23, "learning_rate": 0.00019208681854769792, "loss": 1.5405, "step": 15612 }, { "epoch": 1.23, "learning_rate": 0.00019207495516615597, "loss": 1.5512, "step": 15613 }, { "epoch": 1.23, "learning_rate": 0.00019206309149894833, "loss": 1.5597, "step": 15614 }, { "epoch": 1.23, "learning_rate": 0.0001920512275461555, "loss": 1.485, "step": 15615 }, { "epoch": 1.23, "learning_rate": 0.00019203936330785805, "loss": 1.5326, "step": 15616 }, { "epoch": 1.23, "learning_rate": 0.00019202749878413652, "loss": 1.5021, "step": 15617 }, { "epoch": 1.23, "learning_rate": 0.00019201563397507144, "loss": 1.5705, "step": 15618 }, { "epoch": 1.23, "learning_rate": 0.00019200376888074341, "loss": 1.5536, "step": 15619 }, { "epoch": 1.23, "learning_rate": 0.000191991903501233, "loss": 1.5824, "step": 15620 }, { "epoch": 1.23, "learning_rate": 0.00019198003783662068, "loss": 1.5515, "step": 15621 }, { "epoch": 1.23, "learning_rate": 0.0001919681718869871, "loss": 1.5779, "step": 15622 }, { "epoch": 1.23, "learning_rate": 0.00019195630565241282, "loss": 1.4841, "step": 15623 }, { "epoch": 1.23, "learning_rate": 0.00019194443913297834, "loss": 1.5615, "step": 15624 }, { "epoch": 1.23, "learning_rate": 0.0001919325723287643, "loss": 1.5366, "step": 15625 }, { "epoch": 1.23, "learning_rate": 0.00019192070523985118, "loss": 1.556, "step": 15626 }, { "epoch": 1.23, "learning_rate": 0.00019190883786631964, "loss": 1.5118, "step": 15627 }, { "epoch": 1.23, "learning_rate": 0.0001918969702082502, "loss": 1.5626, "step": 15628 }, { "epoch": 1.23, "learning_rate": 0.0001918851022657235, "loss": 1.4779, "step": 15629 }, { "epoch": 1.23, "learning_rate": 0.00019187323403882005, "loss": 1.5575, "step": 15630 }, { "epoch": 1.23, "learning_rate": 0.00019186136552762042, "loss": 1.5381, "step": 15631 }, { "epoch": 1.23, "learning_rate": 0.00019184949673220527, "loss": 1.4963, "step": 15632 }, { "epoch": 1.23, "learning_rate": 0.00019183762765265507, "loss": 1.6265, "step": 15633 }, { "epoch": 1.23, "learning_rate": 0.0001918257582890505, "loss": 1.5425, "step": 15634 }, { "epoch": 1.23, "learning_rate": 0.00019181388864147208, "loss": 1.564, "step": 15635 }, { "epoch": 1.23, "learning_rate": 0.00019180201871000043, "loss": 1.5523, "step": 15636 }, { "epoch": 1.23, "learning_rate": 0.0001917901484947162, "loss": 1.512, "step": 15637 }, { "epoch": 1.23, "learning_rate": 0.0001917782779956999, "loss": 1.5589, "step": 15638 }, { "epoch": 1.23, "learning_rate": 0.00019176640721303215, "loss": 1.5267, "step": 15639 }, { "epoch": 1.23, "learning_rate": 0.0001917545361467935, "loss": 1.5373, "step": 15640 }, { "epoch": 1.23, "learning_rate": 0.00019174266479706463, "loss": 1.5363, "step": 15641 }, { "epoch": 1.23, "learning_rate": 0.0001917307931639261, "loss": 1.5405, "step": 15642 }, { "epoch": 1.23, "learning_rate": 0.00019171892124745848, "loss": 1.6082, "step": 15643 }, { "epoch": 1.23, "learning_rate": 0.00019170704904774246, "loss": 1.5102, "step": 15644 }, { "epoch": 1.23, "learning_rate": 0.00019169517656485855, "loss": 1.5453, "step": 15645 }, { "epoch": 1.23, "learning_rate": 0.00019168330379888741, "loss": 1.5466, "step": 15646 }, { "epoch": 1.23, "learning_rate": 0.00019167143074990967, "loss": 1.4927, "step": 15647 }, { "epoch": 1.23, "learning_rate": 0.0001916595574180059, "loss": 1.524, "step": 15648 }, { "epoch": 1.23, "learning_rate": 0.00019164768380325672, "loss": 1.5138, "step": 15649 }, { "epoch": 1.23, "learning_rate": 0.0001916358099057427, "loss": 1.5623, "step": 15650 }, { "epoch": 1.23, "learning_rate": 0.0001916239357255446, "loss": 1.5904, "step": 15651 }, { "epoch": 1.23, "learning_rate": 0.0001916120612627429, "loss": 1.5203, "step": 15652 }, { "epoch": 1.23, "learning_rate": 0.00019160018651741823, "loss": 1.5741, "step": 15653 }, { "epoch": 1.23, "learning_rate": 0.00019158831148965132, "loss": 1.4969, "step": 15654 }, { "epoch": 1.23, "learning_rate": 0.00019157643617952267, "loss": 1.5573, "step": 15655 }, { "epoch": 1.23, "learning_rate": 0.00019156456058711302, "loss": 1.5118, "step": 15656 }, { "epoch": 1.23, "learning_rate": 0.00019155268471250287, "loss": 1.5423, "step": 15657 }, { "epoch": 1.23, "learning_rate": 0.00019154080855577295, "loss": 1.5487, "step": 15658 }, { "epoch": 1.23, "learning_rate": 0.00019152893211700386, "loss": 1.5004, "step": 15659 }, { "epoch": 1.23, "learning_rate": 0.00019151705539627626, "loss": 1.5202, "step": 15660 }, { "epoch": 1.23, "learning_rate": 0.00019150517839367078, "loss": 1.564, "step": 15661 }, { "epoch": 1.23, "learning_rate": 0.00019149330110926802, "loss": 1.5734, "step": 15662 }, { "epoch": 1.23, "learning_rate": 0.0001914814235431486, "loss": 1.5204, "step": 15663 }, { "epoch": 1.23, "learning_rate": 0.00019146954569539327, "loss": 1.5057, "step": 15664 }, { "epoch": 1.23, "learning_rate": 0.00019145766756608254, "loss": 1.5695, "step": 15665 }, { "epoch": 1.23, "learning_rate": 0.00019144578915529723, "loss": 1.5616, "step": 15666 }, { "epoch": 1.23, "learning_rate": 0.0001914339104631178, "loss": 1.5376, "step": 15667 }, { "epoch": 1.23, "learning_rate": 0.000191422031489625, "loss": 1.5469, "step": 15668 }, { "epoch": 1.23, "learning_rate": 0.00019141015223489948, "loss": 1.5365, "step": 15669 }, { "epoch": 1.23, "learning_rate": 0.00019139827269902188, "loss": 1.5957, "step": 15670 }, { "epoch": 1.23, "learning_rate": 0.00019138639288207286, "loss": 1.5247, "step": 15671 }, { "epoch": 1.23, "learning_rate": 0.00019137451278413304, "loss": 1.5943, "step": 15672 }, { "epoch": 1.23, "learning_rate": 0.0001913626324052831, "loss": 1.5685, "step": 15673 }, { "epoch": 1.23, "learning_rate": 0.00019135075174560372, "loss": 1.5335, "step": 15674 }, { "epoch": 1.23, "learning_rate": 0.00019133887080517557, "loss": 1.5765, "step": 15675 }, { "epoch": 1.23, "learning_rate": 0.00019132698958407936, "loss": 1.5329, "step": 15676 }, { "epoch": 1.23, "learning_rate": 0.00019131510808239563, "loss": 1.5387, "step": 15677 }, { "epoch": 1.23, "learning_rate": 0.00019130322630020512, "loss": 1.5245, "step": 15678 }, { "epoch": 1.23, "learning_rate": 0.0001912913442375885, "loss": 1.573, "step": 15679 }, { "epoch": 1.23, "learning_rate": 0.00019127946189462645, "loss": 1.562, "step": 15680 }, { "epoch": 1.23, "learning_rate": 0.0001912675792713996, "loss": 1.5585, "step": 15681 }, { "epoch": 1.23, "learning_rate": 0.00019125569636798867, "loss": 1.5646, "step": 15682 }, { "epoch": 1.23, "learning_rate": 0.00019124381318447436, "loss": 1.5904, "step": 15683 }, { "epoch": 1.23, "learning_rate": 0.0001912319297209373, "loss": 1.5195, "step": 15684 }, { "epoch": 1.23, "learning_rate": 0.00019122004597745817, "loss": 1.4962, "step": 15685 }, { "epoch": 1.23, "learning_rate": 0.00019120816195411774, "loss": 1.5388, "step": 15686 }, { "epoch": 1.23, "learning_rate": 0.00019119627765099657, "loss": 1.5533, "step": 15687 }, { "epoch": 1.23, "learning_rate": 0.00019118439306817545, "loss": 1.5698, "step": 15688 }, { "epoch": 1.23, "learning_rate": 0.00019117250820573496, "loss": 1.5423, "step": 15689 }, { "epoch": 1.23, "learning_rate": 0.00019116062306375592, "loss": 1.495, "step": 15690 }, { "epoch": 1.23, "learning_rate": 0.00019114873764231892, "loss": 1.5339, "step": 15691 }, { "epoch": 1.23, "learning_rate": 0.00019113685194150476, "loss": 1.5414, "step": 15692 }, { "epoch": 1.23, "learning_rate": 0.00019112496596139405, "loss": 1.5587, "step": 15693 }, { "epoch": 1.23, "learning_rate": 0.00019111307970206748, "loss": 1.5393, "step": 15694 }, { "epoch": 1.23, "learning_rate": 0.00019110119316360588, "loss": 1.4787, "step": 15695 }, { "epoch": 1.23, "learning_rate": 0.00019108930634608977, "loss": 1.5851, "step": 15696 }, { "epoch": 1.24, "learning_rate": 0.00019107741924959996, "loss": 1.5245, "step": 15697 }, { "epoch": 1.24, "learning_rate": 0.00019106553187421717, "loss": 1.5708, "step": 15698 }, { "epoch": 1.24, "learning_rate": 0.00019105364422002203, "loss": 1.5585, "step": 15699 }, { "epoch": 1.24, "learning_rate": 0.00019104175628709534, "loss": 1.5582, "step": 15700 }, { "epoch": 1.24, "learning_rate": 0.00019102986807551778, "loss": 1.5151, "step": 15701 }, { "epoch": 1.24, "learning_rate": 0.00019101797958537002, "loss": 1.5846, "step": 15702 }, { "epoch": 1.24, "learning_rate": 0.00019100609081673287, "loss": 1.536, "step": 15703 }, { "epoch": 1.24, "learning_rate": 0.00019099420176968697, "loss": 1.5119, "step": 15704 }, { "epoch": 1.24, "learning_rate": 0.00019098231244431304, "loss": 1.5388, "step": 15705 }, { "epoch": 1.24, "learning_rate": 0.00019097042284069182, "loss": 1.5839, "step": 15706 }, { "epoch": 1.24, "learning_rate": 0.0001909585329589041, "loss": 1.5737, "step": 15707 }, { "epoch": 1.24, "learning_rate": 0.00019094664279903047, "loss": 1.5683, "step": 15708 }, { "epoch": 1.24, "learning_rate": 0.00019093475236115178, "loss": 1.5555, "step": 15709 }, { "epoch": 1.24, "learning_rate": 0.00019092286164534868, "loss": 1.535, "step": 15710 }, { "epoch": 1.24, "learning_rate": 0.00019091097065170195, "loss": 1.5372, "step": 15711 }, { "epoch": 1.24, "learning_rate": 0.00019089907938029234, "loss": 1.5729, "step": 15712 }, { "epoch": 1.24, "learning_rate": 0.00019088718783120048, "loss": 1.5736, "step": 15713 }, { "epoch": 1.24, "learning_rate": 0.0001908752960045072, "loss": 1.5669, "step": 15714 }, { "epoch": 1.24, "learning_rate": 0.00019086340390029325, "loss": 1.5714, "step": 15715 }, { "epoch": 1.24, "learning_rate": 0.0001908515115186393, "loss": 1.5546, "step": 15716 }, { "epoch": 1.24, "learning_rate": 0.0001908396188596262, "loss": 1.4973, "step": 15717 }, { "epoch": 1.24, "learning_rate": 0.00019082772592333454, "loss": 1.5292, "step": 15718 }, { "epoch": 1.24, "learning_rate": 0.00019081583270984516, "loss": 1.5718, "step": 15719 }, { "epoch": 1.24, "learning_rate": 0.0001908039392192388, "loss": 1.5676, "step": 15720 }, { "epoch": 1.24, "learning_rate": 0.00019079204545159625, "loss": 1.5055, "step": 15721 }, { "epoch": 1.24, "learning_rate": 0.00019078015140699823, "loss": 1.5338, "step": 15722 }, { "epoch": 1.24, "learning_rate": 0.0001907682570855255, "loss": 1.591, "step": 15723 }, { "epoch": 1.24, "learning_rate": 0.00019075636248725873, "loss": 1.579, "step": 15724 }, { "epoch": 1.24, "learning_rate": 0.00019074446761227878, "loss": 1.5756, "step": 15725 }, { "epoch": 1.24, "learning_rate": 0.00019073257246066637, "loss": 1.5243, "step": 15726 }, { "epoch": 1.24, "learning_rate": 0.00019072067703250232, "loss": 1.5699, "step": 15727 }, { "epoch": 1.24, "learning_rate": 0.00019070878132786728, "loss": 1.596, "step": 15728 }, { "epoch": 1.24, "learning_rate": 0.0001906968853468421, "loss": 1.5484, "step": 15729 }, { "epoch": 1.24, "learning_rate": 0.00019068498908950756, "loss": 1.5405, "step": 15730 }, { "epoch": 1.24, "learning_rate": 0.00019067309255594436, "loss": 1.5398, "step": 15731 }, { "epoch": 1.24, "learning_rate": 0.00019066119574623333, "loss": 1.532, "step": 15732 }, { "epoch": 1.24, "learning_rate": 0.0001906492986604552, "loss": 1.5269, "step": 15733 }, { "epoch": 1.24, "learning_rate": 0.0001906374012986908, "loss": 1.506, "step": 15734 }, { "epoch": 1.24, "learning_rate": 0.00019062550366102083, "loss": 1.5572, "step": 15735 }, { "epoch": 1.24, "learning_rate": 0.00019061360574752613, "loss": 1.5257, "step": 15736 }, { "epoch": 1.24, "learning_rate": 0.00019060170755828745, "loss": 1.5525, "step": 15737 }, { "epoch": 1.24, "learning_rate": 0.00019058980909338557, "loss": 1.5779, "step": 15738 }, { "epoch": 1.24, "learning_rate": 0.0001905779103529013, "loss": 1.5692, "step": 15739 }, { "epoch": 1.24, "learning_rate": 0.00019056601133691543, "loss": 1.5157, "step": 15740 }, { "epoch": 1.24, "learning_rate": 0.00019055411204550867, "loss": 1.5506, "step": 15741 }, { "epoch": 1.24, "learning_rate": 0.00019054221247876194, "loss": 1.4872, "step": 15742 }, { "epoch": 1.24, "learning_rate": 0.00019053031263675593, "loss": 1.5634, "step": 15743 }, { "epoch": 1.24, "learning_rate": 0.00019051841251957146, "loss": 1.5241, "step": 15744 }, { "epoch": 1.24, "learning_rate": 0.00019050651212728934, "loss": 1.5515, "step": 15745 }, { "epoch": 1.24, "learning_rate": 0.00019049461145999034, "loss": 1.5341, "step": 15746 }, { "epoch": 1.24, "learning_rate": 0.0001904827105177553, "loss": 1.5458, "step": 15747 }, { "epoch": 1.24, "learning_rate": 0.00019047080930066493, "loss": 1.5631, "step": 15748 }, { "epoch": 1.24, "learning_rate": 0.00019045890780880018, "loss": 1.5403, "step": 15749 }, { "epoch": 1.24, "learning_rate": 0.00019044700604224174, "loss": 1.5799, "step": 15750 }, { "epoch": 1.24, "learning_rate": 0.00019043510400107048, "loss": 1.568, "step": 15751 }, { "epoch": 1.24, "learning_rate": 0.00019042320168536709, "loss": 1.5096, "step": 15752 }, { "epoch": 1.24, "learning_rate": 0.00019041129909521258, "loss": 1.5115, "step": 15753 }, { "epoch": 1.24, "learning_rate": 0.0001903993962306876, "loss": 1.5873, "step": 15754 }, { "epoch": 1.24, "learning_rate": 0.00019038749309187298, "loss": 1.5625, "step": 15755 }, { "epoch": 1.24, "learning_rate": 0.00019037558967884962, "loss": 1.5459, "step": 15756 }, { "epoch": 1.24, "learning_rate": 0.00019036368599169827, "loss": 1.5563, "step": 15757 }, { "epoch": 1.24, "learning_rate": 0.00019035178203049975, "loss": 1.5733, "step": 15758 }, { "epoch": 1.24, "learning_rate": 0.0001903398777953349, "loss": 1.5341, "step": 15759 }, { "epoch": 1.24, "learning_rate": 0.00019032797328628453, "loss": 1.5545, "step": 15760 }, { "epoch": 1.24, "learning_rate": 0.00019031606850342952, "loss": 1.5542, "step": 15761 }, { "epoch": 1.24, "learning_rate": 0.00019030416344685062, "loss": 1.5284, "step": 15762 }, { "epoch": 1.24, "learning_rate": 0.00019029225811662874, "loss": 1.5279, "step": 15763 }, { "epoch": 1.24, "learning_rate": 0.0001902803525128446, "loss": 1.5346, "step": 15764 }, { "epoch": 1.24, "learning_rate": 0.0001902684466355791, "loss": 1.5057, "step": 15765 }, { "epoch": 1.24, "learning_rate": 0.00019025654048491312, "loss": 1.5061, "step": 15766 }, { "epoch": 1.24, "learning_rate": 0.0001902446340609274, "loss": 1.5703, "step": 15767 }, { "epoch": 1.24, "learning_rate": 0.00019023272736370283, "loss": 1.5178, "step": 15768 }, { "epoch": 1.24, "learning_rate": 0.00019022082039332026, "loss": 1.5885, "step": 15769 }, { "epoch": 1.24, "learning_rate": 0.0001902089131498605, "loss": 1.5536, "step": 15770 }, { "epoch": 1.24, "learning_rate": 0.0001901970056334044, "loss": 1.5338, "step": 15771 }, { "epoch": 1.24, "learning_rate": 0.00019018509784403287, "loss": 1.5013, "step": 15772 }, { "epoch": 1.24, "learning_rate": 0.00019017318978182667, "loss": 1.4668, "step": 15773 }, { "epoch": 1.24, "learning_rate": 0.00019016128144686665, "loss": 1.5578, "step": 15774 }, { "epoch": 1.24, "learning_rate": 0.00019014937283923371, "loss": 1.4846, "step": 15775 }, { "epoch": 1.24, "learning_rate": 0.0001901374639590087, "loss": 1.561, "step": 15776 }, { "epoch": 1.24, "learning_rate": 0.00019012555480627243, "loss": 1.4877, "step": 15777 }, { "epoch": 1.24, "learning_rate": 0.00019011364538110582, "loss": 1.5195, "step": 15778 }, { "epoch": 1.24, "learning_rate": 0.00019010173568358968, "loss": 1.5048, "step": 15779 }, { "epoch": 1.24, "learning_rate": 0.0001900898257138049, "loss": 1.5207, "step": 15780 }, { "epoch": 1.24, "learning_rate": 0.0001900779154718323, "loss": 1.4877, "step": 15781 }, { "epoch": 1.24, "learning_rate": 0.0001900660049577528, "loss": 1.5001, "step": 15782 }, { "epoch": 1.24, "learning_rate": 0.00019005409417164717, "loss": 1.5126, "step": 15783 }, { "epoch": 1.24, "learning_rate": 0.0001900421831135964, "loss": 1.5801, "step": 15784 }, { "epoch": 1.24, "learning_rate": 0.00019003027178368133, "loss": 1.5464, "step": 15785 }, { "epoch": 1.24, "learning_rate": 0.00019001836018198273, "loss": 1.5249, "step": 15786 }, { "epoch": 1.24, "learning_rate": 0.0001900064483085816, "loss": 1.5266, "step": 15787 }, { "epoch": 1.24, "learning_rate": 0.00018999453616355875, "loss": 1.576, "step": 15788 }, { "epoch": 1.24, "learning_rate": 0.00018998262374699508, "loss": 1.5322, "step": 15789 }, { "epoch": 1.24, "learning_rate": 0.00018997071105897147, "loss": 1.5467, "step": 15790 }, { "epoch": 1.24, "learning_rate": 0.00018995879809956872, "loss": 1.5526, "step": 15791 }, { "epoch": 1.24, "learning_rate": 0.00018994688486886788, "loss": 1.5294, "step": 15792 }, { "epoch": 1.24, "learning_rate": 0.00018993497136694969, "loss": 1.4968, "step": 15793 }, { "epoch": 1.24, "learning_rate": 0.00018992305759389506, "loss": 1.5448, "step": 15794 }, { "epoch": 1.24, "learning_rate": 0.00018991114354978495, "loss": 1.563, "step": 15795 }, { "epoch": 1.24, "learning_rate": 0.00018989922923470017, "loss": 1.4871, "step": 15796 }, { "epoch": 1.24, "learning_rate": 0.00018988731464872165, "loss": 1.535, "step": 15797 }, { "epoch": 1.24, "learning_rate": 0.00018987539979193024, "loss": 1.5231, "step": 15798 }, { "epoch": 1.24, "learning_rate": 0.00018986348466440688, "loss": 1.5591, "step": 15799 }, { "epoch": 1.24, "learning_rate": 0.0001898515692662325, "loss": 1.521, "step": 15800 }, { "epoch": 1.24, "learning_rate": 0.00018983965359748792, "loss": 1.5099, "step": 15801 }, { "epoch": 1.24, "learning_rate": 0.0001898277376582541, "loss": 1.5732, "step": 15802 }, { "epoch": 1.24, "learning_rate": 0.00018981582144861193, "loss": 1.5631, "step": 15803 }, { "epoch": 1.24, "learning_rate": 0.00018980390496864229, "loss": 1.543, "step": 15804 }, { "epoch": 1.24, "learning_rate": 0.0001897919882184261, "loss": 1.6359, "step": 15805 }, { "epoch": 1.24, "learning_rate": 0.00018978007119804425, "loss": 1.5357, "step": 15806 }, { "epoch": 1.24, "learning_rate": 0.0001897681539075777, "loss": 1.4954, "step": 15807 }, { "epoch": 1.24, "learning_rate": 0.0001897562363471073, "loss": 1.5612, "step": 15808 }, { "epoch": 1.24, "learning_rate": 0.00018974431851671403, "loss": 1.5287, "step": 15809 }, { "epoch": 1.24, "learning_rate": 0.00018973240041647872, "loss": 1.532, "step": 15810 }, { "epoch": 1.24, "learning_rate": 0.0001897204820464824, "loss": 1.5264, "step": 15811 }, { "epoch": 1.24, "learning_rate": 0.0001897085634068059, "loss": 1.5696, "step": 15812 }, { "epoch": 1.24, "learning_rate": 0.00018969664449753015, "loss": 1.5657, "step": 15813 }, { "epoch": 1.24, "learning_rate": 0.0001896847253187361, "loss": 1.5496, "step": 15814 }, { "epoch": 1.24, "learning_rate": 0.00018967280587050466, "loss": 1.575, "step": 15815 }, { "epoch": 1.24, "learning_rate": 0.00018966088615291675, "loss": 1.5412, "step": 15816 }, { "epoch": 1.24, "learning_rate": 0.00018964896616605336, "loss": 1.5547, "step": 15817 }, { "epoch": 1.24, "learning_rate": 0.00018963704590999533, "loss": 1.5609, "step": 15818 }, { "epoch": 1.24, "learning_rate": 0.00018962512538482363, "loss": 1.5378, "step": 15819 }, { "epoch": 1.24, "learning_rate": 0.00018961320459061923, "loss": 1.4814, "step": 15820 }, { "epoch": 1.24, "learning_rate": 0.000189601283527463, "loss": 1.5026, "step": 15821 }, { "epoch": 1.24, "learning_rate": 0.00018958936219543593, "loss": 1.459, "step": 15822 }, { "epoch": 1.24, "learning_rate": 0.00018957744059461889, "loss": 1.5945, "step": 15823 }, { "epoch": 1.25, "learning_rate": 0.00018956551872509293, "loss": 1.518, "step": 15824 }, { "epoch": 1.25, "learning_rate": 0.0001895535965869389, "loss": 1.4968, "step": 15825 }, { "epoch": 1.25, "learning_rate": 0.00018954167418023773, "loss": 1.509, "step": 15826 }, { "epoch": 1.25, "learning_rate": 0.00018952975150507052, "loss": 1.5373, "step": 15827 }, { "epoch": 1.25, "learning_rate": 0.00018951782856151803, "loss": 1.5718, "step": 15828 }, { "epoch": 1.25, "learning_rate": 0.00018950590534966134, "loss": 1.5304, "step": 15829 }, { "epoch": 1.25, "learning_rate": 0.0001894939818695813, "loss": 1.5283, "step": 15830 }, { "epoch": 1.25, "learning_rate": 0.00018948205812135898, "loss": 1.5605, "step": 15831 }, { "epoch": 1.25, "learning_rate": 0.0001894701341050752, "loss": 1.5406, "step": 15832 }, { "epoch": 1.25, "learning_rate": 0.00018945820982081105, "loss": 1.5533, "step": 15833 }, { "epoch": 1.25, "learning_rate": 0.00018944628526864745, "loss": 1.5817, "step": 15834 }, { "epoch": 1.25, "learning_rate": 0.0001894343604486653, "loss": 1.5319, "step": 15835 }, { "epoch": 1.25, "learning_rate": 0.0001894224353609456, "loss": 1.5298, "step": 15836 }, { "epoch": 1.25, "learning_rate": 0.00018941051000556932, "loss": 1.491, "step": 15837 }, { "epoch": 1.25, "learning_rate": 0.00018939858438261743, "loss": 1.6156, "step": 15838 }, { "epoch": 1.25, "learning_rate": 0.00018938665849217089, "loss": 1.602, "step": 15839 }, { "epoch": 1.25, "learning_rate": 0.00018937473233431067, "loss": 1.5206, "step": 15840 }, { "epoch": 1.25, "learning_rate": 0.00018936280590911775, "loss": 1.5651, "step": 15841 }, { "epoch": 1.25, "learning_rate": 0.00018935087921667312, "loss": 1.5918, "step": 15842 }, { "epoch": 1.25, "learning_rate": 0.0001893389522570577, "loss": 1.5343, "step": 15843 }, { "epoch": 1.25, "learning_rate": 0.00018932702503035259, "loss": 1.4804, "step": 15844 }, { "epoch": 1.25, "learning_rate": 0.00018931509753663858, "loss": 1.6006, "step": 15845 }, { "epoch": 1.25, "learning_rate": 0.0001893031697759968, "loss": 1.5025, "step": 15846 }, { "epoch": 1.25, "learning_rate": 0.00018929124174850816, "loss": 1.5122, "step": 15847 }, { "epoch": 1.25, "learning_rate": 0.00018927931345425372, "loss": 1.5613, "step": 15848 }, { "epoch": 1.25, "learning_rate": 0.0001892673848933144, "loss": 1.4411, "step": 15849 }, { "epoch": 1.25, "learning_rate": 0.00018925545606577118, "loss": 1.567, "step": 15850 }, { "epoch": 1.25, "learning_rate": 0.0001892435269717051, "loss": 1.5886, "step": 15851 }, { "epoch": 1.25, "learning_rate": 0.00018923159761119712, "loss": 1.5452, "step": 15852 }, { "epoch": 1.25, "learning_rate": 0.00018921966798432824, "loss": 1.5224, "step": 15853 }, { "epoch": 1.25, "learning_rate": 0.00018920773809117942, "loss": 1.5968, "step": 15854 }, { "epoch": 1.25, "learning_rate": 0.00018919580793183173, "loss": 1.5424, "step": 15855 }, { "epoch": 1.25, "learning_rate": 0.00018918387750636615, "loss": 1.6028, "step": 15856 }, { "epoch": 1.25, "learning_rate": 0.00018917194681486365, "loss": 1.577, "step": 15857 }, { "epoch": 1.25, "learning_rate": 0.0001891600158574053, "loss": 1.5302, "step": 15858 }, { "epoch": 1.25, "learning_rate": 0.00018914808463407198, "loss": 1.5487, "step": 15859 }, { "epoch": 1.25, "learning_rate": 0.00018913615314494476, "loss": 1.5217, "step": 15860 }, { "epoch": 1.25, "learning_rate": 0.00018912422139010475, "loss": 1.5959, "step": 15861 }, { "epoch": 1.25, "learning_rate": 0.00018911228936963274, "loss": 1.5415, "step": 15862 }, { "epoch": 1.25, "learning_rate": 0.00018910035708360996, "loss": 1.569, "step": 15863 }, { "epoch": 1.25, "learning_rate": 0.00018908842453211732, "loss": 1.5469, "step": 15864 }, { "epoch": 1.25, "learning_rate": 0.00018907649171523585, "loss": 1.5738, "step": 15865 }, { "epoch": 1.25, "learning_rate": 0.00018906455863304652, "loss": 1.5368, "step": 15866 }, { "epoch": 1.25, "learning_rate": 0.00018905262528563042, "loss": 1.5784, "step": 15867 }, { "epoch": 1.25, "learning_rate": 0.0001890406916730686, "loss": 1.5544, "step": 15868 }, { "epoch": 1.25, "learning_rate": 0.00018902875779544198, "loss": 1.5348, "step": 15869 }, { "epoch": 1.25, "learning_rate": 0.0001890168236528316, "loss": 1.5425, "step": 15870 }, { "epoch": 1.25, "learning_rate": 0.00018900488924531857, "loss": 1.5462, "step": 15871 }, { "epoch": 1.25, "learning_rate": 0.00018899295457298383, "loss": 1.4881, "step": 15872 }, { "epoch": 1.25, "learning_rate": 0.00018898101963590847, "loss": 1.5275, "step": 15873 }, { "epoch": 1.25, "learning_rate": 0.0001889690844341735, "loss": 1.541, "step": 15874 }, { "epoch": 1.25, "learning_rate": 0.00018895714896785995, "loss": 1.5289, "step": 15875 }, { "epoch": 1.25, "learning_rate": 0.00018894521323704886, "loss": 1.6397, "step": 15876 }, { "epoch": 1.25, "learning_rate": 0.00018893327724182126, "loss": 1.5883, "step": 15877 }, { "epoch": 1.25, "learning_rate": 0.00018892134098225815, "loss": 1.5596, "step": 15878 }, { "epoch": 1.25, "learning_rate": 0.00018890940445844066, "loss": 1.5165, "step": 15879 }, { "epoch": 1.25, "learning_rate": 0.00018889746767044977, "loss": 1.4925, "step": 15880 }, { "epoch": 1.25, "learning_rate": 0.00018888553061836657, "loss": 1.5415, "step": 15881 }, { "epoch": 1.25, "learning_rate": 0.00018887359330227202, "loss": 1.5788, "step": 15882 }, { "epoch": 1.25, "learning_rate": 0.00018886165572224727, "loss": 1.5161, "step": 15883 }, { "epoch": 1.25, "learning_rate": 0.0001888497178783733, "loss": 1.5636, "step": 15884 }, { "epoch": 1.25, "learning_rate": 0.0001888377797707312, "loss": 1.4557, "step": 15885 }, { "epoch": 1.25, "learning_rate": 0.000188825841399402, "loss": 1.5241, "step": 15886 }, { "epoch": 1.25, "learning_rate": 0.00018881390276446677, "loss": 1.4744, "step": 15887 }, { "epoch": 1.25, "learning_rate": 0.00018880196386600656, "loss": 1.5224, "step": 15888 }, { "epoch": 1.25, "learning_rate": 0.0001887900247041024, "loss": 1.5253, "step": 15889 }, { "epoch": 1.25, "learning_rate": 0.0001887780852788354, "loss": 1.5266, "step": 15890 }, { "epoch": 1.25, "learning_rate": 0.00018876614559028664, "loss": 1.5128, "step": 15891 }, { "epoch": 1.25, "learning_rate": 0.00018875420563853714, "loss": 1.5576, "step": 15892 }, { "epoch": 1.25, "learning_rate": 0.00018874226542366787, "loss": 1.6258, "step": 15893 }, { "epoch": 1.25, "learning_rate": 0.00018873032494576007, "loss": 1.6111, "step": 15894 }, { "epoch": 1.25, "learning_rate": 0.00018871838420489472, "loss": 1.5743, "step": 15895 }, { "epoch": 1.25, "learning_rate": 0.00018870644320115293, "loss": 1.5261, "step": 15896 }, { "epoch": 1.25, "learning_rate": 0.00018869450193461574, "loss": 1.5348, "step": 15897 }, { "epoch": 1.25, "learning_rate": 0.00018868256040536425, "loss": 1.5564, "step": 15898 }, { "epoch": 1.25, "learning_rate": 0.0001886706186134795, "loss": 1.5165, "step": 15899 }, { "epoch": 1.25, "learning_rate": 0.0001886586765590426, "loss": 1.5267, "step": 15900 }, { "epoch": 1.25, "learning_rate": 0.0001886467342421346, "loss": 1.5372, "step": 15901 }, { "epoch": 1.25, "learning_rate": 0.00018863479166283663, "loss": 1.563, "step": 15902 }, { "epoch": 1.25, "learning_rate": 0.00018862284882122972, "loss": 1.5201, "step": 15903 }, { "epoch": 1.25, "learning_rate": 0.00018861090571739502, "loss": 1.5588, "step": 15904 }, { "epoch": 1.25, "learning_rate": 0.00018859896235141354, "loss": 1.5442, "step": 15905 }, { "epoch": 1.25, "learning_rate": 0.0001885870187233664, "loss": 1.5021, "step": 15906 }, { "epoch": 1.25, "learning_rate": 0.00018857507483333472, "loss": 1.5268, "step": 15907 }, { "epoch": 1.25, "learning_rate": 0.00018856313068139956, "loss": 1.5341, "step": 15908 }, { "epoch": 1.25, "learning_rate": 0.000188551186267642, "loss": 1.5674, "step": 15909 }, { "epoch": 1.25, "learning_rate": 0.00018853924159214317, "loss": 1.5776, "step": 15910 }, { "epoch": 1.25, "learning_rate": 0.0001885272966549842, "loss": 1.6151, "step": 15911 }, { "epoch": 1.25, "learning_rate": 0.00018851535145624615, "loss": 1.5334, "step": 15912 }, { "epoch": 1.25, "learning_rate": 0.00018850340599601008, "loss": 1.5314, "step": 15913 }, { "epoch": 1.25, "learning_rate": 0.00018849146027435714, "loss": 1.5524, "step": 15914 }, { "epoch": 1.25, "learning_rate": 0.00018847951429136844, "loss": 1.5038, "step": 15915 }, { "epoch": 1.25, "learning_rate": 0.00018846756804712504, "loss": 1.5775, "step": 15916 }, { "epoch": 1.25, "learning_rate": 0.00018845562154170807, "loss": 1.5653, "step": 15917 }, { "epoch": 1.25, "learning_rate": 0.0001884436747751987, "loss": 1.5234, "step": 15918 }, { "epoch": 1.25, "learning_rate": 0.00018843172774767798, "loss": 1.5195, "step": 15919 }, { "epoch": 1.25, "learning_rate": 0.00018841978045922703, "loss": 1.5072, "step": 15920 }, { "epoch": 1.25, "learning_rate": 0.00018840783290992698, "loss": 1.5882, "step": 15921 }, { "epoch": 1.25, "learning_rate": 0.0001883958850998589, "loss": 1.5268, "step": 15922 }, { "epoch": 1.25, "learning_rate": 0.00018838393702910402, "loss": 1.5604, "step": 15923 }, { "epoch": 1.25, "learning_rate": 0.00018837198869774333, "loss": 1.5405, "step": 15924 }, { "epoch": 1.25, "learning_rate": 0.000188360040105858, "loss": 1.5308, "step": 15925 }, { "epoch": 1.25, "learning_rate": 0.00018834809125352925, "loss": 1.5461, "step": 15926 }, { "epoch": 1.25, "learning_rate": 0.00018833614214083802, "loss": 1.5669, "step": 15927 }, { "epoch": 1.25, "learning_rate": 0.0001883241927678656, "loss": 1.5485, "step": 15928 }, { "epoch": 1.25, "learning_rate": 0.0001883122431346931, "loss": 1.5032, "step": 15929 }, { "epoch": 1.25, "learning_rate": 0.00018830029324140153, "loss": 1.5449, "step": 15930 }, { "epoch": 1.25, "learning_rate": 0.00018828834308807216, "loss": 1.5472, "step": 15931 }, { "epoch": 1.25, "learning_rate": 0.00018827639267478605, "loss": 1.5531, "step": 15932 }, { "epoch": 1.25, "learning_rate": 0.00018826444200162437, "loss": 1.6052, "step": 15933 }, { "epoch": 1.25, "learning_rate": 0.00018825249106866818, "loss": 1.5357, "step": 15934 }, { "epoch": 1.25, "learning_rate": 0.00018824053987599875, "loss": 1.5898, "step": 15935 }, { "epoch": 1.25, "learning_rate": 0.00018822858842369717, "loss": 1.6027, "step": 15936 }, { "epoch": 1.25, "learning_rate": 0.00018821663671184452, "loss": 1.552, "step": 15937 }, { "epoch": 1.25, "learning_rate": 0.00018820468474052202, "loss": 1.5263, "step": 15938 }, { "epoch": 1.25, "learning_rate": 0.0001881927325098108, "loss": 1.5576, "step": 15939 }, { "epoch": 1.25, "learning_rate": 0.00018818078001979195, "loss": 1.5184, "step": 15940 }, { "epoch": 1.25, "learning_rate": 0.00018816882727054678, "loss": 1.5782, "step": 15941 }, { "epoch": 1.25, "learning_rate": 0.00018815687426215622, "loss": 1.5074, "step": 15942 }, { "epoch": 1.25, "learning_rate": 0.00018814492099470165, "loss": 1.5377, "step": 15943 }, { "epoch": 1.25, "learning_rate": 0.00018813296746826404, "loss": 1.5935, "step": 15944 }, { "epoch": 1.25, "learning_rate": 0.00018812101368292464, "loss": 1.5405, "step": 15945 }, { "epoch": 1.25, "learning_rate": 0.00018810905963876463, "loss": 1.4968, "step": 15946 }, { "epoch": 1.25, "learning_rate": 0.00018809710533586508, "loss": 1.5554, "step": 15947 }, { "epoch": 1.25, "learning_rate": 0.00018808515077430726, "loss": 1.5266, "step": 15948 }, { "epoch": 1.25, "learning_rate": 0.00018807319595417224, "loss": 1.5415, "step": 15949 }, { "epoch": 1.25, "learning_rate": 0.00018806124087554125, "loss": 1.5325, "step": 15950 }, { "epoch": 1.26, "learning_rate": 0.00018804928553849544, "loss": 1.5814, "step": 15951 }, { "epoch": 1.26, "learning_rate": 0.00018803732994311596, "loss": 1.5257, "step": 15952 }, { "epoch": 1.26, "learning_rate": 0.00018802537408948406, "loss": 1.5159, "step": 15953 }, { "epoch": 1.26, "learning_rate": 0.0001880134179776808, "loss": 1.5492, "step": 15954 }, { "epoch": 1.26, "learning_rate": 0.0001880014616077874, "loss": 1.5443, "step": 15955 }, { "epoch": 1.26, "learning_rate": 0.00018798950497988503, "loss": 1.536, "step": 15956 }, { "epoch": 1.26, "learning_rate": 0.00018797754809405493, "loss": 1.5713, "step": 15957 }, { "epoch": 1.26, "learning_rate": 0.00018796559095037827, "loss": 1.5305, "step": 15958 }, { "epoch": 1.26, "learning_rate": 0.00018795363354893614, "loss": 1.5269, "step": 15959 }, { "epoch": 1.26, "learning_rate": 0.0001879416758898098, "loss": 1.5304, "step": 15960 }, { "epoch": 1.26, "learning_rate": 0.0001879297179730804, "loss": 1.5577, "step": 15961 }, { "epoch": 1.26, "learning_rate": 0.00018791775979882917, "loss": 1.5741, "step": 15962 }, { "epoch": 1.26, "learning_rate": 0.0001879058013671373, "loss": 1.4847, "step": 15963 }, { "epoch": 1.26, "learning_rate": 0.00018789384267808588, "loss": 1.5443, "step": 15964 }, { "epoch": 1.26, "learning_rate": 0.00018788188373175624, "loss": 1.4956, "step": 15965 }, { "epoch": 1.26, "learning_rate": 0.0001878699245282295, "loss": 1.4862, "step": 15966 }, { "epoch": 1.26, "learning_rate": 0.00018785796506758687, "loss": 1.5355, "step": 15967 }, { "epoch": 1.26, "learning_rate": 0.00018784600534990957, "loss": 1.5959, "step": 15968 }, { "epoch": 1.26, "learning_rate": 0.00018783404537527873, "loss": 1.541, "step": 15969 }, { "epoch": 1.26, "learning_rate": 0.00018782208514377566, "loss": 1.4895, "step": 15970 }, { "epoch": 1.26, "learning_rate": 0.0001878101246554815, "loss": 1.5319, "step": 15971 }, { "epoch": 1.26, "learning_rate": 0.0001877981639104774, "loss": 1.5269, "step": 15972 }, { "epoch": 1.26, "learning_rate": 0.00018778620290884465, "loss": 1.4808, "step": 15973 }, { "epoch": 1.26, "learning_rate": 0.0001877742416506644, "loss": 1.4698, "step": 15974 }, { "epoch": 1.26, "learning_rate": 0.000187762280136018, "loss": 1.5444, "step": 15975 }, { "epoch": 1.26, "learning_rate": 0.00018775031836498646, "loss": 1.5619, "step": 15976 }, { "epoch": 1.26, "learning_rate": 0.00018773835633765116, "loss": 1.5346, "step": 15977 }, { "epoch": 1.26, "learning_rate": 0.0001877263940540932, "loss": 1.5251, "step": 15978 }, { "epoch": 1.26, "learning_rate": 0.00018771443151439384, "loss": 1.5425, "step": 15979 }, { "epoch": 1.26, "learning_rate": 0.0001877024687186343, "loss": 1.4757, "step": 15980 }, { "epoch": 1.26, "learning_rate": 0.00018769050566689582, "loss": 1.5543, "step": 15981 }, { "epoch": 1.26, "learning_rate": 0.00018767854235925962, "loss": 1.5386, "step": 15982 }, { "epoch": 1.26, "learning_rate": 0.0001876665787958069, "loss": 1.5693, "step": 15983 }, { "epoch": 1.26, "learning_rate": 0.00018765461497661888, "loss": 1.5434, "step": 15984 }, { "epoch": 1.26, "learning_rate": 0.00018764265090177686, "loss": 1.4914, "step": 15985 }, { "epoch": 1.26, "learning_rate": 0.00018763068657136193, "loss": 1.5551, "step": 15986 }, { "epoch": 1.26, "learning_rate": 0.0001876187219854555, "loss": 1.5183, "step": 15987 }, { "epoch": 1.26, "learning_rate": 0.0001876067571441386, "loss": 1.6135, "step": 15988 }, { "epoch": 1.26, "learning_rate": 0.00018759479204749264, "loss": 1.4975, "step": 15989 }, { "epoch": 1.26, "learning_rate": 0.00018758282669559877, "loss": 1.5336, "step": 15990 }, { "epoch": 1.26, "learning_rate": 0.00018757086108853822, "loss": 1.517, "step": 15991 }, { "epoch": 1.26, "learning_rate": 0.0001875588952263923, "loss": 1.567, "step": 15992 }, { "epoch": 1.26, "learning_rate": 0.0001875469291092422, "loss": 1.6004, "step": 15993 }, { "epoch": 1.26, "learning_rate": 0.00018753496273716917, "loss": 1.4991, "step": 15994 }, { "epoch": 1.26, "learning_rate": 0.00018752299611025442, "loss": 1.5488, "step": 15995 }, { "epoch": 1.26, "learning_rate": 0.0001875110292285793, "loss": 1.5294, "step": 15996 }, { "epoch": 1.26, "learning_rate": 0.00018749906209222493, "loss": 1.5572, "step": 15997 }, { "epoch": 1.26, "learning_rate": 0.00018748709470127266, "loss": 1.5409, "step": 15998 }, { "epoch": 1.26, "learning_rate": 0.0001874751270558037, "loss": 1.5799, "step": 15999 }, { "epoch": 1.26, "learning_rate": 0.0001874631591558993, "loss": 1.4787, "step": 16000 }, { "epoch": 1.26, "learning_rate": 0.0001874511910016407, "loss": 1.5003, "step": 16001 }, { "epoch": 1.26, "learning_rate": 0.00018743922259310922, "loss": 1.4867, "step": 16002 }, { "epoch": 1.26, "learning_rate": 0.00018742725393038607, "loss": 1.5557, "step": 16003 }, { "epoch": 1.26, "learning_rate": 0.00018741528501355252, "loss": 1.5168, "step": 16004 }, { "epoch": 1.26, "learning_rate": 0.0001874033158426898, "loss": 1.5286, "step": 16005 }, { "epoch": 1.26, "learning_rate": 0.00018739134641787924, "loss": 1.5096, "step": 16006 }, { "epoch": 1.26, "learning_rate": 0.0001873793767392021, "loss": 1.5714, "step": 16007 }, { "epoch": 1.26, "learning_rate": 0.00018736740680673955, "loss": 1.5272, "step": 16008 }, { "epoch": 1.26, "learning_rate": 0.000187355436620573, "loss": 1.5544, "step": 16009 }, { "epoch": 1.26, "learning_rate": 0.0001873434661807836, "loss": 1.5909, "step": 16010 }, { "epoch": 1.26, "learning_rate": 0.0001873314954874527, "loss": 1.5793, "step": 16011 }, { "epoch": 1.26, "learning_rate": 0.0001873195245406615, "loss": 1.5961, "step": 16012 }, { "epoch": 1.26, "learning_rate": 0.00018730755334049135, "loss": 1.4928, "step": 16013 }, { "epoch": 1.26, "learning_rate": 0.0001872955818870235, "loss": 1.5728, "step": 16014 }, { "epoch": 1.26, "learning_rate": 0.00018728361018033923, "loss": 1.5679, "step": 16015 }, { "epoch": 1.26, "learning_rate": 0.00018727163822051984, "loss": 1.5537, "step": 16016 }, { "epoch": 1.26, "learning_rate": 0.00018725966600764658, "loss": 1.5618, "step": 16017 }, { "epoch": 1.26, "learning_rate": 0.00018724769354180074, "loss": 1.5435, "step": 16018 }, { "epoch": 1.26, "learning_rate": 0.00018723572082306362, "loss": 1.4966, "step": 16019 }, { "epoch": 1.26, "learning_rate": 0.0001872237478515165, "loss": 1.5627, "step": 16020 }, { "epoch": 1.26, "learning_rate": 0.0001872117746272407, "loss": 1.5154, "step": 16021 }, { "epoch": 1.26, "learning_rate": 0.0001871998011503175, "loss": 1.5456, "step": 16022 }, { "epoch": 1.26, "learning_rate": 0.00018718782742082812, "loss": 1.5797, "step": 16023 }, { "epoch": 1.26, "learning_rate": 0.00018717585343885397, "loss": 1.5726, "step": 16024 }, { "epoch": 1.26, "learning_rate": 0.00018716387920447627, "loss": 1.4868, "step": 16025 }, { "epoch": 1.26, "learning_rate": 0.00018715190471777632, "loss": 1.5797, "step": 16026 }, { "epoch": 1.26, "learning_rate": 0.00018713992997883543, "loss": 1.5633, "step": 16027 }, { "epoch": 1.26, "learning_rate": 0.00018712795498773495, "loss": 1.561, "step": 16028 }, { "epoch": 1.26, "learning_rate": 0.00018711597974455611, "loss": 1.5315, "step": 16029 }, { "epoch": 1.26, "learning_rate": 0.00018710400424938026, "loss": 1.5496, "step": 16030 }, { "epoch": 1.26, "learning_rate": 0.00018709202850228875, "loss": 1.5872, "step": 16031 }, { "epoch": 1.26, "learning_rate": 0.00018708005250336275, "loss": 1.5392, "step": 16032 }, { "epoch": 1.26, "learning_rate": 0.00018706807625268372, "loss": 1.5468, "step": 16033 }, { "epoch": 1.26, "learning_rate": 0.00018705609975033286, "loss": 1.5304, "step": 16034 }, { "epoch": 1.26, "learning_rate": 0.00018704412299639153, "loss": 1.5104, "step": 16035 }, { "epoch": 1.26, "learning_rate": 0.0001870321459909411, "loss": 1.4969, "step": 16036 }, { "epoch": 1.26, "learning_rate": 0.00018702016873406278, "loss": 1.5404, "step": 16037 }, { "epoch": 1.26, "learning_rate": 0.00018700819122583802, "loss": 1.6017, "step": 16038 }, { "epoch": 1.26, "learning_rate": 0.00018699621346634802, "loss": 1.5327, "step": 16039 }, { "epoch": 1.26, "learning_rate": 0.00018698423545567412, "loss": 1.5352, "step": 16040 }, { "epoch": 1.26, "learning_rate": 0.0001869722571938977, "loss": 1.5137, "step": 16041 }, { "epoch": 1.26, "learning_rate": 0.00018696027868110005, "loss": 1.5624, "step": 16042 }, { "epoch": 1.26, "learning_rate": 0.0001869482999173625, "loss": 1.5032, "step": 16043 }, { "epoch": 1.26, "learning_rate": 0.00018693632090276637, "loss": 1.5137, "step": 16044 }, { "epoch": 1.26, "learning_rate": 0.00018692434163739306, "loss": 1.5151, "step": 16045 }, { "epoch": 1.26, "learning_rate": 0.0001869123621213238, "loss": 1.5524, "step": 16046 }, { "epoch": 1.26, "learning_rate": 0.00018690038235463996, "loss": 1.558, "step": 16047 }, { "epoch": 1.26, "learning_rate": 0.00018688840233742292, "loss": 1.5553, "step": 16048 }, { "epoch": 1.26, "learning_rate": 0.00018687642206975398, "loss": 1.5292, "step": 16049 }, { "epoch": 1.26, "learning_rate": 0.00018686444155171443, "loss": 1.539, "step": 16050 }, { "epoch": 1.26, "learning_rate": 0.00018685246078338572, "loss": 1.5558, "step": 16051 }, { "epoch": 1.26, "learning_rate": 0.0001868404797648491, "loss": 1.5187, "step": 16052 }, { "epoch": 1.26, "learning_rate": 0.00018682849849618603, "loss": 1.4791, "step": 16053 }, { "epoch": 1.26, "learning_rate": 0.00018681651697747772, "loss": 1.5564, "step": 16054 }, { "epoch": 1.26, "learning_rate": 0.0001868045352088056, "loss": 1.5378, "step": 16055 }, { "epoch": 1.26, "learning_rate": 0.00018679255319025098, "loss": 1.5616, "step": 16056 }, { "epoch": 1.26, "learning_rate": 0.00018678057092189523, "loss": 1.5334, "step": 16057 }, { "epoch": 1.26, "learning_rate": 0.0001867685884038197, "loss": 1.5234, "step": 16058 }, { "epoch": 1.26, "learning_rate": 0.00018675660563610575, "loss": 1.5612, "step": 16059 }, { "epoch": 1.26, "learning_rate": 0.00018674462261883472, "loss": 1.5281, "step": 16060 }, { "epoch": 1.26, "learning_rate": 0.00018673263935208798, "loss": 1.5321, "step": 16061 }, { "epoch": 1.26, "learning_rate": 0.00018672065583594688, "loss": 1.517, "step": 16062 }, { "epoch": 1.26, "learning_rate": 0.00018670867207049285, "loss": 1.5185, "step": 16063 }, { "epoch": 1.26, "learning_rate": 0.00018669668805580713, "loss": 1.6226, "step": 16064 }, { "epoch": 1.26, "learning_rate": 0.0001866847037919712, "loss": 1.5189, "step": 16065 }, { "epoch": 1.26, "learning_rate": 0.00018667271927906633, "loss": 1.5444, "step": 16066 }, { "epoch": 1.26, "learning_rate": 0.00018666073451717395, "loss": 1.561, "step": 16067 }, { "epoch": 1.26, "learning_rate": 0.00018664874950637543, "loss": 1.4931, "step": 16068 }, { "epoch": 1.26, "learning_rate": 0.00018663676424675207, "loss": 1.5598, "step": 16069 }, { "epoch": 1.26, "learning_rate": 0.0001866247787383854, "loss": 1.5138, "step": 16070 }, { "epoch": 1.26, "learning_rate": 0.0001866127929813566, "loss": 1.5917, "step": 16071 }, { "epoch": 1.26, "learning_rate": 0.00018660080697574722, "loss": 1.5625, "step": 16072 }, { "epoch": 1.26, "learning_rate": 0.0001865888207216385, "loss": 1.565, "step": 16073 }, { "epoch": 1.26, "learning_rate": 0.00018657683421911185, "loss": 1.5991, "step": 16074 }, { "epoch": 1.26, "learning_rate": 0.00018656484746824872, "loss": 1.552, "step": 16075 }, { "epoch": 1.26, "learning_rate": 0.00018655286046913045, "loss": 1.5415, "step": 16076 }, { "epoch": 1.26, "learning_rate": 0.00018654087322183847, "loss": 1.4865, "step": 16077 }, { "epoch": 1.27, "learning_rate": 0.00018652888572645405, "loss": 1.541, "step": 16078 }, { "epoch": 1.27, "learning_rate": 0.00018651689798305872, "loss": 1.483, "step": 16079 }, { "epoch": 1.27, "learning_rate": 0.00018650490999173378, "loss": 1.5677, "step": 16080 }, { "epoch": 1.27, "learning_rate": 0.00018649292175256066, "loss": 1.5612, "step": 16081 }, { "epoch": 1.27, "learning_rate": 0.00018648093326562067, "loss": 1.5357, "step": 16082 }, { "epoch": 1.27, "learning_rate": 0.00018646894453099535, "loss": 1.5028, "step": 16083 }, { "epoch": 1.27, "learning_rate": 0.00018645695554876603, "loss": 1.5369, "step": 16084 }, { "epoch": 1.27, "learning_rate": 0.00018644496631901403, "loss": 1.5109, "step": 16085 }, { "epoch": 1.27, "learning_rate": 0.00018643297684182089, "loss": 1.5716, "step": 16086 }, { "epoch": 1.27, "learning_rate": 0.00018642098711726794, "loss": 1.5661, "step": 16087 }, { "epoch": 1.27, "learning_rate": 0.0001864089971454365, "loss": 1.5542, "step": 16088 }, { "epoch": 1.27, "learning_rate": 0.00018639700692640816, "loss": 1.5849, "step": 16089 }, { "epoch": 1.27, "learning_rate": 0.00018638501646026415, "loss": 1.5293, "step": 16090 }, { "epoch": 1.27, "learning_rate": 0.00018637302574708598, "loss": 1.4936, "step": 16091 }, { "epoch": 1.27, "learning_rate": 0.0001863610347869551, "loss": 1.5526, "step": 16092 }, { "epoch": 1.27, "learning_rate": 0.0001863490435799528, "loss": 1.496, "step": 16093 }, { "epoch": 1.27, "learning_rate": 0.0001863370521261606, "loss": 1.5401, "step": 16094 }, { "epoch": 1.27, "learning_rate": 0.00018632506042565983, "loss": 1.5782, "step": 16095 }, { "epoch": 1.27, "learning_rate": 0.00018631306847853194, "loss": 1.5531, "step": 16096 }, { "epoch": 1.27, "learning_rate": 0.00018630107628485838, "loss": 1.5362, "step": 16097 }, { "epoch": 1.27, "learning_rate": 0.00018628908384472052, "loss": 1.536, "step": 16098 }, { "epoch": 1.27, "learning_rate": 0.00018627709115819982, "loss": 1.5392, "step": 16099 }, { "epoch": 1.27, "learning_rate": 0.0001862650982253777, "loss": 1.5728, "step": 16100 }, { "epoch": 1.27, "learning_rate": 0.00018625310504633558, "loss": 1.5661, "step": 16101 }, { "epoch": 1.27, "learning_rate": 0.00018624111162115486, "loss": 1.5453, "step": 16102 }, { "epoch": 1.27, "learning_rate": 0.00018622911794991697, "loss": 1.609, "step": 16103 }, { "epoch": 1.27, "learning_rate": 0.0001862171240327034, "loss": 1.5424, "step": 16104 }, { "epoch": 1.27, "learning_rate": 0.00018620512986959552, "loss": 1.5235, "step": 16105 }, { "epoch": 1.27, "learning_rate": 0.00018619313546067482, "loss": 1.5003, "step": 16106 }, { "epoch": 1.27, "learning_rate": 0.00018618114080602268, "loss": 1.5863, "step": 16107 }, { "epoch": 1.27, "learning_rate": 0.00018616914590572056, "loss": 1.5202, "step": 16108 }, { "epoch": 1.27, "learning_rate": 0.00018615715075984992, "loss": 1.5319, "step": 16109 }, { "epoch": 1.27, "learning_rate": 0.00018614515536849213, "loss": 1.5064, "step": 16110 }, { "epoch": 1.27, "learning_rate": 0.00018613315973172877, "loss": 1.5264, "step": 16111 }, { "epoch": 1.27, "learning_rate": 0.00018612116384964113, "loss": 1.5662, "step": 16112 }, { "epoch": 1.27, "learning_rate": 0.0001861091677223107, "loss": 1.5342, "step": 16113 }, { "epoch": 1.27, "learning_rate": 0.000186097171349819, "loss": 1.5122, "step": 16114 }, { "epoch": 1.27, "learning_rate": 0.00018608517473224737, "loss": 1.5785, "step": 16115 }, { "epoch": 1.27, "learning_rate": 0.00018607317786967738, "loss": 1.52, "step": 16116 }, { "epoch": 1.27, "learning_rate": 0.0001860611807621904, "loss": 1.5243, "step": 16117 }, { "epoch": 1.27, "learning_rate": 0.00018604918340986787, "loss": 1.5548, "step": 16118 }, { "epoch": 1.27, "learning_rate": 0.00018603718581279135, "loss": 1.5259, "step": 16119 }, { "epoch": 1.27, "learning_rate": 0.00018602518797104214, "loss": 1.5481, "step": 16120 }, { "epoch": 1.27, "learning_rate": 0.00018601318988470183, "loss": 1.5218, "step": 16121 }, { "epoch": 1.27, "learning_rate": 0.0001860011915538518, "loss": 1.524, "step": 16122 }, { "epoch": 1.27, "learning_rate": 0.0001859891929785736, "loss": 1.6125, "step": 16123 }, { "epoch": 1.27, "learning_rate": 0.00018597719415894861, "loss": 1.5717, "step": 16124 }, { "epoch": 1.27, "learning_rate": 0.00018596519509505834, "loss": 1.5595, "step": 16125 }, { "epoch": 1.27, "learning_rate": 0.00018595319578698424, "loss": 1.545, "step": 16126 }, { "epoch": 1.27, "learning_rate": 0.00018594119623480777, "loss": 1.5036, "step": 16127 }, { "epoch": 1.27, "learning_rate": 0.00018592919643861043, "loss": 1.5419, "step": 16128 }, { "epoch": 1.27, "learning_rate": 0.00018591719639847362, "loss": 1.5032, "step": 16129 }, { "epoch": 1.27, "learning_rate": 0.00018590519611447892, "loss": 1.5154, "step": 16130 }, { "epoch": 1.27, "learning_rate": 0.00018589319558670774, "loss": 1.5756, "step": 16131 }, { "epoch": 1.27, "learning_rate": 0.00018588119481524154, "loss": 1.5617, "step": 16132 }, { "epoch": 1.27, "learning_rate": 0.00018586919380016186, "loss": 1.6139, "step": 16133 }, { "epoch": 1.27, "learning_rate": 0.0001858571925415502, "loss": 1.5108, "step": 16134 }, { "epoch": 1.27, "learning_rate": 0.0001858451910394879, "loss": 1.503, "step": 16135 }, { "epoch": 1.27, "learning_rate": 0.00018583318929405658, "loss": 1.5713, "step": 16136 }, { "epoch": 1.27, "learning_rate": 0.0001858211873053376, "loss": 1.5215, "step": 16137 }, { "epoch": 1.27, "learning_rate": 0.00018580918507341265, "loss": 1.4984, "step": 16138 }, { "epoch": 1.27, "learning_rate": 0.00018579718259836302, "loss": 1.5506, "step": 16139 }, { "epoch": 1.27, "learning_rate": 0.00018578517988027032, "loss": 1.556, "step": 16140 }, { "epoch": 1.27, "learning_rate": 0.00018577317691921598, "loss": 1.5268, "step": 16141 }, { "epoch": 1.27, "learning_rate": 0.00018576117371528147, "loss": 1.4886, "step": 16142 }, { "epoch": 1.27, "learning_rate": 0.00018574917026854837, "loss": 1.5295, "step": 16143 }, { "epoch": 1.27, "learning_rate": 0.00018573716657909812, "loss": 1.5579, "step": 16144 }, { "epoch": 1.27, "learning_rate": 0.0001857251626470122, "loss": 1.5711, "step": 16145 }, { "epoch": 1.27, "learning_rate": 0.00018571315847237216, "loss": 1.5487, "step": 16146 }, { "epoch": 1.27, "learning_rate": 0.00018570115405525946, "loss": 1.5532, "step": 16147 }, { "epoch": 1.27, "learning_rate": 0.0001856891493957557, "loss": 1.5378, "step": 16148 }, { "epoch": 1.27, "learning_rate": 0.00018567714449394223, "loss": 1.5337, "step": 16149 }, { "epoch": 1.27, "learning_rate": 0.00018566513934990074, "loss": 1.5262, "step": 16150 }, { "epoch": 1.27, "learning_rate": 0.00018565313396371253, "loss": 1.5598, "step": 16151 }, { "epoch": 1.27, "learning_rate": 0.00018564112833545926, "loss": 1.5849, "step": 16152 }, { "epoch": 1.27, "learning_rate": 0.00018562912246522238, "loss": 1.5005, "step": 16153 }, { "epoch": 1.27, "learning_rate": 0.0001856171163530834, "loss": 1.5619, "step": 16154 }, { "epoch": 1.27, "learning_rate": 0.00018560510999912394, "loss": 1.5534, "step": 16155 }, { "epoch": 1.27, "learning_rate": 0.00018559310340342537, "loss": 1.5313, "step": 16156 }, { "epoch": 1.27, "learning_rate": 0.00018558109656606928, "loss": 1.5594, "step": 16157 }, { "epoch": 1.27, "learning_rate": 0.00018556908948713717, "loss": 1.5581, "step": 16158 }, { "epoch": 1.27, "learning_rate": 0.00018555708216671057, "loss": 1.5564, "step": 16159 }, { "epoch": 1.27, "learning_rate": 0.00018554507460487101, "loss": 1.561, "step": 16160 }, { "epoch": 1.27, "learning_rate": 0.00018553306680169998, "loss": 1.5255, "step": 16161 }, { "epoch": 1.27, "learning_rate": 0.0001855210587572791, "loss": 1.5315, "step": 16162 }, { "epoch": 1.27, "learning_rate": 0.00018550905047168978, "loss": 1.5123, "step": 16163 }, { "epoch": 1.27, "learning_rate": 0.00018549704194501361, "loss": 1.5042, "step": 16164 }, { "epoch": 1.27, "learning_rate": 0.00018548503317733216, "loss": 1.601, "step": 16165 }, { "epoch": 1.27, "learning_rate": 0.00018547302416872688, "loss": 1.4985, "step": 16166 }, { "epoch": 1.27, "learning_rate": 0.00018546101491927937, "loss": 1.5718, "step": 16167 }, { "epoch": 1.27, "learning_rate": 0.00018544900542907106, "loss": 1.5578, "step": 16168 }, { "epoch": 1.27, "learning_rate": 0.00018543699569818363, "loss": 1.5932, "step": 16169 }, { "epoch": 1.27, "learning_rate": 0.00018542498572669854, "loss": 1.5504, "step": 16170 }, { "epoch": 1.27, "learning_rate": 0.00018541297551469735, "loss": 1.5074, "step": 16171 }, { "epoch": 1.27, "learning_rate": 0.0001854009650622616, "loss": 1.5613, "step": 16172 }, { "epoch": 1.27, "learning_rate": 0.0001853889543694728, "loss": 1.5938, "step": 16173 }, { "epoch": 1.27, "learning_rate": 0.00018537694343641258, "loss": 1.5873, "step": 16174 }, { "epoch": 1.27, "learning_rate": 0.00018536493226316246, "loss": 1.5475, "step": 16175 }, { "epoch": 1.27, "learning_rate": 0.00018535292084980384, "loss": 1.531, "step": 16176 }, { "epoch": 1.27, "learning_rate": 0.0001853409091964185, "loss": 1.5847, "step": 16177 }, { "epoch": 1.27, "learning_rate": 0.00018532889730308788, "loss": 1.5179, "step": 16178 }, { "epoch": 1.27, "learning_rate": 0.00018531688516989356, "loss": 1.5188, "step": 16179 }, { "epoch": 1.27, "learning_rate": 0.00018530487279691703, "loss": 1.5563, "step": 16180 }, { "epoch": 1.27, "learning_rate": 0.0001852928601842399, "loss": 1.5603, "step": 16181 }, { "epoch": 1.27, "learning_rate": 0.00018528084733194377, "loss": 1.5418, "step": 16182 }, { "epoch": 1.27, "learning_rate": 0.00018526883424011014, "loss": 1.5707, "step": 16183 }, { "epoch": 1.27, "learning_rate": 0.00018525682090882056, "loss": 1.5678, "step": 16184 }, { "epoch": 1.27, "learning_rate": 0.00018524480733815663, "loss": 1.5679, "step": 16185 }, { "epoch": 1.27, "learning_rate": 0.00018523279352819993, "loss": 1.5433, "step": 16186 }, { "epoch": 1.27, "learning_rate": 0.00018522077947903198, "loss": 1.5412, "step": 16187 }, { "epoch": 1.27, "learning_rate": 0.0001852087651907344, "loss": 1.4944, "step": 16188 }, { "epoch": 1.27, "learning_rate": 0.00018519675066338873, "loss": 1.5503, "step": 16189 }, { "epoch": 1.27, "learning_rate": 0.00018518473589707653, "loss": 1.5878, "step": 16190 }, { "epoch": 1.27, "learning_rate": 0.0001851727208918794, "loss": 1.5277, "step": 16191 }, { "epoch": 1.27, "learning_rate": 0.00018516070564787888, "loss": 1.5297, "step": 16192 }, { "epoch": 1.27, "learning_rate": 0.00018514869016515658, "loss": 1.4969, "step": 16193 }, { "epoch": 1.27, "learning_rate": 0.0001851366744437941, "loss": 1.5299, "step": 16194 }, { "epoch": 1.27, "learning_rate": 0.00018512465848387298, "loss": 1.5614, "step": 16195 }, { "epoch": 1.27, "learning_rate": 0.00018511264228547483, "loss": 1.5086, "step": 16196 }, { "epoch": 1.27, "learning_rate": 0.00018510062584868117, "loss": 1.5255, "step": 16197 }, { "epoch": 1.27, "learning_rate": 0.00018508860917357365, "loss": 1.5199, "step": 16198 }, { "epoch": 1.27, "learning_rate": 0.00018507659226023386, "loss": 1.5475, "step": 16199 }, { "epoch": 1.27, "learning_rate": 0.00018506457510874332, "loss": 1.5532, "step": 16200 }, { "epoch": 1.27, "learning_rate": 0.0001850525577191837, "loss": 1.5411, "step": 16201 }, { "epoch": 1.27, "learning_rate": 0.00018504054009163654, "loss": 1.5379, "step": 16202 }, { "epoch": 1.27, "learning_rate": 0.00018502852222618344, "loss": 1.6073, "step": 16203 }, { "epoch": 1.27, "learning_rate": 0.00018501650412290605, "loss": 1.5748, "step": 16204 }, { "epoch": 1.28, "learning_rate": 0.00018500448578188586, "loss": 1.5352, "step": 16205 }, { "epoch": 1.28, "learning_rate": 0.0001849924672032046, "loss": 1.5247, "step": 16206 }, { "epoch": 1.28, "learning_rate": 0.00018498044838694377, "loss": 1.51, "step": 16207 }, { "epoch": 1.28, "learning_rate": 0.00018496842933318495, "loss": 1.5267, "step": 16208 }, { "epoch": 1.28, "learning_rate": 0.00018495641004200982, "loss": 1.521, "step": 16209 }, { "epoch": 1.28, "learning_rate": 0.00018494439051349997, "loss": 1.5191, "step": 16210 }, { "epoch": 1.28, "learning_rate": 0.00018493237074773702, "loss": 1.5537, "step": 16211 }, { "epoch": 1.28, "learning_rate": 0.0001849203507448025, "loss": 1.5179, "step": 16212 }, { "epoch": 1.28, "learning_rate": 0.0001849083305047781, "loss": 1.5208, "step": 16213 }, { "epoch": 1.28, "learning_rate": 0.00018489631002774538, "loss": 1.4723, "step": 16214 }, { "epoch": 1.28, "learning_rate": 0.000184884289313786, "loss": 1.5339, "step": 16215 }, { "epoch": 1.28, "learning_rate": 0.00018487226836298148, "loss": 1.5938, "step": 16216 }, { "epoch": 1.28, "learning_rate": 0.00018486024717541353, "loss": 1.5272, "step": 16217 }, { "epoch": 1.28, "learning_rate": 0.0001848482257511638, "loss": 1.559, "step": 16218 }, { "epoch": 1.28, "learning_rate": 0.0001848362040903138, "loss": 1.5537, "step": 16219 }, { "epoch": 1.28, "learning_rate": 0.0001848241821929452, "loss": 1.5153, "step": 16220 }, { "epoch": 1.28, "learning_rate": 0.00018481216005913963, "loss": 1.6079, "step": 16221 }, { "epoch": 1.28, "learning_rate": 0.0001848001376889787, "loss": 1.5449, "step": 16222 }, { "epoch": 1.28, "learning_rate": 0.00018478811508254402, "loss": 1.5562, "step": 16223 }, { "epoch": 1.28, "learning_rate": 0.00018477609223991725, "loss": 1.5585, "step": 16224 }, { "epoch": 1.28, "learning_rate": 0.00018476406916118003, "loss": 1.5982, "step": 16225 }, { "epoch": 1.28, "learning_rate": 0.00018475204584641393, "loss": 1.5529, "step": 16226 }, { "epoch": 1.28, "learning_rate": 0.00018474002229570063, "loss": 1.5682, "step": 16227 }, { "epoch": 1.28, "learning_rate": 0.00018472799850912178, "loss": 1.5291, "step": 16228 }, { "epoch": 1.28, "learning_rate": 0.00018471597448675896, "loss": 1.5762, "step": 16229 }, { "epoch": 1.28, "learning_rate": 0.0001847039502286938, "loss": 1.4917, "step": 16230 }, { "epoch": 1.28, "learning_rate": 0.00018469192573500798, "loss": 1.5223, "step": 16231 }, { "epoch": 1.28, "learning_rate": 0.00018467990100578315, "loss": 1.4914, "step": 16232 }, { "epoch": 1.28, "learning_rate": 0.00018466787604110095, "loss": 1.5575, "step": 16233 }, { "epoch": 1.28, "learning_rate": 0.00018465585084104295, "loss": 1.5049, "step": 16234 }, { "epoch": 1.28, "learning_rate": 0.0001846438254056909, "loss": 1.5342, "step": 16235 }, { "epoch": 1.28, "learning_rate": 0.00018463179973512636, "loss": 1.5454, "step": 16236 }, { "epoch": 1.28, "learning_rate": 0.000184619773829431, "loss": 1.5202, "step": 16237 }, { "epoch": 1.28, "learning_rate": 0.0001846077476886865, "loss": 1.5499, "step": 16238 }, { "epoch": 1.28, "learning_rate": 0.00018459572131297448, "loss": 1.5045, "step": 16239 }, { "epoch": 1.28, "learning_rate": 0.00018458369470237662, "loss": 1.5654, "step": 16240 }, { "epoch": 1.28, "learning_rate": 0.00018457166785697458, "loss": 1.5415, "step": 16241 }, { "epoch": 1.28, "learning_rate": 0.00018455964077684995, "loss": 1.5255, "step": 16242 }, { "epoch": 1.28, "learning_rate": 0.00018454761346208446, "loss": 1.5054, "step": 16243 }, { "epoch": 1.28, "learning_rate": 0.0001845355859127597, "loss": 1.4795, "step": 16244 }, { "epoch": 1.28, "learning_rate": 0.0001845235581289574, "loss": 1.6051, "step": 16245 }, { "epoch": 1.28, "learning_rate": 0.0001845115301107592, "loss": 1.549, "step": 16246 }, { "epoch": 1.28, "learning_rate": 0.00018449950185824674, "loss": 1.5173, "step": 16247 }, { "epoch": 1.28, "learning_rate": 0.0001844874733715017, "loss": 1.5672, "step": 16248 }, { "epoch": 1.28, "learning_rate": 0.00018447544465060575, "loss": 1.4803, "step": 16249 }, { "epoch": 1.28, "learning_rate": 0.0001844634156956406, "loss": 1.5282, "step": 16250 }, { "epoch": 1.28, "learning_rate": 0.0001844513865066878, "loss": 1.5816, "step": 16251 }, { "epoch": 1.28, "learning_rate": 0.00018443935708382914, "loss": 1.5581, "step": 16252 }, { "epoch": 1.28, "learning_rate": 0.00018442732742714624, "loss": 1.5028, "step": 16253 }, { "epoch": 1.28, "learning_rate": 0.0001844152975367208, "loss": 1.5223, "step": 16254 }, { "epoch": 1.28, "learning_rate": 0.00018440326741263444, "loss": 1.5815, "step": 16255 }, { "epoch": 1.28, "learning_rate": 0.0001843912370549689, "loss": 1.5986, "step": 16256 }, { "epoch": 1.28, "learning_rate": 0.00018437920646380588, "loss": 1.5791, "step": 16257 }, { "epoch": 1.28, "learning_rate": 0.00018436717563922696, "loss": 1.5264, "step": 16258 }, { "epoch": 1.28, "learning_rate": 0.00018435514458131391, "loss": 1.5815, "step": 16259 }, { "epoch": 1.28, "learning_rate": 0.0001843431132901484, "loss": 1.5245, "step": 16260 }, { "epoch": 1.28, "learning_rate": 0.0001843310817658121, "loss": 1.5498, "step": 16261 }, { "epoch": 1.28, "learning_rate": 0.00018431905000838668, "loss": 1.5339, "step": 16262 }, { "epoch": 1.28, "learning_rate": 0.00018430701801795384, "loss": 1.5394, "step": 16263 }, { "epoch": 1.28, "learning_rate": 0.0001842949857945953, "loss": 1.5574, "step": 16264 }, { "epoch": 1.28, "learning_rate": 0.00018428295333839273, "loss": 1.5012, "step": 16265 }, { "epoch": 1.28, "learning_rate": 0.00018427092064942784, "loss": 1.5295, "step": 16266 }, { "epoch": 1.28, "learning_rate": 0.0001842588877277823, "loss": 1.4922, "step": 16267 }, { "epoch": 1.28, "learning_rate": 0.00018424685457353783, "loss": 1.5144, "step": 16268 }, { "epoch": 1.28, "learning_rate": 0.00018423482118677613, "loss": 1.5183, "step": 16269 }, { "epoch": 1.28, "learning_rate": 0.0001842227875675788, "loss": 1.4895, "step": 16270 }, { "epoch": 1.28, "learning_rate": 0.00018421075371602771, "loss": 1.5725, "step": 16271 }, { "epoch": 1.28, "learning_rate": 0.00018419871963220447, "loss": 1.53, "step": 16272 }, { "epoch": 1.28, "learning_rate": 0.00018418668531619076, "loss": 1.5995, "step": 16273 }, { "epoch": 1.28, "learning_rate": 0.00018417465076806837, "loss": 1.5411, "step": 16274 }, { "epoch": 1.28, "learning_rate": 0.00018416261598791893, "loss": 1.4631, "step": 16275 }, { "epoch": 1.28, "learning_rate": 0.00018415058097582418, "loss": 1.5379, "step": 16276 }, { "epoch": 1.28, "learning_rate": 0.00018413854573186584, "loss": 1.5593, "step": 16277 }, { "epoch": 1.28, "learning_rate": 0.00018412651025612558, "loss": 1.5401, "step": 16278 }, { "epoch": 1.28, "learning_rate": 0.00018411447454868518, "loss": 1.5205, "step": 16279 }, { "epoch": 1.28, "learning_rate": 0.00018410243860962635, "loss": 1.5612, "step": 16280 }, { "epoch": 1.28, "learning_rate": 0.00018409040243903076, "loss": 1.5466, "step": 16281 }, { "epoch": 1.28, "learning_rate": 0.00018407836603698014, "loss": 1.5547, "step": 16282 }, { "epoch": 1.28, "learning_rate": 0.00018406632940355623, "loss": 1.5945, "step": 16283 }, { "epoch": 1.28, "learning_rate": 0.00018405429253884074, "loss": 1.5114, "step": 16284 }, { "epoch": 1.28, "learning_rate": 0.0001840422554429154, "loss": 1.4773, "step": 16285 }, { "epoch": 1.28, "learning_rate": 0.00018403021811586195, "loss": 1.5382, "step": 16286 }, { "epoch": 1.28, "learning_rate": 0.00018401818055776203, "loss": 1.5321, "step": 16287 }, { "epoch": 1.28, "learning_rate": 0.00018400614276869749, "loss": 1.5712, "step": 16288 }, { "epoch": 1.28, "learning_rate": 0.00018399410474875, "loss": 1.533, "step": 16289 }, { "epoch": 1.28, "learning_rate": 0.0001839820664980013, "loss": 1.5828, "step": 16290 }, { "epoch": 1.28, "learning_rate": 0.00018397002801653312, "loss": 1.5185, "step": 16291 }, { "epoch": 1.28, "learning_rate": 0.0001839579893044272, "loss": 1.5052, "step": 16292 }, { "epoch": 1.28, "learning_rate": 0.00018394595036176525, "loss": 1.5258, "step": 16293 }, { "epoch": 1.28, "learning_rate": 0.00018393391118862905, "loss": 1.5445, "step": 16294 }, { "epoch": 1.28, "learning_rate": 0.0001839218717851003, "loss": 1.5258, "step": 16295 }, { "epoch": 1.28, "learning_rate": 0.0001839098321512608, "loss": 1.5074, "step": 16296 }, { "epoch": 1.28, "learning_rate": 0.0001838977922871922, "loss": 1.5497, "step": 16297 }, { "epoch": 1.28, "learning_rate": 0.00018388575219297637, "loss": 1.5346, "step": 16298 }, { "epoch": 1.28, "learning_rate": 0.00018387371186869494, "loss": 1.5035, "step": 16299 }, { "epoch": 1.28, "learning_rate": 0.00018386167131442967, "loss": 1.5465, "step": 16300 }, { "epoch": 1.28, "learning_rate": 0.00018384963053026237, "loss": 1.4912, "step": 16301 }, { "epoch": 1.28, "learning_rate": 0.00018383758951627473, "loss": 1.5838, "step": 16302 }, { "epoch": 1.28, "learning_rate": 0.00018382554827254857, "loss": 1.5119, "step": 16303 }, { "epoch": 1.28, "learning_rate": 0.00018381350679916558, "loss": 1.5726, "step": 16304 }, { "epoch": 1.28, "learning_rate": 0.00018380146509620754, "loss": 1.5504, "step": 16305 }, { "epoch": 1.28, "learning_rate": 0.00018378942316375622, "loss": 1.5109, "step": 16306 }, { "epoch": 1.28, "learning_rate": 0.00018377738100189338, "loss": 1.4942, "step": 16307 }, { "epoch": 1.28, "learning_rate": 0.00018376533861070074, "loss": 1.5622, "step": 16308 }, { "epoch": 1.28, "learning_rate": 0.0001837532959902601, "loss": 1.5505, "step": 16309 }, { "epoch": 1.28, "learning_rate": 0.00018374125314065315, "loss": 1.4801, "step": 16310 }, { "epoch": 1.28, "learning_rate": 0.00018372921006196176, "loss": 1.5755, "step": 16311 }, { "epoch": 1.28, "learning_rate": 0.0001837171667542676, "loss": 1.5821, "step": 16312 }, { "epoch": 1.28, "learning_rate": 0.00018370512321765254, "loss": 1.5063, "step": 16313 }, { "epoch": 1.28, "learning_rate": 0.00018369307945219828, "loss": 1.5042, "step": 16314 }, { "epoch": 1.28, "learning_rate": 0.00018368103545798658, "loss": 1.6055, "step": 16315 }, { "epoch": 1.28, "learning_rate": 0.0001836689912350993, "loss": 1.5394, "step": 16316 }, { "epoch": 1.28, "learning_rate": 0.0001836569467836181, "loss": 1.5421, "step": 16317 }, { "epoch": 1.28, "learning_rate": 0.00018364490210362477, "loss": 1.5314, "step": 16318 }, { "epoch": 1.28, "learning_rate": 0.00018363285719520117, "loss": 1.5188, "step": 16319 }, { "epoch": 1.28, "learning_rate": 0.00018362081205842905, "loss": 1.5417, "step": 16320 }, { "epoch": 1.28, "learning_rate": 0.0001836087666933901, "loss": 1.5722, "step": 16321 }, { "epoch": 1.28, "learning_rate": 0.00018359672110016624, "loss": 1.5609, "step": 16322 }, { "epoch": 1.28, "learning_rate": 0.00018358467527883915, "loss": 1.5376, "step": 16323 }, { "epoch": 1.28, "learning_rate": 0.00018357262922949065, "loss": 1.5572, "step": 16324 }, { "epoch": 1.28, "learning_rate": 0.00018356058295220253, "loss": 1.5278, "step": 16325 }, { "epoch": 1.28, "learning_rate": 0.00018354853644705655, "loss": 1.5325, "step": 16326 }, { "epoch": 1.28, "learning_rate": 0.00018353648971413457, "loss": 1.5122, "step": 16327 }, { "epoch": 1.28, "learning_rate": 0.0001835244427535183, "loss": 1.564, "step": 16328 }, { "epoch": 1.28, "learning_rate": 0.00018351239556528952, "loss": 1.5299, "step": 16329 }, { "epoch": 1.28, "learning_rate": 0.00018350034814953016, "loss": 1.5777, "step": 16330 }, { "epoch": 1.28, "learning_rate": 0.00018348830050632188, "loss": 1.5341, "step": 16331 }, { "epoch": 1.29, "learning_rate": 0.0001834762526357465, "loss": 1.5022, "step": 16332 }, { "epoch": 1.29, "learning_rate": 0.00018346420453788586, "loss": 1.5201, "step": 16333 }, { "epoch": 1.29, "learning_rate": 0.00018345215621282172, "loss": 1.5105, "step": 16334 }, { "epoch": 1.29, "learning_rate": 0.0001834401076606359, "loss": 1.5677, "step": 16335 }, { "epoch": 1.29, "learning_rate": 0.00018342805888141024, "loss": 1.4795, "step": 16336 }, { "epoch": 1.29, "learning_rate": 0.0001834160098752265, "loss": 1.5423, "step": 16337 }, { "epoch": 1.29, "learning_rate": 0.00018340396064216646, "loss": 1.5634, "step": 16338 }, { "epoch": 1.29, "learning_rate": 0.00018339191118231198, "loss": 1.513, "step": 16339 }, { "epoch": 1.29, "learning_rate": 0.00018337986149574487, "loss": 1.5364, "step": 16340 }, { "epoch": 1.29, "learning_rate": 0.00018336781158254686, "loss": 1.5728, "step": 16341 }, { "epoch": 1.29, "learning_rate": 0.00018335576144279988, "loss": 1.516, "step": 16342 }, { "epoch": 1.29, "learning_rate": 0.00018334371107658564, "loss": 1.5397, "step": 16343 }, { "epoch": 1.29, "learning_rate": 0.000183331660483986, "loss": 1.5654, "step": 16344 }, { "epoch": 1.29, "learning_rate": 0.00018331960966508286, "loss": 1.5094, "step": 16345 }, { "epoch": 1.29, "learning_rate": 0.00018330755861995792, "loss": 1.5193, "step": 16346 }, { "epoch": 1.29, "learning_rate": 0.00018329550734869305, "loss": 1.5513, "step": 16347 }, { "epoch": 1.29, "learning_rate": 0.00018328345585137, "loss": 1.545, "step": 16348 }, { "epoch": 1.29, "learning_rate": 0.0001832714041280707, "loss": 1.5378, "step": 16349 }, { "epoch": 1.29, "learning_rate": 0.0001832593521788769, "loss": 1.513, "step": 16350 }, { "epoch": 1.29, "learning_rate": 0.00018324730000387045, "loss": 1.5407, "step": 16351 }, { "epoch": 1.29, "learning_rate": 0.00018323524760313322, "loss": 1.5508, "step": 16352 }, { "epoch": 1.29, "learning_rate": 0.00018322319497674695, "loss": 1.5331, "step": 16353 }, { "epoch": 1.29, "learning_rate": 0.0001832111421247936, "loss": 1.556, "step": 16354 }, { "epoch": 1.29, "learning_rate": 0.00018319908904735485, "loss": 1.5439, "step": 16355 }, { "epoch": 1.29, "learning_rate": 0.00018318703574451262, "loss": 1.5211, "step": 16356 }, { "epoch": 1.29, "learning_rate": 0.00018317498221634873, "loss": 1.5496, "step": 16357 }, { "epoch": 1.29, "learning_rate": 0.00018316292846294501, "loss": 1.5032, "step": 16358 }, { "epoch": 1.29, "learning_rate": 0.00018315087448438332, "loss": 1.5317, "step": 16359 }, { "epoch": 1.29, "learning_rate": 0.00018313882028074552, "loss": 1.4904, "step": 16360 }, { "epoch": 1.29, "learning_rate": 0.00018312676585211337, "loss": 1.5743, "step": 16361 }, { "epoch": 1.29, "learning_rate": 0.0001831147111985688, "loss": 1.5361, "step": 16362 }, { "epoch": 1.29, "learning_rate": 0.00018310265632019357, "loss": 1.5651, "step": 16363 }, { "epoch": 1.29, "learning_rate": 0.00018309060121706963, "loss": 1.5473, "step": 16364 }, { "epoch": 1.29, "learning_rate": 0.00018307854588927867, "loss": 1.5266, "step": 16365 }, { "epoch": 1.29, "learning_rate": 0.00018306649033690274, "loss": 1.5248, "step": 16366 }, { "epoch": 1.29, "learning_rate": 0.00018305443456002353, "loss": 1.5359, "step": 16367 }, { "epoch": 1.29, "learning_rate": 0.00018304237855872296, "loss": 1.5815, "step": 16368 }, { "epoch": 1.29, "learning_rate": 0.0001830303223330829, "loss": 1.5461, "step": 16369 }, { "epoch": 1.29, "learning_rate": 0.00018301826588318517, "loss": 1.5146, "step": 16370 }, { "epoch": 1.29, "learning_rate": 0.0001830062092091116, "loss": 1.4761, "step": 16371 }, { "epoch": 1.29, "learning_rate": 0.00018299415231094412, "loss": 1.5011, "step": 16372 }, { "epoch": 1.29, "learning_rate": 0.00018298209518876452, "loss": 1.5985, "step": 16373 }, { "epoch": 1.29, "learning_rate": 0.00018297003784265476, "loss": 1.5368, "step": 16374 }, { "epoch": 1.29, "learning_rate": 0.00018295798027269657, "loss": 1.4948, "step": 16375 }, { "epoch": 1.29, "learning_rate": 0.00018294592247897193, "loss": 1.5193, "step": 16376 }, { "epoch": 1.29, "learning_rate": 0.00018293386446156264, "loss": 1.5293, "step": 16377 }, { "epoch": 1.29, "learning_rate": 0.00018292180622055056, "loss": 1.4884, "step": 16378 }, { "epoch": 1.29, "learning_rate": 0.00018290974775601762, "loss": 1.5049, "step": 16379 }, { "epoch": 1.29, "learning_rate": 0.0001828976890680456, "loss": 1.5668, "step": 16380 }, { "epoch": 1.29, "learning_rate": 0.00018288563015671648, "loss": 1.5619, "step": 16381 }, { "epoch": 1.29, "learning_rate": 0.00018287357102211204, "loss": 1.5342, "step": 16382 }, { "epoch": 1.29, "learning_rate": 0.00018286151166431425, "loss": 1.521, "step": 16383 }, { "epoch": 1.29, "learning_rate": 0.0001828494520834049, "loss": 1.512, "step": 16384 }, { "epoch": 1.29, "learning_rate": 0.00018283739227946587, "loss": 1.559, "step": 16385 }, { "epoch": 1.29, "learning_rate": 0.0001828253322525791, "loss": 1.5604, "step": 16386 }, { "epoch": 1.29, "learning_rate": 0.00018281327200282644, "loss": 1.4768, "step": 16387 }, { "epoch": 1.29, "learning_rate": 0.00018280121153028977, "loss": 1.5172, "step": 16388 }, { "epoch": 1.29, "learning_rate": 0.00018278915083505095, "loss": 1.5028, "step": 16389 }, { "epoch": 1.29, "learning_rate": 0.00018277708991719187, "loss": 1.515, "step": 16390 }, { "epoch": 1.29, "learning_rate": 0.00018276502877679452, "loss": 1.567, "step": 16391 }, { "epoch": 1.29, "learning_rate": 0.00018275296741394065, "loss": 1.5708, "step": 16392 }, { "epoch": 1.29, "learning_rate": 0.00018274090582871223, "loss": 1.4971, "step": 16393 }, { "epoch": 1.29, "learning_rate": 0.0001827288440211911, "loss": 1.5569, "step": 16394 }, { "epoch": 1.29, "learning_rate": 0.00018271678199145917, "loss": 1.4772, "step": 16395 }, { "epoch": 1.29, "learning_rate": 0.00018270471973959836, "loss": 1.5696, "step": 16396 }, { "epoch": 1.29, "learning_rate": 0.00018269265726569055, "loss": 1.5181, "step": 16397 }, { "epoch": 1.29, "learning_rate": 0.0001826805945698177, "loss": 1.5358, "step": 16398 }, { "epoch": 1.29, "learning_rate": 0.00018266853165206157, "loss": 1.5294, "step": 16399 }, { "epoch": 1.29, "learning_rate": 0.00018265646851250416, "loss": 1.5453, "step": 16400 }, { "epoch": 1.29, "learning_rate": 0.00018264440515122738, "loss": 1.4731, "step": 16401 }, { "epoch": 1.29, "learning_rate": 0.00018263234156831306, "loss": 1.5225, "step": 16402 }, { "epoch": 1.29, "learning_rate": 0.00018262027776384319, "loss": 1.571, "step": 16403 }, { "epoch": 1.29, "learning_rate": 0.00018260821373789957, "loss": 1.5307, "step": 16404 }, { "epoch": 1.29, "learning_rate": 0.00018259614949056423, "loss": 1.4928, "step": 16405 }, { "epoch": 1.29, "learning_rate": 0.000182584085021919, "loss": 1.5419, "step": 16406 }, { "epoch": 1.29, "learning_rate": 0.00018257202033204582, "loss": 1.5038, "step": 16407 }, { "epoch": 1.29, "learning_rate": 0.0001825599554210266, "loss": 1.55, "step": 16408 }, { "epoch": 1.29, "learning_rate": 0.00018254789028894323, "loss": 1.5199, "step": 16409 }, { "epoch": 1.29, "learning_rate": 0.00018253582493587772, "loss": 1.5413, "step": 16410 }, { "epoch": 1.29, "learning_rate": 0.00018252375936191184, "loss": 1.5659, "step": 16411 }, { "epoch": 1.29, "learning_rate": 0.00018251169356712756, "loss": 1.5711, "step": 16412 }, { "epoch": 1.29, "learning_rate": 0.00018249962755160687, "loss": 1.5231, "step": 16413 }, { "epoch": 1.29, "learning_rate": 0.00018248756131543167, "loss": 1.5041, "step": 16414 }, { "epoch": 1.29, "learning_rate": 0.0001824754948586838, "loss": 1.5469, "step": 16415 }, { "epoch": 1.29, "learning_rate": 0.00018246342818144525, "loss": 1.5053, "step": 16416 }, { "epoch": 1.29, "learning_rate": 0.00018245136128379797, "loss": 1.5482, "step": 16417 }, { "epoch": 1.29, "learning_rate": 0.00018243929416582387, "loss": 1.5736, "step": 16418 }, { "epoch": 1.29, "learning_rate": 0.00018242722682760483, "loss": 1.5387, "step": 16419 }, { "epoch": 1.29, "learning_rate": 0.0001824151592692228, "loss": 1.4981, "step": 16420 }, { "epoch": 1.29, "learning_rate": 0.00018240309149075975, "loss": 1.5387, "step": 16421 }, { "epoch": 1.29, "learning_rate": 0.00018239102349229755, "loss": 1.546, "step": 16422 }, { "epoch": 1.29, "learning_rate": 0.00018237895527391823, "loss": 1.5698, "step": 16423 }, { "epoch": 1.29, "learning_rate": 0.00018236688683570364, "loss": 1.5071, "step": 16424 }, { "epoch": 1.29, "learning_rate": 0.00018235481817773576, "loss": 1.5622, "step": 16425 }, { "epoch": 1.29, "learning_rate": 0.00018234274930009655, "loss": 1.5408, "step": 16426 }, { "epoch": 1.29, "learning_rate": 0.00018233068020286785, "loss": 1.5567, "step": 16427 }, { "epoch": 1.29, "learning_rate": 0.00018231861088613172, "loss": 1.5514, "step": 16428 }, { "epoch": 1.29, "learning_rate": 0.00018230654134997006, "loss": 1.5312, "step": 16429 }, { "epoch": 1.29, "learning_rate": 0.0001822944715944648, "loss": 1.5393, "step": 16430 }, { "epoch": 1.29, "learning_rate": 0.00018228240161969787, "loss": 1.5333, "step": 16431 }, { "epoch": 1.29, "learning_rate": 0.00018227033142575135, "loss": 1.5223, "step": 16432 }, { "epoch": 1.29, "learning_rate": 0.000182258261012707, "loss": 1.5477, "step": 16433 }, { "epoch": 1.29, "learning_rate": 0.00018224619038064685, "loss": 1.5928, "step": 16434 }, { "epoch": 1.29, "learning_rate": 0.0001822341195296529, "loss": 1.58, "step": 16435 }, { "epoch": 1.29, "learning_rate": 0.000182222048459807, "loss": 1.5776, "step": 16436 }, { "epoch": 1.29, "learning_rate": 0.00018220997717119126, "loss": 1.5512, "step": 16437 }, { "epoch": 1.29, "learning_rate": 0.00018219790566388754, "loss": 1.5876, "step": 16438 }, { "epoch": 1.29, "learning_rate": 0.00018218583393797775, "loss": 1.5476, "step": 16439 }, { "epoch": 1.29, "learning_rate": 0.000182173761993544, "loss": 1.5602, "step": 16440 }, { "epoch": 1.29, "learning_rate": 0.00018216168983066806, "loss": 1.5374, "step": 16441 }, { "epoch": 1.29, "learning_rate": 0.00018214961744943207, "loss": 1.5602, "step": 16442 }, { "epoch": 1.29, "learning_rate": 0.00018213754484991786, "loss": 1.5552, "step": 16443 }, { "epoch": 1.29, "learning_rate": 0.0001821254720322075, "loss": 1.5146, "step": 16444 }, { "epoch": 1.29, "learning_rate": 0.00018211339899638289, "loss": 1.4569, "step": 16445 }, { "epoch": 1.29, "learning_rate": 0.00018210132574252605, "loss": 1.5064, "step": 16446 }, { "epoch": 1.29, "learning_rate": 0.00018208925227071893, "loss": 1.5106, "step": 16447 }, { "epoch": 1.29, "learning_rate": 0.00018207717858104345, "loss": 1.5936, "step": 16448 }, { "epoch": 1.29, "learning_rate": 0.00018206510467358165, "loss": 1.5031, "step": 16449 }, { "epoch": 1.29, "learning_rate": 0.00018205303054841547, "loss": 1.6035, "step": 16450 }, { "epoch": 1.29, "learning_rate": 0.00018204095620562692, "loss": 1.5168, "step": 16451 }, { "epoch": 1.29, "learning_rate": 0.00018202888164529793, "loss": 1.5432, "step": 16452 }, { "epoch": 1.29, "learning_rate": 0.00018201680686751054, "loss": 1.4718, "step": 16453 }, { "epoch": 1.29, "learning_rate": 0.0001820047318723467, "loss": 1.5212, "step": 16454 }, { "epoch": 1.29, "learning_rate": 0.0001819926566598884, "loss": 1.5676, "step": 16455 }, { "epoch": 1.29, "learning_rate": 0.0001819805812302176, "loss": 1.5238, "step": 16456 }, { "epoch": 1.29, "learning_rate": 0.00018196850558341632, "loss": 1.5692, "step": 16457 }, { "epoch": 1.29, "learning_rate": 0.0001819564297195665, "loss": 1.5492, "step": 16458 }, { "epoch": 1.3, "learning_rate": 0.00018194435363875014, "loss": 1.5072, "step": 16459 }, { "epoch": 1.3, "learning_rate": 0.00018193227734104926, "loss": 1.533, "step": 16460 }, { "epoch": 1.3, "learning_rate": 0.0001819202008265459, "loss": 1.5012, "step": 16461 }, { "epoch": 1.3, "learning_rate": 0.00018190812409532193, "loss": 1.5019, "step": 16462 }, { "epoch": 1.3, "learning_rate": 0.0001818960471474594, "loss": 1.5126, "step": 16463 }, { "epoch": 1.3, "learning_rate": 0.00018188396998304037, "loss": 1.539, "step": 16464 }, { "epoch": 1.3, "learning_rate": 0.00018187189260214674, "loss": 1.5618, "step": 16465 }, { "epoch": 1.3, "learning_rate": 0.00018185981500486056, "loss": 1.5138, "step": 16466 }, { "epoch": 1.3, "learning_rate": 0.00018184773719126374, "loss": 1.5384, "step": 16467 }, { "epoch": 1.3, "learning_rate": 0.00018183565916143844, "loss": 1.5299, "step": 16468 }, { "epoch": 1.3, "learning_rate": 0.0001818235809154666, "loss": 1.5134, "step": 16469 }, { "epoch": 1.3, "learning_rate": 0.00018181150245343014, "loss": 1.4696, "step": 16470 }, { "epoch": 1.3, "learning_rate": 0.0001817994237754112, "loss": 1.5231, "step": 16471 }, { "epoch": 1.3, "learning_rate": 0.0001817873448814917, "loss": 1.5332, "step": 16472 }, { "epoch": 1.3, "learning_rate": 0.00018177526577175366, "loss": 1.4881, "step": 16473 }, { "epoch": 1.3, "learning_rate": 0.0001817631864462791, "loss": 1.5193, "step": 16474 }, { "epoch": 1.3, "learning_rate": 0.00018175110690514998, "loss": 1.5426, "step": 16475 }, { "epoch": 1.3, "learning_rate": 0.00018173902714844846, "loss": 1.54, "step": 16476 }, { "epoch": 1.3, "learning_rate": 0.00018172694717625643, "loss": 1.5257, "step": 16477 }, { "epoch": 1.3, "learning_rate": 0.00018171486698865592, "loss": 1.5229, "step": 16478 }, { "epoch": 1.3, "learning_rate": 0.00018170278658572898, "loss": 1.5238, "step": 16479 }, { "epoch": 1.3, "learning_rate": 0.0001816907059675576, "loss": 1.5331, "step": 16480 }, { "epoch": 1.3, "learning_rate": 0.00018167862513422382, "loss": 1.5203, "step": 16481 }, { "epoch": 1.3, "learning_rate": 0.00018166654408580967, "loss": 1.5583, "step": 16482 }, { "epoch": 1.3, "learning_rate": 0.00018165446282239714, "loss": 1.5003, "step": 16483 }, { "epoch": 1.3, "learning_rate": 0.00018164238134406825, "loss": 1.5469, "step": 16484 }, { "epoch": 1.3, "learning_rate": 0.0001816302996509051, "loss": 1.4957, "step": 16485 }, { "epoch": 1.3, "learning_rate": 0.00018161821774298966, "loss": 1.5432, "step": 16486 }, { "epoch": 1.3, "learning_rate": 0.00018160613562040397, "loss": 1.5399, "step": 16487 }, { "epoch": 1.3, "learning_rate": 0.00018159405328323008, "loss": 1.5455, "step": 16488 }, { "epoch": 1.3, "learning_rate": 0.00018158197073155, "loss": 1.5002, "step": 16489 }, { "epoch": 1.3, "learning_rate": 0.00018156988796544572, "loss": 1.5408, "step": 16490 }, { "epoch": 1.3, "learning_rate": 0.00018155780498499934, "loss": 1.532, "step": 16491 }, { "epoch": 1.3, "learning_rate": 0.00018154572179029287, "loss": 1.5449, "step": 16492 }, { "epoch": 1.3, "learning_rate": 0.0001815336383814084, "loss": 1.5748, "step": 16493 }, { "epoch": 1.3, "learning_rate": 0.00018152155475842791, "loss": 1.5404, "step": 16494 }, { "epoch": 1.3, "learning_rate": 0.0001815094709214334, "loss": 1.5019, "step": 16495 }, { "epoch": 1.3, "learning_rate": 0.0001814973868705071, "loss": 1.5543, "step": 16496 }, { "epoch": 1.3, "learning_rate": 0.0001814853026057308, "loss": 1.5089, "step": 16497 }, { "epoch": 1.3, "learning_rate": 0.00018147321812718673, "loss": 1.4939, "step": 16498 }, { "epoch": 1.3, "learning_rate": 0.00018146113343495688, "loss": 1.53, "step": 16499 }, { "epoch": 1.3, "learning_rate": 0.0001814490485291233, "loss": 1.5072, "step": 16500 }, { "epoch": 1.3, "learning_rate": 0.000181436963409768, "loss": 1.5356, "step": 16501 }, { "epoch": 1.3, "learning_rate": 0.00018142487807697307, "loss": 1.5447, "step": 16502 }, { "epoch": 1.3, "learning_rate": 0.00018141279253082058, "loss": 1.5582, "step": 16503 }, { "epoch": 1.3, "learning_rate": 0.00018140070677139257, "loss": 1.5907, "step": 16504 }, { "epoch": 1.3, "learning_rate": 0.0001813886207987711, "loss": 1.4979, "step": 16505 }, { "epoch": 1.3, "learning_rate": 0.00018137653461303813, "loss": 1.552, "step": 16506 }, { "epoch": 1.3, "learning_rate": 0.0001813644482142759, "loss": 1.5411, "step": 16507 }, { "epoch": 1.3, "learning_rate": 0.00018135236160256633, "loss": 1.5918, "step": 16508 }, { "epoch": 1.3, "learning_rate": 0.00018134027477799153, "loss": 1.5267, "step": 16509 }, { "epoch": 1.3, "learning_rate": 0.00018132818774063358, "loss": 1.5006, "step": 16510 }, { "epoch": 1.3, "learning_rate": 0.0001813161004905745, "loss": 1.5032, "step": 16511 }, { "epoch": 1.3, "learning_rate": 0.00018130401302789639, "loss": 1.5121, "step": 16512 }, { "epoch": 1.3, "learning_rate": 0.00018129192535268134, "loss": 1.6073, "step": 16513 }, { "epoch": 1.3, "learning_rate": 0.0001812798374650113, "loss": 1.4933, "step": 16514 }, { "epoch": 1.3, "learning_rate": 0.00018126774936496853, "loss": 1.5607, "step": 16515 }, { "epoch": 1.3, "learning_rate": 0.00018125566105263493, "loss": 1.57, "step": 16516 }, { "epoch": 1.3, "learning_rate": 0.00018124357252809266, "loss": 1.5837, "step": 16517 }, { "epoch": 1.3, "learning_rate": 0.00018123148379142377, "loss": 1.5358, "step": 16518 }, { "epoch": 1.3, "learning_rate": 0.00018121939484271033, "loss": 1.5383, "step": 16519 }, { "epoch": 1.3, "learning_rate": 0.00018120730568203444, "loss": 1.5504, "step": 16520 }, { "epoch": 1.3, "learning_rate": 0.00018119521630947818, "loss": 1.5201, "step": 16521 }, { "epoch": 1.3, "learning_rate": 0.00018118312672512355, "loss": 1.5585, "step": 16522 }, { "epoch": 1.3, "learning_rate": 0.00018117103692905277, "loss": 1.5229, "step": 16523 }, { "epoch": 1.3, "learning_rate": 0.0001811589469213478, "loss": 1.5348, "step": 16524 }, { "epoch": 1.3, "learning_rate": 0.00018114685670209084, "loss": 1.5854, "step": 16525 }, { "epoch": 1.3, "learning_rate": 0.00018113476627136388, "loss": 1.5402, "step": 16526 }, { "epoch": 1.3, "learning_rate": 0.00018112267562924906, "loss": 1.5781, "step": 16527 }, { "epoch": 1.3, "learning_rate": 0.00018111058477582838, "loss": 1.4861, "step": 16528 }, { "epoch": 1.3, "learning_rate": 0.00018109849371118406, "loss": 1.5285, "step": 16529 }, { "epoch": 1.3, "learning_rate": 0.00018108640243539808, "loss": 1.4923, "step": 16530 }, { "epoch": 1.3, "learning_rate": 0.00018107431094855259, "loss": 1.4901, "step": 16531 }, { "epoch": 1.3, "learning_rate": 0.00018106221925072972, "loss": 1.506, "step": 16532 }, { "epoch": 1.3, "learning_rate": 0.00018105012734201148, "loss": 1.5613, "step": 16533 }, { "epoch": 1.3, "learning_rate": 0.00018103803522248008, "loss": 1.5436, "step": 16534 }, { "epoch": 1.3, "learning_rate": 0.00018102594289221748, "loss": 1.6066, "step": 16535 }, { "epoch": 1.3, "learning_rate": 0.00018101385035130586, "loss": 1.5616, "step": 16536 }, { "epoch": 1.3, "learning_rate": 0.00018100175759982735, "loss": 1.4983, "step": 16537 }, { "epoch": 1.3, "learning_rate": 0.0001809896646378639, "loss": 1.587, "step": 16538 }, { "epoch": 1.3, "learning_rate": 0.00018097757146549786, "loss": 1.5932, "step": 16539 }, { "epoch": 1.3, "learning_rate": 0.00018096547808281113, "loss": 1.552, "step": 16540 }, { "epoch": 1.3, "learning_rate": 0.00018095338448988592, "loss": 1.5926, "step": 16541 }, { "epoch": 1.3, "learning_rate": 0.00018094129068680435, "loss": 1.5342, "step": 16542 }, { "epoch": 1.3, "learning_rate": 0.00018092919667364842, "loss": 1.531, "step": 16543 }, { "epoch": 1.3, "learning_rate": 0.00018091710245050037, "loss": 1.5433, "step": 16544 }, { "epoch": 1.3, "learning_rate": 0.0001809050080174422, "loss": 1.5484, "step": 16545 }, { "epoch": 1.3, "learning_rate": 0.00018089291337455613, "loss": 1.5168, "step": 16546 }, { "epoch": 1.3, "learning_rate": 0.0001808808185219242, "loss": 1.5261, "step": 16547 }, { "epoch": 1.3, "learning_rate": 0.00018086872345962854, "loss": 1.5664, "step": 16548 }, { "epoch": 1.3, "learning_rate": 0.00018085662818775132, "loss": 1.5343, "step": 16549 }, { "epoch": 1.3, "learning_rate": 0.00018084453270637458, "loss": 1.5537, "step": 16550 }, { "epoch": 1.3, "learning_rate": 0.00018083243701558054, "loss": 1.5217, "step": 16551 }, { "epoch": 1.3, "learning_rate": 0.00018082034111545123, "loss": 1.5626, "step": 16552 }, { "epoch": 1.3, "learning_rate": 0.00018080824500606879, "loss": 1.5192, "step": 16553 }, { "epoch": 1.3, "learning_rate": 0.0001807961486875154, "loss": 1.4931, "step": 16554 }, { "epoch": 1.3, "learning_rate": 0.00018078405215987315, "loss": 1.5255, "step": 16555 }, { "epoch": 1.3, "learning_rate": 0.0001807719554232242, "loss": 1.4813, "step": 16556 }, { "epoch": 1.3, "learning_rate": 0.00018075985847765063, "loss": 1.5391, "step": 16557 }, { "epoch": 1.3, "learning_rate": 0.00018074776132323455, "loss": 1.5426, "step": 16558 }, { "epoch": 1.3, "learning_rate": 0.00018073566396005822, "loss": 1.5817, "step": 16559 }, { "epoch": 1.3, "learning_rate": 0.00018072356638820366, "loss": 1.5466, "step": 16560 }, { "epoch": 1.3, "learning_rate": 0.000180711468607753, "loss": 1.5461, "step": 16561 }, { "epoch": 1.3, "learning_rate": 0.00018069937061878847, "loss": 1.5393, "step": 16562 }, { "epoch": 1.3, "learning_rate": 0.00018068727242139213, "loss": 1.4822, "step": 16563 }, { "epoch": 1.3, "learning_rate": 0.00018067517401564617, "loss": 1.5307, "step": 16564 }, { "epoch": 1.3, "learning_rate": 0.00018066307540163265, "loss": 1.5076, "step": 16565 }, { "epoch": 1.3, "learning_rate": 0.00018065097657943383, "loss": 1.5291, "step": 16566 }, { "epoch": 1.3, "learning_rate": 0.00018063887754913175, "loss": 1.5325, "step": 16567 }, { "epoch": 1.3, "learning_rate": 0.00018062677831080863, "loss": 1.5513, "step": 16568 }, { "epoch": 1.3, "learning_rate": 0.00018061467886454656, "loss": 1.5321, "step": 16569 }, { "epoch": 1.3, "learning_rate": 0.00018060257921042772, "loss": 1.5225, "step": 16570 }, { "epoch": 1.3, "learning_rate": 0.00018059047934853429, "loss": 1.5359, "step": 16571 }, { "epoch": 1.3, "learning_rate": 0.00018057837927894834, "loss": 1.5596, "step": 16572 }, { "epoch": 1.3, "learning_rate": 0.00018056627900175213, "loss": 1.5211, "step": 16573 }, { "epoch": 1.3, "learning_rate": 0.0001805541785170277, "loss": 1.4846, "step": 16574 }, { "epoch": 1.3, "learning_rate": 0.00018054207782485724, "loss": 1.5538, "step": 16575 }, { "epoch": 1.3, "learning_rate": 0.00018052997692532302, "loss": 1.5473, "step": 16576 }, { "epoch": 1.3, "learning_rate": 0.00018051787581850699, "loss": 1.52, "step": 16577 }, { "epoch": 1.3, "learning_rate": 0.00018050577450449149, "loss": 1.5654, "step": 16578 }, { "epoch": 1.3, "learning_rate": 0.00018049367298335862, "loss": 1.5162, "step": 16579 }, { "epoch": 1.3, "learning_rate": 0.00018048157125519053, "loss": 1.5303, "step": 16580 }, { "epoch": 1.3, "learning_rate": 0.0001804694693200694, "loss": 1.514, "step": 16581 }, { "epoch": 1.3, "learning_rate": 0.00018045736717807735, "loss": 1.5479, "step": 16582 }, { "epoch": 1.3, "learning_rate": 0.00018044526482929662, "loss": 1.527, "step": 16583 }, { "epoch": 1.3, "learning_rate": 0.0001804331622738093, "loss": 1.5027, "step": 16584 }, { "epoch": 1.3, "learning_rate": 0.00018042105951169765, "loss": 1.5051, "step": 16585 }, { "epoch": 1.31, "learning_rate": 0.00018040895654304376, "loss": 1.5746, "step": 16586 }, { "epoch": 1.31, "learning_rate": 0.00018039685336792985, "loss": 1.4905, "step": 16587 }, { "epoch": 1.31, "learning_rate": 0.00018038474998643812, "loss": 1.5271, "step": 16588 }, { "epoch": 1.31, "learning_rate": 0.00018037264639865066, "loss": 1.5369, "step": 16589 }, { "epoch": 1.31, "learning_rate": 0.0001803605426046497, "loss": 1.5348, "step": 16590 }, { "epoch": 1.31, "learning_rate": 0.00018034843860451739, "loss": 1.5265, "step": 16591 }, { "epoch": 1.31, "learning_rate": 0.00018033633439833597, "loss": 1.5696, "step": 16592 }, { "epoch": 1.31, "learning_rate": 0.00018032422998618753, "loss": 1.4765, "step": 16593 }, { "epoch": 1.31, "learning_rate": 0.00018031212536815433, "loss": 1.5445, "step": 16594 }, { "epoch": 1.31, "learning_rate": 0.00018030002054431857, "loss": 1.568, "step": 16595 }, { "epoch": 1.31, "learning_rate": 0.00018028791551476234, "loss": 1.5599, "step": 16596 }, { "epoch": 1.31, "learning_rate": 0.00018027581027956787, "loss": 1.4862, "step": 16597 }, { "epoch": 1.31, "learning_rate": 0.0001802637048388174, "loss": 1.527, "step": 16598 }, { "epoch": 1.31, "learning_rate": 0.00018025159919259304, "loss": 1.5254, "step": 16599 }, { "epoch": 1.31, "learning_rate": 0.00018023949334097705, "loss": 1.5208, "step": 16600 }, { "epoch": 1.31, "learning_rate": 0.0001802273872840515, "loss": 1.5753, "step": 16601 }, { "epoch": 1.31, "learning_rate": 0.00018021528102189877, "loss": 1.5344, "step": 16602 }, { "epoch": 1.31, "learning_rate": 0.00018020317455460093, "loss": 1.5307, "step": 16603 }, { "epoch": 1.31, "learning_rate": 0.00018019106788224015, "loss": 1.5295, "step": 16604 }, { "epoch": 1.31, "learning_rate": 0.00018017896100489873, "loss": 1.5273, "step": 16605 }, { "epoch": 1.31, "learning_rate": 0.00018016685392265882, "loss": 1.4794, "step": 16606 }, { "epoch": 1.31, "learning_rate": 0.0001801547466356026, "loss": 1.5783, "step": 16607 }, { "epoch": 1.31, "learning_rate": 0.00018014263914381228, "loss": 1.567, "step": 16608 }, { "epoch": 1.31, "learning_rate": 0.0001801305314473701, "loss": 1.5356, "step": 16609 }, { "epoch": 1.31, "learning_rate": 0.00018011842354635825, "loss": 1.5949, "step": 16610 }, { "epoch": 1.31, "learning_rate": 0.0001801063154408589, "loss": 1.5522, "step": 16611 }, { "epoch": 1.31, "learning_rate": 0.00018009420713095432, "loss": 1.5694, "step": 16612 }, { "epoch": 1.31, "learning_rate": 0.00018008209861672663, "loss": 1.5319, "step": 16613 }, { "epoch": 1.31, "learning_rate": 0.00018006998989825813, "loss": 1.5035, "step": 16614 }, { "epoch": 1.31, "learning_rate": 0.000180057880975631, "loss": 1.5348, "step": 16615 }, { "epoch": 1.31, "learning_rate": 0.00018004577184892734, "loss": 1.5133, "step": 16616 }, { "epoch": 1.31, "learning_rate": 0.0001800336625182296, "loss": 1.51, "step": 16617 }, { "epoch": 1.31, "learning_rate": 0.00018002155298361982, "loss": 1.557, "step": 16618 }, { "epoch": 1.31, "learning_rate": 0.00018000944324518027, "loss": 1.5345, "step": 16619 }, { "epoch": 1.31, "learning_rate": 0.00017999733330299313, "loss": 1.5707, "step": 16620 }, { "epoch": 1.31, "learning_rate": 0.00017998522315714068, "loss": 1.513, "step": 16621 }, { "epoch": 1.31, "learning_rate": 0.00017997311280770512, "loss": 1.5437, "step": 16622 }, { "epoch": 1.31, "learning_rate": 0.00017996100225476863, "loss": 1.5899, "step": 16623 }, { "epoch": 1.31, "learning_rate": 0.00017994889149841348, "loss": 1.5644, "step": 16624 }, { "epoch": 1.31, "learning_rate": 0.00017993678053872188, "loss": 1.5012, "step": 16625 }, { "epoch": 1.31, "learning_rate": 0.00017992466937577606, "loss": 1.543, "step": 16626 }, { "epoch": 1.31, "learning_rate": 0.0001799125580096583, "loss": 1.5251, "step": 16627 }, { "epoch": 1.31, "learning_rate": 0.0001799004464404507, "loss": 1.5415, "step": 16628 }, { "epoch": 1.31, "learning_rate": 0.00017988833466823563, "loss": 1.5317, "step": 16629 }, { "epoch": 1.31, "learning_rate": 0.00017987622269309523, "loss": 1.4821, "step": 16630 }, { "epoch": 1.31, "learning_rate": 0.00017986411051511178, "loss": 1.5651, "step": 16631 }, { "epoch": 1.31, "learning_rate": 0.00017985199813436747, "loss": 1.5198, "step": 16632 }, { "epoch": 1.31, "learning_rate": 0.00017983988555094458, "loss": 1.5216, "step": 16633 }, { "epoch": 1.31, "learning_rate": 0.00017982777276492537, "loss": 1.4658, "step": 16634 }, { "epoch": 1.31, "learning_rate": 0.00017981565977639202, "loss": 1.5508, "step": 16635 }, { "epoch": 1.31, "learning_rate": 0.00017980354658542677, "loss": 1.5374, "step": 16636 }, { "epoch": 1.31, "learning_rate": 0.00017979143319211193, "loss": 1.518, "step": 16637 }, { "epoch": 1.31, "learning_rate": 0.00017977931959652966, "loss": 1.4948, "step": 16638 }, { "epoch": 1.31, "learning_rate": 0.00017976720579876228, "loss": 1.5337, "step": 16639 }, { "epoch": 1.31, "learning_rate": 0.00017975509179889192, "loss": 1.495, "step": 16640 }, { "epoch": 1.31, "learning_rate": 0.000179742977597001, "loss": 1.5439, "step": 16641 }, { "epoch": 1.31, "learning_rate": 0.00017973086319317166, "loss": 1.5465, "step": 16642 }, { "epoch": 1.31, "learning_rate": 0.00017971874858748612, "loss": 1.5023, "step": 16643 }, { "epoch": 1.31, "learning_rate": 0.00017970663378002671, "loss": 1.5244, "step": 16644 }, { "epoch": 1.31, "learning_rate": 0.00017969451877087567, "loss": 1.541, "step": 16645 }, { "epoch": 1.31, "learning_rate": 0.00017968240356011522, "loss": 1.5324, "step": 16646 }, { "epoch": 1.31, "learning_rate": 0.00017967028814782759, "loss": 1.5176, "step": 16647 }, { "epoch": 1.31, "learning_rate": 0.0001796581725340951, "loss": 1.5147, "step": 16648 }, { "epoch": 1.31, "learning_rate": 0.000179646056719, "loss": 1.5321, "step": 16649 }, { "epoch": 1.31, "learning_rate": 0.0001796339407026245, "loss": 1.5635, "step": 16650 }, { "epoch": 1.31, "learning_rate": 0.00017962182448505096, "loss": 1.5656, "step": 16651 }, { "epoch": 1.31, "learning_rate": 0.00017960970806636152, "loss": 1.5635, "step": 16652 }, { "epoch": 1.31, "learning_rate": 0.0001795975914466385, "loss": 1.5155, "step": 16653 }, { "epoch": 1.31, "learning_rate": 0.00017958547462596422, "loss": 1.5374, "step": 16654 }, { "epoch": 1.31, "learning_rate": 0.00017957335760442086, "loss": 1.5247, "step": 16655 }, { "epoch": 1.31, "learning_rate": 0.0001795612403820907, "loss": 1.5657, "step": 16656 }, { "epoch": 1.31, "learning_rate": 0.00017954912295905606, "loss": 1.5002, "step": 16657 }, { "epoch": 1.31, "learning_rate": 0.0001795370053353992, "loss": 1.5122, "step": 16658 }, { "epoch": 1.31, "learning_rate": 0.00017952488751120233, "loss": 1.4617, "step": 16659 }, { "epoch": 1.31, "learning_rate": 0.0001795127694865478, "loss": 1.5393, "step": 16660 }, { "epoch": 1.31, "learning_rate": 0.00017950065126151786, "loss": 1.5846, "step": 16661 }, { "epoch": 1.31, "learning_rate": 0.0001794885328361947, "loss": 1.4943, "step": 16662 }, { "epoch": 1.31, "learning_rate": 0.00017947641421066075, "loss": 1.5414, "step": 16663 }, { "epoch": 1.31, "learning_rate": 0.0001794642953849982, "loss": 1.5907, "step": 16664 }, { "epoch": 1.31, "learning_rate": 0.00017945217635928932, "loss": 1.51, "step": 16665 }, { "epoch": 1.31, "learning_rate": 0.00017944005713361644, "loss": 1.4794, "step": 16666 }, { "epoch": 1.31, "learning_rate": 0.00017942793770806182, "loss": 1.5346, "step": 16667 }, { "epoch": 1.31, "learning_rate": 0.00017941581808270774, "loss": 1.5225, "step": 16668 }, { "epoch": 1.31, "learning_rate": 0.00017940369825763652, "loss": 1.5633, "step": 16669 }, { "epoch": 1.31, "learning_rate": 0.00017939157823293036, "loss": 1.5494, "step": 16670 }, { "epoch": 1.31, "learning_rate": 0.0001793794580086716, "loss": 1.5969, "step": 16671 }, { "epoch": 1.31, "learning_rate": 0.00017936733758494255, "loss": 1.5494, "step": 16672 }, { "epoch": 1.31, "learning_rate": 0.00017935521696182553, "loss": 1.5629, "step": 16673 }, { "epoch": 1.31, "learning_rate": 0.00017934309613940275, "loss": 1.5137, "step": 16674 }, { "epoch": 1.31, "learning_rate": 0.00017933097511775654, "loss": 1.5092, "step": 16675 }, { "epoch": 1.31, "learning_rate": 0.00017931885389696917, "loss": 1.5158, "step": 16676 }, { "epoch": 1.31, "learning_rate": 0.000179306732477123, "loss": 1.551, "step": 16677 }, { "epoch": 1.31, "learning_rate": 0.00017929461085830028, "loss": 1.5631, "step": 16678 }, { "epoch": 1.31, "learning_rate": 0.00017928248904058327, "loss": 1.5424, "step": 16679 }, { "epoch": 1.31, "learning_rate": 0.00017927036702405436, "loss": 1.5436, "step": 16680 }, { "epoch": 1.31, "learning_rate": 0.0001792582448087958, "loss": 1.5198, "step": 16681 }, { "epoch": 1.31, "learning_rate": 0.00017924612239488992, "loss": 1.5375, "step": 16682 }, { "epoch": 1.31, "learning_rate": 0.00017923399978241904, "loss": 1.5626, "step": 16683 }, { "epoch": 1.31, "learning_rate": 0.0001792218769714654, "loss": 1.4965, "step": 16684 }, { "epoch": 1.31, "learning_rate": 0.00017920975396211133, "loss": 1.5146, "step": 16685 }, { "epoch": 1.31, "learning_rate": 0.00017919763075443916, "loss": 1.5222, "step": 16686 }, { "epoch": 1.31, "learning_rate": 0.0001791855073485312, "loss": 1.4949, "step": 16687 }, { "epoch": 1.31, "learning_rate": 0.00017917338374446971, "loss": 1.5652, "step": 16688 }, { "epoch": 1.31, "learning_rate": 0.00017916125994233705, "loss": 1.5382, "step": 16689 }, { "epoch": 1.31, "learning_rate": 0.00017914913594221558, "loss": 1.5388, "step": 16690 }, { "epoch": 1.31, "learning_rate": 0.00017913701174418755, "loss": 1.5105, "step": 16691 }, { "epoch": 1.31, "learning_rate": 0.00017912488734833523, "loss": 1.5638, "step": 16692 }, { "epoch": 1.31, "learning_rate": 0.00017911276275474108, "loss": 1.5136, "step": 16693 }, { "epoch": 1.31, "learning_rate": 0.00017910063796348728, "loss": 1.5409, "step": 16694 }, { "epoch": 1.31, "learning_rate": 0.0001790885129746562, "loss": 1.5132, "step": 16695 }, { "epoch": 1.31, "learning_rate": 0.0001790763877883302, "loss": 1.5338, "step": 16696 }, { "epoch": 1.31, "learning_rate": 0.0001790642624045916, "loss": 1.5213, "step": 16697 }, { "epoch": 1.31, "learning_rate": 0.00017905213682352264, "loss": 1.6199, "step": 16698 }, { "epoch": 1.31, "learning_rate": 0.00017904001104520573, "loss": 1.5319, "step": 16699 }, { "epoch": 1.31, "learning_rate": 0.00017902788506972316, "loss": 1.5638, "step": 16700 }, { "epoch": 1.31, "learning_rate": 0.0001790157588971573, "loss": 1.5427, "step": 16701 }, { "epoch": 1.31, "learning_rate": 0.00017900363252759045, "loss": 1.5492, "step": 16702 }, { "epoch": 1.31, "learning_rate": 0.00017899150596110486, "loss": 1.5081, "step": 16703 }, { "epoch": 1.31, "learning_rate": 0.00017897937919778302, "loss": 1.5494, "step": 16704 }, { "epoch": 1.31, "learning_rate": 0.00017896725223770716, "loss": 1.5051, "step": 16705 }, { "epoch": 1.31, "learning_rate": 0.00017895512508095965, "loss": 1.5114, "step": 16706 }, { "epoch": 1.31, "learning_rate": 0.00017894299772762282, "loss": 1.5071, "step": 16707 }, { "epoch": 1.31, "learning_rate": 0.00017893087017777903, "loss": 1.5255, "step": 16708 }, { "epoch": 1.31, "learning_rate": 0.00017891874243151055, "loss": 1.5744, "step": 16709 }, { "epoch": 1.31, "learning_rate": 0.0001789066144888998, "loss": 1.5224, "step": 16710 }, { "epoch": 1.31, "learning_rate": 0.00017889448635002904, "loss": 1.4975, "step": 16711 }, { "epoch": 1.31, "learning_rate": 0.00017888235801498075, "loss": 1.4711, "step": 16712 }, { "epoch": 1.32, "learning_rate": 0.00017887022948383713, "loss": 1.4891, "step": 16713 }, { "epoch": 1.32, "learning_rate": 0.0001788581007566806, "loss": 1.5184, "step": 16714 }, { "epoch": 1.32, "learning_rate": 0.00017884597183359348, "loss": 1.5165, "step": 16715 }, { "epoch": 1.32, "learning_rate": 0.0001788338427146581, "loss": 1.4972, "step": 16716 }, { "epoch": 1.32, "learning_rate": 0.00017882171339995693, "loss": 1.5232, "step": 16717 }, { "epoch": 1.32, "learning_rate": 0.00017880958388957212, "loss": 1.549, "step": 16718 }, { "epoch": 1.32, "learning_rate": 0.00017879745418358624, "loss": 1.502, "step": 16719 }, { "epoch": 1.32, "learning_rate": 0.00017878532428208146, "loss": 1.5195, "step": 16720 }, { "epoch": 1.32, "learning_rate": 0.00017877319418514023, "loss": 1.4714, "step": 16721 }, { "epoch": 1.32, "learning_rate": 0.00017876106389284495, "loss": 1.5025, "step": 16722 }, { "epoch": 1.32, "learning_rate": 0.00017874893340527785, "loss": 1.5509, "step": 16723 }, { "epoch": 1.32, "learning_rate": 0.00017873680272252138, "loss": 1.5132, "step": 16724 }, { "epoch": 1.32, "learning_rate": 0.00017872467184465787, "loss": 1.5324, "step": 16725 }, { "epoch": 1.32, "learning_rate": 0.0001787125407717697, "loss": 1.5103, "step": 16726 }, { "epoch": 1.32, "learning_rate": 0.0001787004095039392, "loss": 1.5533, "step": 16727 }, { "epoch": 1.32, "learning_rate": 0.00017868827804124878, "loss": 1.5167, "step": 16728 }, { "epoch": 1.32, "learning_rate": 0.00017867614638378078, "loss": 1.5644, "step": 16729 }, { "epoch": 1.32, "learning_rate": 0.00017866401453161756, "loss": 1.5175, "step": 16730 }, { "epoch": 1.32, "learning_rate": 0.00017865188248484154, "loss": 1.4567, "step": 16731 }, { "epoch": 1.32, "learning_rate": 0.00017863975024353502, "loss": 1.545, "step": 16732 }, { "epoch": 1.32, "learning_rate": 0.00017862761780778038, "loss": 1.4891, "step": 16733 }, { "epoch": 1.32, "learning_rate": 0.00017861548517766, "loss": 1.5809, "step": 16734 }, { "epoch": 1.32, "learning_rate": 0.0001786033523532563, "loss": 1.5125, "step": 16735 }, { "epoch": 1.32, "learning_rate": 0.00017859121933465165, "loss": 1.5227, "step": 16736 }, { "epoch": 1.32, "learning_rate": 0.00017857908612192835, "loss": 1.5163, "step": 16737 }, { "epoch": 1.32, "learning_rate": 0.00017856695271516884, "loss": 1.5451, "step": 16738 }, { "epoch": 1.32, "learning_rate": 0.00017855481911445553, "loss": 1.5315, "step": 16739 }, { "epoch": 1.32, "learning_rate": 0.00017854268531987072, "loss": 1.5693, "step": 16740 }, { "epoch": 1.32, "learning_rate": 0.00017853055133149683, "loss": 1.4843, "step": 16741 }, { "epoch": 1.32, "learning_rate": 0.0001785184171494162, "loss": 1.5337, "step": 16742 }, { "epoch": 1.32, "learning_rate": 0.0001785062827737113, "loss": 1.5326, "step": 16743 }, { "epoch": 1.32, "learning_rate": 0.00017849414820446448, "loss": 1.5325, "step": 16744 }, { "epoch": 1.32, "learning_rate": 0.00017848201344175806, "loss": 1.5192, "step": 16745 }, { "epoch": 1.32, "learning_rate": 0.0001784698784856746, "loss": 1.5165, "step": 16746 }, { "epoch": 1.32, "learning_rate": 0.00017845774333629625, "loss": 1.5573, "step": 16747 }, { "epoch": 1.32, "learning_rate": 0.00017844560799370557, "loss": 1.5768, "step": 16748 }, { "epoch": 1.32, "learning_rate": 0.00017843347245798493, "loss": 1.512, "step": 16749 }, { "epoch": 1.32, "learning_rate": 0.00017842133672921667, "loss": 1.5548, "step": 16750 }, { "epoch": 1.32, "learning_rate": 0.00017840920080748325, "loss": 1.5565, "step": 16751 }, { "epoch": 1.32, "learning_rate": 0.00017839706469286704, "loss": 1.472, "step": 16752 }, { "epoch": 1.32, "learning_rate": 0.00017838492838545043, "loss": 1.5727, "step": 16753 }, { "epoch": 1.32, "learning_rate": 0.0001783727918853158, "loss": 1.5443, "step": 16754 }, { "epoch": 1.32, "learning_rate": 0.00017836065519254556, "loss": 1.5453, "step": 16755 }, { "epoch": 1.32, "learning_rate": 0.00017834851830722217, "loss": 1.4833, "step": 16756 }, { "epoch": 1.32, "learning_rate": 0.00017833638122942793, "loss": 1.5497, "step": 16757 }, { "epoch": 1.32, "learning_rate": 0.00017832424395924532, "loss": 1.5488, "step": 16758 }, { "epoch": 1.32, "learning_rate": 0.00017831210649675672, "loss": 1.5492, "step": 16759 }, { "epoch": 1.32, "learning_rate": 0.00017829996884204458, "loss": 1.4983, "step": 16760 }, { "epoch": 1.32, "learning_rate": 0.0001782878309951912, "loss": 1.5459, "step": 16761 }, { "epoch": 1.32, "learning_rate": 0.0001782756929562791, "loss": 1.5452, "step": 16762 }, { "epoch": 1.32, "learning_rate": 0.00017826355472539063, "loss": 1.5501, "step": 16763 }, { "epoch": 1.32, "learning_rate": 0.00017825141630260826, "loss": 1.5413, "step": 16764 }, { "epoch": 1.32, "learning_rate": 0.0001782392776880143, "loss": 1.5659, "step": 16765 }, { "epoch": 1.32, "learning_rate": 0.00017822713888169126, "loss": 1.4408, "step": 16766 }, { "epoch": 1.32, "learning_rate": 0.00017821499988372153, "loss": 1.5699, "step": 16767 }, { "epoch": 1.32, "learning_rate": 0.00017820286069418755, "loss": 1.5451, "step": 16768 }, { "epoch": 1.32, "learning_rate": 0.00017819072131317168, "loss": 1.5131, "step": 16769 }, { "epoch": 1.32, "learning_rate": 0.00017817858174075637, "loss": 1.5757, "step": 16770 }, { "epoch": 1.32, "learning_rate": 0.00017816644197702405, "loss": 1.5114, "step": 16771 }, { "epoch": 1.32, "learning_rate": 0.0001781543020220571, "loss": 1.5098, "step": 16772 }, { "epoch": 1.32, "learning_rate": 0.00017814216187593798, "loss": 1.5878, "step": 16773 }, { "epoch": 1.32, "learning_rate": 0.00017813002153874914, "loss": 1.5945, "step": 16774 }, { "epoch": 1.32, "learning_rate": 0.000178117881010573, "loss": 1.5361, "step": 16775 }, { "epoch": 1.32, "learning_rate": 0.0001781057402914919, "loss": 1.5967, "step": 16776 }, { "epoch": 1.32, "learning_rate": 0.00017809359938158838, "loss": 1.486, "step": 16777 }, { "epoch": 1.32, "learning_rate": 0.00017808145828094481, "loss": 1.5486, "step": 16778 }, { "epoch": 1.32, "learning_rate": 0.00017806931698964362, "loss": 1.5307, "step": 16779 }, { "epoch": 1.32, "learning_rate": 0.0001780571755077673, "loss": 1.5512, "step": 16780 }, { "epoch": 1.32, "learning_rate": 0.00017804503383539818, "loss": 1.6243, "step": 16781 }, { "epoch": 1.32, "learning_rate": 0.00017803289197261882, "loss": 1.5505, "step": 16782 }, { "epoch": 1.32, "learning_rate": 0.0001780207499195115, "loss": 1.5021, "step": 16783 }, { "epoch": 1.32, "learning_rate": 0.00017800860767615883, "loss": 1.5306, "step": 16784 }, { "epoch": 1.32, "learning_rate": 0.0001779964652426432, "loss": 1.5352, "step": 16785 }, { "epoch": 1.32, "learning_rate": 0.00017798432261904694, "loss": 1.5816, "step": 16786 }, { "epoch": 1.32, "learning_rate": 0.00017797217980545265, "loss": 1.5438, "step": 16787 }, { "epoch": 1.32, "learning_rate": 0.00017796003680194263, "loss": 1.5259, "step": 16788 }, { "epoch": 1.32, "learning_rate": 0.00017794789360859936, "loss": 1.5361, "step": 16789 }, { "epoch": 1.32, "learning_rate": 0.0001779357502255054, "loss": 1.5418, "step": 16790 }, { "epoch": 1.32, "learning_rate": 0.00017792360665274307, "loss": 1.5507, "step": 16791 }, { "epoch": 1.32, "learning_rate": 0.0001779114628903949, "loss": 1.543, "step": 16792 }, { "epoch": 1.32, "learning_rate": 0.00017789931893854324, "loss": 1.5762, "step": 16793 }, { "epoch": 1.32, "learning_rate": 0.00017788717479727062, "loss": 1.525, "step": 16794 }, { "epoch": 1.32, "learning_rate": 0.0001778750304666595, "loss": 1.5333, "step": 16795 }, { "epoch": 1.32, "learning_rate": 0.00017786288594679229, "loss": 1.5189, "step": 16796 }, { "epoch": 1.32, "learning_rate": 0.00017785074123775145, "loss": 1.5627, "step": 16797 }, { "epoch": 1.32, "learning_rate": 0.00017783859633961946, "loss": 1.5496, "step": 16798 }, { "epoch": 1.32, "learning_rate": 0.00017782645125247879, "loss": 1.511, "step": 16799 }, { "epoch": 1.32, "learning_rate": 0.0001778143059764118, "loss": 1.5038, "step": 16800 }, { "epoch": 1.32, "learning_rate": 0.00017780216051150105, "loss": 1.5805, "step": 16801 }, { "epoch": 1.32, "learning_rate": 0.00017779001485782901, "loss": 1.5102, "step": 16802 }, { "epoch": 1.32, "learning_rate": 0.00017777786901547807, "loss": 1.5165, "step": 16803 }, { "epoch": 1.32, "learning_rate": 0.00017776572298453073, "loss": 1.5041, "step": 16804 }, { "epoch": 1.32, "learning_rate": 0.00017775357676506944, "loss": 1.55, "step": 16805 }, { "epoch": 1.32, "learning_rate": 0.00017774143035717668, "loss": 1.5521, "step": 16806 }, { "epoch": 1.32, "learning_rate": 0.00017772928376093498, "loss": 1.6077, "step": 16807 }, { "epoch": 1.32, "learning_rate": 0.0001777171369764267, "loss": 1.5281, "step": 16808 }, { "epoch": 1.32, "learning_rate": 0.0001777049900037344, "loss": 1.521, "step": 16809 }, { "epoch": 1.32, "learning_rate": 0.00017769284284294045, "loss": 1.5112, "step": 16810 }, { "epoch": 1.32, "learning_rate": 0.00017768069549412734, "loss": 1.5065, "step": 16811 }, { "epoch": 1.32, "learning_rate": 0.00017766854795737768, "loss": 1.5106, "step": 16812 }, { "epoch": 1.32, "learning_rate": 0.00017765640023277376, "loss": 1.5052, "step": 16813 }, { "epoch": 1.32, "learning_rate": 0.00017764425232039824, "loss": 1.5279, "step": 16814 }, { "epoch": 1.32, "learning_rate": 0.00017763210422033342, "loss": 1.571, "step": 16815 }, { "epoch": 1.32, "learning_rate": 0.0001776199559326619, "loss": 1.5413, "step": 16816 }, { "epoch": 1.32, "learning_rate": 0.00017760780745746613, "loss": 1.5198, "step": 16817 }, { "epoch": 1.32, "learning_rate": 0.00017759565879482857, "loss": 1.5507, "step": 16818 }, { "epoch": 1.32, "learning_rate": 0.00017758350994483173, "loss": 1.5093, "step": 16819 }, { "epoch": 1.32, "learning_rate": 0.00017757136090755806, "loss": 1.4829, "step": 16820 }, { "epoch": 1.32, "learning_rate": 0.00017755921168309004, "loss": 1.4869, "step": 16821 }, { "epoch": 1.32, "learning_rate": 0.0001775470622715102, "loss": 1.5069, "step": 16822 }, { "epoch": 1.32, "learning_rate": 0.00017753491267290098, "loss": 1.5489, "step": 16823 }, { "epoch": 1.32, "learning_rate": 0.00017752276288734498, "loss": 1.5179, "step": 16824 }, { "epoch": 1.32, "learning_rate": 0.00017751061291492457, "loss": 1.5328, "step": 16825 }, { "epoch": 1.32, "learning_rate": 0.00017749846275572228, "loss": 1.6075, "step": 16826 }, { "epoch": 1.32, "learning_rate": 0.00017748631240982056, "loss": 1.4778, "step": 16827 }, { "epoch": 1.32, "learning_rate": 0.000177474161877302, "loss": 1.5366, "step": 16828 }, { "epoch": 1.32, "learning_rate": 0.00017746201115824902, "loss": 1.5237, "step": 16829 }, { "epoch": 1.32, "learning_rate": 0.00017744986025274414, "loss": 1.5178, "step": 16830 }, { "epoch": 1.32, "learning_rate": 0.00017743770916086985, "loss": 1.4972, "step": 16831 }, { "epoch": 1.32, "learning_rate": 0.0001774255578827087, "loss": 1.5046, "step": 16832 }, { "epoch": 1.32, "learning_rate": 0.0001774134064183431, "loss": 1.5437, "step": 16833 }, { "epoch": 1.32, "learning_rate": 0.00017740125476785562, "loss": 1.5792, "step": 16834 }, { "epoch": 1.32, "learning_rate": 0.0001773891029313287, "loss": 1.5017, "step": 16835 }, { "epoch": 1.32, "learning_rate": 0.00017737695090884494, "loss": 1.5406, "step": 16836 }, { "epoch": 1.32, "learning_rate": 0.00017736479870048675, "loss": 1.5777, "step": 16837 }, { "epoch": 1.32, "learning_rate": 0.00017735264630633674, "loss": 1.5365, "step": 16838 }, { "epoch": 1.32, "learning_rate": 0.00017734049372647727, "loss": 1.4745, "step": 16839 }, { "epoch": 1.32, "learning_rate": 0.000177328340960991, "loss": 1.5516, "step": 16840 }, { "epoch": 1.33, "learning_rate": 0.0001773161880099604, "loss": 1.4901, "step": 16841 }, { "epoch": 1.33, "learning_rate": 0.0001773040348734679, "loss": 1.5417, "step": 16842 }, { "epoch": 1.33, "learning_rate": 0.00017729188155159607, "loss": 1.5546, "step": 16843 }, { "epoch": 1.33, "learning_rate": 0.00017727972804442742, "loss": 1.5312, "step": 16844 }, { "epoch": 1.33, "learning_rate": 0.0001772675743520445, "loss": 1.5614, "step": 16845 }, { "epoch": 1.33, "learning_rate": 0.00017725542047452978, "loss": 1.5539, "step": 16846 }, { "epoch": 1.33, "learning_rate": 0.00017724326641196578, "loss": 1.516, "step": 16847 }, { "epoch": 1.33, "learning_rate": 0.0001772311121644351, "loss": 1.4982, "step": 16848 }, { "epoch": 1.33, "learning_rate": 0.00017721895773202014, "loss": 1.5659, "step": 16849 }, { "epoch": 1.33, "learning_rate": 0.00017720680311480349, "loss": 1.4694, "step": 16850 }, { "epoch": 1.33, "learning_rate": 0.00017719464831286768, "loss": 1.5999, "step": 16851 }, { "epoch": 1.33, "learning_rate": 0.00017718249332629514, "loss": 1.5603, "step": 16852 }, { "epoch": 1.33, "learning_rate": 0.00017717033815516857, "loss": 1.5591, "step": 16853 }, { "epoch": 1.33, "learning_rate": 0.00017715818279957034, "loss": 1.5166, "step": 16854 }, { "epoch": 1.33, "learning_rate": 0.0001771460272595831, "loss": 1.5476, "step": 16855 }, { "epoch": 1.33, "learning_rate": 0.00017713387153528922, "loss": 1.5324, "step": 16856 }, { "epoch": 1.33, "learning_rate": 0.00017712171562677138, "loss": 1.5162, "step": 16857 }, { "epoch": 1.33, "learning_rate": 0.00017710955953411208, "loss": 1.504, "step": 16858 }, { "epoch": 1.33, "learning_rate": 0.0001770974032573938, "loss": 1.5466, "step": 16859 }, { "epoch": 1.33, "learning_rate": 0.00017708524679669907, "loss": 1.5129, "step": 16860 }, { "epoch": 1.33, "learning_rate": 0.0001770730901521105, "loss": 1.4881, "step": 16861 }, { "epoch": 1.33, "learning_rate": 0.0001770609333237106, "loss": 1.5245, "step": 16862 }, { "epoch": 1.33, "learning_rate": 0.00017704877631158188, "loss": 1.5441, "step": 16863 }, { "epoch": 1.33, "learning_rate": 0.0001770366191158069, "loss": 1.5383, "step": 16864 }, { "epoch": 1.33, "learning_rate": 0.00017702446173646822, "loss": 1.5749, "step": 16865 }, { "epoch": 1.33, "learning_rate": 0.0001770123041736483, "loss": 1.5654, "step": 16866 }, { "epoch": 1.33, "learning_rate": 0.0001770001464274298, "loss": 1.5382, "step": 16867 }, { "epoch": 1.33, "learning_rate": 0.00017698798849789517, "loss": 1.595, "step": 16868 }, { "epoch": 1.33, "learning_rate": 0.00017697583038512696, "loss": 1.5319, "step": 16869 }, { "epoch": 1.33, "learning_rate": 0.0001769636720892078, "loss": 1.5559, "step": 16870 }, { "epoch": 1.33, "learning_rate": 0.00017695151361022017, "loss": 1.5102, "step": 16871 }, { "epoch": 1.33, "learning_rate": 0.00017693935494824667, "loss": 1.579, "step": 16872 }, { "epoch": 1.33, "learning_rate": 0.0001769271961033698, "loss": 1.5354, "step": 16873 }, { "epoch": 1.33, "learning_rate": 0.0001769150370756721, "loss": 1.5841, "step": 16874 }, { "epoch": 1.33, "learning_rate": 0.0001769028778652362, "loss": 1.4942, "step": 16875 }, { "epoch": 1.33, "learning_rate": 0.00017689071847214454, "loss": 1.549, "step": 16876 }, { "epoch": 1.33, "learning_rate": 0.00017687855889647977, "loss": 1.5333, "step": 16877 }, { "epoch": 1.33, "learning_rate": 0.0001768663991383244, "loss": 1.5289, "step": 16878 }, { "epoch": 1.33, "learning_rate": 0.00017685423919776104, "loss": 1.5533, "step": 16879 }, { "epoch": 1.33, "learning_rate": 0.00017684207907487222, "loss": 1.4988, "step": 16880 }, { "epoch": 1.33, "learning_rate": 0.00017682991876974047, "loss": 1.5819, "step": 16881 }, { "epoch": 1.33, "learning_rate": 0.0001768177582824484, "loss": 1.5101, "step": 16882 }, { "epoch": 1.33, "learning_rate": 0.00017680559761307853, "loss": 1.5236, "step": 16883 }, { "epoch": 1.33, "learning_rate": 0.00017679343676171345, "loss": 1.4957, "step": 16884 }, { "epoch": 1.33, "learning_rate": 0.00017678127572843573, "loss": 1.5627, "step": 16885 }, { "epoch": 1.33, "learning_rate": 0.00017676911451332793, "loss": 1.517, "step": 16886 }, { "epoch": 1.33, "learning_rate": 0.0001767569531164726, "loss": 1.5449, "step": 16887 }, { "epoch": 1.33, "learning_rate": 0.00017674479153795232, "loss": 1.5781, "step": 16888 }, { "epoch": 1.33, "learning_rate": 0.00017673262977784966, "loss": 1.5252, "step": 16889 }, { "epoch": 1.33, "learning_rate": 0.0001767204678362472, "loss": 1.4743, "step": 16890 }, { "epoch": 1.33, "learning_rate": 0.0001767083057132275, "loss": 1.537, "step": 16891 }, { "epoch": 1.33, "learning_rate": 0.00017669614340887319, "loss": 1.5471, "step": 16892 }, { "epoch": 1.33, "learning_rate": 0.00017668398092326676, "loss": 1.489, "step": 16893 }, { "epoch": 1.33, "learning_rate": 0.00017667181825649085, "loss": 1.5137, "step": 16894 }, { "epoch": 1.33, "learning_rate": 0.00017665965540862797, "loss": 1.5677, "step": 16895 }, { "epoch": 1.33, "learning_rate": 0.0001766474923797608, "loss": 1.5488, "step": 16896 }, { "epoch": 1.33, "learning_rate": 0.00017663532916997182, "loss": 1.5243, "step": 16897 }, { "epoch": 1.33, "learning_rate": 0.00017662316577934367, "loss": 1.5453, "step": 16898 }, { "epoch": 1.33, "learning_rate": 0.0001766110022079589, "loss": 1.5408, "step": 16899 }, { "epoch": 1.33, "learning_rate": 0.00017659883845590012, "loss": 1.518, "step": 16900 }, { "epoch": 1.33, "learning_rate": 0.00017658667452324987, "loss": 1.4873, "step": 16901 }, { "epoch": 1.33, "learning_rate": 0.00017657451041009085, "loss": 1.5153, "step": 16902 }, { "epoch": 1.33, "learning_rate": 0.0001765623461165055, "loss": 1.5446, "step": 16903 }, { "epoch": 1.33, "learning_rate": 0.00017655018164257653, "loss": 1.5559, "step": 16904 }, { "epoch": 1.33, "learning_rate": 0.00017653801698838646, "loss": 1.5466, "step": 16905 }, { "epoch": 1.33, "learning_rate": 0.0001765258521540179, "loss": 1.5394, "step": 16906 }, { "epoch": 1.33, "learning_rate": 0.0001765136871395534, "loss": 1.5192, "step": 16907 }, { "epoch": 1.33, "learning_rate": 0.00017650152194507564, "loss": 1.5472, "step": 16908 }, { "epoch": 1.33, "learning_rate": 0.00017648935657066714, "loss": 1.5108, "step": 16909 }, { "epoch": 1.33, "learning_rate": 0.00017647719101641056, "loss": 1.5105, "step": 16910 }, { "epoch": 1.33, "learning_rate": 0.00017646502528238849, "loss": 1.5469, "step": 16911 }, { "epoch": 1.33, "learning_rate": 0.00017645285936868343, "loss": 1.5487, "step": 16912 }, { "epoch": 1.33, "learning_rate": 0.0001764406932753781, "loss": 1.4662, "step": 16913 }, { "epoch": 1.33, "learning_rate": 0.00017642852700255505, "loss": 1.5229, "step": 16914 }, { "epoch": 1.33, "learning_rate": 0.00017641636055029683, "loss": 1.544, "step": 16915 }, { "epoch": 1.33, "learning_rate": 0.00017640419391868616, "loss": 1.5466, "step": 16916 }, { "epoch": 1.33, "learning_rate": 0.0001763920271078056, "loss": 1.5433, "step": 16917 }, { "epoch": 1.33, "learning_rate": 0.0001763798601177377, "loss": 1.5114, "step": 16918 }, { "epoch": 1.33, "learning_rate": 0.00017636769294856512, "loss": 1.5626, "step": 16919 }, { "epoch": 1.33, "learning_rate": 0.00017635552560037047, "loss": 1.5096, "step": 16920 }, { "epoch": 1.33, "learning_rate": 0.00017634335807323632, "loss": 1.5325, "step": 16921 }, { "epoch": 1.33, "learning_rate": 0.00017633119036724533, "loss": 1.4989, "step": 16922 }, { "epoch": 1.33, "learning_rate": 0.00017631902248248005, "loss": 1.5228, "step": 16923 }, { "epoch": 1.33, "learning_rate": 0.00017630685441902315, "loss": 1.5481, "step": 16924 }, { "epoch": 1.33, "learning_rate": 0.00017629468617695723, "loss": 1.5035, "step": 16925 }, { "epoch": 1.33, "learning_rate": 0.00017628251775636493, "loss": 1.5009, "step": 16926 }, { "epoch": 1.33, "learning_rate": 0.0001762703491573288, "loss": 1.5316, "step": 16927 }, { "epoch": 1.33, "learning_rate": 0.0001762581803799315, "loss": 1.5404, "step": 16928 }, { "epoch": 1.33, "learning_rate": 0.00017624601142425569, "loss": 1.5459, "step": 16929 }, { "epoch": 1.33, "learning_rate": 0.00017623384229038388, "loss": 1.539, "step": 16930 }, { "epoch": 1.33, "learning_rate": 0.00017622167297839876, "loss": 1.5481, "step": 16931 }, { "epoch": 1.33, "learning_rate": 0.00017620950348838302, "loss": 1.5984, "step": 16932 }, { "epoch": 1.33, "learning_rate": 0.00017619733382041918, "loss": 1.5358, "step": 16933 }, { "epoch": 1.33, "learning_rate": 0.00017618516397458988, "loss": 1.5302, "step": 16934 }, { "epoch": 1.33, "learning_rate": 0.00017617299395097778, "loss": 1.499, "step": 16935 }, { "epoch": 1.33, "learning_rate": 0.0001761608237496655, "loss": 1.4916, "step": 16936 }, { "epoch": 1.33, "learning_rate": 0.00017614865337073568, "loss": 1.5617, "step": 16937 }, { "epoch": 1.33, "learning_rate": 0.00017613648281427087, "loss": 1.528, "step": 16938 }, { "epoch": 1.33, "learning_rate": 0.00017612431208035382, "loss": 1.5468, "step": 16939 }, { "epoch": 1.33, "learning_rate": 0.0001761121411690671, "loss": 1.5189, "step": 16940 }, { "epoch": 1.33, "learning_rate": 0.00017609997008049335, "loss": 1.5031, "step": 16941 }, { "epoch": 1.33, "learning_rate": 0.0001760877988147152, "loss": 1.5819, "step": 16942 }, { "epoch": 1.33, "learning_rate": 0.00017607562737181532, "loss": 1.5215, "step": 16943 }, { "epoch": 1.33, "learning_rate": 0.00017606345575187627, "loss": 1.5359, "step": 16944 }, { "epoch": 1.33, "learning_rate": 0.00017605128395498074, "loss": 1.5365, "step": 16945 }, { "epoch": 1.33, "learning_rate": 0.0001760391119812114, "loss": 1.5682, "step": 16946 }, { "epoch": 1.33, "learning_rate": 0.00017602693983065083, "loss": 1.5378, "step": 16947 }, { "epoch": 1.33, "learning_rate": 0.00017601476750338176, "loss": 1.5518, "step": 16948 }, { "epoch": 1.33, "learning_rate": 0.00017600259499948672, "loss": 1.5115, "step": 16949 }, { "epoch": 1.33, "learning_rate": 0.00017599042231904844, "loss": 1.4951, "step": 16950 }, { "epoch": 1.33, "learning_rate": 0.0001759782494621495, "loss": 1.5535, "step": 16951 }, { "epoch": 1.33, "learning_rate": 0.00017596607642887262, "loss": 1.484, "step": 16952 }, { "epoch": 1.33, "learning_rate": 0.00017595390321930042, "loss": 1.4941, "step": 16953 }, { "epoch": 1.33, "learning_rate": 0.00017594172983351544, "loss": 1.5596, "step": 16954 }, { "epoch": 1.33, "learning_rate": 0.00017592955627160058, "loss": 1.5271, "step": 16955 }, { "epoch": 1.33, "learning_rate": 0.00017591738253363825, "loss": 1.4967, "step": 16956 }, { "epoch": 1.33, "learning_rate": 0.0001759052086197112, "loss": 1.5269, "step": 16957 }, { "epoch": 1.33, "learning_rate": 0.0001758930345299021, "loss": 1.5156, "step": 16958 }, { "epoch": 1.33, "learning_rate": 0.00017588086026429356, "loss": 1.4913, "step": 16959 }, { "epoch": 1.33, "learning_rate": 0.0001758686858229683, "loss": 1.5319, "step": 16960 }, { "epoch": 1.33, "learning_rate": 0.0001758565112060089, "loss": 1.6106, "step": 16961 }, { "epoch": 1.33, "learning_rate": 0.00017584433641349806, "loss": 1.5156, "step": 16962 }, { "epoch": 1.33, "learning_rate": 0.00017583216144551845, "loss": 1.4972, "step": 16963 }, { "epoch": 1.33, "learning_rate": 0.0001758199863021527, "loss": 1.5639, "step": 16964 }, { "epoch": 1.33, "learning_rate": 0.00017580781098348357, "loss": 1.5224, "step": 16965 }, { "epoch": 1.33, "learning_rate": 0.00017579563548959356, "loss": 1.549, "step": 16966 }, { "epoch": 1.33, "learning_rate": 0.00017578345982056546, "loss": 1.5461, "step": 16967 }, { "epoch": 1.34, "learning_rate": 0.0001757712839764819, "loss": 1.5276, "step": 16968 }, { "epoch": 1.34, "learning_rate": 0.0001757591079574255, "loss": 1.5419, "step": 16969 }, { "epoch": 1.34, "learning_rate": 0.000175746931763479, "loss": 1.5809, "step": 16970 }, { "epoch": 1.34, "learning_rate": 0.00017573475539472502, "loss": 1.4794, "step": 16971 }, { "epoch": 1.34, "learning_rate": 0.0001757225788512463, "loss": 1.5131, "step": 16972 }, { "epoch": 1.34, "learning_rate": 0.00017571040213312542, "loss": 1.5279, "step": 16973 }, { "epoch": 1.34, "learning_rate": 0.0001756982252404451, "loss": 1.5759, "step": 16974 }, { "epoch": 1.34, "learning_rate": 0.00017568604817328804, "loss": 1.5113, "step": 16975 }, { "epoch": 1.34, "learning_rate": 0.00017567387093173688, "loss": 1.5393, "step": 16976 }, { "epoch": 1.34, "learning_rate": 0.00017566169351587434, "loss": 1.5392, "step": 16977 }, { "epoch": 1.34, "learning_rate": 0.00017564951592578294, "loss": 1.5329, "step": 16978 }, { "epoch": 1.34, "learning_rate": 0.0001756373381615456, "loss": 1.5479, "step": 16979 }, { "epoch": 1.34, "learning_rate": 0.00017562516022324483, "loss": 1.5563, "step": 16980 }, { "epoch": 1.34, "learning_rate": 0.00017561298211096337, "loss": 1.5138, "step": 16981 }, { "epoch": 1.34, "learning_rate": 0.00017560080382478393, "loss": 1.4542, "step": 16982 }, { "epoch": 1.34, "learning_rate": 0.00017558862536478913, "loss": 1.5495, "step": 16983 }, { "epoch": 1.34, "learning_rate": 0.0001755764467310617, "loss": 1.5381, "step": 16984 }, { "epoch": 1.34, "learning_rate": 0.0001755642679236843, "loss": 1.5615, "step": 16985 }, { "epoch": 1.34, "learning_rate": 0.00017555208894273958, "loss": 1.5469, "step": 16986 }, { "epoch": 1.34, "learning_rate": 0.00017553990978831036, "loss": 1.5218, "step": 16987 }, { "epoch": 1.34, "learning_rate": 0.0001755277304604792, "loss": 1.5387, "step": 16988 }, { "epoch": 1.34, "learning_rate": 0.00017551555095932886, "loss": 1.5845, "step": 16989 }, { "epoch": 1.34, "learning_rate": 0.00017550337128494198, "loss": 1.52, "step": 16990 }, { "epoch": 1.34, "learning_rate": 0.0001754911914374013, "loss": 1.4728, "step": 16991 }, { "epoch": 1.34, "learning_rate": 0.00017547901141678953, "loss": 1.543, "step": 16992 }, { "epoch": 1.34, "learning_rate": 0.00017546683122318925, "loss": 1.5253, "step": 16993 }, { "epoch": 1.34, "learning_rate": 0.00017545465085668332, "loss": 1.5154, "step": 16994 }, { "epoch": 1.34, "learning_rate": 0.00017544247031735434, "loss": 1.5086, "step": 16995 }, { "epoch": 1.34, "learning_rate": 0.000175430289605285, "loss": 1.5095, "step": 16996 }, { "epoch": 1.34, "learning_rate": 0.00017541810872055805, "loss": 1.4928, "step": 16997 }, { "epoch": 1.34, "learning_rate": 0.00017540592766325617, "loss": 1.52, "step": 16998 }, { "epoch": 1.34, "learning_rate": 0.00017539374643346206, "loss": 1.5822, "step": 16999 }, { "epoch": 1.34, "learning_rate": 0.00017538156503125842, "loss": 1.4905, "step": 17000 }, { "epoch": 1.34, "learning_rate": 0.0001753693834567279, "loss": 1.5511, "step": 17001 }, { "epoch": 1.34, "learning_rate": 0.00017535720170995335, "loss": 1.5317, "step": 17002 }, { "epoch": 1.34, "learning_rate": 0.00017534501979101736, "loss": 1.5585, "step": 17003 }, { "epoch": 1.34, "learning_rate": 0.0001753328377000027, "loss": 1.5458, "step": 17004 }, { "epoch": 1.34, "learning_rate": 0.000175320655436992, "loss": 1.5033, "step": 17005 }, { "epoch": 1.34, "learning_rate": 0.0001753084730020681, "loss": 1.5388, "step": 17006 }, { "epoch": 1.34, "learning_rate": 0.00017529629039531356, "loss": 1.5634, "step": 17007 }, { "epoch": 1.34, "learning_rate": 0.0001752841076168112, "loss": 1.4858, "step": 17008 }, { "epoch": 1.34, "learning_rate": 0.0001752719246666437, "loss": 1.4894, "step": 17009 }, { "epoch": 1.34, "learning_rate": 0.00017525974154489375, "loss": 1.541, "step": 17010 }, { "epoch": 1.34, "learning_rate": 0.00017524755825164417, "loss": 1.5027, "step": 17011 }, { "epoch": 1.34, "learning_rate": 0.00017523537478697753, "loss": 1.5733, "step": 17012 }, { "epoch": 1.34, "learning_rate": 0.00017522319115097665, "loss": 1.5385, "step": 17013 }, { "epoch": 1.34, "learning_rate": 0.00017521100734372422, "loss": 1.4957, "step": 17014 }, { "epoch": 1.34, "learning_rate": 0.00017519882336530297, "loss": 1.5678, "step": 17015 }, { "epoch": 1.34, "learning_rate": 0.0001751866392157956, "loss": 1.5918, "step": 17016 }, { "epoch": 1.34, "learning_rate": 0.0001751744548952848, "loss": 1.5545, "step": 17017 }, { "epoch": 1.34, "learning_rate": 0.00017516227040385344, "loss": 1.4933, "step": 17018 }, { "epoch": 1.34, "learning_rate": 0.0001751500857415841, "loss": 1.5343, "step": 17019 }, { "epoch": 1.34, "learning_rate": 0.00017513790090855955, "loss": 1.5413, "step": 17020 }, { "epoch": 1.34, "learning_rate": 0.00017512571590486256, "loss": 1.5172, "step": 17021 }, { "epoch": 1.34, "learning_rate": 0.0001751135307305758, "loss": 1.5617, "step": 17022 }, { "epoch": 1.34, "learning_rate": 0.00017510134538578203, "loss": 1.5786, "step": 17023 }, { "epoch": 1.34, "learning_rate": 0.00017508915987056396, "loss": 1.5034, "step": 17024 }, { "epoch": 1.34, "learning_rate": 0.00017507697418500437, "loss": 1.5852, "step": 17025 }, { "epoch": 1.34, "learning_rate": 0.00017506478832918595, "loss": 1.5136, "step": 17026 }, { "epoch": 1.34, "learning_rate": 0.00017505260230319143, "loss": 1.5282, "step": 17027 }, { "epoch": 1.34, "learning_rate": 0.00017504041610710359, "loss": 1.4995, "step": 17028 }, { "epoch": 1.34, "learning_rate": 0.00017502822974100514, "loss": 1.5112, "step": 17029 }, { "epoch": 1.34, "learning_rate": 0.0001750160432049788, "loss": 1.5431, "step": 17030 }, { "epoch": 1.34, "learning_rate": 0.0001750038564991074, "loss": 1.4808, "step": 17031 }, { "epoch": 1.34, "learning_rate": 0.00017499166962347355, "loss": 1.5407, "step": 17032 }, { "epoch": 1.34, "learning_rate": 0.00017497948257816002, "loss": 1.5268, "step": 17033 }, { "epoch": 1.34, "learning_rate": 0.00017496729536324964, "loss": 1.5038, "step": 17034 }, { "epoch": 1.34, "learning_rate": 0.00017495510797882512, "loss": 1.5262, "step": 17035 }, { "epoch": 1.34, "learning_rate": 0.00017494292042496916, "loss": 1.5306, "step": 17036 }, { "epoch": 1.34, "learning_rate": 0.00017493073270176453, "loss": 1.5508, "step": 17037 }, { "epoch": 1.34, "learning_rate": 0.00017491854480929404, "loss": 1.5083, "step": 17038 }, { "epoch": 1.34, "learning_rate": 0.0001749063567476403, "loss": 1.5487, "step": 17039 }, { "epoch": 1.34, "learning_rate": 0.0001748941685168862, "loss": 1.5336, "step": 17040 }, { "epoch": 1.34, "learning_rate": 0.0001748819801171144, "loss": 1.5252, "step": 17041 }, { "epoch": 1.34, "learning_rate": 0.00017486979154840765, "loss": 1.5252, "step": 17042 }, { "epoch": 1.34, "learning_rate": 0.00017485760281084884, "loss": 1.5018, "step": 17043 }, { "epoch": 1.34, "learning_rate": 0.00017484541390452055, "loss": 1.524, "step": 17044 }, { "epoch": 1.34, "learning_rate": 0.00017483322482950565, "loss": 1.5282, "step": 17045 }, { "epoch": 1.34, "learning_rate": 0.00017482103558588683, "loss": 1.5114, "step": 17046 }, { "epoch": 1.34, "learning_rate": 0.00017480884617374689, "loss": 1.5583, "step": 17047 }, { "epoch": 1.34, "learning_rate": 0.00017479665659316857, "loss": 1.5252, "step": 17048 }, { "epoch": 1.34, "learning_rate": 0.00017478446684423462, "loss": 1.5146, "step": 17049 }, { "epoch": 1.34, "learning_rate": 0.00017477227692702784, "loss": 1.5061, "step": 17050 }, { "epoch": 1.34, "learning_rate": 0.00017476008684163093, "loss": 1.5881, "step": 17051 }, { "epoch": 1.34, "learning_rate": 0.00017474789658812677, "loss": 1.5007, "step": 17052 }, { "epoch": 1.34, "learning_rate": 0.000174735706166598, "loss": 1.5015, "step": 17053 }, { "epoch": 1.34, "learning_rate": 0.00017472351557712743, "loss": 1.4902, "step": 17054 }, { "epoch": 1.34, "learning_rate": 0.00017471132481979785, "loss": 1.5271, "step": 17055 }, { "epoch": 1.34, "learning_rate": 0.000174699133894692, "loss": 1.5003, "step": 17056 }, { "epoch": 1.34, "learning_rate": 0.00017468694280189267, "loss": 1.5442, "step": 17057 }, { "epoch": 1.34, "learning_rate": 0.0001746747515414826, "loss": 1.5694, "step": 17058 }, { "epoch": 1.34, "learning_rate": 0.00017466256011354462, "loss": 1.5106, "step": 17059 }, { "epoch": 1.34, "learning_rate": 0.00017465036851816145, "loss": 1.5306, "step": 17060 }, { "epoch": 1.34, "learning_rate": 0.0001746381767554159, "loss": 1.4954, "step": 17061 }, { "epoch": 1.34, "learning_rate": 0.0001746259848253907, "loss": 1.5789, "step": 17062 }, { "epoch": 1.34, "learning_rate": 0.00017461379272816867, "loss": 1.5571, "step": 17063 }, { "epoch": 1.34, "learning_rate": 0.00017460160046383252, "loss": 1.5056, "step": 17064 }, { "epoch": 1.34, "learning_rate": 0.00017458940803246516, "loss": 1.5418, "step": 17065 }, { "epoch": 1.34, "learning_rate": 0.0001745772154341492, "loss": 1.5571, "step": 17066 }, { "epoch": 1.34, "learning_rate": 0.00017456502266896757, "loss": 1.5968, "step": 17067 }, { "epoch": 1.34, "learning_rate": 0.000174552829737003, "loss": 1.5205, "step": 17068 }, { "epoch": 1.34, "learning_rate": 0.00017454063663833823, "loss": 1.5502, "step": 17069 }, { "epoch": 1.34, "learning_rate": 0.0001745284433730561, "loss": 1.563, "step": 17070 }, { "epoch": 1.34, "learning_rate": 0.00017451624994123936, "loss": 1.5499, "step": 17071 }, { "epoch": 1.34, "learning_rate": 0.00017450405634297084, "loss": 1.5024, "step": 17072 }, { "epoch": 1.34, "learning_rate": 0.00017449186257833326, "loss": 1.5339, "step": 17073 }, { "epoch": 1.34, "learning_rate": 0.00017447966864740948, "loss": 1.5217, "step": 17074 }, { "epoch": 1.34, "learning_rate": 0.00017446747455028227, "loss": 1.4797, "step": 17075 }, { "epoch": 1.34, "learning_rate": 0.00017445528028703437, "loss": 1.522, "step": 17076 }, { "epoch": 1.34, "learning_rate": 0.00017444308585774866, "loss": 1.5376, "step": 17077 }, { "epoch": 1.34, "learning_rate": 0.00017443089126250786, "loss": 1.5431, "step": 17078 }, { "epoch": 1.34, "learning_rate": 0.0001744186965013948, "loss": 1.5494, "step": 17079 }, { "epoch": 1.34, "learning_rate": 0.0001744065015744922, "loss": 1.5454, "step": 17080 }, { "epoch": 1.34, "learning_rate": 0.00017439430648188303, "loss": 1.5837, "step": 17081 }, { "epoch": 1.34, "learning_rate": 0.0001743821112236499, "loss": 1.543, "step": 17082 }, { "epoch": 1.34, "learning_rate": 0.00017436991579987572, "loss": 1.4887, "step": 17083 }, { "epoch": 1.34, "learning_rate": 0.00017435772021064328, "loss": 1.5369, "step": 17084 }, { "epoch": 1.34, "learning_rate": 0.00017434552445603533, "loss": 1.5276, "step": 17085 }, { "epoch": 1.34, "learning_rate": 0.0001743333285361347, "loss": 1.5348, "step": 17086 }, { "epoch": 1.34, "learning_rate": 0.00017432113245102423, "loss": 1.5086, "step": 17087 }, { "epoch": 1.34, "learning_rate": 0.00017430893620078665, "loss": 1.5535, "step": 17088 }, { "epoch": 1.34, "learning_rate": 0.00017429673978550483, "loss": 1.5234, "step": 17089 }, { "epoch": 1.34, "learning_rate": 0.00017428454320526156, "loss": 1.4983, "step": 17090 }, { "epoch": 1.34, "learning_rate": 0.00017427234646013966, "loss": 1.5142, "step": 17091 }, { "epoch": 1.34, "learning_rate": 0.00017426014955022193, "loss": 1.5642, "step": 17092 }, { "epoch": 1.34, "learning_rate": 0.0001742479524755911, "loss": 1.4969, "step": 17093 }, { "epoch": 1.34, "learning_rate": 0.00017423575523633011, "loss": 1.5485, "step": 17094 }, { "epoch": 1.35, "learning_rate": 0.0001742235578325217, "loss": 1.5218, "step": 17095 }, { "epoch": 1.35, "learning_rate": 0.00017421136026424873, "loss": 1.5082, "step": 17096 }, { "epoch": 1.35, "learning_rate": 0.00017419916253159394, "loss": 1.583, "step": 17097 }, { "epoch": 1.35, "learning_rate": 0.00017418696463464018, "loss": 1.5687, "step": 17098 }, { "epoch": 1.35, "learning_rate": 0.00017417476657347034, "loss": 1.5099, "step": 17099 }, { "epoch": 1.35, "learning_rate": 0.00017416256834816714, "loss": 1.583, "step": 17100 }, { "epoch": 1.35, "learning_rate": 0.00017415036995881345, "loss": 1.5553, "step": 17101 }, { "epoch": 1.35, "learning_rate": 0.00017413817140549205, "loss": 1.5076, "step": 17102 }, { "epoch": 1.35, "learning_rate": 0.0001741259726882858, "loss": 1.5539, "step": 17103 }, { "epoch": 1.35, "learning_rate": 0.0001741137738072775, "loss": 1.5487, "step": 17104 }, { "epoch": 1.35, "learning_rate": 0.00017410157476255, "loss": 1.5221, "step": 17105 }, { "epoch": 1.35, "learning_rate": 0.0001740893755541861, "loss": 1.5662, "step": 17106 }, { "epoch": 1.35, "learning_rate": 0.0001740771761822686, "loss": 1.5561, "step": 17107 }, { "epoch": 1.35, "learning_rate": 0.00017406497664688045, "loss": 1.4688, "step": 17108 }, { "epoch": 1.35, "learning_rate": 0.00017405277694810433, "loss": 1.5229, "step": 17109 }, { "epoch": 1.35, "learning_rate": 0.0001740405770860231, "loss": 1.5272, "step": 17110 }, { "epoch": 1.35, "learning_rate": 0.00017402837706071962, "loss": 1.5753, "step": 17111 }, { "epoch": 1.35, "learning_rate": 0.00017401617687227676, "loss": 1.6127, "step": 17112 }, { "epoch": 1.35, "learning_rate": 0.00017400397652077732, "loss": 1.5643, "step": 17113 }, { "epoch": 1.35, "learning_rate": 0.00017399177600630413, "loss": 1.541, "step": 17114 }, { "epoch": 1.35, "learning_rate": 0.00017397957532894, "loss": 1.53, "step": 17115 }, { "epoch": 1.35, "learning_rate": 0.0001739673744887678, "loss": 1.4654, "step": 17116 }, { "epoch": 1.35, "learning_rate": 0.0001739551734858703, "loss": 1.5555, "step": 17117 }, { "epoch": 1.35, "learning_rate": 0.0001739429723203305, "loss": 1.5291, "step": 17118 }, { "epoch": 1.35, "learning_rate": 0.00017393077099223098, "loss": 1.5445, "step": 17119 }, { "epoch": 1.35, "learning_rate": 0.00017391856950165483, "loss": 1.5669, "step": 17120 }, { "epoch": 1.35, "learning_rate": 0.00017390636784868477, "loss": 1.551, "step": 17121 }, { "epoch": 1.35, "learning_rate": 0.00017389416603340367, "loss": 1.5353, "step": 17122 }, { "epoch": 1.35, "learning_rate": 0.00017388196405589438, "loss": 1.5334, "step": 17123 }, { "epoch": 1.35, "learning_rate": 0.0001738697619162397, "loss": 1.5425, "step": 17124 }, { "epoch": 1.35, "learning_rate": 0.00017385755961452253, "loss": 1.5194, "step": 17125 }, { "epoch": 1.35, "learning_rate": 0.00017384535715082573, "loss": 1.5256, "step": 17126 }, { "epoch": 1.35, "learning_rate": 0.00017383315452523202, "loss": 1.5191, "step": 17127 }, { "epoch": 1.35, "learning_rate": 0.00017382095173782444, "loss": 1.5448, "step": 17128 }, { "epoch": 1.35, "learning_rate": 0.0001738087487886857, "loss": 1.5086, "step": 17129 }, { "epoch": 1.35, "learning_rate": 0.00017379654567789871, "loss": 1.5494, "step": 17130 }, { "epoch": 1.35, "learning_rate": 0.00017378434240554631, "loss": 1.5341, "step": 17131 }, { "epoch": 1.35, "learning_rate": 0.00017377213897171132, "loss": 1.5699, "step": 17132 }, { "epoch": 1.35, "learning_rate": 0.00017375993537647666, "loss": 1.5045, "step": 17133 }, { "epoch": 1.35, "learning_rate": 0.00017374773161992513, "loss": 1.5158, "step": 17134 }, { "epoch": 1.35, "learning_rate": 0.00017373552770213958, "loss": 1.499, "step": 17135 }, { "epoch": 1.35, "learning_rate": 0.00017372332362320292, "loss": 1.5534, "step": 17136 }, { "epoch": 1.35, "learning_rate": 0.000173711119383198, "loss": 1.5489, "step": 17137 }, { "epoch": 1.35, "learning_rate": 0.00017369891498220767, "loss": 1.557, "step": 17138 }, { "epoch": 1.35, "learning_rate": 0.00017368671042031477, "loss": 1.5578, "step": 17139 }, { "epoch": 1.35, "learning_rate": 0.0001736745056976022, "loss": 1.4834, "step": 17140 }, { "epoch": 1.35, "learning_rate": 0.00017366230081415274, "loss": 1.5468, "step": 17141 }, { "epoch": 1.35, "learning_rate": 0.00017365009577004938, "loss": 1.5077, "step": 17142 }, { "epoch": 1.35, "learning_rate": 0.00017363789056537487, "loss": 1.4729, "step": 17143 }, { "epoch": 1.35, "learning_rate": 0.0001736256852002121, "loss": 1.5503, "step": 17144 }, { "epoch": 1.35, "learning_rate": 0.0001736134796746441, "loss": 1.4944, "step": 17145 }, { "epoch": 1.35, "learning_rate": 0.00017360127398875349, "loss": 1.5543, "step": 17146 }, { "epoch": 1.35, "learning_rate": 0.00017358906814262328, "loss": 1.5363, "step": 17147 }, { "epoch": 1.35, "learning_rate": 0.00017357686213633635, "loss": 1.5412, "step": 17148 }, { "epoch": 1.35, "learning_rate": 0.0001735646559699755, "loss": 1.5184, "step": 17149 }, { "epoch": 1.35, "learning_rate": 0.00017355244964362363, "loss": 1.5248, "step": 17150 }, { "epoch": 1.35, "learning_rate": 0.00017354024315736362, "loss": 1.5704, "step": 17151 }, { "epoch": 1.35, "learning_rate": 0.00017352803651127837, "loss": 1.5201, "step": 17152 }, { "epoch": 1.35, "learning_rate": 0.00017351582970545073, "loss": 1.5442, "step": 17153 }, { "epoch": 1.35, "learning_rate": 0.0001735036227399636, "loss": 1.6035, "step": 17154 }, { "epoch": 1.35, "learning_rate": 0.00017349141561489987, "loss": 1.4942, "step": 17155 }, { "epoch": 1.35, "learning_rate": 0.00017347920833034233, "loss": 1.5099, "step": 17156 }, { "epoch": 1.35, "learning_rate": 0.00017346700088637394, "loss": 1.4712, "step": 17157 }, { "epoch": 1.35, "learning_rate": 0.00017345479328307754, "loss": 1.5261, "step": 17158 }, { "epoch": 1.35, "learning_rate": 0.0001734425855205361, "loss": 1.5015, "step": 17159 }, { "epoch": 1.35, "learning_rate": 0.0001734303775988324, "loss": 1.5635, "step": 17160 }, { "epoch": 1.35, "learning_rate": 0.00017341816951804936, "loss": 1.5621, "step": 17161 }, { "epoch": 1.35, "learning_rate": 0.0001734059612782699, "loss": 1.5212, "step": 17162 }, { "epoch": 1.35, "learning_rate": 0.00017339375287957686, "loss": 1.5856, "step": 17163 }, { "epoch": 1.35, "learning_rate": 0.00017338154432205318, "loss": 1.5623, "step": 17164 }, { "epoch": 1.35, "learning_rate": 0.0001733693356057817, "loss": 1.5092, "step": 17165 }, { "epoch": 1.35, "learning_rate": 0.0001733571267308453, "loss": 1.5434, "step": 17166 }, { "epoch": 1.35, "learning_rate": 0.0001733449176973269, "loss": 1.4802, "step": 17167 }, { "epoch": 1.35, "learning_rate": 0.0001733327085053094, "loss": 1.4992, "step": 17168 }, { "epoch": 1.35, "learning_rate": 0.00017332049915487572, "loss": 1.5504, "step": 17169 }, { "epoch": 1.35, "learning_rate": 0.0001733082896461087, "loss": 1.5019, "step": 17170 }, { "epoch": 1.35, "learning_rate": 0.00017329607997909125, "loss": 1.5464, "step": 17171 }, { "epoch": 1.35, "learning_rate": 0.00017328387015390627, "loss": 1.5431, "step": 17172 }, { "epoch": 1.35, "learning_rate": 0.00017327166017063665, "loss": 1.5066, "step": 17173 }, { "epoch": 1.35, "learning_rate": 0.00017325945002936532, "loss": 1.5267, "step": 17174 }, { "epoch": 1.35, "learning_rate": 0.00017324723973017515, "loss": 1.5209, "step": 17175 }, { "epoch": 1.35, "learning_rate": 0.00017323502927314905, "loss": 1.5405, "step": 17176 }, { "epoch": 1.35, "learning_rate": 0.00017322281865836994, "loss": 1.5222, "step": 17177 }, { "epoch": 1.35, "learning_rate": 0.00017321060788592067, "loss": 1.5216, "step": 17178 }, { "epoch": 1.35, "learning_rate": 0.00017319839695588424, "loss": 1.5031, "step": 17179 }, { "epoch": 1.35, "learning_rate": 0.00017318618586834345, "loss": 1.5291, "step": 17180 }, { "epoch": 1.35, "learning_rate": 0.00017317397462338126, "loss": 1.5053, "step": 17181 }, { "epoch": 1.35, "learning_rate": 0.00017316176322108056, "loss": 1.5045, "step": 17182 }, { "epoch": 1.35, "learning_rate": 0.0001731495516615243, "loss": 1.5722, "step": 17183 }, { "epoch": 1.35, "learning_rate": 0.00017313733994479531, "loss": 1.4852, "step": 17184 }, { "epoch": 1.35, "learning_rate": 0.0001731251280709766, "loss": 1.5937, "step": 17185 }, { "epoch": 1.35, "learning_rate": 0.00017311291604015105, "loss": 1.5416, "step": 17186 }, { "epoch": 1.35, "learning_rate": 0.0001731007038524015, "loss": 1.5481, "step": 17187 }, { "epoch": 1.35, "learning_rate": 0.00017308849150781094, "loss": 1.5503, "step": 17188 }, { "epoch": 1.35, "learning_rate": 0.00017307627900646228, "loss": 1.6046, "step": 17189 }, { "epoch": 1.35, "learning_rate": 0.0001730640663484384, "loss": 1.5427, "step": 17190 }, { "epoch": 1.35, "learning_rate": 0.00017305185353382223, "loss": 1.5582, "step": 17191 }, { "epoch": 1.35, "learning_rate": 0.00017303964056269668, "loss": 1.5239, "step": 17192 }, { "epoch": 1.35, "learning_rate": 0.0001730274274351447, "loss": 1.5528, "step": 17193 }, { "epoch": 1.35, "learning_rate": 0.00017301521415124925, "loss": 1.5167, "step": 17194 }, { "epoch": 1.35, "learning_rate": 0.00017300300071109315, "loss": 1.4923, "step": 17195 }, { "epoch": 1.35, "learning_rate": 0.0001729907871147594, "loss": 1.5405, "step": 17196 }, { "epoch": 1.35, "learning_rate": 0.00017297857336233085, "loss": 1.5119, "step": 17197 }, { "epoch": 1.35, "learning_rate": 0.0001729663594538905, "loss": 1.4842, "step": 17198 }, { "epoch": 1.35, "learning_rate": 0.0001729541453895212, "loss": 1.5193, "step": 17199 }, { "epoch": 1.35, "learning_rate": 0.00017294193116930594, "loss": 1.5912, "step": 17200 }, { "epoch": 1.35, "learning_rate": 0.00017292971679332765, "loss": 1.5508, "step": 17201 }, { "epoch": 1.35, "learning_rate": 0.00017291750226166918, "loss": 1.5504, "step": 17202 }, { "epoch": 1.35, "learning_rate": 0.0001729052875744136, "loss": 1.5434, "step": 17203 }, { "epoch": 1.35, "learning_rate": 0.00017289307273164373, "loss": 1.5311, "step": 17204 }, { "epoch": 1.35, "learning_rate": 0.0001728808577334425, "loss": 1.4916, "step": 17205 }, { "epoch": 1.35, "learning_rate": 0.00017286864257989287, "loss": 1.5247, "step": 17206 }, { "epoch": 1.35, "learning_rate": 0.0001728564272710778, "loss": 1.5345, "step": 17207 }, { "epoch": 1.35, "learning_rate": 0.0001728442118070802, "loss": 1.5934, "step": 17208 }, { "epoch": 1.35, "learning_rate": 0.000172831996187983, "loss": 1.5649, "step": 17209 }, { "epoch": 1.35, "learning_rate": 0.00017281978041386913, "loss": 1.5375, "step": 17210 }, { "epoch": 1.35, "learning_rate": 0.0001728075644848216, "loss": 1.5787, "step": 17211 }, { "epoch": 1.35, "learning_rate": 0.00017279534840092324, "loss": 1.5557, "step": 17212 }, { "epoch": 1.35, "learning_rate": 0.00017278313216225705, "loss": 1.5696, "step": 17213 }, { "epoch": 1.35, "learning_rate": 0.00017277091576890598, "loss": 1.5153, "step": 17214 }, { "epoch": 1.35, "learning_rate": 0.00017275869922095296, "loss": 1.5379, "step": 17215 }, { "epoch": 1.35, "learning_rate": 0.00017274648251848092, "loss": 1.4985, "step": 17216 }, { "epoch": 1.35, "learning_rate": 0.0001727342656615728, "loss": 1.5191, "step": 17217 }, { "epoch": 1.35, "learning_rate": 0.00017272204865031163, "loss": 1.6207, "step": 17218 }, { "epoch": 1.35, "learning_rate": 0.00017270983148478023, "loss": 1.5099, "step": 17219 }, { "epoch": 1.35, "learning_rate": 0.00017269761416506164, "loss": 1.5572, "step": 17220 }, { "epoch": 1.35, "learning_rate": 0.0001726853966912387, "loss": 1.483, "step": 17221 }, { "epoch": 1.36, "learning_rate": 0.0001726731790633945, "loss": 1.524, "step": 17222 }, { "epoch": 1.36, "learning_rate": 0.00017266096128161192, "loss": 1.5318, "step": 17223 }, { "epoch": 1.36, "learning_rate": 0.0001726487433459739, "loss": 1.52, "step": 17224 }, { "epoch": 1.36, "learning_rate": 0.00017263652525656347, "loss": 1.5552, "step": 17225 }, { "epoch": 1.36, "learning_rate": 0.00017262430701346347, "loss": 1.484, "step": 17226 }, { "epoch": 1.36, "learning_rate": 0.0001726120886167569, "loss": 1.5453, "step": 17227 }, { "epoch": 1.36, "learning_rate": 0.00017259987006652678, "loss": 1.4997, "step": 17228 }, { "epoch": 1.36, "learning_rate": 0.00017258765136285597, "loss": 1.4844, "step": 17229 }, { "epoch": 1.36, "learning_rate": 0.0001725754325058275, "loss": 1.5499, "step": 17230 }, { "epoch": 1.36, "learning_rate": 0.00017256321349552427, "loss": 1.553, "step": 17231 }, { "epoch": 1.36, "learning_rate": 0.0001725509943320293, "loss": 1.4895, "step": 17232 }, { "epoch": 1.36, "learning_rate": 0.00017253877501542553, "loss": 1.5023, "step": 17233 }, { "epoch": 1.36, "learning_rate": 0.00017252655554579588, "loss": 1.5057, "step": 17234 }, { "epoch": 1.36, "learning_rate": 0.00017251433592322337, "loss": 1.5527, "step": 17235 }, { "epoch": 1.36, "learning_rate": 0.00017250211614779093, "loss": 1.5732, "step": 17236 }, { "epoch": 1.36, "learning_rate": 0.00017248989621958155, "loss": 1.5469, "step": 17237 }, { "epoch": 1.36, "learning_rate": 0.00017247767613867818, "loss": 1.5501, "step": 17238 }, { "epoch": 1.36, "learning_rate": 0.0001724654559051638, "loss": 1.4859, "step": 17239 }, { "epoch": 1.36, "learning_rate": 0.00017245323551912136, "loss": 1.5474, "step": 17240 }, { "epoch": 1.36, "learning_rate": 0.00017244101498063385, "loss": 1.5508, "step": 17241 }, { "epoch": 1.36, "learning_rate": 0.00017242879428978428, "loss": 1.5616, "step": 17242 }, { "epoch": 1.36, "learning_rate": 0.00017241657344665553, "loss": 1.4713, "step": 17243 }, { "epoch": 1.36, "learning_rate": 0.00017240435245133057, "loss": 1.5773, "step": 17244 }, { "epoch": 1.36, "learning_rate": 0.00017239213130389245, "loss": 1.5271, "step": 17245 }, { "epoch": 1.36, "learning_rate": 0.00017237991000442412, "loss": 1.5192, "step": 17246 }, { "epoch": 1.36, "learning_rate": 0.00017236768855300862, "loss": 1.5474, "step": 17247 }, { "epoch": 1.36, "learning_rate": 0.00017235546694972876, "loss": 1.4942, "step": 17248 }, { "epoch": 1.36, "learning_rate": 0.00017234324519466764, "loss": 1.575, "step": 17249 }, { "epoch": 1.36, "learning_rate": 0.00017233102328790826, "loss": 1.5747, "step": 17250 }, { "epoch": 1.36, "learning_rate": 0.00017231880122953354, "loss": 1.5788, "step": 17251 }, { "epoch": 1.36, "learning_rate": 0.0001723065790196265, "loss": 1.4819, "step": 17252 }, { "epoch": 1.36, "learning_rate": 0.00017229435665826998, "loss": 1.5552, "step": 17253 }, { "epoch": 1.36, "learning_rate": 0.00017228213414554718, "loss": 1.4696, "step": 17254 }, { "epoch": 1.36, "learning_rate": 0.00017226991148154097, "loss": 1.5171, "step": 17255 }, { "epoch": 1.36, "learning_rate": 0.00017225768866633434, "loss": 1.5369, "step": 17256 }, { "epoch": 1.36, "learning_rate": 0.0001722454657000103, "loss": 1.5317, "step": 17257 }, { "epoch": 1.36, "learning_rate": 0.00017223324258265182, "loss": 1.5336, "step": 17258 }, { "epoch": 1.36, "learning_rate": 0.00017222101931434194, "loss": 1.5324, "step": 17259 }, { "epoch": 1.36, "learning_rate": 0.00017220879589516352, "loss": 1.5155, "step": 17260 }, { "epoch": 1.36, "learning_rate": 0.00017219657232519963, "loss": 1.5784, "step": 17261 }, { "epoch": 1.36, "learning_rate": 0.00017218434860453332, "loss": 1.5605, "step": 17262 }, { "epoch": 1.36, "learning_rate": 0.0001721721247332475, "loss": 1.5264, "step": 17263 }, { "epoch": 1.36, "learning_rate": 0.00017215990071142522, "loss": 1.4776, "step": 17264 }, { "epoch": 1.36, "learning_rate": 0.0001721476765391494, "loss": 1.5422, "step": 17265 }, { "epoch": 1.36, "learning_rate": 0.00017213545221650306, "loss": 1.4895, "step": 17266 }, { "epoch": 1.36, "learning_rate": 0.00017212322774356927, "loss": 1.5099, "step": 17267 }, { "epoch": 1.36, "learning_rate": 0.0001721110031204309, "loss": 1.5163, "step": 17268 }, { "epoch": 1.36, "learning_rate": 0.00017209877834717112, "loss": 1.5114, "step": 17269 }, { "epoch": 1.36, "learning_rate": 0.00017208655342387276, "loss": 1.5462, "step": 17270 }, { "epoch": 1.36, "learning_rate": 0.00017207432835061894, "loss": 1.48, "step": 17271 }, { "epoch": 1.36, "learning_rate": 0.00017206210312749258, "loss": 1.5122, "step": 17272 }, { "epoch": 1.36, "learning_rate": 0.0001720498777545767, "loss": 1.4971, "step": 17273 }, { "epoch": 1.36, "learning_rate": 0.00017203765223195434, "loss": 1.5756, "step": 17274 }, { "epoch": 1.36, "learning_rate": 0.00017202542655970847, "loss": 1.5803, "step": 17275 }, { "epoch": 1.36, "learning_rate": 0.00017201320073792213, "loss": 1.5031, "step": 17276 }, { "epoch": 1.36, "learning_rate": 0.00017200097476667827, "loss": 1.5591, "step": 17277 }, { "epoch": 1.36, "learning_rate": 0.00017198874864605995, "loss": 1.534, "step": 17278 }, { "epoch": 1.36, "learning_rate": 0.00017197652237615018, "loss": 1.5248, "step": 17279 }, { "epoch": 1.36, "learning_rate": 0.00017196429595703195, "loss": 1.4905, "step": 17280 }, { "epoch": 1.36, "learning_rate": 0.00017195206938878826, "loss": 1.5315, "step": 17281 }, { "epoch": 1.36, "learning_rate": 0.00017193984267150212, "loss": 1.4967, "step": 17282 }, { "epoch": 1.36, "learning_rate": 0.00017192761580525658, "loss": 1.5137, "step": 17283 }, { "epoch": 1.36, "learning_rate": 0.00017191538879013458, "loss": 1.5539, "step": 17284 }, { "epoch": 1.36, "learning_rate": 0.0001719031616262192, "loss": 1.5176, "step": 17285 }, { "epoch": 1.36, "learning_rate": 0.0001718909343135935, "loss": 1.506, "step": 17286 }, { "epoch": 1.36, "learning_rate": 0.0001718787068523404, "loss": 1.5509, "step": 17287 }, { "epoch": 1.36, "learning_rate": 0.00017186647924254296, "loss": 1.5307, "step": 17288 }, { "epoch": 1.36, "learning_rate": 0.00017185425148428417, "loss": 1.6049, "step": 17289 }, { "epoch": 1.36, "learning_rate": 0.00017184202357764706, "loss": 1.4907, "step": 17290 }, { "epoch": 1.36, "learning_rate": 0.0001718297955227147, "loss": 1.4793, "step": 17291 }, { "epoch": 1.36, "learning_rate": 0.00017181756731957004, "loss": 1.5237, "step": 17292 }, { "epoch": 1.36, "learning_rate": 0.0001718053389682962, "loss": 1.5224, "step": 17293 }, { "epoch": 1.36, "learning_rate": 0.00017179311046897606, "loss": 1.5648, "step": 17294 }, { "epoch": 1.36, "learning_rate": 0.00017178088182169277, "loss": 1.5137, "step": 17295 }, { "epoch": 1.36, "learning_rate": 0.00017176865302652935, "loss": 1.5922, "step": 17296 }, { "epoch": 1.36, "learning_rate": 0.00017175642408356873, "loss": 1.5253, "step": 17297 }, { "epoch": 1.36, "learning_rate": 0.00017174419499289405, "loss": 1.6006, "step": 17298 }, { "epoch": 1.36, "learning_rate": 0.00017173196575458822, "loss": 1.5337, "step": 17299 }, { "epoch": 1.36, "learning_rate": 0.00017171973636873438, "loss": 1.5472, "step": 17300 }, { "epoch": 1.36, "learning_rate": 0.0001717075068354155, "loss": 1.5345, "step": 17301 }, { "epoch": 1.36, "learning_rate": 0.0001716952771547146, "loss": 1.5058, "step": 17302 }, { "epoch": 1.36, "learning_rate": 0.0001716830473267148, "loss": 1.5385, "step": 17303 }, { "epoch": 1.36, "learning_rate": 0.00017167081735149905, "loss": 1.5288, "step": 17304 }, { "epoch": 1.36, "learning_rate": 0.00017165858722915039, "loss": 1.4915, "step": 17305 }, { "epoch": 1.36, "learning_rate": 0.00017164635695975192, "loss": 1.5557, "step": 17306 }, { "epoch": 1.36, "learning_rate": 0.0001716341265433866, "loss": 1.5398, "step": 17307 }, { "epoch": 1.36, "learning_rate": 0.0001716218959801375, "loss": 1.478, "step": 17308 }, { "epoch": 1.36, "learning_rate": 0.0001716096652700876, "loss": 1.4914, "step": 17309 }, { "epoch": 1.36, "learning_rate": 0.0001715974344133201, "loss": 1.5564, "step": 17310 }, { "epoch": 1.36, "learning_rate": 0.00017158520340991787, "loss": 1.5397, "step": 17311 }, { "epoch": 1.36, "learning_rate": 0.00017157297225996407, "loss": 1.5178, "step": 17312 }, { "epoch": 1.36, "learning_rate": 0.0001715607409635417, "loss": 1.5193, "step": 17313 }, { "epoch": 1.36, "learning_rate": 0.00017154850952073373, "loss": 1.5339, "step": 17314 }, { "epoch": 1.36, "learning_rate": 0.00017153627793162335, "loss": 1.565, "step": 17315 }, { "epoch": 1.36, "learning_rate": 0.00017152404619629342, "loss": 1.5835, "step": 17316 }, { "epoch": 1.36, "learning_rate": 0.0001715118143148272, "loss": 1.5715, "step": 17317 }, { "epoch": 1.36, "learning_rate": 0.00017149958228730757, "loss": 1.5339, "step": 17318 }, { "epoch": 1.36, "learning_rate": 0.00017148735011381766, "loss": 1.4888, "step": 17319 }, { "epoch": 1.36, "learning_rate": 0.00017147511779444055, "loss": 1.5024, "step": 17320 }, { "epoch": 1.36, "learning_rate": 0.00017146288532925917, "loss": 1.5749, "step": 17321 }, { "epoch": 1.36, "learning_rate": 0.00017145065271835665, "loss": 1.5258, "step": 17322 }, { "epoch": 1.36, "learning_rate": 0.00017143841996181608, "loss": 1.5486, "step": 17323 }, { "epoch": 1.36, "learning_rate": 0.0001714261870597204, "loss": 1.4907, "step": 17324 }, { "epoch": 1.36, "learning_rate": 0.0001714139540121528, "loss": 1.5611, "step": 17325 }, { "epoch": 1.36, "learning_rate": 0.00017140172081919622, "loss": 1.4928, "step": 17326 }, { "epoch": 1.36, "learning_rate": 0.00017138948748093383, "loss": 1.5602, "step": 17327 }, { "epoch": 1.36, "learning_rate": 0.00017137725399744857, "loss": 1.5576, "step": 17328 }, { "epoch": 1.36, "learning_rate": 0.00017136502036882358, "loss": 1.5678, "step": 17329 }, { "epoch": 1.36, "learning_rate": 0.0001713527865951419, "loss": 1.59, "step": 17330 }, { "epoch": 1.36, "learning_rate": 0.00017134055267648652, "loss": 1.5534, "step": 17331 }, { "epoch": 1.36, "learning_rate": 0.0001713283186129406, "loss": 1.5184, "step": 17332 }, { "epoch": 1.36, "learning_rate": 0.00017131608440458719, "loss": 1.5001, "step": 17333 }, { "epoch": 1.36, "learning_rate": 0.0001713038500515093, "loss": 1.5713, "step": 17334 }, { "epoch": 1.36, "learning_rate": 0.00017129161555379005, "loss": 1.5653, "step": 17335 }, { "epoch": 1.36, "learning_rate": 0.00017127938091151247, "loss": 1.5436, "step": 17336 }, { "epoch": 1.36, "learning_rate": 0.00017126714612475966, "loss": 1.5092, "step": 17337 }, { "epoch": 1.36, "learning_rate": 0.00017125491119361462, "loss": 1.5583, "step": 17338 }, { "epoch": 1.36, "learning_rate": 0.00017124267611816048, "loss": 1.5524, "step": 17339 }, { "epoch": 1.36, "learning_rate": 0.0001712304408984803, "loss": 1.5506, "step": 17340 }, { "epoch": 1.36, "learning_rate": 0.00017121820553465714, "loss": 1.5285, "step": 17341 }, { "epoch": 1.36, "learning_rate": 0.00017120597002677406, "loss": 1.5081, "step": 17342 }, { "epoch": 1.36, "learning_rate": 0.00017119373437491414, "loss": 1.5421, "step": 17343 }, { "epoch": 1.36, "learning_rate": 0.0001711814985791605, "loss": 1.5186, "step": 17344 }, { "epoch": 1.36, "learning_rate": 0.00017116926263959615, "loss": 1.5289, "step": 17345 }, { "epoch": 1.36, "learning_rate": 0.00017115702655630415, "loss": 1.5381, "step": 17346 }, { "epoch": 1.36, "learning_rate": 0.00017114479032936768, "loss": 1.5394, "step": 17347 }, { "epoch": 1.36, "learning_rate": 0.00017113255395886972, "loss": 1.5095, "step": 17348 }, { "epoch": 1.37, "learning_rate": 0.00017112031744489337, "loss": 1.5272, "step": 17349 }, { "epoch": 1.37, "learning_rate": 0.00017110808078752172, "loss": 1.5196, "step": 17350 }, { "epoch": 1.37, "learning_rate": 0.00017109584398683787, "loss": 1.4618, "step": 17351 }, { "epoch": 1.37, "learning_rate": 0.00017108360704292492, "loss": 1.5376, "step": 17352 }, { "epoch": 1.37, "learning_rate": 0.00017107136995586584, "loss": 1.5254, "step": 17353 }, { "epoch": 1.37, "learning_rate": 0.00017105913272574382, "loss": 1.4973, "step": 17354 }, { "epoch": 1.37, "learning_rate": 0.00017104689535264186, "loss": 1.4862, "step": 17355 }, { "epoch": 1.37, "learning_rate": 0.00017103465783664318, "loss": 1.5719, "step": 17356 }, { "epoch": 1.37, "learning_rate": 0.00017102242017783074, "loss": 1.532, "step": 17357 }, { "epoch": 1.37, "learning_rate": 0.00017101018237628763, "loss": 1.5239, "step": 17358 }, { "epoch": 1.37, "learning_rate": 0.00017099794443209705, "loss": 1.5175, "step": 17359 }, { "epoch": 1.37, "learning_rate": 0.000170985706345342, "loss": 1.4996, "step": 17360 }, { "epoch": 1.37, "learning_rate": 0.00017097346811610555, "loss": 1.5234, "step": 17361 }, { "epoch": 1.37, "learning_rate": 0.00017096122974447084, "loss": 1.5276, "step": 17362 }, { "epoch": 1.37, "learning_rate": 0.0001709489912305209, "loss": 1.4901, "step": 17363 }, { "epoch": 1.37, "learning_rate": 0.00017093675257433892, "loss": 1.5651, "step": 17364 }, { "epoch": 1.37, "learning_rate": 0.00017092451377600794, "loss": 1.5251, "step": 17365 }, { "epoch": 1.37, "learning_rate": 0.0001709122748356111, "loss": 1.5422, "step": 17366 }, { "epoch": 1.37, "learning_rate": 0.00017090003575323138, "loss": 1.5801, "step": 17367 }, { "epoch": 1.37, "learning_rate": 0.000170887796528952, "loss": 1.5184, "step": 17368 }, { "epoch": 1.37, "learning_rate": 0.000170875557162856, "loss": 1.5063, "step": 17369 }, { "epoch": 1.37, "learning_rate": 0.0001708633176550265, "loss": 1.5147, "step": 17370 }, { "epoch": 1.37, "learning_rate": 0.00017085107800554654, "loss": 1.5313, "step": 17371 }, { "epoch": 1.37, "learning_rate": 0.00017083883821449928, "loss": 1.4681, "step": 17372 }, { "epoch": 1.37, "learning_rate": 0.00017082659828196787, "loss": 1.5258, "step": 17373 }, { "epoch": 1.37, "learning_rate": 0.0001708143582080353, "loss": 1.5137, "step": 17374 }, { "epoch": 1.37, "learning_rate": 0.0001708021179927847, "loss": 1.5408, "step": 17375 }, { "epoch": 1.37, "learning_rate": 0.00017078987763629927, "loss": 1.5824, "step": 17376 }, { "epoch": 1.37, "learning_rate": 0.00017077763713866197, "loss": 1.5124, "step": 17377 }, { "epoch": 1.37, "learning_rate": 0.000170765396499956, "loss": 1.5072, "step": 17378 }, { "epoch": 1.37, "learning_rate": 0.00017075315572026442, "loss": 1.5202, "step": 17379 }, { "epoch": 1.37, "learning_rate": 0.0001707409147996704, "loss": 1.5091, "step": 17380 }, { "epoch": 1.37, "learning_rate": 0.00017072867373825703, "loss": 1.5121, "step": 17381 }, { "epoch": 1.37, "learning_rate": 0.00017071643253610742, "loss": 1.5001, "step": 17382 }, { "epoch": 1.37, "learning_rate": 0.0001707041911933046, "loss": 1.5561, "step": 17383 }, { "epoch": 1.37, "learning_rate": 0.00017069194970993181, "loss": 1.4914, "step": 17384 }, { "epoch": 1.37, "learning_rate": 0.00017067970808607203, "loss": 1.5131, "step": 17385 }, { "epoch": 1.37, "learning_rate": 0.00017066746632180848, "loss": 1.5351, "step": 17386 }, { "epoch": 1.37, "learning_rate": 0.00017065522441722425, "loss": 1.4892, "step": 17387 }, { "epoch": 1.37, "learning_rate": 0.00017064298237240248, "loss": 1.4898, "step": 17388 }, { "epoch": 1.37, "learning_rate": 0.0001706307401874262, "loss": 1.527, "step": 17389 }, { "epoch": 1.37, "learning_rate": 0.00017061849786237856, "loss": 1.512, "step": 17390 }, { "epoch": 1.37, "learning_rate": 0.00017060625539734277, "loss": 1.522, "step": 17391 }, { "epoch": 1.37, "learning_rate": 0.0001705940127924018, "loss": 1.5269, "step": 17392 }, { "epoch": 1.37, "learning_rate": 0.0001705817700476389, "loss": 1.4887, "step": 17393 }, { "epoch": 1.37, "learning_rate": 0.00017056952716313712, "loss": 1.5201, "step": 17394 }, { "epoch": 1.37, "learning_rate": 0.0001705572841389796, "loss": 1.5039, "step": 17395 }, { "epoch": 1.37, "learning_rate": 0.00017054504097524948, "loss": 1.562, "step": 17396 }, { "epoch": 1.37, "learning_rate": 0.00017053279767202984, "loss": 1.54, "step": 17397 }, { "epoch": 1.37, "learning_rate": 0.0001705205542294039, "loss": 1.5189, "step": 17398 }, { "epoch": 1.37, "learning_rate": 0.00017050831064745463, "loss": 1.4841, "step": 17399 }, { "epoch": 1.37, "learning_rate": 0.00017049606692626533, "loss": 1.4806, "step": 17400 }, { "epoch": 1.37, "learning_rate": 0.000170483823065919, "loss": 1.523, "step": 17401 }, { "epoch": 1.37, "learning_rate": 0.00017047157906649883, "loss": 1.5533, "step": 17402 }, { "epoch": 1.37, "learning_rate": 0.00017045933492808792, "loss": 1.518, "step": 17403 }, { "epoch": 1.37, "learning_rate": 0.0001704470906507694, "loss": 1.4726, "step": 17404 }, { "epoch": 1.37, "learning_rate": 0.00017043484623462647, "loss": 1.5992, "step": 17405 }, { "epoch": 1.37, "learning_rate": 0.00017042260167974218, "loss": 1.517, "step": 17406 }, { "epoch": 1.37, "learning_rate": 0.0001704103569861997, "loss": 1.54, "step": 17407 }, { "epoch": 1.37, "learning_rate": 0.00017039811215408218, "loss": 1.5604, "step": 17408 }, { "epoch": 1.37, "learning_rate": 0.0001703858671834727, "loss": 1.4863, "step": 17409 }, { "epoch": 1.37, "learning_rate": 0.00017037362207445445, "loss": 1.5199, "step": 17410 }, { "epoch": 1.37, "learning_rate": 0.00017036137682711054, "loss": 1.4933, "step": 17411 }, { "epoch": 1.37, "learning_rate": 0.00017034913144152415, "loss": 1.5222, "step": 17412 }, { "epoch": 1.37, "learning_rate": 0.0001703368859177783, "loss": 1.5125, "step": 17413 }, { "epoch": 1.37, "learning_rate": 0.0001703246402559563, "loss": 1.5001, "step": 17414 }, { "epoch": 1.37, "learning_rate": 0.00017031239445614122, "loss": 1.5034, "step": 17415 }, { "epoch": 1.37, "learning_rate": 0.00017030014851841615, "loss": 1.5759, "step": 17416 }, { "epoch": 1.37, "learning_rate": 0.00017028790244286426, "loss": 1.5908, "step": 17417 }, { "epoch": 1.37, "learning_rate": 0.0001702756562295687, "loss": 1.5297, "step": 17418 }, { "epoch": 1.37, "learning_rate": 0.00017026340987861266, "loss": 1.529, "step": 17419 }, { "epoch": 1.37, "learning_rate": 0.00017025116339007925, "loss": 1.5333, "step": 17420 }, { "epoch": 1.37, "learning_rate": 0.0001702389167640516, "loss": 1.5202, "step": 17421 }, { "epoch": 1.37, "learning_rate": 0.00017022667000061293, "loss": 1.5518, "step": 17422 }, { "epoch": 1.37, "learning_rate": 0.00017021442309984628, "loss": 1.5299, "step": 17423 }, { "epoch": 1.37, "learning_rate": 0.0001702021760618348, "loss": 1.5479, "step": 17424 }, { "epoch": 1.37, "learning_rate": 0.0001701899288866618, "loss": 1.5597, "step": 17425 }, { "epoch": 1.37, "learning_rate": 0.00017017768157441025, "loss": 1.5021, "step": 17426 }, { "epoch": 1.37, "learning_rate": 0.00017016543412516342, "loss": 1.557, "step": 17427 }, { "epoch": 1.37, "learning_rate": 0.00017015318653900439, "loss": 1.5447, "step": 17428 }, { "epoch": 1.37, "learning_rate": 0.00017014093881601635, "loss": 1.5608, "step": 17429 }, { "epoch": 1.37, "learning_rate": 0.00017012869095628247, "loss": 1.535, "step": 17430 }, { "epoch": 1.37, "learning_rate": 0.00017011644295988583, "loss": 1.5686, "step": 17431 }, { "epoch": 1.37, "learning_rate": 0.00017010419482690973, "loss": 1.4905, "step": 17432 }, { "epoch": 1.37, "learning_rate": 0.00017009194655743718, "loss": 1.493, "step": 17433 }, { "epoch": 1.37, "learning_rate": 0.00017007969815155145, "loss": 1.561, "step": 17434 }, { "epoch": 1.37, "learning_rate": 0.00017006744960933558, "loss": 1.5095, "step": 17435 }, { "epoch": 1.37, "learning_rate": 0.00017005520093087284, "loss": 1.5023, "step": 17436 }, { "epoch": 1.37, "learning_rate": 0.00017004295211624635, "loss": 1.5082, "step": 17437 }, { "epoch": 1.37, "learning_rate": 0.0001700307031655393, "loss": 1.5218, "step": 17438 }, { "epoch": 1.37, "learning_rate": 0.00017001845407883483, "loss": 1.5587, "step": 17439 }, { "epoch": 1.37, "learning_rate": 0.00017000620485621608, "loss": 1.5257, "step": 17440 }, { "epoch": 1.37, "learning_rate": 0.00016999395549776623, "loss": 1.5398, "step": 17441 }, { "epoch": 1.37, "learning_rate": 0.00016998170600356847, "loss": 1.4871, "step": 17442 }, { "epoch": 1.37, "learning_rate": 0.00016996945637370593, "loss": 1.5079, "step": 17443 }, { "epoch": 1.37, "learning_rate": 0.00016995720660826184, "loss": 1.5628, "step": 17444 }, { "epoch": 1.37, "learning_rate": 0.00016994495670731932, "loss": 1.5037, "step": 17445 }, { "epoch": 1.37, "learning_rate": 0.00016993270667096152, "loss": 1.5031, "step": 17446 }, { "epoch": 1.37, "learning_rate": 0.0001699204564992717, "loss": 1.5414, "step": 17447 }, { "epoch": 1.37, "learning_rate": 0.00016990820619233293, "loss": 1.5249, "step": 17448 }, { "epoch": 1.37, "learning_rate": 0.00016989595575022843, "loss": 1.5024, "step": 17449 }, { "epoch": 1.37, "learning_rate": 0.00016988370517304134, "loss": 1.5403, "step": 17450 }, { "epoch": 1.37, "learning_rate": 0.00016987145446085492, "loss": 1.5538, "step": 17451 }, { "epoch": 1.37, "learning_rate": 0.00016985920361375228, "loss": 1.548, "step": 17452 }, { "epoch": 1.37, "learning_rate": 0.00016984695263181656, "loss": 1.5753, "step": 17453 }, { "epoch": 1.37, "learning_rate": 0.00016983470151513103, "loss": 1.5647, "step": 17454 }, { "epoch": 1.37, "learning_rate": 0.00016982245026377885, "loss": 1.5428, "step": 17455 }, { "epoch": 1.37, "learning_rate": 0.00016981019887784312, "loss": 1.5622, "step": 17456 }, { "epoch": 1.37, "learning_rate": 0.00016979794735740708, "loss": 1.5694, "step": 17457 }, { "epoch": 1.37, "learning_rate": 0.0001697856957025539, "loss": 1.5506, "step": 17458 }, { "epoch": 1.37, "learning_rate": 0.00016977344391336675, "loss": 1.5566, "step": 17459 }, { "epoch": 1.37, "learning_rate": 0.00016976119198992888, "loss": 1.5531, "step": 17460 }, { "epoch": 1.37, "learning_rate": 0.0001697489399323234, "loss": 1.5702, "step": 17461 }, { "epoch": 1.37, "learning_rate": 0.0001697366877406335, "loss": 1.5447, "step": 17462 }, { "epoch": 1.37, "learning_rate": 0.00016972443541494239, "loss": 1.5294, "step": 17463 }, { "epoch": 1.37, "learning_rate": 0.0001697121829553333, "loss": 1.5523, "step": 17464 }, { "epoch": 1.37, "learning_rate": 0.00016969993036188924, "loss": 1.4913, "step": 17465 }, { "epoch": 1.37, "learning_rate": 0.00016968767763469363, "loss": 1.497, "step": 17466 }, { "epoch": 1.37, "learning_rate": 0.0001696754247738295, "loss": 1.5043, "step": 17467 }, { "epoch": 1.37, "learning_rate": 0.00016966317177938015, "loss": 1.5152, "step": 17468 }, { "epoch": 1.37, "learning_rate": 0.00016965091865142867, "loss": 1.5746, "step": 17469 }, { "epoch": 1.37, "learning_rate": 0.0001696386653900583, "loss": 1.4945, "step": 17470 }, { "epoch": 1.37, "learning_rate": 0.00016962641199535225, "loss": 1.5512, "step": 17471 }, { "epoch": 1.37, "learning_rate": 0.00016961415846739365, "loss": 1.4878, "step": 17472 }, { "epoch": 1.37, "learning_rate": 0.00016960190480626576, "loss": 1.5478, "step": 17473 }, { "epoch": 1.37, "learning_rate": 0.0001695896510120518, "loss": 1.5924, "step": 17474 }, { "epoch": 1.37, "learning_rate": 0.00016957739708483484, "loss": 1.5197, "step": 17475 }, { "epoch": 1.38, "learning_rate": 0.00016956514302469823, "loss": 1.5804, "step": 17476 }, { "epoch": 1.38, "learning_rate": 0.00016955288883172508, "loss": 1.5047, "step": 17477 }, { "epoch": 1.38, "learning_rate": 0.00016954063450599858, "loss": 1.5177, "step": 17478 }, { "epoch": 1.38, "learning_rate": 0.00016952838004760198, "loss": 1.5006, "step": 17479 }, { "epoch": 1.38, "learning_rate": 0.0001695161254566184, "loss": 1.5721, "step": 17480 }, { "epoch": 1.38, "learning_rate": 0.00016950387073313115, "loss": 1.4999, "step": 17481 }, { "epoch": 1.38, "learning_rate": 0.00016949161587722337, "loss": 1.5715, "step": 17482 }, { "epoch": 1.38, "learning_rate": 0.00016947936088897826, "loss": 1.5428, "step": 17483 }, { "epoch": 1.38, "learning_rate": 0.00016946710576847907, "loss": 1.4997, "step": 17484 }, { "epoch": 1.38, "learning_rate": 0.000169454850515809, "loss": 1.5298, "step": 17485 }, { "epoch": 1.38, "learning_rate": 0.00016944259513105116, "loss": 1.5715, "step": 17486 }, { "epoch": 1.38, "learning_rate": 0.00016943033961428882, "loss": 1.5442, "step": 17487 }, { "epoch": 1.38, "learning_rate": 0.00016941808396560523, "loss": 1.5186, "step": 17488 }, { "epoch": 1.38, "learning_rate": 0.0001694058281850836, "loss": 1.5165, "step": 17489 }, { "epoch": 1.38, "learning_rate": 0.00016939357227280707, "loss": 1.5665, "step": 17490 }, { "epoch": 1.38, "learning_rate": 0.00016938131622885888, "loss": 1.4658, "step": 17491 }, { "epoch": 1.38, "learning_rate": 0.00016936906005332226, "loss": 1.5474, "step": 17492 }, { "epoch": 1.38, "learning_rate": 0.00016935680374628042, "loss": 1.557, "step": 17493 }, { "epoch": 1.38, "learning_rate": 0.0001693445473078166, "loss": 1.5283, "step": 17494 }, { "epoch": 1.38, "learning_rate": 0.00016933229073801394, "loss": 1.5368, "step": 17495 }, { "epoch": 1.38, "learning_rate": 0.00016932003403695564, "loss": 1.4972, "step": 17496 }, { "epoch": 1.38, "learning_rate": 0.00016930777720472505, "loss": 1.5096, "step": 17497 }, { "epoch": 1.38, "learning_rate": 0.00016929552024140524, "loss": 1.5034, "step": 17498 }, { "epoch": 1.38, "learning_rate": 0.00016928326314707954, "loss": 1.4966, "step": 17499 }, { "epoch": 1.38, "learning_rate": 0.00016927100592183114, "loss": 1.5236, "step": 17500 }, { "epoch": 1.38, "learning_rate": 0.0001692587485657432, "loss": 1.5986, "step": 17501 }, { "epoch": 1.38, "learning_rate": 0.00016924649107889902, "loss": 1.5516, "step": 17502 }, { "epoch": 1.38, "learning_rate": 0.00016923423346138178, "loss": 1.4911, "step": 17503 }, { "epoch": 1.38, "learning_rate": 0.0001692219757132747, "loss": 1.4777, "step": 17504 }, { "epoch": 1.38, "learning_rate": 0.00016920971783466101, "loss": 1.5808, "step": 17505 }, { "epoch": 1.38, "learning_rate": 0.00016919745982562392, "loss": 1.5754, "step": 17506 }, { "epoch": 1.38, "learning_rate": 0.00016918520168624675, "loss": 1.508, "step": 17507 }, { "epoch": 1.38, "learning_rate": 0.00016917294341661256, "loss": 1.5387, "step": 17508 }, { "epoch": 1.38, "learning_rate": 0.0001691606850168047, "loss": 1.5134, "step": 17509 }, { "epoch": 1.38, "learning_rate": 0.00016914842648690638, "loss": 1.5017, "step": 17510 }, { "epoch": 1.38, "learning_rate": 0.0001691361678270008, "loss": 1.55, "step": 17511 }, { "epoch": 1.38, "learning_rate": 0.00016912390903717117, "loss": 1.5219, "step": 17512 }, { "epoch": 1.38, "learning_rate": 0.00016911165011750074, "loss": 1.5277, "step": 17513 }, { "epoch": 1.38, "learning_rate": 0.0001690993910680728, "loss": 1.508, "step": 17514 }, { "epoch": 1.38, "learning_rate": 0.00016908713188897053, "loss": 1.5312, "step": 17515 }, { "epoch": 1.38, "learning_rate": 0.00016907487258027715, "loss": 1.5092, "step": 17516 }, { "epoch": 1.38, "learning_rate": 0.00016906261314207595, "loss": 1.4974, "step": 17517 }, { "epoch": 1.38, "learning_rate": 0.00016905035357445006, "loss": 1.5368, "step": 17518 }, { "epoch": 1.38, "learning_rate": 0.00016903809387748282, "loss": 1.5229, "step": 17519 }, { "epoch": 1.38, "learning_rate": 0.00016902583405125742, "loss": 1.5226, "step": 17520 }, { "epoch": 1.38, "learning_rate": 0.0001690135740958571, "loss": 1.518, "step": 17521 }, { "epoch": 1.38, "learning_rate": 0.00016900131401136515, "loss": 1.5084, "step": 17522 }, { "epoch": 1.38, "learning_rate": 0.0001689890537978647, "loss": 1.49, "step": 17523 }, { "epoch": 1.38, "learning_rate": 0.00016897679345543912, "loss": 1.5476, "step": 17524 }, { "epoch": 1.38, "learning_rate": 0.00016896453298417152, "loss": 1.5068, "step": 17525 }, { "epoch": 1.38, "learning_rate": 0.00016895227238414526, "loss": 1.5274, "step": 17526 }, { "epoch": 1.38, "learning_rate": 0.0001689400116554435, "loss": 1.4907, "step": 17527 }, { "epoch": 1.38, "learning_rate": 0.00016892775079814946, "loss": 1.5221, "step": 17528 }, { "epoch": 1.38, "learning_rate": 0.00016891548981234656, "loss": 1.4886, "step": 17529 }, { "epoch": 1.38, "learning_rate": 0.00016890322869811782, "loss": 1.541, "step": 17530 }, { "epoch": 1.38, "learning_rate": 0.0001688909674555466, "loss": 1.4807, "step": 17531 }, { "epoch": 1.38, "learning_rate": 0.00016887870608471619, "loss": 1.5277, "step": 17532 }, { "epoch": 1.38, "learning_rate": 0.00016886644458570976, "loss": 1.5135, "step": 17533 }, { "epoch": 1.38, "learning_rate": 0.0001688541829586106, "loss": 1.4854, "step": 17534 }, { "epoch": 1.38, "learning_rate": 0.00016884192120350189, "loss": 1.5056, "step": 17535 }, { "epoch": 1.38, "learning_rate": 0.00016882965932046696, "loss": 1.5318, "step": 17536 }, { "epoch": 1.38, "learning_rate": 0.00016881739730958904, "loss": 1.4831, "step": 17537 }, { "epoch": 1.38, "learning_rate": 0.00016880513517095137, "loss": 1.4664, "step": 17538 }, { "epoch": 1.38, "learning_rate": 0.00016879287290463724, "loss": 1.5387, "step": 17539 }, { "epoch": 1.38, "learning_rate": 0.00016878061051072983, "loss": 1.5377, "step": 17540 }, { "epoch": 1.38, "learning_rate": 0.00016876834798931246, "loss": 1.5276, "step": 17541 }, { "epoch": 1.38, "learning_rate": 0.00016875608534046838, "loss": 1.5621, "step": 17542 }, { "epoch": 1.38, "learning_rate": 0.00016874382256428078, "loss": 1.5356, "step": 17543 }, { "epoch": 1.38, "learning_rate": 0.000168731559660833, "loss": 1.5298, "step": 17544 }, { "epoch": 1.38, "learning_rate": 0.00016871929663020825, "loss": 1.5004, "step": 17545 }, { "epoch": 1.38, "learning_rate": 0.00016870703347248984, "loss": 1.5036, "step": 17546 }, { "epoch": 1.38, "learning_rate": 0.00016869477018776097, "loss": 1.4937, "step": 17547 }, { "epoch": 1.38, "learning_rate": 0.00016868250677610496, "loss": 1.5586, "step": 17548 }, { "epoch": 1.38, "learning_rate": 0.00016867024323760502, "loss": 1.458, "step": 17549 }, { "epoch": 1.38, "learning_rate": 0.00016865797957234442, "loss": 1.5677, "step": 17550 }, { "epoch": 1.38, "learning_rate": 0.00016864571578040645, "loss": 1.5688, "step": 17551 }, { "epoch": 1.38, "learning_rate": 0.0001686334518618743, "loss": 1.5451, "step": 17552 }, { "epoch": 1.38, "learning_rate": 0.0001686211878168314, "loss": 1.5688, "step": 17553 }, { "epoch": 1.38, "learning_rate": 0.00016860892364536082, "loss": 1.5236, "step": 17554 }, { "epoch": 1.38, "learning_rate": 0.00016859665934754596, "loss": 1.5244, "step": 17555 }, { "epoch": 1.38, "learning_rate": 0.00016858439492347006, "loss": 1.5026, "step": 17556 }, { "epoch": 1.38, "learning_rate": 0.00016857213037321634, "loss": 1.5425, "step": 17557 }, { "epoch": 1.38, "learning_rate": 0.00016855986569686812, "loss": 1.5694, "step": 17558 }, { "epoch": 1.38, "learning_rate": 0.00016854760089450864, "loss": 1.544, "step": 17559 }, { "epoch": 1.38, "learning_rate": 0.0001685353359662212, "loss": 1.5604, "step": 17560 }, { "epoch": 1.38, "learning_rate": 0.00016852307091208907, "loss": 1.4932, "step": 17561 }, { "epoch": 1.38, "learning_rate": 0.00016851080573219548, "loss": 1.5282, "step": 17562 }, { "epoch": 1.38, "learning_rate": 0.00016849854042662375, "loss": 1.5161, "step": 17563 }, { "epoch": 1.38, "learning_rate": 0.00016848627499545712, "loss": 1.5041, "step": 17564 }, { "epoch": 1.38, "learning_rate": 0.00016847400943877891, "loss": 1.5234, "step": 17565 }, { "epoch": 1.38, "learning_rate": 0.00016846174375667236, "loss": 1.4888, "step": 17566 }, { "epoch": 1.38, "learning_rate": 0.00016844947794922074, "loss": 1.4846, "step": 17567 }, { "epoch": 1.38, "learning_rate": 0.0001684372120165074, "loss": 1.5578, "step": 17568 }, { "epoch": 1.38, "learning_rate": 0.00016842494595861553, "loss": 1.5059, "step": 17569 }, { "epoch": 1.38, "learning_rate": 0.00016841267977562842, "loss": 1.5558, "step": 17570 }, { "epoch": 1.38, "learning_rate": 0.00016840041346762944, "loss": 1.4837, "step": 17571 }, { "epoch": 1.38, "learning_rate": 0.00016838814703470177, "loss": 1.5591, "step": 17572 }, { "epoch": 1.38, "learning_rate": 0.00016837588047692874, "loss": 1.5266, "step": 17573 }, { "epoch": 1.38, "learning_rate": 0.00016836361379439358, "loss": 1.5016, "step": 17574 }, { "epoch": 1.38, "learning_rate": 0.00016835134698717962, "loss": 1.4967, "step": 17575 }, { "epoch": 1.38, "learning_rate": 0.0001683390800553702, "loss": 1.5658, "step": 17576 }, { "epoch": 1.38, "learning_rate": 0.00016832681299904848, "loss": 1.568, "step": 17577 }, { "epoch": 1.38, "learning_rate": 0.0001683145458182979, "loss": 1.528, "step": 17578 }, { "epoch": 1.38, "learning_rate": 0.00016830227851320157, "loss": 1.5189, "step": 17579 }, { "epoch": 1.38, "learning_rate": 0.00016829001108384294, "loss": 1.5706, "step": 17580 }, { "epoch": 1.38, "learning_rate": 0.00016827774353030518, "loss": 1.5125, "step": 17581 }, { "epoch": 1.38, "learning_rate": 0.00016826547585267163, "loss": 1.4921, "step": 17582 }, { "epoch": 1.38, "learning_rate": 0.00016825320805102556, "loss": 1.4682, "step": 17583 }, { "epoch": 1.38, "learning_rate": 0.00016824094012545034, "loss": 1.494, "step": 17584 }, { "epoch": 1.38, "learning_rate": 0.0001682286720760292, "loss": 1.5612, "step": 17585 }, { "epoch": 1.38, "learning_rate": 0.0001682164039028454, "loss": 1.5238, "step": 17586 }, { "epoch": 1.38, "learning_rate": 0.00016820413560598226, "loss": 1.5461, "step": 17587 }, { "epoch": 1.38, "learning_rate": 0.00016819186718552311, "loss": 1.584, "step": 17588 }, { "epoch": 1.38, "learning_rate": 0.0001681795986415512, "loss": 1.5143, "step": 17589 }, { "epoch": 1.38, "learning_rate": 0.0001681673299741499, "loss": 1.514, "step": 17590 }, { "epoch": 1.38, "learning_rate": 0.00016815506118340236, "loss": 1.5147, "step": 17591 }, { "epoch": 1.38, "learning_rate": 0.00016814279226939205, "loss": 1.5037, "step": 17592 }, { "epoch": 1.38, "learning_rate": 0.0001681305232322022, "loss": 1.5575, "step": 17593 }, { "epoch": 1.38, "learning_rate": 0.00016811825407191605, "loss": 1.5401, "step": 17594 }, { "epoch": 1.38, "learning_rate": 0.00016810598478861702, "loss": 1.5315, "step": 17595 }, { "epoch": 1.38, "learning_rate": 0.00016809371538238827, "loss": 1.5285, "step": 17596 }, { "epoch": 1.38, "learning_rate": 0.00016808144585331325, "loss": 1.5528, "step": 17597 }, { "epoch": 1.38, "learning_rate": 0.0001680691762014751, "loss": 1.451, "step": 17598 }, { "epoch": 1.38, "learning_rate": 0.00016805690642695726, "loss": 1.5248, "step": 17599 }, { "epoch": 1.38, "learning_rate": 0.00016804463652984303, "loss": 1.5726, "step": 17600 }, { "epoch": 1.38, "learning_rate": 0.00016803236651021563, "loss": 1.5147, "step": 17601 }, { "epoch": 1.38, "learning_rate": 0.00016802009636815844, "loss": 1.6087, "step": 17602 }, { "epoch": 1.39, "learning_rate": 0.0001680078261037547, "loss": 1.56, "step": 17603 }, { "epoch": 1.39, "learning_rate": 0.00016799555571708782, "loss": 1.6017, "step": 17604 }, { "epoch": 1.39, "learning_rate": 0.00016798328520824102, "loss": 1.538, "step": 17605 }, { "epoch": 1.39, "learning_rate": 0.0001679710145772976, "loss": 1.5265, "step": 17606 }, { "epoch": 1.39, "learning_rate": 0.00016795874382434094, "loss": 1.5472, "step": 17607 }, { "epoch": 1.39, "learning_rate": 0.00016794647294945432, "loss": 1.5011, "step": 17608 }, { "epoch": 1.39, "learning_rate": 0.00016793420195272107, "loss": 1.5646, "step": 17609 }, { "epoch": 1.39, "learning_rate": 0.00016792193083422444, "loss": 1.5351, "step": 17610 }, { "epoch": 1.39, "learning_rate": 0.00016790965959404783, "loss": 1.5026, "step": 17611 }, { "epoch": 1.39, "learning_rate": 0.00016789738823227453, "loss": 1.4908, "step": 17612 }, { "epoch": 1.39, "learning_rate": 0.00016788511674898778, "loss": 1.5444, "step": 17613 }, { "epoch": 1.39, "learning_rate": 0.000167872845144271, "loss": 1.5231, "step": 17614 }, { "epoch": 1.39, "learning_rate": 0.00016786057341820743, "loss": 1.487, "step": 17615 }, { "epoch": 1.39, "learning_rate": 0.00016784830157088045, "loss": 1.6044, "step": 17616 }, { "epoch": 1.39, "learning_rate": 0.00016783602960237338, "loss": 1.5282, "step": 17617 }, { "epoch": 1.39, "learning_rate": 0.00016782375751276944, "loss": 1.554, "step": 17618 }, { "epoch": 1.39, "learning_rate": 0.00016781148530215209, "loss": 1.5021, "step": 17619 }, { "epoch": 1.39, "learning_rate": 0.00016779921297060455, "loss": 1.5251, "step": 17620 }, { "epoch": 1.39, "learning_rate": 0.00016778694051821017, "loss": 1.53, "step": 17621 }, { "epoch": 1.39, "learning_rate": 0.00016777466794505228, "loss": 1.5231, "step": 17622 }, { "epoch": 1.39, "learning_rate": 0.0001677623952512142, "loss": 1.5284, "step": 17623 }, { "epoch": 1.39, "learning_rate": 0.00016775012243677931, "loss": 1.4942, "step": 17624 }, { "epoch": 1.39, "learning_rate": 0.00016773784950183083, "loss": 1.5193, "step": 17625 }, { "epoch": 1.39, "learning_rate": 0.00016772557644645217, "loss": 1.4875, "step": 17626 }, { "epoch": 1.39, "learning_rate": 0.00016771330327072662, "loss": 1.5324, "step": 17627 }, { "epoch": 1.39, "learning_rate": 0.0001677010299747375, "loss": 1.5104, "step": 17628 }, { "epoch": 1.39, "learning_rate": 0.0001676887565585682, "loss": 1.5434, "step": 17629 }, { "epoch": 1.39, "learning_rate": 0.00016767648302230194, "loss": 1.5204, "step": 17630 }, { "epoch": 1.39, "learning_rate": 0.00016766420936602214, "loss": 1.517, "step": 17631 }, { "epoch": 1.39, "learning_rate": 0.0001676519355898121, "loss": 1.5445, "step": 17632 }, { "epoch": 1.39, "learning_rate": 0.00016763966169375518, "loss": 1.5066, "step": 17633 }, { "epoch": 1.39, "learning_rate": 0.0001676273876779347, "loss": 1.4592, "step": 17634 }, { "epoch": 1.39, "learning_rate": 0.00016761511354243397, "loss": 1.541, "step": 17635 }, { "epoch": 1.39, "learning_rate": 0.00016760283928733636, "loss": 1.547, "step": 17636 }, { "epoch": 1.39, "learning_rate": 0.00016759056491272515, "loss": 1.5584, "step": 17637 }, { "epoch": 1.39, "learning_rate": 0.0001675782904186837, "loss": 1.5518, "step": 17638 }, { "epoch": 1.39, "learning_rate": 0.00016756601580529537, "loss": 1.5574, "step": 17639 }, { "epoch": 1.39, "learning_rate": 0.0001675537410726435, "loss": 1.5822, "step": 17640 }, { "epoch": 1.39, "learning_rate": 0.00016754146622081144, "loss": 1.5409, "step": 17641 }, { "epoch": 1.39, "learning_rate": 0.00016752919124988247, "loss": 1.4933, "step": 17642 }, { "epoch": 1.39, "learning_rate": 0.00016751691615993995, "loss": 1.5626, "step": 17643 }, { "epoch": 1.39, "learning_rate": 0.0001675046409510673, "loss": 1.5665, "step": 17644 }, { "epoch": 1.39, "learning_rate": 0.00016749236562334775, "loss": 1.596, "step": 17645 }, { "epoch": 1.39, "learning_rate": 0.00016748009017686466, "loss": 1.5712, "step": 17646 }, { "epoch": 1.39, "learning_rate": 0.00016746781461170145, "loss": 1.5721, "step": 17647 }, { "epoch": 1.39, "learning_rate": 0.00016745553892794145, "loss": 1.4711, "step": 17648 }, { "epoch": 1.39, "learning_rate": 0.0001674432631256679, "loss": 1.5173, "step": 17649 }, { "epoch": 1.39, "learning_rate": 0.00016743098720496425, "loss": 1.5158, "step": 17650 }, { "epoch": 1.39, "learning_rate": 0.00016741871116591385, "loss": 1.5218, "step": 17651 }, { "epoch": 1.39, "learning_rate": 0.00016740643500859996, "loss": 1.5054, "step": 17652 }, { "epoch": 1.39, "learning_rate": 0.000167394158733106, "loss": 1.4632, "step": 17653 }, { "epoch": 1.39, "learning_rate": 0.00016738188233951528, "loss": 1.5281, "step": 17654 }, { "epoch": 1.39, "learning_rate": 0.0001673696058279112, "loss": 1.5473, "step": 17655 }, { "epoch": 1.39, "learning_rate": 0.0001673573291983771, "loss": 1.5614, "step": 17656 }, { "epoch": 1.39, "learning_rate": 0.0001673450524509963, "loss": 1.548, "step": 17657 }, { "epoch": 1.39, "learning_rate": 0.00016733277558585215, "loss": 1.5244, "step": 17658 }, { "epoch": 1.39, "learning_rate": 0.000167320498603028, "loss": 1.5406, "step": 17659 }, { "epoch": 1.39, "learning_rate": 0.00016730822150260726, "loss": 1.535, "step": 17660 }, { "epoch": 1.39, "learning_rate": 0.00016729594428467324, "loss": 1.5062, "step": 17661 }, { "epoch": 1.39, "learning_rate": 0.0001672836669493093, "loss": 1.4609, "step": 17662 }, { "epoch": 1.39, "learning_rate": 0.0001672713894965988, "loss": 1.5677, "step": 17663 }, { "epoch": 1.39, "learning_rate": 0.00016725911192662506, "loss": 1.51, "step": 17664 }, { "epoch": 1.39, "learning_rate": 0.00016724683423947155, "loss": 1.5568, "step": 17665 }, { "epoch": 1.39, "learning_rate": 0.0001672345564352215, "loss": 1.5335, "step": 17666 }, { "epoch": 1.39, "learning_rate": 0.00016722227851395833, "loss": 1.5298, "step": 17667 }, { "epoch": 1.39, "learning_rate": 0.00016721000047576542, "loss": 1.5706, "step": 17668 }, { "epoch": 1.39, "learning_rate": 0.00016719772232072602, "loss": 1.5308, "step": 17669 }, { "epoch": 1.39, "learning_rate": 0.0001671854440489237, "loss": 1.5574, "step": 17670 }, { "epoch": 1.39, "learning_rate": 0.00016717316566044162, "loss": 1.5094, "step": 17671 }, { "epoch": 1.39, "learning_rate": 0.00016716088715536324, "loss": 1.513, "step": 17672 }, { "epoch": 1.39, "learning_rate": 0.00016714860853377192, "loss": 1.5365, "step": 17673 }, { "epoch": 1.39, "learning_rate": 0.00016713632979575098, "loss": 1.5349, "step": 17674 }, { "epoch": 1.39, "learning_rate": 0.00016712405094138384, "loss": 1.4707, "step": 17675 }, { "epoch": 1.39, "learning_rate": 0.00016711177197075382, "loss": 1.5198, "step": 17676 }, { "epoch": 1.39, "learning_rate": 0.00016709949288394436, "loss": 1.5668, "step": 17677 }, { "epoch": 1.39, "learning_rate": 0.00016708721368103872, "loss": 1.5113, "step": 17678 }, { "epoch": 1.39, "learning_rate": 0.00016707493436212033, "loss": 1.5251, "step": 17679 }, { "epoch": 1.39, "learning_rate": 0.00016706265492727265, "loss": 1.5161, "step": 17680 }, { "epoch": 1.39, "learning_rate": 0.00016705037537657885, "loss": 1.5079, "step": 17681 }, { "epoch": 1.39, "learning_rate": 0.00016703809571012247, "loss": 1.5333, "step": 17682 }, { "epoch": 1.39, "learning_rate": 0.0001670258159279868, "loss": 1.5272, "step": 17683 }, { "epoch": 1.39, "learning_rate": 0.00016701353603025524, "loss": 1.4927, "step": 17684 }, { "epoch": 1.39, "learning_rate": 0.00016700125601701118, "loss": 1.5313, "step": 17685 }, { "epoch": 1.39, "learning_rate": 0.00016698897588833793, "loss": 1.5636, "step": 17686 }, { "epoch": 1.39, "learning_rate": 0.00016697669564431897, "loss": 1.5156, "step": 17687 }, { "epoch": 1.39, "learning_rate": 0.00016696441528503756, "loss": 1.5287, "step": 17688 }, { "epoch": 1.39, "learning_rate": 0.00016695213481057714, "loss": 1.4859, "step": 17689 }, { "epoch": 1.39, "learning_rate": 0.0001669398542210211, "loss": 1.5357, "step": 17690 }, { "epoch": 1.39, "learning_rate": 0.0001669275735164528, "loss": 1.5085, "step": 17691 }, { "epoch": 1.39, "learning_rate": 0.00016691529269695563, "loss": 1.5673, "step": 17692 }, { "epoch": 1.39, "learning_rate": 0.0001669030117626129, "loss": 1.4941, "step": 17693 }, { "epoch": 1.39, "learning_rate": 0.0001668907307135081, "loss": 1.5422, "step": 17694 }, { "epoch": 1.39, "learning_rate": 0.00016687844954972454, "loss": 1.4932, "step": 17695 }, { "epoch": 1.39, "learning_rate": 0.00016686616827134559, "loss": 1.5374, "step": 17696 }, { "epoch": 1.39, "learning_rate": 0.00016685388687845472, "loss": 1.4861, "step": 17697 }, { "epoch": 1.39, "learning_rate": 0.00016684160537113523, "loss": 1.5113, "step": 17698 }, { "epoch": 1.39, "learning_rate": 0.00016682932374947052, "loss": 1.5296, "step": 17699 }, { "epoch": 1.39, "learning_rate": 0.00016681704201354405, "loss": 1.488, "step": 17700 }, { "epoch": 1.39, "learning_rate": 0.00016680476016343906, "loss": 1.5556, "step": 17701 }, { "epoch": 1.39, "learning_rate": 0.00016679247819923908, "loss": 1.5163, "step": 17702 }, { "epoch": 1.39, "learning_rate": 0.00016678019612102743, "loss": 1.5054, "step": 17703 }, { "epoch": 1.39, "learning_rate": 0.00016676791392888752, "loss": 1.527, "step": 17704 }, { "epoch": 1.39, "learning_rate": 0.00016675563162290273, "loss": 1.5599, "step": 17705 }, { "epoch": 1.39, "learning_rate": 0.0001667433492031564, "loss": 1.5054, "step": 17706 }, { "epoch": 1.39, "learning_rate": 0.000166731066669732, "loss": 1.5071, "step": 17707 }, { "epoch": 1.39, "learning_rate": 0.00016671878402271288, "loss": 1.5088, "step": 17708 }, { "epoch": 1.39, "learning_rate": 0.00016670650126218248, "loss": 1.5478, "step": 17709 }, { "epoch": 1.39, "learning_rate": 0.00016669421838822412, "loss": 1.5635, "step": 17710 }, { "epoch": 1.39, "learning_rate": 0.0001666819354009212, "loss": 1.5489, "step": 17711 }, { "epoch": 1.39, "learning_rate": 0.00016666965230035722, "loss": 1.5413, "step": 17712 }, { "epoch": 1.39, "learning_rate": 0.00016665736908661542, "loss": 1.5305, "step": 17713 }, { "epoch": 1.39, "learning_rate": 0.00016664508575977937, "loss": 1.526, "step": 17714 }, { "epoch": 1.39, "learning_rate": 0.00016663280231993233, "loss": 1.5493, "step": 17715 }, { "epoch": 1.39, "learning_rate": 0.00016662051876715773, "loss": 1.4558, "step": 17716 }, { "epoch": 1.39, "learning_rate": 0.00016660823510153893, "loss": 1.5332, "step": 17717 }, { "epoch": 1.39, "learning_rate": 0.00016659595132315945, "loss": 1.4958, "step": 17718 }, { "epoch": 1.39, "learning_rate": 0.0001665836674321026, "loss": 1.5456, "step": 17719 }, { "epoch": 1.39, "learning_rate": 0.0001665713834284518, "loss": 1.552, "step": 17720 }, { "epoch": 1.39, "learning_rate": 0.00016655909931229048, "loss": 1.4847, "step": 17721 }, { "epoch": 1.39, "learning_rate": 0.00016654681508370198, "loss": 1.5171, "step": 17722 }, { "epoch": 1.39, "learning_rate": 0.00016653453074276972, "loss": 1.5072, "step": 17723 }, { "epoch": 1.39, "learning_rate": 0.00016652224628957714, "loss": 1.5711, "step": 17724 }, { "epoch": 1.39, "learning_rate": 0.00016650996172420764, "loss": 1.4921, "step": 17725 }, { "epoch": 1.39, "learning_rate": 0.00016649767704674458, "loss": 1.5267, "step": 17726 }, { "epoch": 1.39, "learning_rate": 0.00016648539225727144, "loss": 1.548, "step": 17727 }, { "epoch": 1.39, "learning_rate": 0.00016647310735587152, "loss": 1.5009, "step": 17728 }, { "epoch": 1.39, "learning_rate": 0.00016646082234262838, "loss": 1.521, "step": 17729 }, { "epoch": 1.4, "learning_rate": 0.0001664485372176253, "loss": 1.4739, "step": 17730 }, { "epoch": 1.4, "learning_rate": 0.00016643625198094572, "loss": 1.515, "step": 17731 }, { "epoch": 1.4, "learning_rate": 0.000166423966632673, "loss": 1.4861, "step": 17732 }, { "epoch": 1.4, "learning_rate": 0.0001664116811728907, "loss": 1.5258, "step": 17733 }, { "epoch": 1.4, "learning_rate": 0.00016639939560168213, "loss": 1.5329, "step": 17734 }, { "epoch": 1.4, "learning_rate": 0.00016638710991913065, "loss": 1.5259, "step": 17735 }, { "epoch": 1.4, "learning_rate": 0.00016637482412531983, "loss": 1.4902, "step": 17736 }, { "epoch": 1.4, "learning_rate": 0.00016636253822033294, "loss": 1.5349, "step": 17737 }, { "epoch": 1.4, "learning_rate": 0.00016635025220425344, "loss": 1.5358, "step": 17738 }, { "epoch": 1.4, "learning_rate": 0.00016633796607716476, "loss": 1.536, "step": 17739 }, { "epoch": 1.4, "learning_rate": 0.00016632567983915027, "loss": 1.5587, "step": 17740 }, { "epoch": 1.4, "learning_rate": 0.00016631339349029348, "loss": 1.5244, "step": 17741 }, { "epoch": 1.4, "learning_rate": 0.00016630110703067772, "loss": 1.4981, "step": 17742 }, { "epoch": 1.4, "learning_rate": 0.00016628882046038648, "loss": 1.5432, "step": 17743 }, { "epoch": 1.4, "learning_rate": 0.0001662765337795031, "loss": 1.4834, "step": 17744 }, { "epoch": 1.4, "learning_rate": 0.000166264246988111, "loss": 1.5487, "step": 17745 }, { "epoch": 1.4, "learning_rate": 0.00016625196008629374, "loss": 1.527, "step": 17746 }, { "epoch": 1.4, "learning_rate": 0.00016623967307413456, "loss": 1.5179, "step": 17747 }, { "epoch": 1.4, "learning_rate": 0.00016622738595171698, "loss": 1.5105, "step": 17748 }, { "epoch": 1.4, "learning_rate": 0.00016621509871912437, "loss": 1.565, "step": 17749 }, { "epoch": 1.4, "learning_rate": 0.00016620281137644024, "loss": 1.4826, "step": 17750 }, { "epoch": 1.4, "learning_rate": 0.00016619052392374795, "loss": 1.5001, "step": 17751 }, { "epoch": 1.4, "learning_rate": 0.00016617823636113092, "loss": 1.5121, "step": 17752 }, { "epoch": 1.4, "learning_rate": 0.00016616594868867267, "loss": 1.5559, "step": 17753 }, { "epoch": 1.4, "learning_rate": 0.00016615366090645645, "loss": 1.4834, "step": 17754 }, { "epoch": 1.4, "learning_rate": 0.00016614137301456582, "loss": 1.4894, "step": 17755 }, { "epoch": 1.4, "learning_rate": 0.00016612908501308419, "loss": 1.5266, "step": 17756 }, { "epoch": 1.4, "learning_rate": 0.00016611679690209494, "loss": 1.5491, "step": 17757 }, { "epoch": 1.4, "learning_rate": 0.00016610450868168156, "loss": 1.5069, "step": 17758 }, { "epoch": 1.4, "learning_rate": 0.00016609222035192744, "loss": 1.5373, "step": 17759 }, { "epoch": 1.4, "learning_rate": 0.00016607993191291605, "loss": 1.5376, "step": 17760 }, { "epoch": 1.4, "learning_rate": 0.0001660676433647308, "loss": 1.5801, "step": 17761 }, { "epoch": 1.4, "learning_rate": 0.00016605535470745505, "loss": 1.5326, "step": 17762 }, { "epoch": 1.4, "learning_rate": 0.00016604306594117239, "loss": 1.5356, "step": 17763 }, { "epoch": 1.4, "learning_rate": 0.00016603077706596605, "loss": 1.5699, "step": 17764 }, { "epoch": 1.4, "learning_rate": 0.0001660184880819197, "loss": 1.4911, "step": 17765 }, { "epoch": 1.4, "learning_rate": 0.00016600619898911662, "loss": 1.526, "step": 17766 }, { "epoch": 1.4, "learning_rate": 0.00016599390978764024, "loss": 1.5352, "step": 17767 }, { "epoch": 1.4, "learning_rate": 0.00016598162047757407, "loss": 1.5559, "step": 17768 }, { "epoch": 1.4, "learning_rate": 0.00016596933105900152, "loss": 1.526, "step": 17769 }, { "epoch": 1.4, "learning_rate": 0.00016595704153200608, "loss": 1.5629, "step": 17770 }, { "epoch": 1.4, "learning_rate": 0.00016594475189667102, "loss": 1.5353, "step": 17771 }, { "epoch": 1.4, "learning_rate": 0.00016593246215307998, "loss": 1.5621, "step": 17772 }, { "epoch": 1.4, "learning_rate": 0.00016592017230131624, "loss": 1.5282, "step": 17773 }, { "epoch": 1.4, "learning_rate": 0.00016590788234146337, "loss": 1.5276, "step": 17774 }, { "epoch": 1.4, "learning_rate": 0.00016589559227360475, "loss": 1.5485, "step": 17775 }, { "epoch": 1.4, "learning_rate": 0.00016588330209782383, "loss": 1.5558, "step": 17776 }, { "epoch": 1.4, "learning_rate": 0.0001658710118142041, "loss": 1.4528, "step": 17777 }, { "epoch": 1.4, "learning_rate": 0.00016585872142282887, "loss": 1.4797, "step": 17778 }, { "epoch": 1.4, "learning_rate": 0.0001658464309237817, "loss": 1.6063, "step": 17779 }, { "epoch": 1.4, "learning_rate": 0.00016583414031714604, "loss": 1.524, "step": 17780 }, { "epoch": 1.4, "learning_rate": 0.00016582184960300527, "loss": 1.5382, "step": 17781 }, { "epoch": 1.4, "learning_rate": 0.00016580955878144288, "loss": 1.5602, "step": 17782 }, { "epoch": 1.4, "learning_rate": 0.00016579726785254234, "loss": 1.5449, "step": 17783 }, { "epoch": 1.4, "learning_rate": 0.000165784976816387, "loss": 1.5068, "step": 17784 }, { "epoch": 1.4, "learning_rate": 0.0001657726856730605, "loss": 1.555, "step": 17785 }, { "epoch": 1.4, "learning_rate": 0.00016576039442264606, "loss": 1.5495, "step": 17786 }, { "epoch": 1.4, "learning_rate": 0.00016574810306522726, "loss": 1.4981, "step": 17787 }, { "epoch": 1.4, "learning_rate": 0.00016573581160088754, "loss": 1.547, "step": 17788 }, { "epoch": 1.4, "learning_rate": 0.00016572352002971037, "loss": 1.556, "step": 17789 }, { "epoch": 1.4, "learning_rate": 0.00016571122835177914, "loss": 1.504, "step": 17790 }, { "epoch": 1.4, "learning_rate": 0.00016569893656717737, "loss": 1.5472, "step": 17791 }, { "epoch": 1.4, "learning_rate": 0.00016568664467598847, "loss": 1.5291, "step": 17792 }, { "epoch": 1.4, "learning_rate": 0.0001656743526782959, "loss": 1.508, "step": 17793 }, { "epoch": 1.4, "learning_rate": 0.0001656620605741831, "loss": 1.5247, "step": 17794 }, { "epoch": 1.4, "learning_rate": 0.00016564976836373359, "loss": 1.5337, "step": 17795 }, { "epoch": 1.4, "learning_rate": 0.00016563747604703076, "loss": 1.5347, "step": 17796 }, { "epoch": 1.4, "learning_rate": 0.00016562518362415814, "loss": 1.4746, "step": 17797 }, { "epoch": 1.4, "learning_rate": 0.00016561289109519913, "loss": 1.5107, "step": 17798 }, { "epoch": 1.4, "learning_rate": 0.00016560059846023725, "loss": 1.5381, "step": 17799 }, { "epoch": 1.4, "learning_rate": 0.00016558830571935582, "loss": 1.5172, "step": 17800 }, { "epoch": 1.4, "learning_rate": 0.00016557601287263844, "loss": 1.5339, "step": 17801 }, { "epoch": 1.4, "learning_rate": 0.00016556371992016856, "loss": 1.446, "step": 17802 }, { "epoch": 1.4, "learning_rate": 0.00016555142686202953, "loss": 1.5049, "step": 17803 }, { "epoch": 1.4, "learning_rate": 0.00016553913369830495, "loss": 1.4869, "step": 17804 }, { "epoch": 1.4, "learning_rate": 0.00016552684042907823, "loss": 1.5156, "step": 17805 }, { "epoch": 1.4, "learning_rate": 0.00016551454705443286, "loss": 1.4509, "step": 17806 }, { "epoch": 1.4, "learning_rate": 0.00016550225357445222, "loss": 1.5559, "step": 17807 }, { "epoch": 1.4, "learning_rate": 0.00016548995998921985, "loss": 1.5252, "step": 17808 }, { "epoch": 1.4, "learning_rate": 0.00016547766629881923, "loss": 1.5498, "step": 17809 }, { "epoch": 1.4, "learning_rate": 0.00016546537250333376, "loss": 1.523, "step": 17810 }, { "epoch": 1.4, "learning_rate": 0.00016545307860284694, "loss": 1.4884, "step": 17811 }, { "epoch": 1.4, "learning_rate": 0.00016544078459744226, "loss": 1.5367, "step": 17812 }, { "epoch": 1.4, "learning_rate": 0.00016542849048720317, "loss": 1.5366, "step": 17813 }, { "epoch": 1.4, "learning_rate": 0.00016541619627221318, "loss": 1.576, "step": 17814 }, { "epoch": 1.4, "learning_rate": 0.00016540390195255564, "loss": 1.521, "step": 17815 }, { "epoch": 1.4, "learning_rate": 0.00016539160752831423, "loss": 1.5324, "step": 17816 }, { "epoch": 1.4, "learning_rate": 0.0001653793129995722, "loss": 1.5606, "step": 17817 }, { "epoch": 1.4, "learning_rate": 0.00016536701836641313, "loss": 1.53, "step": 17818 }, { "epoch": 1.4, "learning_rate": 0.0001653547236289205, "loss": 1.5343, "step": 17819 }, { "epoch": 1.4, "learning_rate": 0.00016534242878717776, "loss": 1.5441, "step": 17820 }, { "epoch": 1.4, "learning_rate": 0.00016533013384126844, "loss": 1.5381, "step": 17821 }, { "epoch": 1.4, "learning_rate": 0.00016531783879127591, "loss": 1.5287, "step": 17822 }, { "epoch": 1.4, "learning_rate": 0.00016530554363728377, "loss": 1.5185, "step": 17823 }, { "epoch": 1.4, "learning_rate": 0.0001652932483793754, "loss": 1.5345, "step": 17824 }, { "epoch": 1.4, "learning_rate": 0.0001652809530176343, "loss": 1.5548, "step": 17825 }, { "epoch": 1.4, "learning_rate": 0.000165268657552144, "loss": 1.5583, "step": 17826 }, { "epoch": 1.4, "learning_rate": 0.0001652563619829879, "loss": 1.5628, "step": 17827 }, { "epoch": 1.4, "learning_rate": 0.00016524406631024955, "loss": 1.5419, "step": 17828 }, { "epoch": 1.4, "learning_rate": 0.00016523177053401239, "loss": 1.5493, "step": 17829 }, { "epoch": 1.4, "learning_rate": 0.00016521947465435993, "loss": 1.535, "step": 17830 }, { "epoch": 1.4, "learning_rate": 0.0001652071786713756, "loss": 1.4931, "step": 17831 }, { "epoch": 1.4, "learning_rate": 0.00016519488258514293, "loss": 1.5399, "step": 17832 }, { "epoch": 1.4, "learning_rate": 0.00016518258639574546, "loss": 1.5807, "step": 17833 }, { "epoch": 1.4, "learning_rate": 0.0001651702901032665, "loss": 1.4953, "step": 17834 }, { "epoch": 1.4, "learning_rate": 0.00016515799370778972, "loss": 1.5375, "step": 17835 }, { "epoch": 1.4, "learning_rate": 0.0001651456972093985, "loss": 1.5701, "step": 17836 }, { "epoch": 1.4, "learning_rate": 0.00016513340060817633, "loss": 1.5419, "step": 17837 }, { "epoch": 1.4, "learning_rate": 0.00016512110390420675, "loss": 1.5334, "step": 17838 }, { "epoch": 1.4, "learning_rate": 0.00016510880709757323, "loss": 1.5005, "step": 17839 }, { "epoch": 1.4, "learning_rate": 0.00016509651018835922, "loss": 1.5476, "step": 17840 }, { "epoch": 1.4, "learning_rate": 0.00016508421317664826, "loss": 1.4998, "step": 17841 }, { "epoch": 1.4, "learning_rate": 0.00016507191606252378, "loss": 1.5244, "step": 17842 }, { "epoch": 1.4, "learning_rate": 0.00016505961884606934, "loss": 1.5675, "step": 17843 }, { "epoch": 1.4, "learning_rate": 0.00016504732152736838, "loss": 1.5314, "step": 17844 }, { "epoch": 1.4, "learning_rate": 0.00016503502410650445, "loss": 1.533, "step": 17845 }, { "epoch": 1.4, "learning_rate": 0.00016502272658356097, "loss": 1.505, "step": 17846 }, { "epoch": 1.4, "learning_rate": 0.00016501042895862147, "loss": 1.5114, "step": 17847 }, { "epoch": 1.4, "learning_rate": 0.00016499813123176942, "loss": 1.508, "step": 17848 }, { "epoch": 1.4, "learning_rate": 0.00016498583340308838, "loss": 1.5202, "step": 17849 }, { "epoch": 1.4, "learning_rate": 0.00016497353547266177, "loss": 1.5023, "step": 17850 }, { "epoch": 1.4, "learning_rate": 0.00016496123744057313, "loss": 1.5569, "step": 17851 }, { "epoch": 1.4, "learning_rate": 0.0001649489393069059, "loss": 1.5299, "step": 17852 }, { "epoch": 1.4, "learning_rate": 0.0001649366410717437, "loss": 1.5084, "step": 17853 }, { "epoch": 1.4, "learning_rate": 0.0001649243427351699, "loss": 1.4912, "step": 17854 }, { "epoch": 1.4, "learning_rate": 0.00016491204429726808, "loss": 1.5459, "step": 17855 }, { "epoch": 1.4, "learning_rate": 0.0001648997457581217, "loss": 1.5043, "step": 17856 }, { "epoch": 1.41, "learning_rate": 0.00016488744711781424, "loss": 1.5447, "step": 17857 }, { "epoch": 1.41, "learning_rate": 0.00016487514837642924, "loss": 1.5229, "step": 17858 }, { "epoch": 1.41, "learning_rate": 0.0001648628495340502, "loss": 1.5091, "step": 17859 }, { "epoch": 1.41, "learning_rate": 0.00016485055059076064, "loss": 1.5032, "step": 17860 }, { "epoch": 1.41, "learning_rate": 0.000164838251546644, "loss": 1.5107, "step": 17861 }, { "epoch": 1.41, "learning_rate": 0.00016482595240178383, "loss": 1.4618, "step": 17862 }, { "epoch": 1.41, "learning_rate": 0.00016481365315626362, "loss": 1.5024, "step": 17863 }, { "epoch": 1.41, "learning_rate": 0.00016480135381016686, "loss": 1.5168, "step": 17864 }, { "epoch": 1.41, "learning_rate": 0.00016478905436357713, "loss": 1.5071, "step": 17865 }, { "epoch": 1.41, "learning_rate": 0.0001647767548165778, "loss": 1.5558, "step": 17866 }, { "epoch": 1.41, "learning_rate": 0.00016476445516925255, "loss": 1.5141, "step": 17867 }, { "epoch": 1.41, "learning_rate": 0.00016475215542168477, "loss": 1.5115, "step": 17868 }, { "epoch": 1.41, "learning_rate": 0.00016473985557395796, "loss": 1.515, "step": 17869 }, { "epoch": 1.41, "learning_rate": 0.0001647275556261557, "loss": 1.5137, "step": 17870 }, { "epoch": 1.41, "learning_rate": 0.00016471525557836144, "loss": 1.4616, "step": 17871 }, { "epoch": 1.41, "learning_rate": 0.00016470295543065877, "loss": 1.5569, "step": 17872 }, { "epoch": 1.41, "learning_rate": 0.00016469065518313108, "loss": 1.5379, "step": 17873 }, { "epoch": 1.41, "learning_rate": 0.00016467835483586197, "loss": 1.5526, "step": 17874 }, { "epoch": 1.41, "learning_rate": 0.00016466605438893492, "loss": 1.5346, "step": 17875 }, { "epoch": 1.41, "learning_rate": 0.00016465375384243347, "loss": 1.4748, "step": 17876 }, { "epoch": 1.41, "learning_rate": 0.0001646414531964411, "loss": 1.5469, "step": 17877 }, { "epoch": 1.41, "learning_rate": 0.0001646291524510414, "loss": 1.5632, "step": 17878 }, { "epoch": 1.41, "learning_rate": 0.00016461685160631774, "loss": 1.5036, "step": 17879 }, { "epoch": 1.41, "learning_rate": 0.00016460455066235382, "loss": 1.5238, "step": 17880 }, { "epoch": 1.41, "learning_rate": 0.00016459224961923297, "loss": 1.4855, "step": 17881 }, { "epoch": 1.41, "learning_rate": 0.00016457994847703884, "loss": 1.4829, "step": 17882 }, { "epoch": 1.41, "learning_rate": 0.0001645676472358549, "loss": 1.4841, "step": 17883 }, { "epoch": 1.41, "learning_rate": 0.0001645553458957647, "loss": 1.4838, "step": 17884 }, { "epoch": 1.41, "learning_rate": 0.0001645430444568517, "loss": 1.5752, "step": 17885 }, { "epoch": 1.41, "learning_rate": 0.00016453074291919946, "loss": 1.5069, "step": 17886 }, { "epoch": 1.41, "learning_rate": 0.00016451844128289152, "loss": 1.5307, "step": 17887 }, { "epoch": 1.41, "learning_rate": 0.00016450613954801138, "loss": 1.4894, "step": 17888 }, { "epoch": 1.41, "learning_rate": 0.00016449383771464249, "loss": 1.4983, "step": 17889 }, { "epoch": 1.41, "learning_rate": 0.0001644815357828685, "loss": 1.5483, "step": 17890 }, { "epoch": 1.41, "learning_rate": 0.00016446923375277285, "loss": 1.5061, "step": 17891 }, { "epoch": 1.41, "learning_rate": 0.0001644569316244391, "loss": 1.4869, "step": 17892 }, { "epoch": 1.41, "learning_rate": 0.00016444462939795075, "loss": 1.519, "step": 17893 }, { "epoch": 1.41, "learning_rate": 0.00016443232707339137, "loss": 1.5212, "step": 17894 }, { "epoch": 1.41, "learning_rate": 0.00016442002465084444, "loss": 1.521, "step": 17895 }, { "epoch": 1.41, "learning_rate": 0.00016440772213039347, "loss": 1.529, "step": 17896 }, { "epoch": 1.41, "learning_rate": 0.000164395419512122, "loss": 1.4673, "step": 17897 }, { "epoch": 1.41, "learning_rate": 0.00016438311679611362, "loss": 1.4759, "step": 17898 }, { "epoch": 1.41, "learning_rate": 0.00016437081398245184, "loss": 1.5137, "step": 17899 }, { "epoch": 1.41, "learning_rate": 0.0001643585110712201, "loss": 1.5071, "step": 17900 }, { "epoch": 1.41, "learning_rate": 0.00016434620806250207, "loss": 1.5076, "step": 17901 }, { "epoch": 1.41, "learning_rate": 0.0001643339049563811, "loss": 1.5405, "step": 17902 }, { "epoch": 1.41, "learning_rate": 0.00016432160175294092, "loss": 1.4751, "step": 17903 }, { "epoch": 1.41, "learning_rate": 0.00016430929845226492, "loss": 1.4663, "step": 17904 }, { "epoch": 1.41, "learning_rate": 0.00016429699505443666, "loss": 1.5043, "step": 17905 }, { "epoch": 1.41, "learning_rate": 0.00016428469155953978, "loss": 1.4971, "step": 17906 }, { "epoch": 1.41, "learning_rate": 0.00016427238796765762, "loss": 1.53, "step": 17907 }, { "epoch": 1.41, "learning_rate": 0.0001642600842788739, "loss": 1.4734, "step": 17908 }, { "epoch": 1.41, "learning_rate": 0.00016424778049327205, "loss": 1.5172, "step": 17909 }, { "epoch": 1.41, "learning_rate": 0.00016423547661093563, "loss": 1.5166, "step": 17910 }, { "epoch": 1.41, "learning_rate": 0.0001642231726319482, "loss": 1.5459, "step": 17911 }, { "epoch": 1.41, "learning_rate": 0.00016421086855639326, "loss": 1.5174, "step": 17912 }, { "epoch": 1.41, "learning_rate": 0.00016419856438435436, "loss": 1.5131, "step": 17913 }, { "epoch": 1.41, "learning_rate": 0.00016418626011591503, "loss": 1.4838, "step": 17914 }, { "epoch": 1.41, "learning_rate": 0.0001641739557511588, "loss": 1.5464, "step": 17915 }, { "epoch": 1.41, "learning_rate": 0.00016416165129016933, "loss": 1.4939, "step": 17916 }, { "epoch": 1.41, "learning_rate": 0.00016414934673302997, "loss": 1.5694, "step": 17917 }, { "epoch": 1.41, "learning_rate": 0.00016413704207982442, "loss": 1.5155, "step": 17918 }, { "epoch": 1.41, "learning_rate": 0.00016412473733063614, "loss": 1.5316, "step": 17919 }, { "epoch": 1.41, "learning_rate": 0.00016411243248554865, "loss": 1.5142, "step": 17920 }, { "epoch": 1.41, "learning_rate": 0.00016410012754464553, "loss": 1.4547, "step": 17921 }, { "epoch": 1.41, "learning_rate": 0.00016408782250801034, "loss": 1.5323, "step": 17922 }, { "epoch": 1.41, "learning_rate": 0.00016407551737572667, "loss": 1.5182, "step": 17923 }, { "epoch": 1.41, "learning_rate": 0.00016406321214787792, "loss": 1.51, "step": 17924 }, { "epoch": 1.41, "learning_rate": 0.00016405090682454775, "loss": 1.5081, "step": 17925 }, { "epoch": 1.41, "learning_rate": 0.0001640386014058197, "loss": 1.5066, "step": 17926 }, { "epoch": 1.41, "learning_rate": 0.00016402629589177726, "loss": 1.5271, "step": 17927 }, { "epoch": 1.41, "learning_rate": 0.00016401399028250407, "loss": 1.4333, "step": 17928 }, { "epoch": 1.41, "learning_rate": 0.0001640016845780835, "loss": 1.5216, "step": 17929 }, { "epoch": 1.41, "learning_rate": 0.00016398937877859932, "loss": 1.5597, "step": 17930 }, { "epoch": 1.41, "learning_rate": 0.00016397707288413494, "loss": 1.474, "step": 17931 }, { "epoch": 1.41, "learning_rate": 0.00016396476689477395, "loss": 1.4478, "step": 17932 }, { "epoch": 1.41, "learning_rate": 0.00016395246081059994, "loss": 1.5455, "step": 17933 }, { "epoch": 1.41, "learning_rate": 0.0001639401546316964, "loss": 1.5129, "step": 17934 }, { "epoch": 1.41, "learning_rate": 0.00016392784835814685, "loss": 1.5635, "step": 17935 }, { "epoch": 1.41, "learning_rate": 0.00016391554199003493, "loss": 1.5371, "step": 17936 }, { "epoch": 1.41, "learning_rate": 0.0001639032355274442, "loss": 1.559, "step": 17937 }, { "epoch": 1.41, "learning_rate": 0.00016389092897045815, "loss": 1.4796, "step": 17938 }, { "epoch": 1.41, "learning_rate": 0.00016387862231916032, "loss": 1.5294, "step": 17939 }, { "epoch": 1.41, "learning_rate": 0.00016386631557363434, "loss": 1.5699, "step": 17940 }, { "epoch": 1.41, "learning_rate": 0.00016385400873396373, "loss": 1.5134, "step": 17941 }, { "epoch": 1.41, "learning_rate": 0.00016384170180023202, "loss": 1.5157, "step": 17942 }, { "epoch": 1.41, "learning_rate": 0.00016382939477252282, "loss": 1.6142, "step": 17943 }, { "epoch": 1.41, "learning_rate": 0.00016381708765091964, "loss": 1.5579, "step": 17944 }, { "epoch": 1.41, "learning_rate": 0.00016380478043550608, "loss": 1.5161, "step": 17945 }, { "epoch": 1.41, "learning_rate": 0.00016379247312636567, "loss": 1.4985, "step": 17946 }, { "epoch": 1.41, "learning_rate": 0.00016378016572358195, "loss": 1.5347, "step": 17947 }, { "epoch": 1.41, "learning_rate": 0.00016376785822723856, "loss": 1.5268, "step": 17948 }, { "epoch": 1.41, "learning_rate": 0.000163755550637419, "loss": 1.4809, "step": 17949 }, { "epoch": 1.41, "learning_rate": 0.00016374324295420685, "loss": 1.528, "step": 17950 }, { "epoch": 1.41, "learning_rate": 0.00016373093517768562, "loss": 1.5315, "step": 17951 }, { "epoch": 1.41, "learning_rate": 0.00016371862730793895, "loss": 1.5681, "step": 17952 }, { "epoch": 1.41, "learning_rate": 0.00016370631934505036, "loss": 1.5139, "step": 17953 }, { "epoch": 1.41, "learning_rate": 0.00016369401128910342, "loss": 1.5488, "step": 17954 }, { "epoch": 1.41, "learning_rate": 0.00016368170314018173, "loss": 1.5109, "step": 17955 }, { "epoch": 1.41, "learning_rate": 0.00016366939489836877, "loss": 1.5453, "step": 17956 }, { "epoch": 1.41, "learning_rate": 0.00016365708656374822, "loss": 1.5188, "step": 17957 }, { "epoch": 1.41, "learning_rate": 0.00016364477813640355, "loss": 1.5198, "step": 17958 }, { "epoch": 1.41, "learning_rate": 0.00016363246961641838, "loss": 1.4592, "step": 17959 }, { "epoch": 1.41, "learning_rate": 0.00016362016100387628, "loss": 1.5217, "step": 17960 }, { "epoch": 1.41, "learning_rate": 0.00016360785229886074, "loss": 1.536, "step": 17961 }, { "epoch": 1.41, "learning_rate": 0.0001635955435014555, "loss": 1.5417, "step": 17962 }, { "epoch": 1.41, "learning_rate": 0.00016358323461174393, "loss": 1.4889, "step": 17963 }, { "epoch": 1.41, "learning_rate": 0.00016357092562980973, "loss": 1.5123, "step": 17964 }, { "epoch": 1.41, "learning_rate": 0.00016355861655573643, "loss": 1.5503, "step": 17965 }, { "epoch": 1.41, "learning_rate": 0.00016354630738960765, "loss": 1.5804, "step": 17966 }, { "epoch": 1.41, "learning_rate": 0.00016353399813150686, "loss": 1.5006, "step": 17967 }, { "epoch": 1.41, "learning_rate": 0.00016352168878151768, "loss": 1.53, "step": 17968 }, { "epoch": 1.41, "learning_rate": 0.00016350937933972375, "loss": 1.5629, "step": 17969 }, { "epoch": 1.41, "learning_rate": 0.00016349706980620855, "loss": 1.5346, "step": 17970 }, { "epoch": 1.41, "learning_rate": 0.0001634847601810557, "loss": 1.501, "step": 17971 }, { "epoch": 1.41, "learning_rate": 0.0001634724504643488, "loss": 1.5079, "step": 17972 }, { "epoch": 1.41, "learning_rate": 0.00016346014065617135, "loss": 1.5392, "step": 17973 }, { "epoch": 1.41, "learning_rate": 0.00016344783075660703, "loss": 1.5597, "step": 17974 }, { "epoch": 1.41, "learning_rate": 0.0001634355207657393, "loss": 1.5536, "step": 17975 }, { "epoch": 1.41, "learning_rate": 0.00016342321068365178, "loss": 1.5294, "step": 17976 }, { "epoch": 1.41, "learning_rate": 0.00016341090051042814, "loss": 1.523, "step": 17977 }, { "epoch": 1.41, "learning_rate": 0.00016339859024615185, "loss": 1.5405, "step": 17978 }, { "epoch": 1.41, "learning_rate": 0.00016338627989090652, "loss": 1.5343, "step": 17979 }, { "epoch": 1.41, "learning_rate": 0.00016337396944477575, "loss": 1.4578, "step": 17980 }, { "epoch": 1.41, "learning_rate": 0.0001633616589078431, "loss": 1.5396, "step": 17981 }, { "epoch": 1.41, "learning_rate": 0.0001633493482801922, "loss": 1.519, "step": 17982 }, { "epoch": 1.41, "learning_rate": 0.00016333703756190655, "loss": 1.5027, "step": 17983 }, { "epoch": 1.42, "learning_rate": 0.00016332472675306976, "loss": 1.5273, "step": 17984 }, { "epoch": 1.42, "learning_rate": 0.00016331241585376544, "loss": 1.5029, "step": 17985 }, { "epoch": 1.42, "learning_rate": 0.0001633001048640772, "loss": 1.5218, "step": 17986 }, { "epoch": 1.42, "learning_rate": 0.00016328779378408856, "loss": 1.5636, "step": 17987 }, { "epoch": 1.42, "learning_rate": 0.00016327548261388315, "loss": 1.5112, "step": 17988 }, { "epoch": 1.42, "learning_rate": 0.00016326317135354452, "loss": 1.5881, "step": 17989 }, { "epoch": 1.42, "learning_rate": 0.0001632508600031563, "loss": 1.5075, "step": 17990 }, { "epoch": 1.42, "learning_rate": 0.000163238548562802, "loss": 1.5313, "step": 17991 }, { "epoch": 1.42, "learning_rate": 0.00016322623703256527, "loss": 1.4912, "step": 17992 }, { "epoch": 1.42, "learning_rate": 0.00016321392541252973, "loss": 1.515, "step": 17993 }, { "epoch": 1.42, "learning_rate": 0.00016320161370277894, "loss": 1.5333, "step": 17994 }, { "epoch": 1.42, "learning_rate": 0.0001631893019033964, "loss": 1.4926, "step": 17995 }, { "epoch": 1.42, "learning_rate": 0.00016317699001446587, "loss": 1.5126, "step": 17996 }, { "epoch": 1.42, "learning_rate": 0.0001631646780360708, "loss": 1.5221, "step": 17997 }, { "epoch": 1.42, "learning_rate": 0.00016315236596829483, "loss": 1.5243, "step": 17998 }, { "epoch": 1.42, "learning_rate": 0.00016314005381122155, "loss": 1.536, "step": 17999 }, { "epoch": 1.42, "learning_rate": 0.00016312774156493457, "loss": 1.5241, "step": 18000 }, { "epoch": 1.42, "learning_rate": 0.00016311542922951746, "loss": 1.5134, "step": 18001 }, { "epoch": 1.42, "learning_rate": 0.00016310311680505386, "loss": 1.5492, "step": 18002 }, { "epoch": 1.42, "learning_rate": 0.00016309080429162726, "loss": 1.5285, "step": 18003 }, { "epoch": 1.42, "learning_rate": 0.00016307849168932138, "loss": 1.5442, "step": 18004 }, { "epoch": 1.42, "learning_rate": 0.00016306617899821974, "loss": 1.5305, "step": 18005 }, { "epoch": 1.42, "learning_rate": 0.00016305386621840598, "loss": 1.5252, "step": 18006 }, { "epoch": 1.42, "learning_rate": 0.00016304155334996361, "loss": 1.5581, "step": 18007 }, { "epoch": 1.42, "learning_rate": 0.00016302924039297633, "loss": 1.5699, "step": 18008 }, { "epoch": 1.42, "learning_rate": 0.0001630169273475277, "loss": 1.5246, "step": 18009 }, { "epoch": 1.42, "learning_rate": 0.00016300461421370132, "loss": 1.513, "step": 18010 }, { "epoch": 1.42, "learning_rate": 0.0001629923009915808, "loss": 1.555, "step": 18011 }, { "epoch": 1.42, "learning_rate": 0.00016297998768124967, "loss": 1.4721, "step": 18012 }, { "epoch": 1.42, "learning_rate": 0.00016296767428279163, "loss": 1.5169, "step": 18013 }, { "epoch": 1.42, "learning_rate": 0.00016295536079629022, "loss": 1.5519, "step": 18014 }, { "epoch": 1.42, "learning_rate": 0.0001629430472218291, "loss": 1.5392, "step": 18015 }, { "epoch": 1.42, "learning_rate": 0.00016293073355949178, "loss": 1.5591, "step": 18016 }, { "epoch": 1.42, "learning_rate": 0.00016291841980936193, "loss": 1.5302, "step": 18017 }, { "epoch": 1.42, "learning_rate": 0.00016290610597152316, "loss": 1.5106, "step": 18018 }, { "epoch": 1.42, "learning_rate": 0.00016289379204605903, "loss": 1.5555, "step": 18019 }, { "epoch": 1.42, "learning_rate": 0.00016288147803305314, "loss": 1.5001, "step": 18020 }, { "epoch": 1.42, "learning_rate": 0.00016286916393258919, "loss": 1.4957, "step": 18021 }, { "epoch": 1.42, "learning_rate": 0.00016285684974475068, "loss": 1.523, "step": 18022 }, { "epoch": 1.42, "learning_rate": 0.00016284453546962124, "loss": 1.4991, "step": 18023 }, { "epoch": 1.42, "learning_rate": 0.0001628322211072845, "loss": 1.5326, "step": 18024 }, { "epoch": 1.42, "learning_rate": 0.0001628199066578241, "loss": 1.5346, "step": 18025 }, { "epoch": 1.42, "learning_rate": 0.00016280759212132357, "loss": 1.4949, "step": 18026 }, { "epoch": 1.42, "learning_rate": 0.00016279527749786657, "loss": 1.522, "step": 18027 }, { "epoch": 1.42, "learning_rate": 0.0001627829627875367, "loss": 1.5507, "step": 18028 }, { "epoch": 1.42, "learning_rate": 0.00016277064799041752, "loss": 1.5348, "step": 18029 }, { "epoch": 1.42, "learning_rate": 0.00016275833310659275, "loss": 1.5247, "step": 18030 }, { "epoch": 1.42, "learning_rate": 0.0001627460181361459, "loss": 1.49, "step": 18031 }, { "epoch": 1.42, "learning_rate": 0.00016273370307916062, "loss": 1.5105, "step": 18032 }, { "epoch": 1.42, "learning_rate": 0.00016272138793572058, "loss": 1.5615, "step": 18033 }, { "epoch": 1.42, "learning_rate": 0.00016270907270590928, "loss": 1.4887, "step": 18034 }, { "epoch": 1.42, "learning_rate": 0.00016269675738981042, "loss": 1.5334, "step": 18035 }, { "epoch": 1.42, "learning_rate": 0.00016268444198750756, "loss": 1.5445, "step": 18036 }, { "epoch": 1.42, "learning_rate": 0.00016267212649908434, "loss": 1.5265, "step": 18037 }, { "epoch": 1.42, "learning_rate": 0.00016265981092462444, "loss": 1.5309, "step": 18038 }, { "epoch": 1.42, "learning_rate": 0.0001626474952642113, "loss": 1.5443, "step": 18039 }, { "epoch": 1.42, "learning_rate": 0.0001626351795179287, "loss": 1.512, "step": 18040 }, { "epoch": 1.42, "learning_rate": 0.0001626228636858602, "loss": 1.5762, "step": 18041 }, { "epoch": 1.42, "learning_rate": 0.00016261054776808945, "loss": 1.5445, "step": 18042 }, { "epoch": 1.42, "learning_rate": 0.0001625982317647, "loss": 1.5516, "step": 18043 }, { "epoch": 1.42, "learning_rate": 0.00016258591567577552, "loss": 1.5705, "step": 18044 }, { "epoch": 1.42, "learning_rate": 0.00016257359950139967, "loss": 1.5048, "step": 18045 }, { "epoch": 1.42, "learning_rate": 0.0001625612832416559, "loss": 1.4822, "step": 18046 }, { "epoch": 1.42, "learning_rate": 0.00016254896689662805, "loss": 1.5103, "step": 18047 }, { "epoch": 1.42, "learning_rate": 0.00016253665046639962, "loss": 1.5257, "step": 18048 }, { "epoch": 1.42, "learning_rate": 0.00016252433395105422, "loss": 1.4912, "step": 18049 }, { "epoch": 1.42, "learning_rate": 0.00016251201735067555, "loss": 1.5816, "step": 18050 }, { "epoch": 1.42, "learning_rate": 0.00016249970066534714, "loss": 1.4976, "step": 18051 }, { "epoch": 1.42, "learning_rate": 0.00016248738389515273, "loss": 1.5127, "step": 18052 }, { "epoch": 1.42, "learning_rate": 0.0001624750670401758, "loss": 1.5483, "step": 18053 }, { "epoch": 1.42, "learning_rate": 0.00016246275010050007, "loss": 1.5189, "step": 18054 }, { "epoch": 1.42, "learning_rate": 0.00016245043307620914, "loss": 1.4668, "step": 18055 }, { "epoch": 1.42, "learning_rate": 0.00016243811596738662, "loss": 1.5117, "step": 18056 }, { "epoch": 1.42, "learning_rate": 0.00016242579877411625, "loss": 1.6033, "step": 18057 }, { "epoch": 1.42, "learning_rate": 0.00016241348149648144, "loss": 1.5431, "step": 18058 }, { "epoch": 1.42, "learning_rate": 0.00016240116413456602, "loss": 1.532, "step": 18059 }, { "epoch": 1.42, "learning_rate": 0.00016238884668845355, "loss": 1.5132, "step": 18060 }, { "epoch": 1.42, "learning_rate": 0.0001623765291582276, "loss": 1.5637, "step": 18061 }, { "epoch": 1.42, "learning_rate": 0.00016236421154397187, "loss": 1.5839, "step": 18062 }, { "epoch": 1.42, "learning_rate": 0.00016235189384576992, "loss": 1.5085, "step": 18063 }, { "epoch": 1.42, "learning_rate": 0.00016233957606370548, "loss": 1.5302, "step": 18064 }, { "epoch": 1.42, "learning_rate": 0.00016232725819786213, "loss": 1.5084, "step": 18065 }, { "epoch": 1.42, "learning_rate": 0.0001623149402483235, "loss": 1.5117, "step": 18066 }, { "epoch": 1.42, "learning_rate": 0.0001623026222151732, "loss": 1.4963, "step": 18067 }, { "epoch": 1.42, "learning_rate": 0.00016229030409849489, "loss": 1.5456, "step": 18068 }, { "epoch": 1.42, "learning_rate": 0.00016227798589837222, "loss": 1.4714, "step": 18069 }, { "epoch": 1.42, "learning_rate": 0.00016226566761488875, "loss": 1.535, "step": 18070 }, { "epoch": 1.42, "learning_rate": 0.0001622533492481282, "loss": 1.4948, "step": 18071 }, { "epoch": 1.42, "learning_rate": 0.00016224103079817419, "loss": 1.4804, "step": 18072 }, { "epoch": 1.42, "learning_rate": 0.00016222871226511027, "loss": 1.5199, "step": 18073 }, { "epoch": 1.42, "learning_rate": 0.00016221639364902022, "loss": 1.5129, "step": 18074 }, { "epoch": 1.42, "learning_rate": 0.00016220407494998756, "loss": 1.5556, "step": 18075 }, { "epoch": 1.42, "learning_rate": 0.00016219175616809595, "loss": 1.5904, "step": 18076 }, { "epoch": 1.42, "learning_rate": 0.0001621794373034291, "loss": 1.5117, "step": 18077 }, { "epoch": 1.42, "learning_rate": 0.0001621671183560705, "loss": 1.4538, "step": 18078 }, { "epoch": 1.42, "learning_rate": 0.00016215479932610397, "loss": 1.4816, "step": 18079 }, { "epoch": 1.42, "learning_rate": 0.000162142480213613, "loss": 1.556, "step": 18080 }, { "epoch": 1.42, "learning_rate": 0.00016213016101868135, "loss": 1.5105, "step": 18081 }, { "epoch": 1.42, "learning_rate": 0.00016211784174139255, "loss": 1.5108, "step": 18082 }, { "epoch": 1.42, "learning_rate": 0.00016210552238183032, "loss": 1.567, "step": 18083 }, { "epoch": 1.42, "learning_rate": 0.00016209320294007827, "loss": 1.5303, "step": 18084 }, { "epoch": 1.42, "learning_rate": 0.00016208088341622003, "loss": 1.5312, "step": 18085 }, { "epoch": 1.42, "learning_rate": 0.00016206856381033926, "loss": 1.5181, "step": 18086 }, { "epoch": 1.42, "learning_rate": 0.00016205624412251958, "loss": 1.5665, "step": 18087 }, { "epoch": 1.42, "learning_rate": 0.00016204392435284468, "loss": 1.5549, "step": 18088 }, { "epoch": 1.42, "learning_rate": 0.0001620316045013982, "loss": 1.5216, "step": 18089 }, { "epoch": 1.42, "learning_rate": 0.00016201928456826374, "loss": 1.5467, "step": 18090 }, { "epoch": 1.42, "learning_rate": 0.00016200696455352502, "loss": 1.4764, "step": 18091 }, { "epoch": 1.42, "learning_rate": 0.00016199464445726557, "loss": 1.5297, "step": 18092 }, { "epoch": 1.42, "learning_rate": 0.00016198232427956915, "loss": 1.5387, "step": 18093 }, { "epoch": 1.42, "learning_rate": 0.00016197000402051932, "loss": 1.5692, "step": 18094 }, { "epoch": 1.42, "learning_rate": 0.00016195768368019976, "loss": 1.517, "step": 18095 }, { "epoch": 1.42, "learning_rate": 0.00016194536325869418, "loss": 1.5426, "step": 18096 }, { "epoch": 1.42, "learning_rate": 0.00016193304275608612, "loss": 1.5522, "step": 18097 }, { "epoch": 1.42, "learning_rate": 0.00016192072217245936, "loss": 1.5226, "step": 18098 }, { "epoch": 1.42, "learning_rate": 0.00016190840150789743, "loss": 1.5558, "step": 18099 }, { "epoch": 1.42, "learning_rate": 0.00016189608076248402, "loss": 1.5449, "step": 18100 }, { "epoch": 1.42, "learning_rate": 0.00016188375993630278, "loss": 1.5519, "step": 18101 }, { "epoch": 1.42, "learning_rate": 0.00016187143902943735, "loss": 1.5134, "step": 18102 }, { "epoch": 1.42, "learning_rate": 0.00016185911804197147, "loss": 1.4988, "step": 18103 }, { "epoch": 1.42, "learning_rate": 0.00016184679697398867, "loss": 1.4935, "step": 18104 }, { "epoch": 1.42, "learning_rate": 0.00016183447582557265, "loss": 1.5327, "step": 18105 }, { "epoch": 1.42, "learning_rate": 0.00016182215459680711, "loss": 1.5117, "step": 18106 }, { "epoch": 1.42, "learning_rate": 0.00016180983328777562, "loss": 1.5146, "step": 18107 }, { "epoch": 1.42, "learning_rate": 0.00016179751189856193, "loss": 1.4741, "step": 18108 }, { "epoch": 1.42, "learning_rate": 0.00016178519042924958, "loss": 1.5158, "step": 18109 }, { "epoch": 1.42, "learning_rate": 0.00016177286887992235, "loss": 1.481, "step": 18110 }, { "epoch": 1.42, "learning_rate": 0.0001617605472506638, "loss": 1.4964, "step": 18111 }, { "epoch": 1.43, "learning_rate": 0.00016174822554155765, "loss": 1.5199, "step": 18112 }, { "epoch": 1.43, "learning_rate": 0.00016173590375268755, "loss": 1.5429, "step": 18113 }, { "epoch": 1.43, "learning_rate": 0.00016172358188413708, "loss": 1.5291, "step": 18114 }, { "epoch": 1.43, "learning_rate": 0.00016171125993598998, "loss": 1.5396, "step": 18115 }, { "epoch": 1.43, "learning_rate": 0.0001616989379083299, "loss": 1.4699, "step": 18116 }, { "epoch": 1.43, "learning_rate": 0.00016168661580124048, "loss": 1.5617, "step": 18117 }, { "epoch": 1.43, "learning_rate": 0.0001616742936148054, "loss": 1.5212, "step": 18118 }, { "epoch": 1.43, "learning_rate": 0.00016166197134910828, "loss": 1.4964, "step": 18119 }, { "epoch": 1.43, "learning_rate": 0.00016164964900423285, "loss": 1.5749, "step": 18120 }, { "epoch": 1.43, "learning_rate": 0.0001616373265802627, "loss": 1.5337, "step": 18121 }, { "epoch": 1.43, "learning_rate": 0.00016162500407728155, "loss": 1.5339, "step": 18122 }, { "epoch": 1.43, "learning_rate": 0.00016161268149537304, "loss": 1.4823, "step": 18123 }, { "epoch": 1.43, "learning_rate": 0.00016160035883462081, "loss": 1.5517, "step": 18124 }, { "epoch": 1.43, "learning_rate": 0.00016158803609510854, "loss": 1.4869, "step": 18125 }, { "epoch": 1.43, "learning_rate": 0.0001615757132769199, "loss": 1.5179, "step": 18126 }, { "epoch": 1.43, "learning_rate": 0.00016156339038013857, "loss": 1.524, "step": 18127 }, { "epoch": 1.43, "learning_rate": 0.00016155106740484824, "loss": 1.5582, "step": 18128 }, { "epoch": 1.43, "learning_rate": 0.00016153874435113246, "loss": 1.5462, "step": 18129 }, { "epoch": 1.43, "learning_rate": 0.000161526421219075, "loss": 1.4984, "step": 18130 }, { "epoch": 1.43, "learning_rate": 0.00016151409800875953, "loss": 1.604, "step": 18131 }, { "epoch": 1.43, "learning_rate": 0.00016150177472026966, "loss": 1.5653, "step": 18132 }, { "epoch": 1.43, "learning_rate": 0.00016148945135368908, "loss": 1.53, "step": 18133 }, { "epoch": 1.43, "learning_rate": 0.00016147712790910145, "loss": 1.4409, "step": 18134 }, { "epoch": 1.43, "learning_rate": 0.0001614648043865905, "loss": 1.5302, "step": 18135 }, { "epoch": 1.43, "learning_rate": 0.00016145248078623987, "loss": 1.5586, "step": 18136 }, { "epoch": 1.43, "learning_rate": 0.0001614401571081332, "loss": 1.5014, "step": 18137 }, { "epoch": 1.43, "learning_rate": 0.00016142783335235412, "loss": 1.6021, "step": 18138 }, { "epoch": 1.43, "learning_rate": 0.0001614155095189864, "loss": 1.5256, "step": 18139 }, { "epoch": 1.43, "learning_rate": 0.0001614031856081137, "loss": 1.498, "step": 18140 }, { "epoch": 1.43, "learning_rate": 0.0001613908616198196, "loss": 1.5037, "step": 18141 }, { "epoch": 1.43, "learning_rate": 0.00016137853755418787, "loss": 1.5684, "step": 18142 }, { "epoch": 1.43, "learning_rate": 0.00016136621341130214, "loss": 1.5393, "step": 18143 }, { "epoch": 1.43, "learning_rate": 0.0001613538891912461, "loss": 1.5646, "step": 18144 }, { "epoch": 1.43, "learning_rate": 0.00016134156489410343, "loss": 1.5486, "step": 18145 }, { "epoch": 1.43, "learning_rate": 0.00016132924051995778, "loss": 1.5544, "step": 18146 }, { "epoch": 1.43, "learning_rate": 0.00016131691606889286, "loss": 1.5228, "step": 18147 }, { "epoch": 1.43, "learning_rate": 0.0001613045915409923, "loss": 1.5119, "step": 18148 }, { "epoch": 1.43, "learning_rate": 0.00016129226693633979, "loss": 1.521, "step": 18149 }, { "epoch": 1.43, "learning_rate": 0.000161279942255019, "loss": 1.5208, "step": 18150 }, { "epoch": 1.43, "learning_rate": 0.00016126761749711368, "loss": 1.5461, "step": 18151 }, { "epoch": 1.43, "learning_rate": 0.00016125529266270745, "loss": 1.4802, "step": 18152 }, { "epoch": 1.43, "learning_rate": 0.00016124296775188394, "loss": 1.5758, "step": 18153 }, { "epoch": 1.43, "learning_rate": 0.000161230642764727, "loss": 1.4978, "step": 18154 }, { "epoch": 1.43, "learning_rate": 0.00016121831770132009, "loss": 1.5425, "step": 18155 }, { "epoch": 1.43, "learning_rate": 0.000161205992561747, "loss": 1.5304, "step": 18156 }, { "epoch": 1.43, "learning_rate": 0.00016119366734609143, "loss": 1.526, "step": 18157 }, { "epoch": 1.43, "learning_rate": 0.000161181342054437, "loss": 1.5109, "step": 18158 }, { "epoch": 1.43, "learning_rate": 0.0001611690166868675, "loss": 1.5731, "step": 18159 }, { "epoch": 1.43, "learning_rate": 0.0001611566912434665, "loss": 1.5047, "step": 18160 }, { "epoch": 1.43, "learning_rate": 0.00016114436572431772, "loss": 1.498, "step": 18161 }, { "epoch": 1.43, "learning_rate": 0.00016113204012950486, "loss": 1.4861, "step": 18162 }, { "epoch": 1.43, "learning_rate": 0.00016111971445911157, "loss": 1.5575, "step": 18163 }, { "epoch": 1.43, "learning_rate": 0.00016110738871322156, "loss": 1.5183, "step": 18164 }, { "epoch": 1.43, "learning_rate": 0.0001610950628919185, "loss": 1.5162, "step": 18165 }, { "epoch": 1.43, "learning_rate": 0.00016108273699528612, "loss": 1.506, "step": 18166 }, { "epoch": 1.43, "learning_rate": 0.00016107041102340805, "loss": 1.5037, "step": 18167 }, { "epoch": 1.43, "learning_rate": 0.00016105808497636799, "loss": 1.4851, "step": 18168 }, { "epoch": 1.43, "learning_rate": 0.00016104575885424966, "loss": 1.535, "step": 18169 }, { "epoch": 1.43, "learning_rate": 0.0001610334326571367, "loss": 1.5403, "step": 18170 }, { "epoch": 1.43, "learning_rate": 0.00016102110638511284, "loss": 1.5356, "step": 18171 }, { "epoch": 1.43, "learning_rate": 0.0001610087800382617, "loss": 1.507, "step": 18172 }, { "epoch": 1.43, "learning_rate": 0.00016099645361666707, "loss": 1.5578, "step": 18173 }, { "epoch": 1.43, "learning_rate": 0.0001609841271204126, "loss": 1.5187, "step": 18174 }, { "epoch": 1.43, "learning_rate": 0.00016097180054958193, "loss": 1.5365, "step": 18175 }, { "epoch": 1.43, "learning_rate": 0.00016095947390425884, "loss": 1.5027, "step": 18176 }, { "epoch": 1.43, "learning_rate": 0.00016094714718452693, "loss": 1.5093, "step": 18177 }, { "epoch": 1.43, "learning_rate": 0.0001609348203904699, "loss": 1.4697, "step": 18178 }, { "epoch": 1.43, "learning_rate": 0.00016092249352217156, "loss": 1.5371, "step": 18179 }, { "epoch": 1.43, "learning_rate": 0.0001609101665797154, "loss": 1.5951, "step": 18180 }, { "epoch": 1.43, "learning_rate": 0.00016089783956318535, "loss": 1.5544, "step": 18181 }, { "epoch": 1.43, "learning_rate": 0.00016088551247266488, "loss": 1.4883, "step": 18182 }, { "epoch": 1.43, "learning_rate": 0.0001608731853082379, "loss": 1.5357, "step": 18183 }, { "epoch": 1.43, "learning_rate": 0.00016086085806998792, "loss": 1.4837, "step": 18184 }, { "epoch": 1.43, "learning_rate": 0.0001608485307579987, "loss": 1.5129, "step": 18185 }, { "epoch": 1.43, "learning_rate": 0.00016083620337235398, "loss": 1.5201, "step": 18186 }, { "epoch": 1.43, "learning_rate": 0.00016082387591313737, "loss": 1.4947, "step": 18187 }, { "epoch": 1.43, "learning_rate": 0.00016081154838043266, "loss": 1.4996, "step": 18188 }, { "epoch": 1.43, "learning_rate": 0.00016079922077432348, "loss": 1.5884, "step": 18189 }, { "epoch": 1.43, "learning_rate": 0.00016078689309489353, "loss": 1.4987, "step": 18190 }, { "epoch": 1.43, "learning_rate": 0.0001607745653422266, "loss": 1.5661, "step": 18191 }, { "epoch": 1.43, "learning_rate": 0.00016076223751640626, "loss": 1.4776, "step": 18192 }, { "epoch": 1.43, "learning_rate": 0.0001607499096175163, "loss": 1.4784, "step": 18193 }, { "epoch": 1.43, "learning_rate": 0.00016073758164564033, "loss": 1.5772, "step": 18194 }, { "epoch": 1.43, "learning_rate": 0.00016072525360086214, "loss": 1.5419, "step": 18195 }, { "epoch": 1.43, "learning_rate": 0.0001607129254832654, "loss": 1.4795, "step": 18196 }, { "epoch": 1.43, "learning_rate": 0.00016070059729293378, "loss": 1.4601, "step": 18197 }, { "epoch": 1.43, "learning_rate": 0.00016068826902995107, "loss": 1.5245, "step": 18198 }, { "epoch": 1.43, "learning_rate": 0.0001606759406944009, "loss": 1.5005, "step": 18199 }, { "epoch": 1.43, "learning_rate": 0.00016066361228636692, "loss": 1.5211, "step": 18200 }, { "epoch": 1.43, "learning_rate": 0.00016065128380593298, "loss": 1.504, "step": 18201 }, { "epoch": 1.43, "learning_rate": 0.00016063895525318263, "loss": 1.5804, "step": 18202 }, { "epoch": 1.43, "learning_rate": 0.00016062662662819972, "loss": 1.5222, "step": 18203 }, { "epoch": 1.43, "learning_rate": 0.00016061429793106776, "loss": 1.4743, "step": 18204 }, { "epoch": 1.43, "learning_rate": 0.00016060196916187067, "loss": 1.6002, "step": 18205 }, { "epoch": 1.43, "learning_rate": 0.00016058964032069205, "loss": 1.5704, "step": 18206 }, { "epoch": 1.43, "learning_rate": 0.0001605773114076156, "loss": 1.5039, "step": 18207 }, { "epoch": 1.43, "learning_rate": 0.00016056498242272504, "loss": 1.5555, "step": 18208 }, { "epoch": 1.43, "learning_rate": 0.0001605526533661041, "loss": 1.4598, "step": 18209 }, { "epoch": 1.43, "learning_rate": 0.00016054032423783648, "loss": 1.4721, "step": 18210 }, { "epoch": 1.43, "learning_rate": 0.00016052799503800578, "loss": 1.4736, "step": 18211 }, { "epoch": 1.43, "learning_rate": 0.0001605156657666959, "loss": 1.513, "step": 18212 }, { "epoch": 1.43, "learning_rate": 0.00016050333642399044, "loss": 1.4814, "step": 18213 }, { "epoch": 1.43, "learning_rate": 0.0001604910070099731, "loss": 1.4774, "step": 18214 }, { "epoch": 1.43, "learning_rate": 0.00016047867752472765, "loss": 1.5372, "step": 18215 }, { "epoch": 1.43, "learning_rate": 0.00016046634796833772, "loss": 1.5248, "step": 18216 }, { "epoch": 1.43, "learning_rate": 0.00016045401834088703, "loss": 1.5564, "step": 18217 }, { "epoch": 1.43, "learning_rate": 0.0001604416886424594, "loss": 1.5166, "step": 18218 }, { "epoch": 1.43, "learning_rate": 0.0001604293588731384, "loss": 1.5444, "step": 18219 }, { "epoch": 1.43, "learning_rate": 0.00016041702903300787, "loss": 1.4943, "step": 18220 }, { "epoch": 1.43, "learning_rate": 0.00016040469912215142, "loss": 1.4876, "step": 18221 }, { "epoch": 1.43, "learning_rate": 0.00016039236914065284, "loss": 1.5203, "step": 18222 }, { "epoch": 1.43, "learning_rate": 0.00016038003908859576, "loss": 1.5411, "step": 18223 }, { "epoch": 1.43, "learning_rate": 0.000160367708966064, "loss": 1.5446, "step": 18224 }, { "epoch": 1.43, "learning_rate": 0.0001603553787731412, "loss": 1.5477, "step": 18225 }, { "epoch": 1.43, "learning_rate": 0.00016034304850991106, "loss": 1.5555, "step": 18226 }, { "epoch": 1.43, "learning_rate": 0.00016033071817645735, "loss": 1.5256, "step": 18227 }, { "epoch": 1.43, "learning_rate": 0.00016031838777286377, "loss": 1.6021, "step": 18228 }, { "epoch": 1.43, "learning_rate": 0.000160306057299214, "loss": 1.5348, "step": 18229 }, { "epoch": 1.43, "learning_rate": 0.00016029372675559184, "loss": 1.5798, "step": 18230 }, { "epoch": 1.43, "learning_rate": 0.0001602813961420809, "loss": 1.4998, "step": 18231 }, { "epoch": 1.43, "learning_rate": 0.00016026906545876503, "loss": 1.4936, "step": 18232 }, { "epoch": 1.43, "learning_rate": 0.00016025673470572782, "loss": 1.5366, "step": 18233 }, { "epoch": 1.43, "learning_rate": 0.000160244403883053, "loss": 1.4507, "step": 18234 }, { "epoch": 1.43, "learning_rate": 0.00016023207299082438, "loss": 1.5251, "step": 18235 }, { "epoch": 1.43, "learning_rate": 0.00016021974202912564, "loss": 1.5448, "step": 18236 }, { "epoch": 1.43, "learning_rate": 0.0001602074109980405, "loss": 1.5494, "step": 18237 }, { "epoch": 1.43, "learning_rate": 0.00016019507989765261, "loss": 1.5501, "step": 18238 }, { "epoch": 1.44, "learning_rate": 0.00016018274872804585, "loss": 1.5355, "step": 18239 }, { "epoch": 1.44, "learning_rate": 0.0001601704174893038, "loss": 1.5767, "step": 18240 }, { "epoch": 1.44, "learning_rate": 0.00016015808618151018, "loss": 1.5325, "step": 18241 }, { "epoch": 1.44, "learning_rate": 0.00016014575480474883, "loss": 1.5685, "step": 18242 }, { "epoch": 1.44, "learning_rate": 0.00016013342335910333, "loss": 1.5301, "step": 18243 }, { "epoch": 1.44, "learning_rate": 0.00016012109184465755, "loss": 1.4817, "step": 18244 }, { "epoch": 1.44, "learning_rate": 0.0001601087602614951, "loss": 1.5511, "step": 18245 }, { "epoch": 1.44, "learning_rate": 0.00016009642860969974, "loss": 1.5371, "step": 18246 }, { "epoch": 1.44, "learning_rate": 0.00016008409688935524, "loss": 1.4936, "step": 18247 }, { "epoch": 1.44, "learning_rate": 0.00016007176510054528, "loss": 1.522, "step": 18248 }, { "epoch": 1.44, "learning_rate": 0.0001600594332433536, "loss": 1.5744, "step": 18249 }, { "epoch": 1.44, "learning_rate": 0.0001600471013178639, "loss": 1.5666, "step": 18250 }, { "epoch": 1.44, "learning_rate": 0.0001600347693241599, "loss": 1.5009, "step": 18251 }, { "epoch": 1.44, "learning_rate": 0.00016002243726232537, "loss": 1.499, "step": 18252 }, { "epoch": 1.44, "learning_rate": 0.00016001010513244405, "loss": 1.4907, "step": 18253 }, { "epoch": 1.44, "learning_rate": 0.00015999777293459962, "loss": 1.5355, "step": 18254 }, { "epoch": 1.44, "learning_rate": 0.00015998544066887584, "loss": 1.5465, "step": 18255 }, { "epoch": 1.44, "learning_rate": 0.0001599731083353564, "loss": 1.4528, "step": 18256 }, { "epoch": 1.44, "learning_rate": 0.00015996077593412512, "loss": 1.4916, "step": 18257 }, { "epoch": 1.44, "learning_rate": 0.00015994844346526557, "loss": 1.5139, "step": 18258 }, { "epoch": 1.44, "learning_rate": 0.00015993611092886167, "loss": 1.5104, "step": 18259 }, { "epoch": 1.44, "learning_rate": 0.000159923778324997, "loss": 1.5134, "step": 18260 }, { "epoch": 1.44, "learning_rate": 0.0001599114456537554, "loss": 1.5124, "step": 18261 }, { "epoch": 1.44, "learning_rate": 0.00015989911291522052, "loss": 1.5257, "step": 18262 }, { "epoch": 1.44, "learning_rate": 0.00015988678010947613, "loss": 1.5103, "step": 18263 }, { "epoch": 1.44, "learning_rate": 0.00015987444723660597, "loss": 1.5215, "step": 18264 }, { "epoch": 1.44, "learning_rate": 0.00015986211429669375, "loss": 1.5098, "step": 18265 }, { "epoch": 1.44, "learning_rate": 0.00015984978128982322, "loss": 1.5341, "step": 18266 }, { "epoch": 1.44, "learning_rate": 0.0001598374482160781, "loss": 1.5112, "step": 18267 }, { "epoch": 1.44, "learning_rate": 0.00015982511507554214, "loss": 1.5398, "step": 18268 }, { "epoch": 1.44, "learning_rate": 0.00015981278186829912, "loss": 1.4462, "step": 18269 }, { "epoch": 1.44, "learning_rate": 0.00015980044859443269, "loss": 1.5259, "step": 18270 }, { "epoch": 1.44, "learning_rate": 0.00015978811525402663, "loss": 1.5091, "step": 18271 }, { "epoch": 1.44, "learning_rate": 0.00015977578184716464, "loss": 1.5084, "step": 18272 }, { "epoch": 1.44, "learning_rate": 0.00015976344837393048, "loss": 1.487, "step": 18273 }, { "epoch": 1.44, "learning_rate": 0.00015975111483440793, "loss": 1.5205, "step": 18274 }, { "epoch": 1.44, "learning_rate": 0.00015973878122868066, "loss": 1.5164, "step": 18275 }, { "epoch": 1.44, "learning_rate": 0.00015972644755683248, "loss": 1.5241, "step": 18276 }, { "epoch": 1.44, "learning_rate": 0.0001597141138189471, "loss": 1.5361, "step": 18277 }, { "epoch": 1.44, "learning_rate": 0.0001597017800151082, "loss": 1.5736, "step": 18278 }, { "epoch": 1.44, "learning_rate": 0.00015968944614539956, "loss": 1.4561, "step": 18279 }, { "epoch": 1.44, "learning_rate": 0.00015967711220990494, "loss": 1.5149, "step": 18280 }, { "epoch": 1.44, "learning_rate": 0.00015966477820870812, "loss": 1.5356, "step": 18281 }, { "epoch": 1.44, "learning_rate": 0.0001596524441418927, "loss": 1.4704, "step": 18282 }, { "epoch": 1.44, "learning_rate": 0.0001596401100095426, "loss": 1.4897, "step": 18283 }, { "epoch": 1.44, "learning_rate": 0.00015962777581174142, "loss": 1.5498, "step": 18284 }, { "epoch": 1.44, "learning_rate": 0.00015961544154857293, "loss": 1.5769, "step": 18285 }, { "epoch": 1.44, "learning_rate": 0.00015960310722012096, "loss": 1.467, "step": 18286 }, { "epoch": 1.44, "learning_rate": 0.00015959077282646917, "loss": 1.5439, "step": 18287 }, { "epoch": 1.44, "learning_rate": 0.00015957843836770136, "loss": 1.5664, "step": 18288 }, { "epoch": 1.44, "learning_rate": 0.00015956610384390118, "loss": 1.4974, "step": 18289 }, { "epoch": 1.44, "learning_rate": 0.00015955376925515244, "loss": 1.5422, "step": 18290 }, { "epoch": 1.44, "learning_rate": 0.0001595414346015389, "loss": 1.4635, "step": 18291 }, { "epoch": 1.44, "learning_rate": 0.00015952909988314426, "loss": 1.5003, "step": 18292 }, { "epoch": 1.44, "learning_rate": 0.00015951676510005233, "loss": 1.5555, "step": 18293 }, { "epoch": 1.44, "learning_rate": 0.00015950443025234678, "loss": 1.5508, "step": 18294 }, { "epoch": 1.44, "learning_rate": 0.0001594920953401114, "loss": 1.513, "step": 18295 }, { "epoch": 1.44, "learning_rate": 0.00015947976036342996, "loss": 1.5119, "step": 18296 }, { "epoch": 1.44, "learning_rate": 0.00015946742532238617, "loss": 1.4915, "step": 18297 }, { "epoch": 1.44, "learning_rate": 0.00015945509021706377, "loss": 1.5352, "step": 18298 }, { "epoch": 1.44, "learning_rate": 0.00015944275504754652, "loss": 1.5344, "step": 18299 }, { "epoch": 1.44, "learning_rate": 0.00015943041981391818, "loss": 1.4539, "step": 18300 }, { "epoch": 1.44, "learning_rate": 0.0001594180845162625, "loss": 1.5189, "step": 18301 }, { "epoch": 1.44, "learning_rate": 0.0001594057491546632, "loss": 1.5021, "step": 18302 }, { "epoch": 1.44, "learning_rate": 0.0001593934137292041, "loss": 1.5041, "step": 18303 }, { "epoch": 1.44, "learning_rate": 0.00015938107823996886, "loss": 1.455, "step": 18304 }, { "epoch": 1.44, "learning_rate": 0.00015936874268704135, "loss": 1.5012, "step": 18305 }, { "epoch": 1.44, "learning_rate": 0.00015935640707050514, "loss": 1.5443, "step": 18306 }, { "epoch": 1.44, "learning_rate": 0.00015934407139044416, "loss": 1.4868, "step": 18307 }, { "epoch": 1.44, "learning_rate": 0.00015933173564694207, "loss": 1.5086, "step": 18308 }, { "epoch": 1.44, "learning_rate": 0.00015931939984008262, "loss": 1.4964, "step": 18309 }, { "epoch": 1.44, "learning_rate": 0.00015930706396994964, "loss": 1.5494, "step": 18310 }, { "epoch": 1.44, "learning_rate": 0.00015929472803662682, "loss": 1.5113, "step": 18311 }, { "epoch": 1.44, "learning_rate": 0.00015928239204019792, "loss": 1.5683, "step": 18312 }, { "epoch": 1.44, "learning_rate": 0.00015927005598074672, "loss": 1.561, "step": 18313 }, { "epoch": 1.44, "learning_rate": 0.00015925771985835687, "loss": 1.5105, "step": 18314 }, { "epoch": 1.44, "learning_rate": 0.0001592453836731123, "loss": 1.5882, "step": 18315 }, { "epoch": 1.44, "learning_rate": 0.00015923304742509664, "loss": 1.4719, "step": 18316 }, { "epoch": 1.44, "learning_rate": 0.0001592207111143937, "loss": 1.5264, "step": 18317 }, { "epoch": 1.44, "learning_rate": 0.0001592083747410872, "loss": 1.5489, "step": 18318 }, { "epoch": 1.44, "learning_rate": 0.0001591960383052609, "loss": 1.5316, "step": 18319 }, { "epoch": 1.44, "learning_rate": 0.00015918370180699863, "loss": 1.5094, "step": 18320 }, { "epoch": 1.44, "learning_rate": 0.00015917136524638405, "loss": 1.5548, "step": 18321 }, { "epoch": 1.44, "learning_rate": 0.000159159028623501, "loss": 1.5511, "step": 18322 }, { "epoch": 1.44, "learning_rate": 0.00015914669193843316, "loss": 1.554, "step": 18323 }, { "epoch": 1.44, "learning_rate": 0.00015913435519126435, "loss": 1.5284, "step": 18324 }, { "epoch": 1.44, "learning_rate": 0.00015912201838207832, "loss": 1.5427, "step": 18325 }, { "epoch": 1.44, "learning_rate": 0.00015910968151095878, "loss": 1.4935, "step": 18326 }, { "epoch": 1.44, "learning_rate": 0.00015909734457798957, "loss": 1.5239, "step": 18327 }, { "epoch": 1.44, "learning_rate": 0.00015908500758325442, "loss": 1.5106, "step": 18328 }, { "epoch": 1.44, "learning_rate": 0.00015907267052683703, "loss": 1.5101, "step": 18329 }, { "epoch": 1.44, "learning_rate": 0.00015906033340882123, "loss": 1.5172, "step": 18330 }, { "epoch": 1.44, "learning_rate": 0.00015904799622929076, "loss": 1.554, "step": 18331 }, { "epoch": 1.44, "learning_rate": 0.00015903565898832942, "loss": 1.5144, "step": 18332 }, { "epoch": 1.44, "learning_rate": 0.00015902332168602095, "loss": 1.5006, "step": 18333 }, { "epoch": 1.44, "learning_rate": 0.00015901098432244908, "loss": 1.5364, "step": 18334 }, { "epoch": 1.44, "learning_rate": 0.00015899864689769758, "loss": 1.5238, "step": 18335 }, { "epoch": 1.44, "learning_rate": 0.00015898630941185027, "loss": 1.4959, "step": 18336 }, { "epoch": 1.44, "learning_rate": 0.00015897397186499083, "loss": 1.5736, "step": 18337 }, { "epoch": 1.44, "learning_rate": 0.0001589616342572031, "loss": 1.5033, "step": 18338 }, { "epoch": 1.44, "learning_rate": 0.00015894929658857087, "loss": 1.4745, "step": 18339 }, { "epoch": 1.44, "learning_rate": 0.0001589369588591778, "loss": 1.5898, "step": 18340 }, { "epoch": 1.44, "learning_rate": 0.0001589246210691077, "loss": 1.5147, "step": 18341 }, { "epoch": 1.44, "learning_rate": 0.00015891228321844437, "loss": 1.5294, "step": 18342 }, { "epoch": 1.44, "learning_rate": 0.00015889994530727156, "loss": 1.5262, "step": 18343 }, { "epoch": 1.44, "learning_rate": 0.00015888760733567307, "loss": 1.5077, "step": 18344 }, { "epoch": 1.44, "learning_rate": 0.00015887526930373253, "loss": 1.5599, "step": 18345 }, { "epoch": 1.44, "learning_rate": 0.0001588629312115339, "loss": 1.4666, "step": 18346 }, { "epoch": 1.44, "learning_rate": 0.00015885059305916082, "loss": 1.5386, "step": 18347 }, { "epoch": 1.44, "learning_rate": 0.0001588382548466971, "loss": 1.5233, "step": 18348 }, { "epoch": 1.44, "learning_rate": 0.00015882591657422654, "loss": 1.5366, "step": 18349 }, { "epoch": 1.44, "learning_rate": 0.0001588135782418328, "loss": 1.4977, "step": 18350 }, { "epoch": 1.44, "learning_rate": 0.00015880123984959982, "loss": 1.4853, "step": 18351 }, { "epoch": 1.44, "learning_rate": 0.00015878890139761121, "loss": 1.5634, "step": 18352 }, { "epoch": 1.44, "learning_rate": 0.00015877656288595078, "loss": 1.495, "step": 18353 }, { "epoch": 1.44, "learning_rate": 0.00015876422431470243, "loss": 1.4737, "step": 18354 }, { "epoch": 1.44, "learning_rate": 0.00015875188568394976, "loss": 1.5278, "step": 18355 }, { "epoch": 1.44, "learning_rate": 0.00015873954699377666, "loss": 1.5395, "step": 18356 }, { "epoch": 1.44, "learning_rate": 0.00015872720824426683, "loss": 1.5662, "step": 18357 }, { "epoch": 1.44, "learning_rate": 0.00015871486943550407, "loss": 1.5348, "step": 18358 }, { "epoch": 1.44, "learning_rate": 0.00015870253056757223, "loss": 1.5271, "step": 18359 }, { "epoch": 1.44, "learning_rate": 0.00015869019164055492, "loss": 1.5123, "step": 18360 }, { "epoch": 1.44, "learning_rate": 0.00015867785265453603, "loss": 1.552, "step": 18361 }, { "epoch": 1.44, "learning_rate": 0.0001586655136095993, "loss": 1.5236, "step": 18362 }, { "epoch": 1.44, "learning_rate": 0.00015865317450582854, "loss": 1.5505, "step": 18363 }, { "epoch": 1.44, "learning_rate": 0.0001586408353433075, "loss": 1.5589, "step": 18364 }, { "epoch": 1.44, "learning_rate": 0.0001586284961221199, "loss": 1.5331, "step": 18365 }, { "epoch": 1.45, "learning_rate": 0.00015861615684234964, "loss": 1.5027, "step": 18366 }, { "epoch": 1.45, "learning_rate": 0.00015860381750408043, "loss": 1.5066, "step": 18367 }, { "epoch": 1.45, "learning_rate": 0.00015859147810739599, "loss": 1.5208, "step": 18368 }, { "epoch": 1.45, "learning_rate": 0.0001585791386523802, "loss": 1.5124, "step": 18369 }, { "epoch": 1.45, "learning_rate": 0.00015856679913911676, "loss": 1.499, "step": 18370 }, { "epoch": 1.45, "learning_rate": 0.0001585544595676895, "loss": 1.4659, "step": 18371 }, { "epoch": 1.45, "learning_rate": 0.0001585421199381822, "loss": 1.5514, "step": 18372 }, { "epoch": 1.45, "learning_rate": 0.0001585297802506786, "loss": 1.5361, "step": 18373 }, { "epoch": 1.45, "learning_rate": 0.00015851744050526253, "loss": 1.5277, "step": 18374 }, { "epoch": 1.45, "learning_rate": 0.00015850510070201766, "loss": 1.5434, "step": 18375 }, { "epoch": 1.45, "learning_rate": 0.00015849276084102792, "loss": 1.5471, "step": 18376 }, { "epoch": 1.45, "learning_rate": 0.00015848042092237696, "loss": 1.5412, "step": 18377 }, { "epoch": 1.45, "learning_rate": 0.00015846808094614872, "loss": 1.528, "step": 18378 }, { "epoch": 1.45, "learning_rate": 0.0001584557409124268, "loss": 1.4718, "step": 18379 }, { "epoch": 1.45, "learning_rate": 0.0001584434008212951, "loss": 1.5059, "step": 18380 }, { "epoch": 1.45, "learning_rate": 0.0001584310606728374, "loss": 1.5476, "step": 18381 }, { "epoch": 1.45, "learning_rate": 0.0001584187204671374, "loss": 1.5422, "step": 18382 }, { "epoch": 1.45, "learning_rate": 0.00015840638020427896, "loss": 1.5065, "step": 18383 }, { "epoch": 1.45, "learning_rate": 0.0001583940398843458, "loss": 1.5497, "step": 18384 }, { "epoch": 1.45, "learning_rate": 0.00015838169950742177, "loss": 1.5303, "step": 18385 }, { "epoch": 1.45, "learning_rate": 0.00015836935907359058, "loss": 1.5821, "step": 18386 }, { "epoch": 1.45, "learning_rate": 0.0001583570185829361, "loss": 1.4968, "step": 18387 }, { "epoch": 1.45, "learning_rate": 0.00015834467803554211, "loss": 1.5369, "step": 18388 }, { "epoch": 1.45, "learning_rate": 0.0001583323374314923, "loss": 1.5282, "step": 18389 }, { "epoch": 1.45, "learning_rate": 0.00015831999677087057, "loss": 1.5335, "step": 18390 }, { "epoch": 1.45, "learning_rate": 0.00015830765605376063, "loss": 1.5448, "step": 18391 }, { "epoch": 1.45, "learning_rate": 0.00015829531528024627, "loss": 1.5249, "step": 18392 }, { "epoch": 1.45, "learning_rate": 0.00015828297445041133, "loss": 1.5552, "step": 18393 }, { "epoch": 1.45, "learning_rate": 0.0001582706335643395, "loss": 1.5694, "step": 18394 }, { "epoch": 1.45, "learning_rate": 0.0001582582926221147, "loss": 1.5194, "step": 18395 }, { "epoch": 1.45, "learning_rate": 0.00015824595162382062, "loss": 1.5426, "step": 18396 }, { "epoch": 1.45, "learning_rate": 0.00015823361056954108, "loss": 1.5219, "step": 18397 }, { "epoch": 1.45, "learning_rate": 0.0001582212694593599, "loss": 1.538, "step": 18398 }, { "epoch": 1.45, "learning_rate": 0.00015820892829336081, "loss": 1.5479, "step": 18399 }, { "epoch": 1.45, "learning_rate": 0.00015819658707162763, "loss": 1.5045, "step": 18400 }, { "epoch": 1.45, "learning_rate": 0.00015818424579424413, "loss": 1.5251, "step": 18401 }, { "epoch": 1.45, "learning_rate": 0.0001581719044612942, "loss": 1.5016, "step": 18402 }, { "epoch": 1.45, "learning_rate": 0.00015815956307286145, "loss": 1.5382, "step": 18403 }, { "epoch": 1.45, "learning_rate": 0.0001581472216290298, "loss": 1.5605, "step": 18404 }, { "epoch": 1.45, "learning_rate": 0.00015813488012988302, "loss": 1.4537, "step": 18405 }, { "epoch": 1.45, "learning_rate": 0.0001581225385755049, "loss": 1.5217, "step": 18406 }, { "epoch": 1.45, "learning_rate": 0.0001581101969659792, "loss": 1.5176, "step": 18407 }, { "epoch": 1.45, "learning_rate": 0.00015809785530138972, "loss": 1.5417, "step": 18408 }, { "epoch": 1.45, "learning_rate": 0.0001580855135818203, "loss": 1.4983, "step": 18409 }, { "epoch": 1.45, "learning_rate": 0.00015807317180735472, "loss": 1.5643, "step": 18410 }, { "epoch": 1.45, "learning_rate": 0.00015806082997807676, "loss": 1.5653, "step": 18411 }, { "epoch": 1.45, "learning_rate": 0.00015804848809407022, "loss": 1.4866, "step": 18412 }, { "epoch": 1.45, "learning_rate": 0.00015803614615541884, "loss": 1.5215, "step": 18413 }, { "epoch": 1.45, "learning_rate": 0.00015802380416220647, "loss": 1.4794, "step": 18414 }, { "epoch": 1.45, "learning_rate": 0.00015801146211451696, "loss": 1.5618, "step": 18415 }, { "epoch": 1.45, "learning_rate": 0.00015799912001243397, "loss": 1.5264, "step": 18416 }, { "epoch": 1.45, "learning_rate": 0.00015798677785604142, "loss": 1.5325, "step": 18417 }, { "epoch": 1.45, "learning_rate": 0.00015797443564542304, "loss": 1.5, "step": 18418 }, { "epoch": 1.45, "learning_rate": 0.00015796209338066265, "loss": 1.5277, "step": 18419 }, { "epoch": 1.45, "learning_rate": 0.000157949751061844, "loss": 1.5011, "step": 18420 }, { "epoch": 1.45, "learning_rate": 0.00015793740868905095, "loss": 1.5034, "step": 18421 }, { "epoch": 1.45, "learning_rate": 0.00015792506626236731, "loss": 1.4961, "step": 18422 }, { "epoch": 1.45, "learning_rate": 0.0001579127237818768, "loss": 1.4607, "step": 18423 }, { "epoch": 1.45, "learning_rate": 0.00015790038124766328, "loss": 1.5298, "step": 18424 }, { "epoch": 1.45, "learning_rate": 0.00015788803865981053, "loss": 1.5173, "step": 18425 }, { "epoch": 1.45, "learning_rate": 0.00015787569601840234, "loss": 1.5528, "step": 18426 }, { "epoch": 1.45, "learning_rate": 0.00015786335332352251, "loss": 1.5607, "step": 18427 }, { "epoch": 1.45, "learning_rate": 0.00015785101057525487, "loss": 1.5008, "step": 18428 }, { "epoch": 1.45, "learning_rate": 0.00015783866777368323, "loss": 1.4762, "step": 18429 }, { "epoch": 1.45, "learning_rate": 0.00015782632491889132, "loss": 1.5158, "step": 18430 }, { "epoch": 1.45, "learning_rate": 0.000157813982010963, "loss": 1.5353, "step": 18431 }, { "epoch": 1.45, "learning_rate": 0.00015780163904998204, "loss": 1.5412, "step": 18432 }, { "epoch": 1.45, "learning_rate": 0.00015778929603603225, "loss": 1.5146, "step": 18433 }, { "epoch": 1.45, "learning_rate": 0.00015777695296919747, "loss": 1.5214, "step": 18434 }, { "epoch": 1.45, "learning_rate": 0.00015776460984956144, "loss": 1.5287, "step": 18435 }, { "epoch": 1.45, "learning_rate": 0.000157752266677208, "loss": 1.534, "step": 18436 }, { "epoch": 1.45, "learning_rate": 0.00015773992345222094, "loss": 1.4948, "step": 18437 }, { "epoch": 1.45, "learning_rate": 0.00015772758017468412, "loss": 1.4976, "step": 18438 }, { "epoch": 1.45, "learning_rate": 0.00015771523684468124, "loss": 1.4924, "step": 18439 }, { "epoch": 1.45, "learning_rate": 0.00015770289346229616, "loss": 1.5534, "step": 18440 }, { "epoch": 1.45, "learning_rate": 0.00015769055002761272, "loss": 1.5112, "step": 18441 }, { "epoch": 1.45, "learning_rate": 0.00015767820654071467, "loss": 1.5149, "step": 18442 }, { "epoch": 1.45, "learning_rate": 0.00015766586300168582, "loss": 1.509, "step": 18443 }, { "epoch": 1.45, "learning_rate": 0.00015765351941061004, "loss": 1.499, "step": 18444 }, { "epoch": 1.45, "learning_rate": 0.00015764117576757105, "loss": 1.5159, "step": 18445 }, { "epoch": 1.45, "learning_rate": 0.0001576288320726527, "loss": 1.5331, "step": 18446 }, { "epoch": 1.45, "learning_rate": 0.00015761648832593878, "loss": 1.5105, "step": 18447 }, { "epoch": 1.45, "learning_rate": 0.00015760414452751313, "loss": 1.5321, "step": 18448 }, { "epoch": 1.45, "learning_rate": 0.00015759180067745948, "loss": 1.5286, "step": 18449 }, { "epoch": 1.45, "learning_rate": 0.00015757945677586174, "loss": 1.5066, "step": 18450 }, { "epoch": 1.45, "learning_rate": 0.0001575671128228037, "loss": 1.5256, "step": 18451 }, { "epoch": 1.45, "learning_rate": 0.0001575547688183691, "loss": 1.5347, "step": 18452 }, { "epoch": 1.45, "learning_rate": 0.0001575424247626418, "loss": 1.5588, "step": 18453 }, { "epoch": 1.45, "learning_rate": 0.0001575300806557056, "loss": 1.6047, "step": 18454 }, { "epoch": 1.45, "learning_rate": 0.00015751773649764423, "loss": 1.543, "step": 18455 }, { "epoch": 1.45, "learning_rate": 0.0001575053922885417, "loss": 1.606, "step": 18456 }, { "epoch": 1.45, "learning_rate": 0.00015749304802848164, "loss": 1.5577, "step": 18457 }, { "epoch": 1.45, "learning_rate": 0.00015748070371754793, "loss": 1.5063, "step": 18458 }, { "epoch": 1.45, "learning_rate": 0.00015746835935582436, "loss": 1.5642, "step": 18459 }, { "epoch": 1.45, "learning_rate": 0.00015745601494339477, "loss": 1.5076, "step": 18460 }, { "epoch": 1.45, "learning_rate": 0.00015744367048034293, "loss": 1.4982, "step": 18461 }, { "epoch": 1.45, "learning_rate": 0.0001574313259667527, "loss": 1.4818, "step": 18462 }, { "epoch": 1.45, "learning_rate": 0.00015741898140270781, "loss": 1.5317, "step": 18463 }, { "epoch": 1.45, "learning_rate": 0.00015740663678829217, "loss": 1.5202, "step": 18464 }, { "epoch": 1.45, "learning_rate": 0.00015739429212358955, "loss": 1.4894, "step": 18465 }, { "epoch": 1.45, "learning_rate": 0.00015738194740868382, "loss": 1.5871, "step": 18466 }, { "epoch": 1.45, "learning_rate": 0.00015736960264365867, "loss": 1.5646, "step": 18467 }, { "epoch": 1.45, "learning_rate": 0.00015735725782859802, "loss": 1.5523, "step": 18468 }, { "epoch": 1.45, "learning_rate": 0.00015734491296358563, "loss": 1.5031, "step": 18469 }, { "epoch": 1.45, "learning_rate": 0.00015733256804870534, "loss": 1.5602, "step": 18470 }, { "epoch": 1.45, "learning_rate": 0.00015732022308404095, "loss": 1.5565, "step": 18471 }, { "epoch": 1.45, "learning_rate": 0.0001573078780696763, "loss": 1.5585, "step": 18472 }, { "epoch": 1.45, "learning_rate": 0.0001572955330056952, "loss": 1.4931, "step": 18473 }, { "epoch": 1.45, "learning_rate": 0.00015728318789218142, "loss": 1.4949, "step": 18474 }, { "epoch": 1.45, "learning_rate": 0.00015727084272921886, "loss": 1.4412, "step": 18475 }, { "epoch": 1.45, "learning_rate": 0.00015725849751689126, "loss": 1.5552, "step": 18476 }, { "epoch": 1.45, "learning_rate": 0.00015724615225528248, "loss": 1.5569, "step": 18477 }, { "epoch": 1.45, "learning_rate": 0.00015723380694447636, "loss": 1.5176, "step": 18478 }, { "epoch": 1.45, "learning_rate": 0.00015722146158455658, "loss": 1.5143, "step": 18479 }, { "epoch": 1.45, "learning_rate": 0.00015720911617560714, "loss": 1.5146, "step": 18480 }, { "epoch": 1.45, "learning_rate": 0.00015719677071771176, "loss": 1.4939, "step": 18481 }, { "epoch": 1.45, "learning_rate": 0.00015718442521095427, "loss": 1.5439, "step": 18482 }, { "epoch": 1.45, "learning_rate": 0.00015717207965541854, "loss": 1.5528, "step": 18483 }, { "epoch": 1.45, "learning_rate": 0.0001571597340511883, "loss": 1.52, "step": 18484 }, { "epoch": 1.45, "learning_rate": 0.00015714738839834745, "loss": 1.5077, "step": 18485 }, { "epoch": 1.45, "learning_rate": 0.00015713504269697972, "loss": 1.5077, "step": 18486 }, { "epoch": 1.45, "learning_rate": 0.00015712269694716905, "loss": 1.5845, "step": 18487 }, { "epoch": 1.45, "learning_rate": 0.0001571103511489992, "loss": 1.489, "step": 18488 }, { "epoch": 1.45, "learning_rate": 0.0001570980053025539, "loss": 1.5477, "step": 18489 }, { "epoch": 1.45, "learning_rate": 0.00015708565940791716, "loss": 1.529, "step": 18490 }, { "epoch": 1.45, "learning_rate": 0.0001570733134651727, "loss": 1.5188, "step": 18491 }, { "epoch": 1.45, "learning_rate": 0.00015706096747440426, "loss": 1.4948, "step": 18492 }, { "epoch": 1.46, "learning_rate": 0.00015704862143569584, "loss": 1.5042, "step": 18493 }, { "epoch": 1.46, "learning_rate": 0.00015703627534913107, "loss": 1.5349, "step": 18494 }, { "epoch": 1.46, "learning_rate": 0.00015702392921479398, "loss": 1.5329, "step": 18495 }, { "epoch": 1.46, "learning_rate": 0.00015701158303276823, "loss": 1.492, "step": 18496 }, { "epoch": 1.46, "learning_rate": 0.00015699923680313773, "loss": 1.4873, "step": 18497 }, { "epoch": 1.46, "learning_rate": 0.00015698689052598625, "loss": 1.4954, "step": 18498 }, { "epoch": 1.46, "learning_rate": 0.00015697454420139767, "loss": 1.5047, "step": 18499 }, { "epoch": 1.46, "learning_rate": 0.00015696219782945574, "loss": 1.5044, "step": 18500 }, { "epoch": 1.46, "learning_rate": 0.00015694985141024434, "loss": 1.515, "step": 18501 }, { "epoch": 1.46, "learning_rate": 0.0001569375049438473, "loss": 1.5381, "step": 18502 }, { "epoch": 1.46, "learning_rate": 0.0001569251584303484, "loss": 1.5139, "step": 18503 }, { "epoch": 1.46, "learning_rate": 0.00015691281186983158, "loss": 1.511, "step": 18504 }, { "epoch": 1.46, "learning_rate": 0.00015690046526238048, "loss": 1.5242, "step": 18505 }, { "epoch": 1.46, "learning_rate": 0.00015688811860807908, "loss": 1.4829, "step": 18506 }, { "epoch": 1.46, "learning_rate": 0.00015687577190701113, "loss": 1.5428, "step": 18507 }, { "epoch": 1.46, "learning_rate": 0.0001568634251592605, "loss": 1.5203, "step": 18508 }, { "epoch": 1.46, "learning_rate": 0.000156851078364911, "loss": 1.4561, "step": 18509 }, { "epoch": 1.46, "learning_rate": 0.00015683873152404646, "loss": 1.5367, "step": 18510 }, { "epoch": 1.46, "learning_rate": 0.0001568263846367507, "loss": 1.5207, "step": 18511 }, { "epoch": 1.46, "learning_rate": 0.00015681403770310756, "loss": 1.4962, "step": 18512 }, { "epoch": 1.46, "learning_rate": 0.0001568016907232009, "loss": 1.5193, "step": 18513 }, { "epoch": 1.46, "learning_rate": 0.00015678934369711448, "loss": 1.5195, "step": 18514 }, { "epoch": 1.46, "learning_rate": 0.00015677699662493212, "loss": 1.63, "step": 18515 }, { "epoch": 1.46, "learning_rate": 0.00015676464950673772, "loss": 1.5364, "step": 18516 }, { "epoch": 1.46, "learning_rate": 0.00015675230234261513, "loss": 1.5323, "step": 18517 }, { "epoch": 1.46, "learning_rate": 0.00015673995513264808, "loss": 1.4884, "step": 18518 }, { "epoch": 1.46, "learning_rate": 0.0001567276078769205, "loss": 1.5124, "step": 18519 }, { "epoch": 1.46, "learning_rate": 0.0001567152605755161, "loss": 1.4992, "step": 18520 }, { "epoch": 1.46, "learning_rate": 0.00015670291322851884, "loss": 1.5429, "step": 18521 }, { "epoch": 1.46, "learning_rate": 0.00015669056583601253, "loss": 1.4732, "step": 18522 }, { "epoch": 1.46, "learning_rate": 0.00015667821839808092, "loss": 1.5495, "step": 18523 }, { "epoch": 1.46, "learning_rate": 0.00015666587091480791, "loss": 1.5366, "step": 18524 }, { "epoch": 1.46, "learning_rate": 0.00015665352338627733, "loss": 1.5251, "step": 18525 }, { "epoch": 1.46, "learning_rate": 0.00015664117581257295, "loss": 1.5215, "step": 18526 }, { "epoch": 1.46, "learning_rate": 0.00015662882819377866, "loss": 1.5734, "step": 18527 }, { "epoch": 1.46, "learning_rate": 0.0001566164805299783, "loss": 1.5296, "step": 18528 }, { "epoch": 1.46, "learning_rate": 0.00015660413282125575, "loss": 1.5198, "step": 18529 }, { "epoch": 1.46, "learning_rate": 0.0001565917850676947, "loss": 1.5249, "step": 18530 }, { "epoch": 1.46, "learning_rate": 0.00015657943726937913, "loss": 1.4983, "step": 18531 }, { "epoch": 1.46, "learning_rate": 0.00015656708942639276, "loss": 1.5473, "step": 18532 }, { "epoch": 1.46, "learning_rate": 0.00015655474153881946, "loss": 1.4946, "step": 18533 }, { "epoch": 1.46, "learning_rate": 0.0001565423936067431, "loss": 1.5369, "step": 18534 }, { "epoch": 1.46, "learning_rate": 0.0001565300456302475, "loss": 1.5488, "step": 18535 }, { "epoch": 1.46, "learning_rate": 0.00015651769760941656, "loss": 1.5582, "step": 18536 }, { "epoch": 1.46, "learning_rate": 0.00015650534954433397, "loss": 1.506, "step": 18537 }, { "epoch": 1.46, "learning_rate": 0.00015649300143508367, "loss": 1.5748, "step": 18538 }, { "epoch": 1.46, "learning_rate": 0.0001564806532817495, "loss": 1.5279, "step": 18539 }, { "epoch": 1.46, "learning_rate": 0.00015646830508441522, "loss": 1.5013, "step": 18540 }, { "epoch": 1.46, "learning_rate": 0.00015645595684316474, "loss": 1.4827, "step": 18541 }, { "epoch": 1.46, "learning_rate": 0.0001564436085580819, "loss": 1.5226, "step": 18542 }, { "epoch": 1.46, "learning_rate": 0.0001564312602292505, "loss": 1.5047, "step": 18543 }, { "epoch": 1.46, "learning_rate": 0.00015641891185675438, "loss": 1.4942, "step": 18544 }, { "epoch": 1.46, "learning_rate": 0.00015640656344067738, "loss": 1.5462, "step": 18545 }, { "epoch": 1.46, "learning_rate": 0.0001563942149811034, "loss": 1.5109, "step": 18546 }, { "epoch": 1.46, "learning_rate": 0.00015638186647811618, "loss": 1.52, "step": 18547 }, { "epoch": 1.46, "learning_rate": 0.0001563695179317996, "loss": 1.535, "step": 18548 }, { "epoch": 1.46, "learning_rate": 0.00015635716934223753, "loss": 1.5147, "step": 18549 }, { "epoch": 1.46, "learning_rate": 0.00015634482070951377, "loss": 1.5568, "step": 18550 }, { "epoch": 1.46, "learning_rate": 0.00015633247203371221, "loss": 1.5636, "step": 18551 }, { "epoch": 1.46, "learning_rate": 0.00015632012331491668, "loss": 1.5634, "step": 18552 }, { "epoch": 1.46, "learning_rate": 0.00015630777455321096, "loss": 1.501, "step": 18553 }, { "epoch": 1.46, "learning_rate": 0.00015629542574867894, "loss": 1.57, "step": 18554 }, { "epoch": 1.46, "learning_rate": 0.00015628307690140441, "loss": 1.5235, "step": 18555 }, { "epoch": 1.46, "learning_rate": 0.00015627072801147133, "loss": 1.5404, "step": 18556 }, { "epoch": 1.46, "learning_rate": 0.0001562583790789634, "loss": 1.5753, "step": 18557 }, { "epoch": 1.46, "learning_rate": 0.0001562460301039646, "loss": 1.5417, "step": 18558 }, { "epoch": 1.46, "learning_rate": 0.00015623368108655866, "loss": 1.5163, "step": 18559 }, { "epoch": 1.46, "learning_rate": 0.0001562213320268295, "loss": 1.4863, "step": 18560 }, { "epoch": 1.46, "learning_rate": 0.00015620898292486088, "loss": 1.4899, "step": 18561 }, { "epoch": 1.46, "learning_rate": 0.0001561966337807367, "loss": 1.4857, "step": 18562 }, { "epoch": 1.46, "learning_rate": 0.00015618428459454085, "loss": 1.4977, "step": 18563 }, { "epoch": 1.46, "learning_rate": 0.00015617193536635707, "loss": 1.5166, "step": 18564 }, { "epoch": 1.46, "learning_rate": 0.00015615958609626926, "loss": 1.5337, "step": 18565 }, { "epoch": 1.46, "learning_rate": 0.00015614723678436125, "loss": 1.5019, "step": 18566 }, { "epoch": 1.46, "learning_rate": 0.0001561348874307169, "loss": 1.5334, "step": 18567 }, { "epoch": 1.46, "learning_rate": 0.00015612253803542008, "loss": 1.5942, "step": 18568 }, { "epoch": 1.46, "learning_rate": 0.00015611018859855457, "loss": 1.5074, "step": 18569 }, { "epoch": 1.46, "learning_rate": 0.00015609783912020432, "loss": 1.5037, "step": 18570 }, { "epoch": 1.46, "learning_rate": 0.00015608548960045304, "loss": 1.5278, "step": 18571 }, { "epoch": 1.46, "learning_rate": 0.00015607314003938464, "loss": 1.5471, "step": 18572 }, { "epoch": 1.46, "learning_rate": 0.00015606079043708297, "loss": 1.5342, "step": 18573 }, { "epoch": 1.46, "learning_rate": 0.0001560484407936319, "loss": 1.4888, "step": 18574 }, { "epoch": 1.46, "learning_rate": 0.00015603609110911526, "loss": 1.4603, "step": 18575 }, { "epoch": 1.46, "learning_rate": 0.00015602374138361689, "loss": 1.5451, "step": 18576 }, { "epoch": 1.46, "learning_rate": 0.00015601139161722062, "loss": 1.5411, "step": 18577 }, { "epoch": 1.46, "learning_rate": 0.00015599904181001035, "loss": 1.473, "step": 18578 }, { "epoch": 1.46, "learning_rate": 0.00015598669196206988, "loss": 1.5198, "step": 18579 }, { "epoch": 1.46, "learning_rate": 0.00015597434207348309, "loss": 1.5052, "step": 18580 }, { "epoch": 1.46, "learning_rate": 0.00015596199214433376, "loss": 1.4874, "step": 18581 }, { "epoch": 1.46, "learning_rate": 0.00015594964217470583, "loss": 1.4482, "step": 18582 }, { "epoch": 1.46, "learning_rate": 0.00015593729216468313, "loss": 1.5694, "step": 18583 }, { "epoch": 1.46, "learning_rate": 0.00015592494211434947, "loss": 1.5321, "step": 18584 }, { "epoch": 1.46, "learning_rate": 0.00015591259202378874, "loss": 1.5608, "step": 18585 }, { "epoch": 1.46, "learning_rate": 0.00015590024189308474, "loss": 1.4458, "step": 18586 }, { "epoch": 1.46, "learning_rate": 0.0001558878917223214, "loss": 1.5578, "step": 18587 }, { "epoch": 1.46, "learning_rate": 0.0001558755415115825, "loss": 1.5731, "step": 18588 }, { "epoch": 1.46, "learning_rate": 0.0001558631912609519, "loss": 1.4784, "step": 18589 }, { "epoch": 1.46, "learning_rate": 0.00015585084097051346, "loss": 1.4835, "step": 18590 }, { "epoch": 1.46, "learning_rate": 0.00015583849064035107, "loss": 1.5097, "step": 18591 }, { "epoch": 1.46, "learning_rate": 0.00015582614027054856, "loss": 1.5711, "step": 18592 }, { "epoch": 1.46, "learning_rate": 0.00015581378986118975, "loss": 1.5442, "step": 18593 }, { "epoch": 1.46, "learning_rate": 0.00015580143941235853, "loss": 1.5194, "step": 18594 }, { "epoch": 1.46, "learning_rate": 0.00015578908892413873, "loss": 1.5162, "step": 18595 }, { "epoch": 1.46, "learning_rate": 0.00015577673839661416, "loss": 1.5182, "step": 18596 }, { "epoch": 1.46, "learning_rate": 0.0001557643878298688, "loss": 1.58, "step": 18597 }, { "epoch": 1.46, "learning_rate": 0.0001557520372239864, "loss": 1.4901, "step": 18598 }, { "epoch": 1.46, "learning_rate": 0.00015573968657905086, "loss": 1.5889, "step": 18599 }, { "epoch": 1.46, "learning_rate": 0.000155727335895146, "loss": 1.5716, "step": 18600 }, { "epoch": 1.46, "learning_rate": 0.0001557149851723557, "loss": 1.4895, "step": 18601 }, { "epoch": 1.46, "learning_rate": 0.0001557026344107638, "loss": 1.4913, "step": 18602 }, { "epoch": 1.46, "learning_rate": 0.00015569028361045413, "loss": 1.5669, "step": 18603 }, { "epoch": 1.46, "learning_rate": 0.00015567793277151056, "loss": 1.52, "step": 18604 }, { "epoch": 1.46, "learning_rate": 0.000155665581894017, "loss": 1.4739, "step": 18605 }, { "epoch": 1.46, "learning_rate": 0.00015565323097805727, "loss": 1.4933, "step": 18606 }, { "epoch": 1.46, "learning_rate": 0.00015564088002371524, "loss": 1.5128, "step": 18607 }, { "epoch": 1.46, "learning_rate": 0.0001556285290310747, "loss": 1.5845, "step": 18608 }, { "epoch": 1.46, "learning_rate": 0.00015561617800021957, "loss": 1.5622, "step": 18609 }, { "epoch": 1.46, "learning_rate": 0.0001556038269312337, "loss": 1.5431, "step": 18610 }, { "epoch": 1.46, "learning_rate": 0.0001555914758242009, "loss": 1.4713, "step": 18611 }, { "epoch": 1.46, "learning_rate": 0.00015557912467920512, "loss": 1.5174, "step": 18612 }, { "epoch": 1.46, "learning_rate": 0.00015556677349633013, "loss": 1.4884, "step": 18613 }, { "epoch": 1.46, "learning_rate": 0.00015555442227565983, "loss": 1.5114, "step": 18614 }, { "epoch": 1.46, "learning_rate": 0.00015554207101727807, "loss": 1.5431, "step": 18615 }, { "epoch": 1.46, "learning_rate": 0.00015552971972126873, "loss": 1.4914, "step": 18616 }, { "epoch": 1.46, "learning_rate": 0.00015551736838771558, "loss": 1.5145, "step": 18617 }, { "epoch": 1.46, "learning_rate": 0.0001555050170167026, "loss": 1.5241, "step": 18618 }, { "epoch": 1.46, "learning_rate": 0.0001554926656083136, "loss": 1.4862, "step": 18619 }, { "epoch": 1.47, "learning_rate": 0.00015548031416263235, "loss": 1.5621, "step": 18620 }, { "epoch": 1.47, "learning_rate": 0.0001554679626797429, "loss": 1.5073, "step": 18621 }, { "epoch": 1.47, "learning_rate": 0.0001554556111597289, "loss": 1.5225, "step": 18622 }, { "epoch": 1.47, "learning_rate": 0.00015544325960267435, "loss": 1.4954, "step": 18623 }, { "epoch": 1.47, "learning_rate": 0.00015543090800866313, "loss": 1.5183, "step": 18624 }, { "epoch": 1.47, "learning_rate": 0.00015541855637777897, "loss": 1.4942, "step": 18625 }, { "epoch": 1.47, "learning_rate": 0.00015540620471010582, "loss": 1.4675, "step": 18626 }, { "epoch": 1.47, "learning_rate": 0.00015539385300572753, "loss": 1.5118, "step": 18627 }, { "epoch": 1.47, "learning_rate": 0.00015538150126472795, "loss": 1.5242, "step": 18628 }, { "epoch": 1.47, "learning_rate": 0.00015536914948719095, "loss": 1.5169, "step": 18629 }, { "epoch": 1.47, "learning_rate": 0.00015535679767320035, "loss": 1.4842, "step": 18630 }, { "epoch": 1.47, "learning_rate": 0.00015534444582284015, "loss": 1.4854, "step": 18631 }, { "epoch": 1.47, "learning_rate": 0.000155332093936194, "loss": 1.5372, "step": 18632 }, { "epoch": 1.47, "learning_rate": 0.00015531974201334593, "loss": 1.569, "step": 18633 }, { "epoch": 1.47, "learning_rate": 0.00015530739005437975, "loss": 1.566, "step": 18634 }, { "epoch": 1.47, "learning_rate": 0.0001552950380593793, "loss": 1.4973, "step": 18635 }, { "epoch": 1.47, "learning_rate": 0.00015528268602842848, "loss": 1.5255, "step": 18636 }, { "epoch": 1.47, "learning_rate": 0.0001552703339616111, "loss": 1.4667, "step": 18637 }, { "epoch": 1.47, "learning_rate": 0.00015525798185901112, "loss": 1.5172, "step": 18638 }, { "epoch": 1.47, "learning_rate": 0.00015524562972071232, "loss": 1.5007, "step": 18639 }, { "epoch": 1.47, "learning_rate": 0.00015523327754679857, "loss": 1.4981, "step": 18640 }, { "epoch": 1.47, "learning_rate": 0.00015522092533735377, "loss": 1.4664, "step": 18641 }, { "epoch": 1.47, "learning_rate": 0.00015520857309246177, "loss": 1.479, "step": 18642 }, { "epoch": 1.47, "learning_rate": 0.00015519622081220643, "loss": 1.5245, "step": 18643 }, { "epoch": 1.47, "learning_rate": 0.00015518386849667162, "loss": 1.5344, "step": 18644 }, { "epoch": 1.47, "learning_rate": 0.00015517151614594118, "loss": 1.4651, "step": 18645 }, { "epoch": 1.47, "learning_rate": 0.00015515916376009902, "loss": 1.4933, "step": 18646 }, { "epoch": 1.47, "learning_rate": 0.000155146811339229, "loss": 1.5644, "step": 18647 }, { "epoch": 1.47, "learning_rate": 0.00015513445888341499, "loss": 1.5079, "step": 18648 }, { "epoch": 1.47, "learning_rate": 0.00015512210639274078, "loss": 1.5315, "step": 18649 }, { "epoch": 1.47, "learning_rate": 0.0001551097538672903, "loss": 1.5152, "step": 18650 }, { "epoch": 1.47, "learning_rate": 0.0001550974013071474, "loss": 1.4831, "step": 18651 }, { "epoch": 1.47, "learning_rate": 0.000155085048712396, "loss": 1.5458, "step": 18652 }, { "epoch": 1.47, "learning_rate": 0.00015507269608311996, "loss": 1.5106, "step": 18653 }, { "epoch": 1.47, "learning_rate": 0.00015506034341940305, "loss": 1.531, "step": 18654 }, { "epoch": 1.47, "learning_rate": 0.00015504799072132923, "loss": 1.498, "step": 18655 }, { "epoch": 1.47, "learning_rate": 0.00015503563798898232, "loss": 1.5371, "step": 18656 }, { "epoch": 1.47, "learning_rate": 0.0001550232852224462, "loss": 1.4416, "step": 18657 }, { "epoch": 1.47, "learning_rate": 0.00015501093242180477, "loss": 1.5272, "step": 18658 }, { "epoch": 1.47, "learning_rate": 0.00015499857958714184, "loss": 1.4876, "step": 18659 }, { "epoch": 1.47, "learning_rate": 0.00015498622671854134, "loss": 1.4853, "step": 18660 }, { "epoch": 1.47, "learning_rate": 0.00015497387381608712, "loss": 1.475, "step": 18661 }, { "epoch": 1.47, "learning_rate": 0.00015496152087986301, "loss": 1.5227, "step": 18662 }, { "epoch": 1.47, "learning_rate": 0.00015494916790995293, "loss": 1.5135, "step": 18663 }, { "epoch": 1.47, "learning_rate": 0.00015493681490644074, "loss": 1.5745, "step": 18664 }, { "epoch": 1.47, "learning_rate": 0.0001549244618694103, "loss": 1.5262, "step": 18665 }, { "epoch": 1.47, "learning_rate": 0.0001549121087989455, "loss": 1.5424, "step": 18666 }, { "epoch": 1.47, "learning_rate": 0.00015489975569513015, "loss": 1.512, "step": 18667 }, { "epoch": 1.47, "learning_rate": 0.00015488740255804816, "loss": 1.5418, "step": 18668 }, { "epoch": 1.47, "learning_rate": 0.00015487504938778342, "loss": 1.5175, "step": 18669 }, { "epoch": 1.47, "learning_rate": 0.00015486269618441981, "loss": 1.5158, "step": 18670 }, { "epoch": 1.47, "learning_rate": 0.00015485034294804116, "loss": 1.5153, "step": 18671 }, { "epoch": 1.47, "learning_rate": 0.00015483798967873136, "loss": 1.5335, "step": 18672 }, { "epoch": 1.47, "learning_rate": 0.00015482563637657425, "loss": 1.5227, "step": 18673 }, { "epoch": 1.47, "learning_rate": 0.00015481328304165376, "loss": 1.5509, "step": 18674 }, { "epoch": 1.47, "learning_rate": 0.0001548009296740537, "loss": 1.5293, "step": 18675 }, { "epoch": 1.47, "learning_rate": 0.000154788576273858, "loss": 1.4979, "step": 18676 }, { "epoch": 1.47, "learning_rate": 0.00015477622284115053, "loss": 1.5313, "step": 18677 }, { "epoch": 1.47, "learning_rate": 0.00015476386937601512, "loss": 1.5393, "step": 18678 }, { "epoch": 1.47, "learning_rate": 0.00015475151587853565, "loss": 1.5466, "step": 18679 }, { "epoch": 1.47, "learning_rate": 0.00015473916234879607, "loss": 1.5644, "step": 18680 }, { "epoch": 1.47, "learning_rate": 0.00015472680878688013, "loss": 1.5228, "step": 18681 }, { "epoch": 1.47, "learning_rate": 0.00015471445519287184, "loss": 1.5318, "step": 18682 }, { "epoch": 1.47, "learning_rate": 0.0001547021015668549, "loss": 1.4697, "step": 18683 }, { "epoch": 1.47, "learning_rate": 0.00015468974790891336, "loss": 1.5769, "step": 18684 }, { "epoch": 1.47, "learning_rate": 0.00015467739421913098, "loss": 1.5023, "step": 18685 }, { "epoch": 1.47, "learning_rate": 0.00015466504049759167, "loss": 1.5121, "step": 18686 }, { "epoch": 1.47, "learning_rate": 0.00015465268674437938, "loss": 1.4844, "step": 18687 }, { "epoch": 1.47, "learning_rate": 0.00015464033295957785, "loss": 1.5357, "step": 18688 }, { "epoch": 1.47, "learning_rate": 0.00015462797914327106, "loss": 1.509, "step": 18689 }, { "epoch": 1.47, "learning_rate": 0.0001546156252955428, "loss": 1.5052, "step": 18690 }, { "epoch": 1.47, "learning_rate": 0.000154603271416477, "loss": 1.5093, "step": 18691 }, { "epoch": 1.47, "learning_rate": 0.00015459091750615755, "loss": 1.505, "step": 18692 }, { "epoch": 1.47, "learning_rate": 0.0001545785635646683, "loss": 1.551, "step": 18693 }, { "epoch": 1.47, "learning_rate": 0.00015456620959209314, "loss": 1.518, "step": 18694 }, { "epoch": 1.47, "learning_rate": 0.0001545538555885159, "loss": 1.5318, "step": 18695 }, { "epoch": 1.47, "learning_rate": 0.00015454150155402052, "loss": 1.4931, "step": 18696 }, { "epoch": 1.47, "learning_rate": 0.00015452914748869087, "loss": 1.5311, "step": 18697 }, { "epoch": 1.47, "learning_rate": 0.00015451679339261077, "loss": 1.5501, "step": 18698 }, { "epoch": 1.47, "learning_rate": 0.00015450443926586413, "loss": 1.5472, "step": 18699 }, { "epoch": 1.47, "learning_rate": 0.00015449208510853485, "loss": 1.5511, "step": 18700 }, { "epoch": 1.47, "learning_rate": 0.00015447973092070678, "loss": 1.5199, "step": 18701 }, { "epoch": 1.47, "learning_rate": 0.00015446737670246386, "loss": 1.5515, "step": 18702 }, { "epoch": 1.47, "learning_rate": 0.00015445502245388983, "loss": 1.5, "step": 18703 }, { "epoch": 1.47, "learning_rate": 0.00015444266817506876, "loss": 1.5362, "step": 18704 }, { "epoch": 1.47, "learning_rate": 0.00015443031386608435, "loss": 1.5319, "step": 18705 }, { "epoch": 1.47, "learning_rate": 0.0001544179595270206, "loss": 1.5423, "step": 18706 }, { "epoch": 1.47, "learning_rate": 0.00015440560515796127, "loss": 1.5129, "step": 18707 }, { "epoch": 1.47, "learning_rate": 0.00015439325075899035, "loss": 1.4887, "step": 18708 }, { "epoch": 1.47, "learning_rate": 0.00015438089633019173, "loss": 1.5701, "step": 18709 }, { "epoch": 1.47, "learning_rate": 0.00015436854187164916, "loss": 1.4749, "step": 18710 }, { "epoch": 1.47, "learning_rate": 0.0001543561873834467, "loss": 1.5257, "step": 18711 }, { "epoch": 1.47, "learning_rate": 0.00015434383286566807, "loss": 1.5223, "step": 18712 }, { "epoch": 1.47, "learning_rate": 0.00015433147831839722, "loss": 1.5698, "step": 18713 }, { "epoch": 1.47, "learning_rate": 0.00015431912374171797, "loss": 1.5027, "step": 18714 }, { "epoch": 1.47, "learning_rate": 0.00015430676913571432, "loss": 1.5503, "step": 18715 }, { "epoch": 1.47, "learning_rate": 0.00015429441450047008, "loss": 1.5118, "step": 18716 }, { "epoch": 1.47, "learning_rate": 0.00015428205983606912, "loss": 1.5407, "step": 18717 }, { "epoch": 1.47, "learning_rate": 0.0001542697051425953, "loss": 1.507, "step": 18718 }, { "epoch": 1.47, "learning_rate": 0.00015425735042013262, "loss": 1.5054, "step": 18719 }, { "epoch": 1.47, "learning_rate": 0.00015424499566876485, "loss": 1.4848, "step": 18720 }, { "epoch": 1.47, "learning_rate": 0.0001542326408885759, "loss": 1.4745, "step": 18721 }, { "epoch": 1.47, "learning_rate": 0.0001542202860796496, "loss": 1.5408, "step": 18722 }, { "epoch": 1.47, "learning_rate": 0.00015420793124206996, "loss": 1.5437, "step": 18723 }, { "epoch": 1.47, "learning_rate": 0.00015419557637592074, "loss": 1.5006, "step": 18724 }, { "epoch": 1.47, "learning_rate": 0.00015418322148128588, "loss": 1.5566, "step": 18725 }, { "epoch": 1.47, "learning_rate": 0.00015417086655824928, "loss": 1.4912, "step": 18726 }, { "epoch": 1.47, "learning_rate": 0.00015415851160689478, "loss": 1.5143, "step": 18727 }, { "epoch": 1.47, "learning_rate": 0.00015414615662730634, "loss": 1.5133, "step": 18728 }, { "epoch": 1.47, "learning_rate": 0.00015413380161956766, "loss": 1.4866, "step": 18729 }, { "epoch": 1.47, "learning_rate": 0.00015412144658376282, "loss": 1.5435, "step": 18730 }, { "epoch": 1.47, "learning_rate": 0.00015410909151997564, "loss": 1.5553, "step": 18731 }, { "epoch": 1.47, "learning_rate": 0.00015409673642828998, "loss": 1.512, "step": 18732 }, { "epoch": 1.47, "learning_rate": 0.00015408438130878977, "loss": 1.5068, "step": 18733 }, { "epoch": 1.47, "learning_rate": 0.00015407202616155884, "loss": 1.5389, "step": 18734 }, { "epoch": 1.47, "learning_rate": 0.00015405967098668108, "loss": 1.4694, "step": 18735 }, { "epoch": 1.47, "learning_rate": 0.00015404731578424046, "loss": 1.5331, "step": 18736 }, { "epoch": 1.47, "learning_rate": 0.00015403496055432073, "loss": 1.4915, "step": 18737 }, { "epoch": 1.47, "learning_rate": 0.00015402260529700585, "loss": 1.4881, "step": 18738 }, { "epoch": 1.47, "learning_rate": 0.00015401025001237972, "loss": 1.5502, "step": 18739 }, { "epoch": 1.47, "learning_rate": 0.00015399789470052621, "loss": 1.4938, "step": 18740 }, { "epoch": 1.47, "learning_rate": 0.0001539855393615292, "loss": 1.5229, "step": 18741 }, { "epoch": 1.47, "learning_rate": 0.00015397318399547257, "loss": 1.5251, "step": 18742 }, { "epoch": 1.47, "learning_rate": 0.0001539608286024402, "loss": 1.5404, "step": 18743 }, { "epoch": 1.47, "learning_rate": 0.000153948473182516, "loss": 1.5029, "step": 18744 }, { "epoch": 1.47, "learning_rate": 0.00015393611773578385, "loss": 1.5715, "step": 18745 }, { "epoch": 1.47, "learning_rate": 0.00015392376226232762, "loss": 1.5162, "step": 18746 }, { "epoch": 1.48, "learning_rate": 0.00015391140676223122, "loss": 1.5232, "step": 18747 }, { "epoch": 1.48, "learning_rate": 0.00015389905123557856, "loss": 1.5321, "step": 18748 }, { "epoch": 1.48, "learning_rate": 0.00015388669568245345, "loss": 1.502, "step": 18749 }, { "epoch": 1.48, "learning_rate": 0.00015387434010293987, "loss": 1.5396, "step": 18750 }, { "epoch": 1.48, "learning_rate": 0.00015386198449712158, "loss": 1.5425, "step": 18751 }, { "epoch": 1.48, "learning_rate": 0.0001538496288650826, "loss": 1.5405, "step": 18752 }, { "epoch": 1.48, "learning_rate": 0.00015383727320690676, "loss": 1.4937, "step": 18753 }, { "epoch": 1.48, "learning_rate": 0.00015382491752267792, "loss": 1.5331, "step": 18754 }, { "epoch": 1.48, "learning_rate": 0.00015381256181248005, "loss": 1.5057, "step": 18755 }, { "epoch": 1.48, "learning_rate": 0.00015380020607639694, "loss": 1.5152, "step": 18756 }, { "epoch": 1.48, "learning_rate": 0.00015378785031451258, "loss": 1.4946, "step": 18757 }, { "epoch": 1.48, "learning_rate": 0.00015377549452691078, "loss": 1.499, "step": 18758 }, { "epoch": 1.48, "learning_rate": 0.00015376313871367546, "loss": 1.5454, "step": 18759 }, { "epoch": 1.48, "learning_rate": 0.0001537507828748905, "loss": 1.5292, "step": 18760 }, { "epoch": 1.48, "learning_rate": 0.00015373842701063976, "loss": 1.4765, "step": 18761 }, { "epoch": 1.48, "learning_rate": 0.00015372607112100722, "loss": 1.4846, "step": 18762 }, { "epoch": 1.48, "learning_rate": 0.0001537137152060767, "loss": 1.5723, "step": 18763 }, { "epoch": 1.48, "learning_rate": 0.0001537013592659321, "loss": 1.5154, "step": 18764 }, { "epoch": 1.48, "learning_rate": 0.0001536890033006573, "loss": 1.5288, "step": 18765 }, { "epoch": 1.48, "learning_rate": 0.00015367664731033622, "loss": 1.5391, "step": 18766 }, { "epoch": 1.48, "learning_rate": 0.00015366429129505275, "loss": 1.5238, "step": 18767 }, { "epoch": 1.48, "learning_rate": 0.00015365193525489071, "loss": 1.5834, "step": 18768 }, { "epoch": 1.48, "learning_rate": 0.0001536395791899341, "loss": 1.5027, "step": 18769 }, { "epoch": 1.48, "learning_rate": 0.00015362722310026673, "loss": 1.5088, "step": 18770 }, { "epoch": 1.48, "learning_rate": 0.00015361486698597249, "loss": 1.4959, "step": 18771 }, { "epoch": 1.48, "learning_rate": 0.00015360251084713537, "loss": 1.513, "step": 18772 }, { "epoch": 1.48, "learning_rate": 0.00015359015468383914, "loss": 1.5192, "step": 18773 }, { "epoch": 1.48, "learning_rate": 0.00015357779849616772, "loss": 1.5347, "step": 18774 }, { "epoch": 1.48, "learning_rate": 0.00015356544228420507, "loss": 1.5, "step": 18775 }, { "epoch": 1.48, "learning_rate": 0.000153553086048035, "loss": 1.4913, "step": 18776 }, { "epoch": 1.48, "learning_rate": 0.00015354072978774144, "loss": 1.5776, "step": 18777 }, { "epoch": 1.48, "learning_rate": 0.0001535283735034083, "loss": 1.4522, "step": 18778 }, { "epoch": 1.48, "learning_rate": 0.00015351601719511943, "loss": 1.5955, "step": 18779 }, { "epoch": 1.48, "learning_rate": 0.00015350366086295874, "loss": 1.5522, "step": 18780 }, { "epoch": 1.48, "learning_rate": 0.00015349130450701014, "loss": 1.5428, "step": 18781 }, { "epoch": 1.48, "learning_rate": 0.00015347894812735755, "loss": 1.566, "step": 18782 }, { "epoch": 1.48, "learning_rate": 0.00015346659172408477, "loss": 1.4537, "step": 18783 }, { "epoch": 1.48, "learning_rate": 0.00015345423529727572, "loss": 1.5274, "step": 18784 }, { "epoch": 1.48, "learning_rate": 0.00015344187884701438, "loss": 1.4982, "step": 18785 }, { "epoch": 1.48, "learning_rate": 0.00015342952237338452, "loss": 1.5222, "step": 18786 }, { "epoch": 1.48, "learning_rate": 0.00015341716587647015, "loss": 1.4943, "step": 18787 }, { "epoch": 1.48, "learning_rate": 0.0001534048093563551, "loss": 1.5136, "step": 18788 }, { "epoch": 1.48, "learning_rate": 0.00015339245281312329, "loss": 1.5473, "step": 18789 }, { "epoch": 1.48, "learning_rate": 0.00015338009624685857, "loss": 1.5211, "step": 18790 }, { "epoch": 1.48, "learning_rate": 0.00015336773965764482, "loss": 1.4549, "step": 18791 }, { "epoch": 1.48, "learning_rate": 0.00015335538304556606, "loss": 1.5352, "step": 18792 }, { "epoch": 1.48, "learning_rate": 0.00015334302641070602, "loss": 1.4732, "step": 18793 }, { "epoch": 1.48, "learning_rate": 0.00015333066975314877, "loss": 1.5119, "step": 18794 }, { "epoch": 1.48, "learning_rate": 0.00015331831307297802, "loss": 1.4907, "step": 18795 }, { "epoch": 1.48, "learning_rate": 0.00015330595637027782, "loss": 1.4949, "step": 18796 }, { "epoch": 1.48, "learning_rate": 0.00015329359964513195, "loss": 1.5064, "step": 18797 }, { "epoch": 1.48, "learning_rate": 0.0001532812428976244, "loss": 1.4889, "step": 18798 }, { "epoch": 1.48, "learning_rate": 0.00015326888612783902, "loss": 1.4947, "step": 18799 }, { "epoch": 1.48, "learning_rate": 0.00015325652933585965, "loss": 1.481, "step": 18800 }, { "epoch": 1.48, "learning_rate": 0.00015324417252177028, "loss": 1.5114, "step": 18801 }, { "epoch": 1.48, "learning_rate": 0.00015323181568565475, "loss": 1.4846, "step": 18802 }, { "epoch": 1.48, "learning_rate": 0.00015321945882759702, "loss": 1.5144, "step": 18803 }, { "epoch": 1.48, "learning_rate": 0.00015320710194768091, "loss": 1.5215, "step": 18804 }, { "epoch": 1.48, "learning_rate": 0.00015319474504599037, "loss": 1.537, "step": 18805 }, { "epoch": 1.48, "learning_rate": 0.00015318238812260927, "loss": 1.5812, "step": 18806 }, { "epoch": 1.48, "learning_rate": 0.0001531700311776215, "loss": 1.5279, "step": 18807 }, { "epoch": 1.48, "learning_rate": 0.00015315767421111092, "loss": 1.5649, "step": 18808 }, { "epoch": 1.48, "learning_rate": 0.00015314531722316151, "loss": 1.5196, "step": 18809 }, { "epoch": 1.48, "learning_rate": 0.00015313296021385715, "loss": 1.5287, "step": 18810 }, { "epoch": 1.48, "learning_rate": 0.00015312060318328172, "loss": 1.4942, "step": 18811 }, { "epoch": 1.48, "learning_rate": 0.0001531082461315191, "loss": 1.523, "step": 18812 }, { "epoch": 1.48, "learning_rate": 0.0001530958890586532, "loss": 1.4953, "step": 18813 }, { "epoch": 1.48, "learning_rate": 0.00015308353196476796, "loss": 1.4731, "step": 18814 }, { "epoch": 1.48, "learning_rate": 0.0001530711748499472, "loss": 1.5341, "step": 18815 }, { "epoch": 1.48, "learning_rate": 0.00015305881771427487, "loss": 1.4921, "step": 18816 }, { "epoch": 1.48, "learning_rate": 0.00015304646055783487, "loss": 1.4886, "step": 18817 }, { "epoch": 1.48, "learning_rate": 0.00015303410338071108, "loss": 1.5189, "step": 18818 }, { "epoch": 1.48, "learning_rate": 0.0001530217461829874, "loss": 1.4811, "step": 18819 }, { "epoch": 1.48, "learning_rate": 0.00015300938896474768, "loss": 1.5299, "step": 18820 }, { "epoch": 1.48, "learning_rate": 0.00015299703172607593, "loss": 1.4689, "step": 18821 }, { "epoch": 1.48, "learning_rate": 0.000152984674467056, "loss": 1.5491, "step": 18822 }, { "epoch": 1.48, "learning_rate": 0.00015297231718777176, "loss": 1.4636, "step": 18823 }, { "epoch": 1.48, "learning_rate": 0.00015295995988830706, "loss": 1.541, "step": 18824 }, { "epoch": 1.48, "learning_rate": 0.00015294760256874594, "loss": 1.5524, "step": 18825 }, { "epoch": 1.48, "learning_rate": 0.00015293524522917219, "loss": 1.4928, "step": 18826 }, { "epoch": 1.48, "learning_rate": 0.00015292288786966976, "loss": 1.4907, "step": 18827 }, { "epoch": 1.48, "learning_rate": 0.00015291053049032257, "loss": 1.5266, "step": 18828 }, { "epoch": 1.48, "learning_rate": 0.00015289817309121446, "loss": 1.4845, "step": 18829 }, { "epoch": 1.48, "learning_rate": 0.0001528858156724293, "loss": 1.5212, "step": 18830 }, { "epoch": 1.48, "learning_rate": 0.00015287345823405114, "loss": 1.5156, "step": 18831 }, { "epoch": 1.48, "learning_rate": 0.00015286110077616369, "loss": 1.48, "step": 18832 }, { "epoch": 1.48, "learning_rate": 0.000152848743298851, "loss": 1.4918, "step": 18833 }, { "epoch": 1.48, "learning_rate": 0.0001528363858021969, "loss": 1.4945, "step": 18834 }, { "epoch": 1.48, "learning_rate": 0.00015282402828628531, "loss": 1.4896, "step": 18835 }, { "epoch": 1.48, "learning_rate": 0.00015281167075120014, "loss": 1.5639, "step": 18836 }, { "epoch": 1.48, "learning_rate": 0.00015279931319702527, "loss": 1.5718, "step": 18837 }, { "epoch": 1.48, "learning_rate": 0.00015278695562384457, "loss": 1.5311, "step": 18838 }, { "epoch": 1.48, "learning_rate": 0.00015277459803174205, "loss": 1.5497, "step": 18839 }, { "epoch": 1.48, "learning_rate": 0.00015276224042080146, "loss": 1.5162, "step": 18840 }, { "epoch": 1.48, "learning_rate": 0.00015274988279110683, "loss": 1.4989, "step": 18841 }, { "epoch": 1.48, "learning_rate": 0.000152737525142742, "loss": 1.4681, "step": 18842 }, { "epoch": 1.48, "learning_rate": 0.0001527251674757909, "loss": 1.5568, "step": 18843 }, { "epoch": 1.48, "learning_rate": 0.00015271280979033738, "loss": 1.527, "step": 18844 }, { "epoch": 1.48, "learning_rate": 0.00015270045208646543, "loss": 1.5067, "step": 18845 }, { "epoch": 1.48, "learning_rate": 0.0001526880943642589, "loss": 1.5569, "step": 18846 }, { "epoch": 1.48, "learning_rate": 0.00015267573662380163, "loss": 1.5169, "step": 18847 }, { "epoch": 1.48, "learning_rate": 0.0001526633788651776, "loss": 1.4862, "step": 18848 }, { "epoch": 1.48, "learning_rate": 0.00015265102108847074, "loss": 1.5289, "step": 18849 }, { "epoch": 1.48, "learning_rate": 0.0001526386632937649, "loss": 1.5268, "step": 18850 }, { "epoch": 1.48, "learning_rate": 0.00015262630548114396, "loss": 1.542, "step": 18851 }, { "epoch": 1.48, "learning_rate": 0.0001526139476506919, "loss": 1.4921, "step": 18852 }, { "epoch": 1.48, "learning_rate": 0.00015260158980249256, "loss": 1.4521, "step": 18853 }, { "epoch": 1.48, "learning_rate": 0.00015258923193662983, "loss": 1.4814, "step": 18854 }, { "epoch": 1.48, "learning_rate": 0.0001525768740531877, "loss": 1.5388, "step": 18855 }, { "epoch": 1.48, "learning_rate": 0.00015256451615224993, "loss": 1.5405, "step": 18856 }, { "epoch": 1.48, "learning_rate": 0.0001525521582339006, "loss": 1.5213, "step": 18857 }, { "epoch": 1.48, "learning_rate": 0.00015253980029822348, "loss": 1.5028, "step": 18858 }, { "epoch": 1.48, "learning_rate": 0.00015252744234530254, "loss": 1.5052, "step": 18859 }, { "epoch": 1.48, "learning_rate": 0.00015251508437522164, "loss": 1.549, "step": 18860 }, { "epoch": 1.48, "learning_rate": 0.0001525027263880647, "loss": 1.5042, "step": 18861 }, { "epoch": 1.48, "learning_rate": 0.0001524903683839157, "loss": 1.5726, "step": 18862 }, { "epoch": 1.48, "learning_rate": 0.0001524780103628584, "loss": 1.5506, "step": 18863 }, { "epoch": 1.48, "learning_rate": 0.0001524656523249768, "loss": 1.508, "step": 18864 }, { "epoch": 1.48, "learning_rate": 0.00015245329427035476, "loss": 1.5335, "step": 18865 }, { "epoch": 1.48, "learning_rate": 0.0001524409361990762, "loss": 1.4732, "step": 18866 }, { "epoch": 1.48, "learning_rate": 0.0001524285781112251, "loss": 1.4634, "step": 18867 }, { "epoch": 1.48, "learning_rate": 0.00015241622000688524, "loss": 1.5246, "step": 18868 }, { "epoch": 1.48, "learning_rate": 0.00015240386188614057, "loss": 1.4851, "step": 18869 }, { "epoch": 1.48, "learning_rate": 0.00015239150374907504, "loss": 1.4728, "step": 18870 }, { "epoch": 1.48, "learning_rate": 0.00015237914559577246, "loss": 1.4819, "step": 18871 }, { "epoch": 1.48, "learning_rate": 0.00015236678742631686, "loss": 1.5154, "step": 18872 }, { "epoch": 1.48, "learning_rate": 0.00015235442924079202, "loss": 1.5164, "step": 18873 }, { "epoch": 1.49, "learning_rate": 0.000152342071039282, "loss": 1.4833, "step": 18874 }, { "epoch": 1.49, "learning_rate": 0.00015232971282187052, "loss": 1.5143, "step": 18875 }, { "epoch": 1.49, "learning_rate": 0.00015231735458864158, "loss": 1.5101, "step": 18876 }, { "epoch": 1.49, "learning_rate": 0.00015230499633967916, "loss": 1.5171, "step": 18877 }, { "epoch": 1.49, "learning_rate": 0.00015229263807506698, "loss": 1.523, "step": 18878 }, { "epoch": 1.49, "learning_rate": 0.00015228027979488913, "loss": 1.5197, "step": 18879 }, { "epoch": 1.49, "learning_rate": 0.00015226792149922942, "loss": 1.504, "step": 18880 }, { "epoch": 1.49, "learning_rate": 0.00015225556318817178, "loss": 1.538, "step": 18881 }, { "epoch": 1.49, "learning_rate": 0.0001522432048618001, "loss": 1.527, "step": 18882 }, { "epoch": 1.49, "learning_rate": 0.00015223084652019828, "loss": 1.5743, "step": 18883 }, { "epoch": 1.49, "learning_rate": 0.00015221848816345025, "loss": 1.5521, "step": 18884 }, { "epoch": 1.49, "learning_rate": 0.00015220612979163992, "loss": 1.5308, "step": 18885 }, { "epoch": 1.49, "learning_rate": 0.0001521937714048512, "loss": 1.5629, "step": 18886 }, { "epoch": 1.49, "learning_rate": 0.00015218141300316795, "loss": 1.5847, "step": 18887 }, { "epoch": 1.49, "learning_rate": 0.00015216905458667412, "loss": 1.558, "step": 18888 }, { "epoch": 1.49, "learning_rate": 0.00015215669615545365, "loss": 1.5527, "step": 18889 }, { "epoch": 1.49, "learning_rate": 0.00015214433770959033, "loss": 1.4879, "step": 18890 }, { "epoch": 1.49, "learning_rate": 0.0001521319792491682, "loss": 1.5797, "step": 18891 }, { "epoch": 1.49, "learning_rate": 0.00015211962077427106, "loss": 1.493, "step": 18892 }, { "epoch": 1.49, "learning_rate": 0.0001521072622849829, "loss": 1.5495, "step": 18893 }, { "epoch": 1.49, "learning_rate": 0.00015209490378138762, "loss": 1.4694, "step": 18894 }, { "epoch": 1.49, "learning_rate": 0.000152082545263569, "loss": 1.5198, "step": 18895 }, { "epoch": 1.49, "learning_rate": 0.00015207018673161113, "loss": 1.5058, "step": 18896 }, { "epoch": 1.49, "learning_rate": 0.0001520578281855978, "loss": 1.5034, "step": 18897 }, { "epoch": 1.49, "learning_rate": 0.00015204546962561296, "loss": 1.5348, "step": 18898 }, { "epoch": 1.49, "learning_rate": 0.00015203311105174052, "loss": 1.5272, "step": 18899 }, { "epoch": 1.49, "learning_rate": 0.0001520207524640644, "loss": 1.5116, "step": 18900 }, { "epoch": 1.49, "learning_rate": 0.00015200839386266847, "loss": 1.5168, "step": 18901 }, { "epoch": 1.49, "learning_rate": 0.00015199603524763662, "loss": 1.5071, "step": 18902 }, { "epoch": 1.49, "learning_rate": 0.00015198367661905282, "loss": 1.4791, "step": 18903 }, { "epoch": 1.49, "learning_rate": 0.00015197131797700092, "loss": 1.4887, "step": 18904 }, { "epoch": 1.49, "learning_rate": 0.00015195895932156487, "loss": 1.5082, "step": 18905 }, { "epoch": 1.49, "learning_rate": 0.0001519466006528286, "loss": 1.5403, "step": 18906 }, { "epoch": 1.49, "learning_rate": 0.00015193424197087598, "loss": 1.5118, "step": 18907 }, { "epoch": 1.49, "learning_rate": 0.00015192188327579093, "loss": 1.5523, "step": 18908 }, { "epoch": 1.49, "learning_rate": 0.0001519095245676573, "loss": 1.496, "step": 18909 }, { "epoch": 1.49, "learning_rate": 0.00015189716584655907, "loss": 1.482, "step": 18910 }, { "epoch": 1.49, "learning_rate": 0.00015188480711258016, "loss": 1.4868, "step": 18911 }, { "epoch": 1.49, "learning_rate": 0.00015187244836580442, "loss": 1.5177, "step": 18912 }, { "epoch": 1.49, "learning_rate": 0.00015186008960631586, "loss": 1.4621, "step": 18913 }, { "epoch": 1.49, "learning_rate": 0.0001518477308341982, "loss": 1.5026, "step": 18914 }, { "epoch": 1.49, "learning_rate": 0.00015183537204953556, "loss": 1.4869, "step": 18915 }, { "epoch": 1.49, "learning_rate": 0.00015182301325241174, "loss": 1.5326, "step": 18916 }, { "epoch": 1.49, "learning_rate": 0.00015181065444291064, "loss": 1.5294, "step": 18917 }, { "epoch": 1.49, "learning_rate": 0.00015179829562111624, "loss": 1.5487, "step": 18918 }, { "epoch": 1.49, "learning_rate": 0.00015178593678711233, "loss": 1.5112, "step": 18919 }, { "epoch": 1.49, "learning_rate": 0.00015177357794098295, "loss": 1.4723, "step": 18920 }, { "epoch": 1.49, "learning_rate": 0.00015176121908281196, "loss": 1.5087, "step": 18921 }, { "epoch": 1.49, "learning_rate": 0.00015174886021268323, "loss": 1.5002, "step": 18922 }, { "epoch": 1.49, "learning_rate": 0.00015173650133068074, "loss": 1.5113, "step": 18923 }, { "epoch": 1.49, "learning_rate": 0.00015172414243688835, "loss": 1.5073, "step": 18924 }, { "epoch": 1.49, "learning_rate": 0.00015171178353138993, "loss": 1.5387, "step": 18925 }, { "epoch": 1.49, "learning_rate": 0.0001516994246142695, "loss": 1.5315, "step": 18926 }, { "epoch": 1.49, "learning_rate": 0.0001516870656856109, "loss": 1.5035, "step": 18927 }, { "epoch": 1.49, "learning_rate": 0.0001516747067454981, "loss": 1.5538, "step": 18928 }, { "epoch": 1.49, "learning_rate": 0.00015166234779401494, "loss": 1.5652, "step": 18929 }, { "epoch": 1.49, "learning_rate": 0.00015164998883124536, "loss": 1.5341, "step": 18930 }, { "epoch": 1.49, "learning_rate": 0.00015163762985727323, "loss": 1.5379, "step": 18931 }, { "epoch": 1.49, "learning_rate": 0.00015162527087218253, "loss": 1.5028, "step": 18932 }, { "epoch": 1.49, "learning_rate": 0.0001516129118760571, "loss": 1.5142, "step": 18933 }, { "epoch": 1.49, "learning_rate": 0.0001516005528689809, "loss": 1.5404, "step": 18934 }, { "epoch": 1.49, "learning_rate": 0.0001515881938510379, "loss": 1.5811, "step": 18935 }, { "epoch": 1.49, "learning_rate": 0.00015157583482231185, "loss": 1.4957, "step": 18936 }, { "epoch": 1.49, "learning_rate": 0.00015156347578288682, "loss": 1.447, "step": 18937 }, { "epoch": 1.49, "learning_rate": 0.0001515511167328466, "loss": 1.5872, "step": 18938 }, { "epoch": 1.49, "learning_rate": 0.00015153875767227515, "loss": 1.5817, "step": 18939 }, { "epoch": 1.49, "learning_rate": 0.00015152639860125644, "loss": 1.5095, "step": 18940 }, { "epoch": 1.49, "learning_rate": 0.0001515140395198743, "loss": 1.4815, "step": 18941 }, { "epoch": 1.49, "learning_rate": 0.00015150168042821265, "loss": 1.5278, "step": 18942 }, { "epoch": 1.49, "learning_rate": 0.0001514893213263554, "loss": 1.5138, "step": 18943 }, { "epoch": 1.49, "learning_rate": 0.0001514769622143865, "loss": 1.5037, "step": 18944 }, { "epoch": 1.49, "learning_rate": 0.00015146460309238988, "loss": 1.5074, "step": 18945 }, { "epoch": 1.49, "learning_rate": 0.0001514522439604494, "loss": 1.4646, "step": 18946 }, { "epoch": 1.49, "learning_rate": 0.00015143988481864897, "loss": 1.5085, "step": 18947 }, { "epoch": 1.49, "learning_rate": 0.0001514275256670725, "loss": 1.55, "step": 18948 }, { "epoch": 1.49, "learning_rate": 0.0001514151665058039, "loss": 1.5217, "step": 18949 }, { "epoch": 1.49, "learning_rate": 0.00015140280733492713, "loss": 1.5216, "step": 18950 }, { "epoch": 1.49, "learning_rate": 0.0001513904481545261, "loss": 1.5041, "step": 18951 }, { "epoch": 1.49, "learning_rate": 0.00015137808896468469, "loss": 1.485, "step": 18952 }, { "epoch": 1.49, "learning_rate": 0.00015136572976548677, "loss": 1.5367, "step": 18953 }, { "epoch": 1.49, "learning_rate": 0.0001513533705570163, "loss": 1.5191, "step": 18954 }, { "epoch": 1.49, "learning_rate": 0.00015134101133935726, "loss": 1.5704, "step": 18955 }, { "epoch": 1.49, "learning_rate": 0.00015132865211259342, "loss": 1.4991, "step": 18956 }, { "epoch": 1.49, "learning_rate": 0.00015131629287680882, "loss": 1.5054, "step": 18957 }, { "epoch": 1.49, "learning_rate": 0.00015130393363208726, "loss": 1.506, "step": 18958 }, { "epoch": 1.49, "learning_rate": 0.00015129157437851278, "loss": 1.4986, "step": 18959 }, { "epoch": 1.49, "learning_rate": 0.00015127921511616914, "loss": 1.5231, "step": 18960 }, { "epoch": 1.49, "learning_rate": 0.0001512668558451404, "loss": 1.4824, "step": 18961 }, { "epoch": 1.49, "learning_rate": 0.0001512544965655104, "loss": 1.5252, "step": 18962 }, { "epoch": 1.49, "learning_rate": 0.00015124213727736303, "loss": 1.4634, "step": 18963 }, { "epoch": 1.49, "learning_rate": 0.00015122977798078227, "loss": 1.4874, "step": 18964 }, { "epoch": 1.49, "learning_rate": 0.00015121741867585198, "loss": 1.5231, "step": 18965 }, { "epoch": 1.49, "learning_rate": 0.00015120505936265608, "loss": 1.5015, "step": 18966 }, { "epoch": 1.49, "learning_rate": 0.00015119270004127847, "loss": 1.5545, "step": 18967 }, { "epoch": 1.49, "learning_rate": 0.00015118034071180312, "loss": 1.5378, "step": 18968 }, { "epoch": 1.49, "learning_rate": 0.0001511679813743139, "loss": 1.5439, "step": 18969 }, { "epoch": 1.49, "learning_rate": 0.00015115562202889474, "loss": 1.4786, "step": 18970 }, { "epoch": 1.49, "learning_rate": 0.00015114326267562952, "loss": 1.508, "step": 18971 }, { "epoch": 1.49, "learning_rate": 0.00015113090331460223, "loss": 1.5631, "step": 18972 }, { "epoch": 1.49, "learning_rate": 0.0001511185439458967, "loss": 1.4882, "step": 18973 }, { "epoch": 1.49, "learning_rate": 0.00015110618456959686, "loss": 1.5879, "step": 18974 }, { "epoch": 1.49, "learning_rate": 0.00015109382518578663, "loss": 1.5319, "step": 18975 }, { "epoch": 1.49, "learning_rate": 0.00015108146579454997, "loss": 1.5107, "step": 18976 }, { "epoch": 1.49, "learning_rate": 0.00015106910639597074, "loss": 1.5428, "step": 18977 }, { "epoch": 1.49, "learning_rate": 0.00015105674699013283, "loss": 1.4833, "step": 18978 }, { "epoch": 1.49, "learning_rate": 0.00015104438757712022, "loss": 1.5184, "step": 18979 }, { "epoch": 1.49, "learning_rate": 0.0001510320281570168, "loss": 1.517, "step": 18980 }, { "epoch": 1.49, "learning_rate": 0.00015101966872990648, "loss": 1.4944, "step": 18981 }, { "epoch": 1.49, "learning_rate": 0.00015100730929587313, "loss": 1.5305, "step": 18982 }, { "epoch": 1.49, "learning_rate": 0.00015099494985500075, "loss": 1.4759, "step": 18983 }, { "epoch": 1.49, "learning_rate": 0.00015098259040737322, "loss": 1.5025, "step": 18984 }, { "epoch": 1.49, "learning_rate": 0.0001509702309530744, "loss": 1.5579, "step": 18985 }, { "epoch": 1.49, "learning_rate": 0.00015095787149218832, "loss": 1.5226, "step": 18986 }, { "epoch": 1.49, "learning_rate": 0.00015094551202479874, "loss": 1.5273, "step": 18987 }, { "epoch": 1.49, "learning_rate": 0.00015093315255098968, "loss": 1.4878, "step": 18988 }, { "epoch": 1.49, "learning_rate": 0.00015092079307084502, "loss": 1.4995, "step": 18989 }, { "epoch": 1.49, "learning_rate": 0.00015090843358444867, "loss": 1.4746, "step": 18990 }, { "epoch": 1.49, "learning_rate": 0.00015089607409188465, "loss": 1.5024, "step": 18991 }, { "epoch": 1.49, "learning_rate": 0.0001508837145932367, "loss": 1.5319, "step": 18992 }, { "epoch": 1.49, "learning_rate": 0.00015087135508858886, "loss": 1.5242, "step": 18993 }, { "epoch": 1.49, "learning_rate": 0.00015085899557802497, "loss": 1.528, "step": 18994 }, { "epoch": 1.49, "learning_rate": 0.00015084663606162896, "loss": 1.519, "step": 18995 }, { "epoch": 1.49, "learning_rate": 0.0001508342765394848, "loss": 1.5544, "step": 18996 }, { "epoch": 1.49, "learning_rate": 0.0001508219170116763, "loss": 1.6043, "step": 18997 }, { "epoch": 1.49, "learning_rate": 0.0001508095574782875, "loss": 1.5623, "step": 18998 }, { "epoch": 1.49, "learning_rate": 0.00015079719793940221, "loss": 1.525, "step": 18999 }, { "epoch": 1.49, "learning_rate": 0.0001507848383951044, "loss": 1.5038, "step": 19000 }, { "epoch": 1.5, "learning_rate": 0.00015077247884547797, "loss": 1.5071, "step": 19001 }, { "epoch": 1.5, "learning_rate": 0.00015076011929060683, "loss": 1.5283, "step": 19002 }, { "epoch": 1.5, "learning_rate": 0.00015074775973057493, "loss": 1.4588, "step": 19003 }, { "epoch": 1.5, "learning_rate": 0.00015073540016546612, "loss": 1.5523, "step": 19004 }, { "epoch": 1.5, "learning_rate": 0.00015072304059536435, "loss": 1.5246, "step": 19005 }, { "epoch": 1.5, "learning_rate": 0.00015071068102035355, "loss": 1.5534, "step": 19006 }, { "epoch": 1.5, "learning_rate": 0.0001506983214405176, "loss": 1.4636, "step": 19007 }, { "epoch": 1.5, "learning_rate": 0.00015068596185594047, "loss": 1.5091, "step": 19008 }, { "epoch": 1.5, "learning_rate": 0.000150673602266706, "loss": 1.5022, "step": 19009 }, { "epoch": 1.5, "learning_rate": 0.00015066124267289817, "loss": 1.5276, "step": 19010 }, { "epoch": 1.5, "learning_rate": 0.00015064888307460086, "loss": 1.5316, "step": 19011 }, { "epoch": 1.5, "learning_rate": 0.00015063652347189796, "loss": 1.5045, "step": 19012 }, { "epoch": 1.5, "learning_rate": 0.00015062416386487344, "loss": 1.4937, "step": 19013 }, { "epoch": 1.5, "learning_rate": 0.00015061180425361118, "loss": 1.5083, "step": 19014 }, { "epoch": 1.5, "learning_rate": 0.00015059944463819515, "loss": 1.4937, "step": 19015 }, { "epoch": 1.5, "learning_rate": 0.00015058708501870918, "loss": 1.5263, "step": 19016 }, { "epoch": 1.5, "learning_rate": 0.00015057472539523723, "loss": 1.4435, "step": 19017 }, { "epoch": 1.5, "learning_rate": 0.00015056236576786324, "loss": 1.544, "step": 19018 }, { "epoch": 1.5, "learning_rate": 0.00015055000613667106, "loss": 1.5399, "step": 19019 }, { "epoch": 1.5, "learning_rate": 0.00015053764650174468, "loss": 1.5196, "step": 19020 }, { "epoch": 1.5, "learning_rate": 0.00015052528686316792, "loss": 1.5137, "step": 19021 }, { "epoch": 1.5, "learning_rate": 0.00015051292722102476, "loss": 1.5155, "step": 19022 }, { "epoch": 1.5, "learning_rate": 0.00015050056757539917, "loss": 1.5595, "step": 19023 }, { "epoch": 1.5, "learning_rate": 0.00015048820792637498, "loss": 1.4853, "step": 19024 }, { "epoch": 1.5, "learning_rate": 0.00015047584827403612, "loss": 1.5101, "step": 19025 }, { "epoch": 1.5, "learning_rate": 0.00015046348861846647, "loss": 1.4827, "step": 19026 }, { "epoch": 1.5, "learning_rate": 0.00015045112895975, "loss": 1.5008, "step": 19027 }, { "epoch": 1.5, "learning_rate": 0.00015043876929797068, "loss": 1.4316, "step": 19028 }, { "epoch": 1.5, "learning_rate": 0.0001504264096332123, "loss": 1.4498, "step": 19029 }, { "epoch": 1.5, "learning_rate": 0.00015041404996555887, "loss": 1.5157, "step": 19030 }, { "epoch": 1.5, "learning_rate": 0.00015040169029509424, "loss": 1.5331, "step": 19031 }, { "epoch": 1.5, "learning_rate": 0.0001503893306219024, "loss": 1.5468, "step": 19032 }, { "epoch": 1.5, "learning_rate": 0.00015037697094606717, "loss": 1.5189, "step": 19033 }, { "epoch": 1.5, "learning_rate": 0.00015036461126767252, "loss": 1.476, "step": 19034 }, { "epoch": 1.5, "learning_rate": 0.0001503522515868024, "loss": 1.5774, "step": 19035 }, { "epoch": 1.5, "learning_rate": 0.0001503398919035406, "loss": 1.4961, "step": 19036 }, { "epoch": 1.5, "learning_rate": 0.0001503275322179712, "loss": 1.5175, "step": 19037 }, { "epoch": 1.5, "learning_rate": 0.00015031517253017798, "loss": 1.5397, "step": 19038 }, { "epoch": 1.5, "learning_rate": 0.00015030281284024495, "loss": 1.5105, "step": 19039 }, { "epoch": 1.5, "learning_rate": 0.000150290453148256, "loss": 1.4931, "step": 19040 }, { "epoch": 1.5, "learning_rate": 0.000150278093454295, "loss": 1.4824, "step": 19041 }, { "epoch": 1.5, "learning_rate": 0.00015026573375844597, "loss": 1.4967, "step": 19042 }, { "epoch": 1.5, "learning_rate": 0.0001502533740607927, "loss": 1.4956, "step": 19043 }, { "epoch": 1.5, "learning_rate": 0.00015024101436141916, "loss": 1.5657, "step": 19044 }, { "epoch": 1.5, "learning_rate": 0.00015022865466040924, "loss": 1.5218, "step": 19045 }, { "epoch": 1.5, "learning_rate": 0.0001502162949578469, "loss": 1.5274, "step": 19046 }, { "epoch": 1.5, "learning_rate": 0.00015020393525381608, "loss": 1.5312, "step": 19047 }, { "epoch": 1.5, "learning_rate": 0.00015019157554840062, "loss": 1.5989, "step": 19048 }, { "epoch": 1.5, "learning_rate": 0.00015017921584168446, "loss": 1.566, "step": 19049 }, { "epoch": 1.5, "learning_rate": 0.00015016685613375154, "loss": 1.5108, "step": 19050 }, { "epoch": 1.5, "learning_rate": 0.00015015449642468573, "loss": 1.5426, "step": 19051 }, { "epoch": 1.5, "learning_rate": 0.00015014213671457098, "loss": 1.4715, "step": 19052 }, { "epoch": 1.5, "learning_rate": 0.00015012977700349118, "loss": 1.5303, "step": 19053 }, { "epoch": 1.5, "learning_rate": 0.00015011741729153036, "loss": 1.5107, "step": 19054 }, { "epoch": 1.5, "learning_rate": 0.00015010505757877225, "loss": 1.4993, "step": 19055 }, { "epoch": 1.5, "learning_rate": 0.00015009269786530086, "loss": 1.5484, "step": 19056 }, { "epoch": 1.5, "learning_rate": 0.00015008033815120016, "loss": 1.5363, "step": 19057 }, { "epoch": 1.5, "learning_rate": 0.00015006797843655396, "loss": 1.5065, "step": 19058 }, { "epoch": 1.5, "learning_rate": 0.0001500556187214463, "loss": 1.5283, "step": 19059 }, { "epoch": 1.5, "learning_rate": 0.00015004325900596087, "loss": 1.4938, "step": 19060 }, { "epoch": 1.5, "learning_rate": 0.00015003089929018187, "loss": 1.4865, "step": 19061 }, { "epoch": 1.5, "learning_rate": 0.00015001853957419302, "loss": 1.5632, "step": 19062 }, { "epoch": 1.5, "learning_rate": 0.00015000617985807833, "loss": 1.4762, "step": 19063 }, { "epoch": 1.5, "learning_rate": 0.00014999382014192167, "loss": 1.5393, "step": 19064 }, { "epoch": 1.5, "learning_rate": 0.00014998146042580695, "loss": 1.4436, "step": 19065 }, { "epoch": 1.5, "learning_rate": 0.00014996910070981813, "loss": 1.5043, "step": 19066 }, { "epoch": 1.5, "learning_rate": 0.0001499567409940391, "loss": 1.5417, "step": 19067 }, { "epoch": 1.5, "learning_rate": 0.00014994438127855376, "loss": 1.5541, "step": 19068 }, { "epoch": 1.5, "learning_rate": 0.00014993202156344604, "loss": 1.5034, "step": 19069 }, { "epoch": 1.5, "learning_rate": 0.00014991966184879984, "loss": 1.5224, "step": 19070 }, { "epoch": 1.5, "learning_rate": 0.0001499073021346991, "loss": 1.4906, "step": 19071 }, { "epoch": 1.5, "learning_rate": 0.00014989494242122772, "loss": 1.5738, "step": 19072 }, { "epoch": 1.5, "learning_rate": 0.00014988258270846966, "loss": 1.5579, "step": 19073 }, { "epoch": 1.5, "learning_rate": 0.00014987022299650876, "loss": 1.4705, "step": 19074 }, { "epoch": 1.5, "learning_rate": 0.000149857863285429, "loss": 1.4954, "step": 19075 }, { "epoch": 1.5, "learning_rate": 0.00014984550357531427, "loss": 1.4792, "step": 19076 }, { "epoch": 1.5, "learning_rate": 0.00014983314386624846, "loss": 1.5894, "step": 19077 }, { "epoch": 1.5, "learning_rate": 0.0001498207841583155, "loss": 1.5433, "step": 19078 }, { "epoch": 1.5, "learning_rate": 0.00014980842445159938, "loss": 1.5369, "step": 19079 }, { "epoch": 1.5, "learning_rate": 0.00014979606474618392, "loss": 1.5648, "step": 19080 }, { "epoch": 1.5, "learning_rate": 0.0001497837050421531, "loss": 1.5249, "step": 19081 }, { "epoch": 1.5, "learning_rate": 0.00014977134533959073, "loss": 1.5014, "step": 19082 }, { "epoch": 1.5, "learning_rate": 0.00014975898563858084, "loss": 1.4575, "step": 19083 }, { "epoch": 1.5, "learning_rate": 0.00014974662593920734, "loss": 1.5474, "step": 19084 }, { "epoch": 1.5, "learning_rate": 0.00014973426624155406, "loss": 1.4691, "step": 19085 }, { "epoch": 1.5, "learning_rate": 0.000149721906545705, "loss": 1.5073, "step": 19086 }, { "epoch": 1.5, "learning_rate": 0.000149709546851744, "loss": 1.5603, "step": 19087 }, { "epoch": 1.5, "learning_rate": 0.000149697187159755, "loss": 1.5277, "step": 19088 }, { "epoch": 1.5, "learning_rate": 0.00014968482746982196, "loss": 1.4673, "step": 19089 }, { "epoch": 1.5, "learning_rate": 0.0001496724677820288, "loss": 1.5117, "step": 19090 }, { "epoch": 1.5, "learning_rate": 0.00014966010809645936, "loss": 1.5687, "step": 19091 }, { "epoch": 1.5, "learning_rate": 0.0001496477484131976, "loss": 1.5106, "step": 19092 }, { "epoch": 1.5, "learning_rate": 0.00014963538873232748, "loss": 1.5254, "step": 19093 }, { "epoch": 1.5, "learning_rate": 0.00014962302905393283, "loss": 1.5328, "step": 19094 }, { "epoch": 1.5, "learning_rate": 0.0001496106693780976, "loss": 1.5293, "step": 19095 }, { "epoch": 1.5, "learning_rate": 0.00014959830970490576, "loss": 1.5527, "step": 19096 }, { "epoch": 1.5, "learning_rate": 0.00014958595003444113, "loss": 1.5232, "step": 19097 }, { "epoch": 1.5, "learning_rate": 0.00014957359036678772, "loss": 1.5201, "step": 19098 }, { "epoch": 1.5, "learning_rate": 0.00014956123070202933, "loss": 1.5963, "step": 19099 }, { "epoch": 1.5, "learning_rate": 0.00014954887104024996, "loss": 1.5726, "step": 19100 }, { "epoch": 1.5, "learning_rate": 0.00014953651138153353, "loss": 1.5161, "step": 19101 }, { "epoch": 1.5, "learning_rate": 0.0001495241517259639, "loss": 1.5194, "step": 19102 }, { "epoch": 1.5, "learning_rate": 0.000149511792073625, "loss": 1.5298, "step": 19103 }, { "epoch": 1.5, "learning_rate": 0.0001494994324246008, "loss": 1.4467, "step": 19104 }, { "epoch": 1.5, "learning_rate": 0.0001494870727789752, "loss": 1.5118, "step": 19105 }, { "epoch": 1.5, "learning_rate": 0.00014947471313683203, "loss": 1.5502, "step": 19106 }, { "epoch": 1.5, "learning_rate": 0.0001494623534982553, "loss": 1.5393, "step": 19107 }, { "epoch": 1.5, "learning_rate": 0.00014944999386332891, "loss": 1.5207, "step": 19108 }, { "epoch": 1.5, "learning_rate": 0.00014943763423213677, "loss": 1.5014, "step": 19109 }, { "epoch": 1.5, "learning_rate": 0.00014942527460476277, "loss": 1.5075, "step": 19110 }, { "epoch": 1.5, "learning_rate": 0.00014941291498129082, "loss": 1.4759, "step": 19111 }, { "epoch": 1.5, "learning_rate": 0.00014940055536180486, "loss": 1.52, "step": 19112 }, { "epoch": 1.5, "learning_rate": 0.0001493881957463888, "loss": 1.4968, "step": 19113 }, { "epoch": 1.5, "learning_rate": 0.00014937583613512656, "loss": 1.4925, "step": 19114 }, { "epoch": 1.5, "learning_rate": 0.00014936347652810207, "loss": 1.4879, "step": 19115 }, { "epoch": 1.5, "learning_rate": 0.00014935111692539917, "loss": 1.5341, "step": 19116 }, { "epoch": 1.5, "learning_rate": 0.00014933875732710185, "loss": 1.5129, "step": 19117 }, { "epoch": 1.5, "learning_rate": 0.00014932639773329403, "loss": 1.5083, "step": 19118 }, { "epoch": 1.5, "learning_rate": 0.00014931403814405953, "loss": 1.511, "step": 19119 }, { "epoch": 1.5, "learning_rate": 0.00014930167855948235, "loss": 1.4676, "step": 19120 }, { "epoch": 1.5, "learning_rate": 0.0001492893189796464, "loss": 1.5101, "step": 19121 }, { "epoch": 1.5, "learning_rate": 0.00014927695940463562, "loss": 1.5244, "step": 19122 }, { "epoch": 1.5, "learning_rate": 0.00014926459983453385, "loss": 1.5912, "step": 19123 }, { "epoch": 1.5, "learning_rate": 0.00014925224026942504, "loss": 1.5083, "step": 19124 }, { "epoch": 1.5, "learning_rate": 0.00014923988070939315, "loss": 1.4873, "step": 19125 }, { "epoch": 1.5, "learning_rate": 0.000149227521154522, "loss": 1.4708, "step": 19126 }, { "epoch": 1.5, "learning_rate": 0.0001492151616048956, "loss": 1.4841, "step": 19127 }, { "epoch": 1.51, "learning_rate": 0.0001492028020605978, "loss": 1.4726, "step": 19128 }, { "epoch": 1.51, "learning_rate": 0.0001491904425217125, "loss": 1.5169, "step": 19129 }, { "epoch": 1.51, "learning_rate": 0.0001491780829883237, "loss": 1.5283, "step": 19130 }, { "epoch": 1.51, "learning_rate": 0.00014916572346051522, "loss": 1.5387, "step": 19131 }, { "epoch": 1.51, "learning_rate": 0.00014915336393837107, "loss": 1.4836, "step": 19132 }, { "epoch": 1.51, "learning_rate": 0.00014914100442197506, "loss": 1.4332, "step": 19133 }, { "epoch": 1.51, "learning_rate": 0.00014912864491141117, "loss": 1.5575, "step": 19134 }, { "epoch": 1.51, "learning_rate": 0.00014911628540676327, "loss": 1.533, "step": 19135 }, { "epoch": 1.51, "learning_rate": 0.00014910392590811533, "loss": 1.5375, "step": 19136 }, { "epoch": 1.51, "learning_rate": 0.00014909156641555125, "loss": 1.5596, "step": 19137 }, { "epoch": 1.51, "learning_rate": 0.00014907920692915492, "loss": 1.4701, "step": 19138 }, { "epoch": 1.51, "learning_rate": 0.00014906684744901032, "loss": 1.5552, "step": 19139 }, { "epoch": 1.51, "learning_rate": 0.00014905448797520123, "loss": 1.5314, "step": 19140 }, { "epoch": 1.51, "learning_rate": 0.00014904212850781168, "loss": 1.4894, "step": 19141 }, { "epoch": 1.51, "learning_rate": 0.00014902976904692557, "loss": 1.4592, "step": 19142 }, { "epoch": 1.51, "learning_rate": 0.00014901740959262678, "loss": 1.4919, "step": 19143 }, { "epoch": 1.51, "learning_rate": 0.00014900505014499925, "loss": 1.492, "step": 19144 }, { "epoch": 1.51, "learning_rate": 0.00014899269070412687, "loss": 1.4822, "step": 19145 }, { "epoch": 1.51, "learning_rate": 0.00014898033127009352, "loss": 1.5344, "step": 19146 }, { "epoch": 1.51, "learning_rate": 0.00014896797184298322, "loss": 1.5053, "step": 19147 }, { "epoch": 1.51, "learning_rate": 0.00014895561242287978, "loss": 1.5347, "step": 19148 }, { "epoch": 1.51, "learning_rate": 0.00014894325300986717, "loss": 1.5243, "step": 19149 }, { "epoch": 1.51, "learning_rate": 0.00014893089360402923, "loss": 1.5139, "step": 19150 }, { "epoch": 1.51, "learning_rate": 0.00014891853420545003, "loss": 1.5446, "step": 19151 }, { "epoch": 1.51, "learning_rate": 0.00014890617481421334, "loss": 1.5624, "step": 19152 }, { "epoch": 1.51, "learning_rate": 0.00014889381543040312, "loss": 1.4794, "step": 19153 }, { "epoch": 1.51, "learning_rate": 0.0001488814560541033, "loss": 1.5487, "step": 19154 }, { "epoch": 1.51, "learning_rate": 0.00014886909668539777, "loss": 1.5252, "step": 19155 }, { "epoch": 1.51, "learning_rate": 0.00014885673732437045, "loss": 1.5019, "step": 19156 }, { "epoch": 1.51, "learning_rate": 0.00014884437797110523, "loss": 1.5469, "step": 19157 }, { "epoch": 1.51, "learning_rate": 0.00014883201862568606, "loss": 1.5409, "step": 19158 }, { "epoch": 1.51, "learning_rate": 0.00014881965928819686, "loss": 1.5194, "step": 19159 }, { "epoch": 1.51, "learning_rate": 0.0001488072999587215, "loss": 1.507, "step": 19160 }, { "epoch": 1.51, "learning_rate": 0.00014879494063734392, "loss": 1.5462, "step": 19161 }, { "epoch": 1.51, "learning_rate": 0.00014878258132414803, "loss": 1.5149, "step": 19162 }, { "epoch": 1.51, "learning_rate": 0.00014877022201921776, "loss": 1.577, "step": 19163 }, { "epoch": 1.51, "learning_rate": 0.000148757862722637, "loss": 1.4926, "step": 19164 }, { "epoch": 1.51, "learning_rate": 0.0001487455034344896, "loss": 1.531, "step": 19165 }, { "epoch": 1.51, "learning_rate": 0.00014873314415485959, "loss": 1.4956, "step": 19166 }, { "epoch": 1.51, "learning_rate": 0.0001487207848838308, "loss": 1.5054, "step": 19167 }, { "epoch": 1.51, "learning_rate": 0.00014870842562148725, "loss": 1.5222, "step": 19168 }, { "epoch": 1.51, "learning_rate": 0.0001486960663679127, "loss": 1.5355, "step": 19169 }, { "epoch": 1.51, "learning_rate": 0.00014868370712319118, "loss": 1.5226, "step": 19170 }, { "epoch": 1.51, "learning_rate": 0.00014867134788740656, "loss": 1.5365, "step": 19171 }, { "epoch": 1.51, "learning_rate": 0.00014865898866064275, "loss": 1.5105, "step": 19172 }, { "epoch": 1.51, "learning_rate": 0.00014864662944298368, "loss": 1.5059, "step": 19173 }, { "epoch": 1.51, "learning_rate": 0.00014863427023451323, "loss": 1.4926, "step": 19174 }, { "epoch": 1.51, "learning_rate": 0.00014862191103531532, "loss": 1.5041, "step": 19175 }, { "epoch": 1.51, "learning_rate": 0.00014860955184547393, "loss": 1.5072, "step": 19176 }, { "epoch": 1.51, "learning_rate": 0.00014859719266507285, "loss": 1.5365, "step": 19177 }, { "epoch": 1.51, "learning_rate": 0.00014858483349419608, "loss": 1.4891, "step": 19178 }, { "epoch": 1.51, "learning_rate": 0.00014857247433292754, "loss": 1.5268, "step": 19179 }, { "epoch": 1.51, "learning_rate": 0.00014856011518135106, "loss": 1.4437, "step": 19180 }, { "epoch": 1.51, "learning_rate": 0.00014854775603955067, "loss": 1.5358, "step": 19181 }, { "epoch": 1.51, "learning_rate": 0.0001485353969076101, "loss": 1.4884, "step": 19182 }, { "epoch": 1.51, "learning_rate": 0.00014852303778561347, "loss": 1.4835, "step": 19183 }, { "epoch": 1.51, "learning_rate": 0.00014851067867364454, "loss": 1.5472, "step": 19184 }, { "epoch": 1.51, "learning_rate": 0.00014849831957178735, "loss": 1.5336, "step": 19185 }, { "epoch": 1.51, "learning_rate": 0.0001484859604801257, "loss": 1.4988, "step": 19186 }, { "epoch": 1.51, "learning_rate": 0.00014847360139874354, "loss": 1.4776, "step": 19187 }, { "epoch": 1.51, "learning_rate": 0.00014846124232772482, "loss": 1.493, "step": 19188 }, { "epoch": 1.51, "learning_rate": 0.0001484488832671534, "loss": 1.5501, "step": 19189 }, { "epoch": 1.51, "learning_rate": 0.00014843652421711319, "loss": 1.5174, "step": 19190 }, { "epoch": 1.51, "learning_rate": 0.00014842416517768815, "loss": 1.5283, "step": 19191 }, { "epoch": 1.51, "learning_rate": 0.00014841180614896213, "loss": 1.5175, "step": 19192 }, { "epoch": 1.51, "learning_rate": 0.00014839944713101907, "loss": 1.4995, "step": 19193 }, { "epoch": 1.51, "learning_rate": 0.0001483870881239429, "loss": 1.5643, "step": 19194 }, { "epoch": 1.51, "learning_rate": 0.00014837472912781748, "loss": 1.4743, "step": 19195 }, { "epoch": 1.51, "learning_rate": 0.00014836237014272677, "loss": 1.5414, "step": 19196 }, { "epoch": 1.51, "learning_rate": 0.00014835001116875467, "loss": 1.5139, "step": 19197 }, { "epoch": 1.51, "learning_rate": 0.00014833765220598503, "loss": 1.5306, "step": 19198 }, { "epoch": 1.51, "learning_rate": 0.00014832529325450186, "loss": 1.4989, "step": 19199 }, { "epoch": 1.51, "learning_rate": 0.00014831293431438904, "loss": 1.5241, "step": 19200 }, { "epoch": 1.51, "learning_rate": 0.00014830057538573046, "loss": 1.4655, "step": 19201 }, { "epoch": 1.51, "learning_rate": 0.00014828821646861005, "loss": 1.4918, "step": 19202 }, { "epoch": 1.51, "learning_rate": 0.00014827585756311165, "loss": 1.4984, "step": 19203 }, { "epoch": 1.51, "learning_rate": 0.00014826349866931926, "loss": 1.5195, "step": 19204 }, { "epoch": 1.51, "learning_rate": 0.00014825113978731677, "loss": 1.4935, "step": 19205 }, { "epoch": 1.51, "learning_rate": 0.00014823878091718804, "loss": 1.4868, "step": 19206 }, { "epoch": 1.51, "learning_rate": 0.00014822642205901702, "loss": 1.5009, "step": 19207 }, { "epoch": 1.51, "learning_rate": 0.00014821406321288767, "loss": 1.4405, "step": 19208 }, { "epoch": 1.51, "learning_rate": 0.0001482017043788838, "loss": 1.4808, "step": 19209 }, { "epoch": 1.51, "learning_rate": 0.00014818934555708939, "loss": 1.4688, "step": 19210 }, { "epoch": 1.51, "learning_rate": 0.0001481769867475883, "loss": 1.5277, "step": 19211 }, { "epoch": 1.51, "learning_rate": 0.00014816462795046444, "loss": 1.5727, "step": 19212 }, { "epoch": 1.51, "learning_rate": 0.00014815226916580174, "loss": 1.4937, "step": 19213 }, { "epoch": 1.51, "learning_rate": 0.00014813991039368417, "loss": 1.5568, "step": 19214 }, { "epoch": 1.51, "learning_rate": 0.00014812755163419553, "loss": 1.4794, "step": 19215 }, { "epoch": 1.51, "learning_rate": 0.0001481151928874198, "loss": 1.5165, "step": 19216 }, { "epoch": 1.51, "learning_rate": 0.0001481028341534409, "loss": 1.4444, "step": 19217 }, { "epoch": 1.51, "learning_rate": 0.00014809047543234266, "loss": 1.5378, "step": 19218 }, { "epoch": 1.51, "learning_rate": 0.00014807811672420908, "loss": 1.5018, "step": 19219 }, { "epoch": 1.51, "learning_rate": 0.00014806575802912402, "loss": 1.5448, "step": 19220 }, { "epoch": 1.51, "learning_rate": 0.0001480533993471714, "loss": 1.5247, "step": 19221 }, { "epoch": 1.51, "learning_rate": 0.0001480410406784351, "loss": 1.5079, "step": 19222 }, { "epoch": 1.51, "learning_rate": 0.00014802868202299906, "loss": 1.4962, "step": 19223 }, { "epoch": 1.51, "learning_rate": 0.00014801632338094718, "loss": 1.519, "step": 19224 }, { "epoch": 1.51, "learning_rate": 0.0001480039647523634, "loss": 1.5178, "step": 19225 }, { "epoch": 1.51, "learning_rate": 0.00014799160613733156, "loss": 1.4873, "step": 19226 }, { "epoch": 1.51, "learning_rate": 0.00014797924753593567, "loss": 1.5156, "step": 19227 }, { "epoch": 1.51, "learning_rate": 0.00014796688894825948, "loss": 1.5124, "step": 19228 }, { "epoch": 1.51, "learning_rate": 0.000147954530374387, "loss": 1.5229, "step": 19229 }, { "epoch": 1.51, "learning_rate": 0.00014794217181440214, "loss": 1.4696, "step": 19230 }, { "epoch": 1.51, "learning_rate": 0.00014792981326838887, "loss": 1.4845, "step": 19231 }, { "epoch": 1.51, "learning_rate": 0.00014791745473643095, "loss": 1.5048, "step": 19232 }, { "epoch": 1.51, "learning_rate": 0.00014790509621861238, "loss": 1.5185, "step": 19233 }, { "epoch": 1.51, "learning_rate": 0.00014789273771501708, "loss": 1.5265, "step": 19234 }, { "epoch": 1.51, "learning_rate": 0.00014788037922572892, "loss": 1.5154, "step": 19235 }, { "epoch": 1.51, "learning_rate": 0.0001478680207508318, "loss": 1.4914, "step": 19236 }, { "epoch": 1.51, "learning_rate": 0.00014785566229040965, "loss": 1.5218, "step": 19237 }, { "epoch": 1.51, "learning_rate": 0.00014784330384454638, "loss": 1.498, "step": 19238 }, { "epoch": 1.51, "learning_rate": 0.00014783094541332589, "loss": 1.5644, "step": 19239 }, { "epoch": 1.51, "learning_rate": 0.00014781858699683206, "loss": 1.5206, "step": 19240 }, { "epoch": 1.51, "learning_rate": 0.0001478062285951488, "loss": 1.5163, "step": 19241 }, { "epoch": 1.51, "learning_rate": 0.0001477938702083601, "loss": 1.5009, "step": 19242 }, { "epoch": 1.51, "learning_rate": 0.00014778151183654975, "loss": 1.5026, "step": 19243 }, { "epoch": 1.51, "learning_rate": 0.00014776915347980177, "loss": 1.5052, "step": 19244 }, { "epoch": 1.51, "learning_rate": 0.00014775679513819988, "loss": 1.496, "step": 19245 }, { "epoch": 1.51, "learning_rate": 0.00014774443681182822, "loss": 1.5205, "step": 19246 }, { "epoch": 1.51, "learning_rate": 0.00014773207850077056, "loss": 1.5537, "step": 19247 }, { "epoch": 1.51, "learning_rate": 0.00014771972020511084, "loss": 1.5181, "step": 19248 }, { "epoch": 1.51, "learning_rate": 0.000147707361924933, "loss": 1.5346, "step": 19249 }, { "epoch": 1.51, "learning_rate": 0.00014769500366032084, "loss": 1.4899, "step": 19250 }, { "epoch": 1.51, "learning_rate": 0.0001476826454113584, "loss": 1.459, "step": 19251 }, { "epoch": 1.51, "learning_rate": 0.00014767028717812948, "loss": 1.4946, "step": 19252 }, { "epoch": 1.51, "learning_rate": 0.00014765792896071801, "loss": 1.4695, "step": 19253 }, { "epoch": 1.51, "learning_rate": 0.00014764557075920795, "loss": 1.4942, "step": 19254 }, { "epoch": 1.52, "learning_rate": 0.00014763321257368314, "loss": 1.51, "step": 19255 }, { "epoch": 1.52, "learning_rate": 0.00014762085440422754, "loss": 1.4939, "step": 19256 }, { "epoch": 1.52, "learning_rate": 0.00014760849625092498, "loss": 1.4581, "step": 19257 }, { "epoch": 1.52, "learning_rate": 0.00014759613811385943, "loss": 1.4912, "step": 19258 }, { "epoch": 1.52, "learning_rate": 0.00014758377999311481, "loss": 1.4984, "step": 19259 }, { "epoch": 1.52, "learning_rate": 0.00014757142188877485, "loss": 1.5233, "step": 19260 }, { "epoch": 1.52, "learning_rate": 0.00014755906380092373, "loss": 1.5208, "step": 19261 }, { "epoch": 1.52, "learning_rate": 0.00014754670572964521, "loss": 1.5007, "step": 19262 }, { "epoch": 1.52, "learning_rate": 0.00014753434767502318, "loss": 1.505, "step": 19263 }, { "epoch": 1.52, "learning_rate": 0.0001475219896371416, "loss": 1.5252, "step": 19264 }, { "epoch": 1.52, "learning_rate": 0.0001475096316160843, "loss": 1.546, "step": 19265 }, { "epoch": 1.52, "learning_rate": 0.00014749727361193526, "loss": 1.5275, "step": 19266 }, { "epoch": 1.52, "learning_rate": 0.00014748491562477833, "loss": 1.5313, "step": 19267 }, { "epoch": 1.52, "learning_rate": 0.00014747255765469746, "loss": 1.5362, "step": 19268 }, { "epoch": 1.52, "learning_rate": 0.0001474601997017765, "loss": 1.5168, "step": 19269 }, { "epoch": 1.52, "learning_rate": 0.00014744784176609938, "loss": 1.5132, "step": 19270 }, { "epoch": 1.52, "learning_rate": 0.00014743548384775005, "loss": 1.5989, "step": 19271 }, { "epoch": 1.52, "learning_rate": 0.00014742312594681232, "loss": 1.5675, "step": 19272 }, { "epoch": 1.52, "learning_rate": 0.00014741076806337015, "loss": 1.4883, "step": 19273 }, { "epoch": 1.52, "learning_rate": 0.00014739841019750747, "loss": 1.4992, "step": 19274 }, { "epoch": 1.52, "learning_rate": 0.00014738605234930813, "loss": 1.5505, "step": 19275 }, { "epoch": 1.52, "learning_rate": 0.000147373694518856, "loss": 1.5171, "step": 19276 }, { "epoch": 1.52, "learning_rate": 0.00014736133670623506, "loss": 1.5194, "step": 19277 }, { "epoch": 1.52, "learning_rate": 0.00014734897891152923, "loss": 1.5397, "step": 19278 }, { "epoch": 1.52, "learning_rate": 0.00014733662113482234, "loss": 1.4948, "step": 19279 }, { "epoch": 1.52, "learning_rate": 0.00014732426337619835, "loss": 1.5299, "step": 19280 }, { "epoch": 1.52, "learning_rate": 0.00014731190563574114, "loss": 1.5726, "step": 19281 }, { "epoch": 1.52, "learning_rate": 0.00014729954791353454, "loss": 1.5433, "step": 19282 }, { "epoch": 1.52, "learning_rate": 0.0001472871902096626, "loss": 1.4741, "step": 19283 }, { "epoch": 1.52, "learning_rate": 0.0001472748325242091, "loss": 1.4551, "step": 19284 }, { "epoch": 1.52, "learning_rate": 0.000147262474857258, "loss": 1.5103, "step": 19285 }, { "epoch": 1.52, "learning_rate": 0.00014725011720889317, "loss": 1.5102, "step": 19286 }, { "epoch": 1.52, "learning_rate": 0.00014723775957919852, "loss": 1.5113, "step": 19287 }, { "epoch": 1.52, "learning_rate": 0.000147225401968258, "loss": 1.5138, "step": 19288 }, { "epoch": 1.52, "learning_rate": 0.00014721304437615543, "loss": 1.5266, "step": 19289 }, { "epoch": 1.52, "learning_rate": 0.00014720068680297476, "loss": 1.5156, "step": 19290 }, { "epoch": 1.52, "learning_rate": 0.0001471883292487999, "loss": 1.5229, "step": 19291 }, { "epoch": 1.52, "learning_rate": 0.0001471759717137147, "loss": 1.5307, "step": 19292 }, { "epoch": 1.52, "learning_rate": 0.00014716361419780306, "loss": 1.4993, "step": 19293 }, { "epoch": 1.52, "learning_rate": 0.00014715125670114896, "loss": 1.5122, "step": 19294 }, { "epoch": 1.52, "learning_rate": 0.0001471388992238363, "loss": 1.5311, "step": 19295 }, { "epoch": 1.52, "learning_rate": 0.00014712654176594886, "loss": 1.5254, "step": 19296 }, { "epoch": 1.52, "learning_rate": 0.00014711418432757068, "loss": 1.491, "step": 19297 }, { "epoch": 1.52, "learning_rate": 0.00014710182690878554, "loss": 1.4971, "step": 19298 }, { "epoch": 1.52, "learning_rate": 0.00014708946950967743, "loss": 1.5046, "step": 19299 }, { "epoch": 1.52, "learning_rate": 0.00014707711213033024, "loss": 1.478, "step": 19300 }, { "epoch": 1.52, "learning_rate": 0.0001470647547708278, "loss": 1.5194, "step": 19301 }, { "epoch": 1.52, "learning_rate": 0.00014705239743125406, "loss": 1.5639, "step": 19302 }, { "epoch": 1.52, "learning_rate": 0.00014704004011169294, "loss": 1.5081, "step": 19303 }, { "epoch": 1.52, "learning_rate": 0.00014702768281222827, "loss": 1.5523, "step": 19304 }, { "epoch": 1.52, "learning_rate": 0.00014701532553294404, "loss": 1.4986, "step": 19305 }, { "epoch": 1.52, "learning_rate": 0.00014700296827392407, "loss": 1.5124, "step": 19306 }, { "epoch": 1.52, "learning_rate": 0.0001469906110352523, "loss": 1.4979, "step": 19307 }, { "epoch": 1.52, "learning_rate": 0.00014697825381701257, "loss": 1.4556, "step": 19308 }, { "epoch": 1.52, "learning_rate": 0.00014696589661928892, "loss": 1.5228, "step": 19309 }, { "epoch": 1.52, "learning_rate": 0.0001469535394421651, "loss": 1.4751, "step": 19310 }, { "epoch": 1.52, "learning_rate": 0.00014694118228572508, "loss": 1.4955, "step": 19311 }, { "epoch": 1.52, "learning_rate": 0.00014692882515005278, "loss": 1.5584, "step": 19312 }, { "epoch": 1.52, "learning_rate": 0.00014691646803523202, "loss": 1.4896, "step": 19313 }, { "epoch": 1.52, "learning_rate": 0.00014690411094134677, "loss": 1.4632, "step": 19314 }, { "epoch": 1.52, "learning_rate": 0.00014689175386848087, "loss": 1.5399, "step": 19315 }, { "epoch": 1.52, "learning_rate": 0.00014687939681671825, "loss": 1.54, "step": 19316 }, { "epoch": 1.52, "learning_rate": 0.00014686703978614285, "loss": 1.5021, "step": 19317 }, { "epoch": 1.52, "learning_rate": 0.00014685468277683846, "loss": 1.5261, "step": 19318 }, { "epoch": 1.52, "learning_rate": 0.00014684232578888906, "loss": 1.5416, "step": 19319 }, { "epoch": 1.52, "learning_rate": 0.00014682996882237856, "loss": 1.5642, "step": 19320 }, { "epoch": 1.52, "learning_rate": 0.00014681761187739078, "loss": 1.4934, "step": 19321 }, { "epoch": 1.52, "learning_rate": 0.0001468052549540097, "loss": 1.5684, "step": 19322 }, { "epoch": 1.52, "learning_rate": 0.00014679289805231906, "loss": 1.5028, "step": 19323 }, { "epoch": 1.52, "learning_rate": 0.00014678054117240295, "loss": 1.4795, "step": 19324 }, { "epoch": 1.52, "learning_rate": 0.0001467681843143452, "loss": 1.4773, "step": 19325 }, { "epoch": 1.52, "learning_rate": 0.00014675582747822972, "loss": 1.5175, "step": 19326 }, { "epoch": 1.52, "learning_rate": 0.00014674347066414033, "loss": 1.5307, "step": 19327 }, { "epoch": 1.52, "learning_rate": 0.00014673111387216098, "loss": 1.4626, "step": 19328 }, { "epoch": 1.52, "learning_rate": 0.0001467187571023756, "loss": 1.5125, "step": 19329 }, { "epoch": 1.52, "learning_rate": 0.00014670640035486802, "loss": 1.5055, "step": 19330 }, { "epoch": 1.52, "learning_rate": 0.00014669404362972218, "loss": 1.5252, "step": 19331 }, { "epoch": 1.52, "learning_rate": 0.00014668168692702198, "loss": 1.4882, "step": 19332 }, { "epoch": 1.52, "learning_rate": 0.00014666933024685126, "loss": 1.5149, "step": 19333 }, { "epoch": 1.52, "learning_rate": 0.00014665697358929396, "loss": 1.5285, "step": 19334 }, { "epoch": 1.52, "learning_rate": 0.00014664461695443397, "loss": 1.4891, "step": 19335 }, { "epoch": 1.52, "learning_rate": 0.00014663226034235515, "loss": 1.5544, "step": 19336 }, { "epoch": 1.52, "learning_rate": 0.00014661990375314148, "loss": 1.4946, "step": 19337 }, { "epoch": 1.52, "learning_rate": 0.00014660754718687674, "loss": 1.5204, "step": 19338 }, { "epoch": 1.52, "learning_rate": 0.00014659519064364487, "loss": 1.5391, "step": 19339 }, { "epoch": 1.52, "learning_rate": 0.0001465828341235298, "loss": 1.5304, "step": 19340 }, { "epoch": 1.52, "learning_rate": 0.00014657047762661542, "loss": 1.5734, "step": 19341 }, { "epoch": 1.52, "learning_rate": 0.0001465581211529856, "loss": 1.4996, "step": 19342 }, { "epoch": 1.52, "learning_rate": 0.00014654576470272425, "loss": 1.5212, "step": 19343 }, { "epoch": 1.52, "learning_rate": 0.00014653340827591523, "loss": 1.5265, "step": 19344 }, { "epoch": 1.52, "learning_rate": 0.00014652105187264245, "loss": 1.5134, "step": 19345 }, { "epoch": 1.52, "learning_rate": 0.00014650869549298983, "loss": 1.5314, "step": 19346 }, { "epoch": 1.52, "learning_rate": 0.00014649633913704123, "loss": 1.5408, "step": 19347 }, { "epoch": 1.52, "learning_rate": 0.00014648398280488054, "loss": 1.4926, "step": 19348 }, { "epoch": 1.52, "learning_rate": 0.0001464716264965917, "loss": 1.5472, "step": 19349 }, { "epoch": 1.52, "learning_rate": 0.00014645927021225856, "loss": 1.5159, "step": 19350 }, { "epoch": 1.52, "learning_rate": 0.00014644691395196503, "loss": 1.5199, "step": 19351 }, { "epoch": 1.52, "learning_rate": 0.00014643455771579496, "loss": 1.618, "step": 19352 }, { "epoch": 1.52, "learning_rate": 0.00014642220150383229, "loss": 1.4983, "step": 19353 }, { "epoch": 1.52, "learning_rate": 0.00014640984531616091, "loss": 1.5274, "step": 19354 }, { "epoch": 1.52, "learning_rate": 0.00014639748915286463, "loss": 1.5445, "step": 19355 }, { "epoch": 1.52, "learning_rate": 0.00014638513301402746, "loss": 1.4645, "step": 19356 }, { "epoch": 1.52, "learning_rate": 0.00014637277689973324, "loss": 1.5673, "step": 19357 }, { "epoch": 1.52, "learning_rate": 0.00014636042081006589, "loss": 1.4919, "step": 19358 }, { "epoch": 1.52, "learning_rate": 0.00014634806474510926, "loss": 1.5069, "step": 19359 }, { "epoch": 1.52, "learning_rate": 0.00014633570870494723, "loss": 1.5499, "step": 19360 }, { "epoch": 1.52, "learning_rate": 0.00014632335268966376, "loss": 1.5259, "step": 19361 }, { "epoch": 1.52, "learning_rate": 0.00014631099669934266, "loss": 1.4573, "step": 19362 }, { "epoch": 1.52, "learning_rate": 0.0001462986407340679, "loss": 1.505, "step": 19363 }, { "epoch": 1.52, "learning_rate": 0.00014628628479392328, "loss": 1.4669, "step": 19364 }, { "epoch": 1.52, "learning_rate": 0.00014627392887899275, "loss": 1.4977, "step": 19365 }, { "epoch": 1.52, "learning_rate": 0.0001462615729893602, "loss": 1.5501, "step": 19366 }, { "epoch": 1.52, "learning_rate": 0.0001462492171251095, "loss": 1.5148, "step": 19367 }, { "epoch": 1.52, "learning_rate": 0.00014623686128632457, "loss": 1.524, "step": 19368 }, { "epoch": 1.52, "learning_rate": 0.00014622450547308922, "loss": 1.5084, "step": 19369 }, { "epoch": 1.52, "learning_rate": 0.0001462121496854874, "loss": 1.485, "step": 19370 }, { "epoch": 1.52, "learning_rate": 0.00014619979392360298, "loss": 1.4842, "step": 19371 }, { "epoch": 1.52, "learning_rate": 0.0001461874381875199, "loss": 1.5668, "step": 19372 }, { "epoch": 1.52, "learning_rate": 0.00014617508247732203, "loss": 1.4685, "step": 19373 }, { "epoch": 1.52, "learning_rate": 0.0001461627267930932, "loss": 1.4755, "step": 19374 }, { "epoch": 1.52, "learning_rate": 0.0001461503711349174, "loss": 1.4851, "step": 19375 }, { "epoch": 1.52, "learning_rate": 0.0001461380155028784, "loss": 1.489, "step": 19376 }, { "epoch": 1.52, "learning_rate": 0.00014612565989706013, "loss": 1.5194, "step": 19377 }, { "epoch": 1.52, "learning_rate": 0.00014611330431754655, "loss": 1.5211, "step": 19378 }, { "epoch": 1.52, "learning_rate": 0.00014610094876442144, "loss": 1.5376, "step": 19379 }, { "epoch": 1.52, "learning_rate": 0.00014608859323776875, "loss": 1.56, "step": 19380 }, { "epoch": 1.52, "learning_rate": 0.00014607623773767235, "loss": 1.5038, "step": 19381 }, { "epoch": 1.53, "learning_rate": 0.00014606388226421615, "loss": 1.5149, "step": 19382 }, { "epoch": 1.53, "learning_rate": 0.00014605152681748402, "loss": 1.4958, "step": 19383 }, { "epoch": 1.53, "learning_rate": 0.00014603917139755982, "loss": 1.4601, "step": 19384 }, { "epoch": 1.53, "learning_rate": 0.00014602681600452746, "loss": 1.5464, "step": 19385 }, { "epoch": 1.53, "learning_rate": 0.00014601446063847078, "loss": 1.5338, "step": 19386 }, { "epoch": 1.53, "learning_rate": 0.0001460021052994738, "loss": 1.5711, "step": 19387 }, { "epoch": 1.53, "learning_rate": 0.00014598974998762025, "loss": 1.4817, "step": 19388 }, { "epoch": 1.53, "learning_rate": 0.00014597739470299413, "loss": 1.5122, "step": 19389 }, { "epoch": 1.53, "learning_rate": 0.00014596503944567927, "loss": 1.5668, "step": 19390 }, { "epoch": 1.53, "learning_rate": 0.00014595268421575957, "loss": 1.5493, "step": 19391 }, { "epoch": 1.53, "learning_rate": 0.00014594032901331892, "loss": 1.5447, "step": 19392 }, { "epoch": 1.53, "learning_rate": 0.00014592797383844116, "loss": 1.4873, "step": 19393 }, { "epoch": 1.53, "learning_rate": 0.00014591561869121023, "loss": 1.5465, "step": 19394 }, { "epoch": 1.53, "learning_rate": 0.00014590326357171002, "loss": 1.5707, "step": 19395 }, { "epoch": 1.53, "learning_rate": 0.00014589090848002434, "loss": 1.5484, "step": 19396 }, { "epoch": 1.53, "learning_rate": 0.00014587855341623718, "loss": 1.5795, "step": 19397 }, { "epoch": 1.53, "learning_rate": 0.00014586619838043234, "loss": 1.4819, "step": 19398 }, { "epoch": 1.53, "learning_rate": 0.00014585384337269372, "loss": 1.5595, "step": 19399 }, { "epoch": 1.53, "learning_rate": 0.00014584148839310524, "loss": 1.5355, "step": 19400 }, { "epoch": 1.53, "learning_rate": 0.00014582913344175075, "loss": 1.4462, "step": 19401 }, { "epoch": 1.53, "learning_rate": 0.0001458167785187141, "loss": 1.5831, "step": 19402 }, { "epoch": 1.53, "learning_rate": 0.00014580442362407923, "loss": 1.4851, "step": 19403 }, { "epoch": 1.53, "learning_rate": 0.00014579206875793004, "loss": 1.4435, "step": 19404 }, { "epoch": 1.53, "learning_rate": 0.00014577971392035037, "loss": 1.5055, "step": 19405 }, { "epoch": 1.53, "learning_rate": 0.0001457673591114241, "loss": 1.4851, "step": 19406 }, { "epoch": 1.53, "learning_rate": 0.00014575500433123515, "loss": 1.533, "step": 19407 }, { "epoch": 1.53, "learning_rate": 0.00014574264957986735, "loss": 1.4826, "step": 19408 }, { "epoch": 1.53, "learning_rate": 0.00014573029485740466, "loss": 1.557, "step": 19409 }, { "epoch": 1.53, "learning_rate": 0.00014571794016393088, "loss": 1.5149, "step": 19410 }, { "epoch": 1.53, "learning_rate": 0.00014570558549952992, "loss": 1.4848, "step": 19411 }, { "epoch": 1.53, "learning_rate": 0.00014569323086428569, "loss": 1.5023, "step": 19412 }, { "epoch": 1.53, "learning_rate": 0.000145680876258282, "loss": 1.506, "step": 19413 }, { "epoch": 1.53, "learning_rate": 0.0001456685216816028, "loss": 1.4849, "step": 19414 }, { "epoch": 1.53, "learning_rate": 0.00014565616713433196, "loss": 1.4276, "step": 19415 }, { "epoch": 1.53, "learning_rate": 0.00014564381261655333, "loss": 1.4888, "step": 19416 }, { "epoch": 1.53, "learning_rate": 0.00014563145812835084, "loss": 1.545, "step": 19417 }, { "epoch": 1.53, "learning_rate": 0.00014561910366980824, "loss": 1.5595, "step": 19418 }, { "epoch": 1.53, "learning_rate": 0.0001456067492410096, "loss": 1.5172, "step": 19419 }, { "epoch": 1.53, "learning_rate": 0.00014559439484203868, "loss": 1.496, "step": 19420 }, { "epoch": 1.53, "learning_rate": 0.0001455820404729794, "loss": 1.5337, "step": 19421 }, { "epoch": 1.53, "learning_rate": 0.00014556968613391565, "loss": 1.4929, "step": 19422 }, { "epoch": 1.53, "learning_rate": 0.00014555733182493124, "loss": 1.5428, "step": 19423 }, { "epoch": 1.53, "learning_rate": 0.00014554497754611014, "loss": 1.5452, "step": 19424 }, { "epoch": 1.53, "learning_rate": 0.00014553262329753614, "loss": 1.5145, "step": 19425 }, { "epoch": 1.53, "learning_rate": 0.00014552026907929322, "loss": 1.5515, "step": 19426 }, { "epoch": 1.53, "learning_rate": 0.00014550791489146515, "loss": 1.544, "step": 19427 }, { "epoch": 1.53, "learning_rate": 0.00014549556073413587, "loss": 1.5324, "step": 19428 }, { "epoch": 1.53, "learning_rate": 0.00014548320660738925, "loss": 1.4834, "step": 19429 }, { "epoch": 1.53, "learning_rate": 0.00014547085251130916, "loss": 1.5007, "step": 19430 }, { "epoch": 1.53, "learning_rate": 0.00014545849844597948, "loss": 1.4805, "step": 19431 }, { "epoch": 1.53, "learning_rate": 0.00014544614441148413, "loss": 1.4888, "step": 19432 }, { "epoch": 1.53, "learning_rate": 0.00014543379040790687, "loss": 1.4802, "step": 19433 }, { "epoch": 1.53, "learning_rate": 0.00014542143643533168, "loss": 1.4789, "step": 19434 }, { "epoch": 1.53, "learning_rate": 0.0001454090824938424, "loss": 1.4974, "step": 19435 }, { "epoch": 1.53, "learning_rate": 0.00014539672858352297, "loss": 1.5679, "step": 19436 }, { "epoch": 1.53, "learning_rate": 0.00014538437470445716, "loss": 1.48, "step": 19437 }, { "epoch": 1.53, "learning_rate": 0.00014537202085672894, "loss": 1.4508, "step": 19438 }, { "epoch": 1.53, "learning_rate": 0.00014535966704042213, "loss": 1.5347, "step": 19439 }, { "epoch": 1.53, "learning_rate": 0.0001453473132556206, "loss": 1.5714, "step": 19440 }, { "epoch": 1.53, "learning_rate": 0.0001453349595024083, "loss": 1.5006, "step": 19441 }, { "epoch": 1.53, "learning_rate": 0.000145322605780869, "loss": 1.5225, "step": 19442 }, { "epoch": 1.53, "learning_rate": 0.00014531025209108662, "loss": 1.5042, "step": 19443 }, { "epoch": 1.53, "learning_rate": 0.0001452978984331451, "loss": 1.535, "step": 19444 }, { "epoch": 1.53, "learning_rate": 0.0001452855448071282, "loss": 1.5077, "step": 19445 }, { "epoch": 1.53, "learning_rate": 0.00014527319121311987, "loss": 1.5488, "step": 19446 }, { "epoch": 1.53, "learning_rate": 0.00014526083765120394, "loss": 1.4865, "step": 19447 }, { "epoch": 1.53, "learning_rate": 0.00014524848412146433, "loss": 1.5136, "step": 19448 }, { "epoch": 1.53, "learning_rate": 0.00014523613062398483, "loss": 1.5294, "step": 19449 }, { "epoch": 1.53, "learning_rate": 0.00014522377715884947, "loss": 1.5116, "step": 19450 }, { "epoch": 1.53, "learning_rate": 0.00014521142372614197, "loss": 1.4962, "step": 19451 }, { "epoch": 1.53, "learning_rate": 0.00014519907032594626, "loss": 1.5258, "step": 19452 }, { "epoch": 1.53, "learning_rate": 0.00014518671695834624, "loss": 1.4995, "step": 19453 }, { "epoch": 1.53, "learning_rate": 0.00014517436362342572, "loss": 1.5302, "step": 19454 }, { "epoch": 1.53, "learning_rate": 0.00014516201032126864, "loss": 1.4823, "step": 19455 }, { "epoch": 1.53, "learning_rate": 0.00014514965705195886, "loss": 1.5216, "step": 19456 }, { "epoch": 1.53, "learning_rate": 0.0001451373038155802, "loss": 1.5033, "step": 19457 }, { "epoch": 1.53, "learning_rate": 0.00014512495061221658, "loss": 1.5228, "step": 19458 }, { "epoch": 1.53, "learning_rate": 0.00014511259744195184, "loss": 1.535, "step": 19459 }, { "epoch": 1.53, "learning_rate": 0.00014510024430486985, "loss": 1.5845, "step": 19460 }, { "epoch": 1.53, "learning_rate": 0.00014508789120105454, "loss": 1.5116, "step": 19461 }, { "epoch": 1.53, "learning_rate": 0.0001450755381305897, "loss": 1.4998, "step": 19462 }, { "epoch": 1.53, "learning_rate": 0.00014506318509355928, "loss": 1.5303, "step": 19463 }, { "epoch": 1.53, "learning_rate": 0.00014505083209004707, "loss": 1.462, "step": 19464 }, { "epoch": 1.53, "learning_rate": 0.00014503847912013696, "loss": 1.5006, "step": 19465 }, { "epoch": 1.53, "learning_rate": 0.00014502612618391285, "loss": 1.5174, "step": 19466 }, { "epoch": 1.53, "learning_rate": 0.00014501377328145863, "loss": 1.5292, "step": 19467 }, { "epoch": 1.53, "learning_rate": 0.00014500142041285813, "loss": 1.5187, "step": 19468 }, { "epoch": 1.53, "learning_rate": 0.0001449890675781952, "loss": 1.504, "step": 19469 }, { "epoch": 1.53, "learning_rate": 0.0001449767147775538, "loss": 1.517, "step": 19470 }, { "epoch": 1.53, "learning_rate": 0.00014496436201101768, "loss": 1.4732, "step": 19471 }, { "epoch": 1.53, "learning_rate": 0.00014495200927867074, "loss": 1.533, "step": 19472 }, { "epoch": 1.53, "learning_rate": 0.00014493965658059696, "loss": 1.5061, "step": 19473 }, { "epoch": 1.53, "learning_rate": 0.00014492730391688004, "loss": 1.5205, "step": 19474 }, { "epoch": 1.53, "learning_rate": 0.00014491495128760398, "loss": 1.4943, "step": 19475 }, { "epoch": 1.53, "learning_rate": 0.00014490259869285257, "loss": 1.4927, "step": 19476 }, { "epoch": 1.53, "learning_rate": 0.00014489024613270968, "loss": 1.4844, "step": 19477 }, { "epoch": 1.53, "learning_rate": 0.00014487789360725925, "loss": 1.5692, "step": 19478 }, { "epoch": 1.53, "learning_rate": 0.00014486554111658507, "loss": 1.5528, "step": 19479 }, { "epoch": 1.53, "learning_rate": 0.00014485318866077097, "loss": 1.5094, "step": 19480 }, { "epoch": 1.53, "learning_rate": 0.00014484083623990092, "loss": 1.5056, "step": 19481 }, { "epoch": 1.53, "learning_rate": 0.0001448284838540588, "loss": 1.5089, "step": 19482 }, { "epoch": 1.53, "learning_rate": 0.00014481613150332836, "loss": 1.5389, "step": 19483 }, { "epoch": 1.53, "learning_rate": 0.00014480377918779354, "loss": 1.4538, "step": 19484 }, { "epoch": 1.53, "learning_rate": 0.00014479142690753823, "loss": 1.5655, "step": 19485 }, { "epoch": 1.53, "learning_rate": 0.0001447790746626462, "loss": 1.5235, "step": 19486 }, { "epoch": 1.53, "learning_rate": 0.00014476672245320143, "loss": 1.5039, "step": 19487 }, { "epoch": 1.53, "learning_rate": 0.0001447543702792877, "loss": 1.4414, "step": 19488 }, { "epoch": 1.53, "learning_rate": 0.00014474201814098888, "loss": 1.525, "step": 19489 }, { "epoch": 1.53, "learning_rate": 0.00014472966603838887, "loss": 1.4997, "step": 19490 }, { "epoch": 1.53, "learning_rate": 0.00014471731397157152, "loss": 1.5147, "step": 19491 }, { "epoch": 1.53, "learning_rate": 0.00014470496194062072, "loss": 1.5129, "step": 19492 }, { "epoch": 1.53, "learning_rate": 0.00014469260994562027, "loss": 1.5829, "step": 19493 }, { "epoch": 1.53, "learning_rate": 0.00014468025798665407, "loss": 1.5244, "step": 19494 }, { "epoch": 1.53, "learning_rate": 0.00014466790606380603, "loss": 1.4833, "step": 19495 }, { "epoch": 1.53, "learning_rate": 0.00014465555417715988, "loss": 1.4729, "step": 19496 }, { "epoch": 1.53, "learning_rate": 0.0001446432023267996, "loss": 1.5599, "step": 19497 }, { "epoch": 1.53, "learning_rate": 0.00014463085051280903, "loss": 1.5283, "step": 19498 }, { "epoch": 1.53, "learning_rate": 0.00014461849873527205, "loss": 1.4774, "step": 19499 }, { "epoch": 1.53, "learning_rate": 0.00014460614699427247, "loss": 1.5233, "step": 19500 }, { "epoch": 1.53, "learning_rate": 0.00014459379528989415, "loss": 1.538, "step": 19501 }, { "epoch": 1.53, "learning_rate": 0.00014458144362222103, "loss": 1.5403, "step": 19502 }, { "epoch": 1.53, "learning_rate": 0.00014456909199133688, "loss": 1.4873, "step": 19503 }, { "epoch": 1.53, "learning_rate": 0.00014455674039732562, "loss": 1.5162, "step": 19504 }, { "epoch": 1.53, "learning_rate": 0.00014454438884027107, "loss": 1.5135, "step": 19505 }, { "epoch": 1.53, "learning_rate": 0.00014453203732025713, "loss": 1.4816, "step": 19506 }, { "epoch": 1.53, "learning_rate": 0.00014451968583736763, "loss": 1.5198, "step": 19507 }, { "epoch": 1.53, "learning_rate": 0.00014450733439168642, "loss": 1.4883, "step": 19508 }, { "epoch": 1.53, "learning_rate": 0.00014449498298329744, "loss": 1.473, "step": 19509 }, { "epoch": 1.54, "learning_rate": 0.00014448263161228442, "loss": 1.4953, "step": 19510 }, { "epoch": 1.54, "learning_rate": 0.0001444702802787313, "loss": 1.5208, "step": 19511 }, { "epoch": 1.54, "learning_rate": 0.0001444579289827219, "loss": 1.5018, "step": 19512 }, { "epoch": 1.54, "learning_rate": 0.00014444557772434012, "loss": 1.5043, "step": 19513 }, { "epoch": 1.54, "learning_rate": 0.00014443322650366984, "loss": 1.5062, "step": 19514 }, { "epoch": 1.54, "learning_rate": 0.00014442087532079485, "loss": 1.4715, "step": 19515 }, { "epoch": 1.54, "learning_rate": 0.00014440852417579907, "loss": 1.4909, "step": 19516 }, { "epoch": 1.54, "learning_rate": 0.0001443961730687663, "loss": 1.4576, "step": 19517 }, { "epoch": 1.54, "learning_rate": 0.0001443838219997804, "loss": 1.5188, "step": 19518 }, { "epoch": 1.54, "learning_rate": 0.0001443714709689253, "loss": 1.5605, "step": 19519 }, { "epoch": 1.54, "learning_rate": 0.00014435911997628478, "loss": 1.4794, "step": 19520 }, { "epoch": 1.54, "learning_rate": 0.00014434676902194275, "loss": 1.5352, "step": 19521 }, { "epoch": 1.54, "learning_rate": 0.000144334418105983, "loss": 1.539, "step": 19522 }, { "epoch": 1.54, "learning_rate": 0.0001443220672284894, "loss": 1.524, "step": 19523 }, { "epoch": 1.54, "learning_rate": 0.0001443097163895459, "loss": 1.5138, "step": 19524 }, { "epoch": 1.54, "learning_rate": 0.00014429736558923626, "loss": 1.4806, "step": 19525 }, { "epoch": 1.54, "learning_rate": 0.00014428501482764434, "loss": 1.5132, "step": 19526 }, { "epoch": 1.54, "learning_rate": 0.00014427266410485404, "loss": 1.5086, "step": 19527 }, { "epoch": 1.54, "learning_rate": 0.00014426031342094914, "loss": 1.5171, "step": 19528 }, { "epoch": 1.54, "learning_rate": 0.00014424796277601355, "loss": 1.508, "step": 19529 }, { "epoch": 1.54, "learning_rate": 0.00014423561217013115, "loss": 1.5165, "step": 19530 }, { "epoch": 1.54, "learning_rate": 0.0001442232616033858, "loss": 1.4616, "step": 19531 }, { "epoch": 1.54, "learning_rate": 0.00014421091107586127, "loss": 1.5491, "step": 19532 }, { "epoch": 1.54, "learning_rate": 0.0001441985605876415, "loss": 1.4918, "step": 19533 }, { "epoch": 1.54, "learning_rate": 0.00014418621013881025, "loss": 1.5499, "step": 19534 }, { "epoch": 1.54, "learning_rate": 0.00014417385972945144, "loss": 1.5382, "step": 19535 }, { "epoch": 1.54, "learning_rate": 0.00014416150935964893, "loss": 1.517, "step": 19536 }, { "epoch": 1.54, "learning_rate": 0.0001441491590294865, "loss": 1.5244, "step": 19537 }, { "epoch": 1.54, "learning_rate": 0.0001441368087390481, "loss": 1.4942, "step": 19538 }, { "epoch": 1.54, "learning_rate": 0.00014412445848841754, "loss": 1.5268, "step": 19539 }, { "epoch": 1.54, "learning_rate": 0.00014411210827767863, "loss": 1.5047, "step": 19540 }, { "epoch": 1.54, "learning_rate": 0.0001440997581069153, "loss": 1.5215, "step": 19541 }, { "epoch": 1.54, "learning_rate": 0.0001440874079762113, "loss": 1.4872, "step": 19542 }, { "epoch": 1.54, "learning_rate": 0.0001440750578856505, "loss": 1.456, "step": 19543 }, { "epoch": 1.54, "learning_rate": 0.00014406270783531684, "loss": 1.5648, "step": 19544 }, { "epoch": 1.54, "learning_rate": 0.00014405035782529417, "loss": 1.4804, "step": 19545 }, { "epoch": 1.54, "learning_rate": 0.0001440380078556662, "loss": 1.4508, "step": 19546 }, { "epoch": 1.54, "learning_rate": 0.00014402565792651691, "loss": 1.5486, "step": 19547 }, { "epoch": 1.54, "learning_rate": 0.00014401330803793014, "loss": 1.5277, "step": 19548 }, { "epoch": 1.54, "learning_rate": 0.00014400095818998965, "loss": 1.4356, "step": 19549 }, { "epoch": 1.54, "learning_rate": 0.00014398860838277938, "loss": 1.4842, "step": 19550 }, { "epoch": 1.54, "learning_rate": 0.00014397625861638312, "loss": 1.533, "step": 19551 }, { "epoch": 1.54, "learning_rate": 0.00014396390889088472, "loss": 1.4756, "step": 19552 }, { "epoch": 1.54, "learning_rate": 0.0001439515592063681, "loss": 1.5471, "step": 19553 }, { "epoch": 1.54, "learning_rate": 0.000143939209562917, "loss": 1.5001, "step": 19554 }, { "epoch": 1.54, "learning_rate": 0.00014392685996061536, "loss": 1.5208, "step": 19555 }, { "epoch": 1.54, "learning_rate": 0.00014391451039954699, "loss": 1.53, "step": 19556 }, { "epoch": 1.54, "learning_rate": 0.00014390216087979574, "loss": 1.4962, "step": 19557 }, { "epoch": 1.54, "learning_rate": 0.00014388981140144543, "loss": 1.5134, "step": 19558 }, { "epoch": 1.54, "learning_rate": 0.00014387746196457986, "loss": 1.4644, "step": 19559 }, { "epoch": 1.54, "learning_rate": 0.00014386511256928307, "loss": 1.5006, "step": 19560 }, { "epoch": 1.54, "learning_rate": 0.0001438527632156387, "loss": 1.508, "step": 19561 }, { "epoch": 1.54, "learning_rate": 0.00014384041390373074, "loss": 1.5075, "step": 19562 }, { "epoch": 1.54, "learning_rate": 0.00014382806463364293, "loss": 1.5516, "step": 19563 }, { "epoch": 1.54, "learning_rate": 0.00014381571540545915, "loss": 1.4862, "step": 19564 }, { "epoch": 1.54, "learning_rate": 0.00014380336621926327, "loss": 1.5658, "step": 19565 }, { "epoch": 1.54, "learning_rate": 0.0001437910170751391, "loss": 1.5114, "step": 19566 }, { "epoch": 1.54, "learning_rate": 0.00014377866797317051, "loss": 1.4733, "step": 19567 }, { "epoch": 1.54, "learning_rate": 0.00014376631891344134, "loss": 1.4561, "step": 19568 }, { "epoch": 1.54, "learning_rate": 0.00014375396989603538, "loss": 1.4609, "step": 19569 }, { "epoch": 1.54, "learning_rate": 0.00014374162092103658, "loss": 1.5535, "step": 19570 }, { "epoch": 1.54, "learning_rate": 0.00014372927198852867, "loss": 1.4637, "step": 19571 }, { "epoch": 1.54, "learning_rate": 0.00014371692309859556, "loss": 1.4544, "step": 19572 }, { "epoch": 1.54, "learning_rate": 0.0001437045742513211, "loss": 1.5215, "step": 19573 }, { "epoch": 1.54, "learning_rate": 0.00014369222544678906, "loss": 1.5337, "step": 19574 }, { "epoch": 1.54, "learning_rate": 0.0001436798766850833, "loss": 1.5464, "step": 19575 }, { "epoch": 1.54, "learning_rate": 0.00014366752796628773, "loss": 1.5085, "step": 19576 }, { "epoch": 1.54, "learning_rate": 0.00014365517929048618, "loss": 1.5199, "step": 19577 }, { "epoch": 1.54, "learning_rate": 0.00014364283065776244, "loss": 1.5274, "step": 19578 }, { "epoch": 1.54, "learning_rate": 0.00014363048206820039, "loss": 1.4823, "step": 19579 }, { "epoch": 1.54, "learning_rate": 0.00014361813352188382, "loss": 1.5037, "step": 19580 }, { "epoch": 1.54, "learning_rate": 0.0001436057850188966, "loss": 1.5289, "step": 19581 }, { "epoch": 1.54, "learning_rate": 0.00014359343655932262, "loss": 1.535, "step": 19582 }, { "epoch": 1.54, "learning_rate": 0.00014358108814324562, "loss": 1.4872, "step": 19583 }, { "epoch": 1.54, "learning_rate": 0.00014356873977074952, "loss": 1.4727, "step": 19584 }, { "epoch": 1.54, "learning_rate": 0.0001435563914419181, "loss": 1.5339, "step": 19585 }, { "epoch": 1.54, "learning_rate": 0.00014354404315683524, "loss": 1.564, "step": 19586 }, { "epoch": 1.54, "learning_rate": 0.0001435316949155848, "loss": 1.5816, "step": 19587 }, { "epoch": 1.54, "learning_rate": 0.00014351934671825054, "loss": 1.4402, "step": 19588 }, { "epoch": 1.54, "learning_rate": 0.00014350699856491633, "loss": 1.52, "step": 19589 }, { "epoch": 1.54, "learning_rate": 0.000143494650455666, "loss": 1.5399, "step": 19590 }, { "epoch": 1.54, "learning_rate": 0.00014348230239058345, "loss": 1.5321, "step": 19591 }, { "epoch": 1.54, "learning_rate": 0.00014346995436975243, "loss": 1.4574, "step": 19592 }, { "epoch": 1.54, "learning_rate": 0.00014345760639325683, "loss": 1.5582, "step": 19593 }, { "epoch": 1.54, "learning_rate": 0.0001434452584611805, "loss": 1.492, "step": 19594 }, { "epoch": 1.54, "learning_rate": 0.00014343291057360724, "loss": 1.4939, "step": 19595 }, { "epoch": 1.54, "learning_rate": 0.00014342056273062087, "loss": 1.5437, "step": 19596 }, { "epoch": 1.54, "learning_rate": 0.00014340821493230528, "loss": 1.5022, "step": 19597 }, { "epoch": 1.54, "learning_rate": 0.00014339586717874425, "loss": 1.5074, "step": 19598 }, { "epoch": 1.54, "learning_rate": 0.00014338351947002168, "loss": 1.5133, "step": 19599 }, { "epoch": 1.54, "learning_rate": 0.00014337117180622132, "loss": 1.5133, "step": 19600 }, { "epoch": 1.54, "learning_rate": 0.00014335882418742703, "loss": 1.4646, "step": 19601 }, { "epoch": 1.54, "learning_rate": 0.0001433464766137227, "loss": 1.5025, "step": 19602 }, { "epoch": 1.54, "learning_rate": 0.00014333412908519211, "loss": 1.5304, "step": 19603 }, { "epoch": 1.54, "learning_rate": 0.0001433217816019191, "loss": 1.5283, "step": 19604 }, { "epoch": 1.54, "learning_rate": 0.0001433094341639875, "loss": 1.5248, "step": 19605 }, { "epoch": 1.54, "learning_rate": 0.0001432970867714811, "loss": 1.5369, "step": 19606 }, { "epoch": 1.54, "learning_rate": 0.00014328473942448383, "loss": 1.4667, "step": 19607 }, { "epoch": 1.54, "learning_rate": 0.0001432723921230795, "loss": 1.5183, "step": 19608 }, { "epoch": 1.54, "learning_rate": 0.0001432600448673519, "loss": 1.507, "step": 19609 }, { "epoch": 1.54, "learning_rate": 0.00014324769765738484, "loss": 1.5426, "step": 19610 }, { "epoch": 1.54, "learning_rate": 0.00014323535049326225, "loss": 1.5747, "step": 19611 }, { "epoch": 1.54, "learning_rate": 0.00014322300337506785, "loss": 1.5283, "step": 19612 }, { "epoch": 1.54, "learning_rate": 0.00014321065630288552, "loss": 1.4997, "step": 19613 }, { "epoch": 1.54, "learning_rate": 0.00014319830927679914, "loss": 1.5409, "step": 19614 }, { "epoch": 1.54, "learning_rate": 0.00014318596229689242, "loss": 1.5563, "step": 19615 }, { "epoch": 1.54, "learning_rate": 0.0001431736153632493, "loss": 1.5291, "step": 19616 }, { "epoch": 1.54, "learning_rate": 0.00014316126847595354, "loss": 1.5319, "step": 19617 }, { "epoch": 1.54, "learning_rate": 0.000143148921635089, "loss": 1.5385, "step": 19618 }, { "epoch": 1.54, "learning_rate": 0.00014313657484073952, "loss": 1.4553, "step": 19619 }, { "epoch": 1.54, "learning_rate": 0.00014312422809298887, "loss": 1.5228, "step": 19620 }, { "epoch": 1.54, "learning_rate": 0.00014311188139192095, "loss": 1.5213, "step": 19621 }, { "epoch": 1.54, "learning_rate": 0.00014309953473761947, "loss": 1.4918, "step": 19622 }, { "epoch": 1.54, "learning_rate": 0.00014308718813016845, "loss": 1.5566, "step": 19623 }, { "epoch": 1.54, "learning_rate": 0.00014307484156965154, "loss": 1.4818, "step": 19624 }, { "epoch": 1.54, "learning_rate": 0.00014306249505615265, "loss": 1.5151, "step": 19625 }, { "epoch": 1.54, "learning_rate": 0.00014305014858975563, "loss": 1.4728, "step": 19626 }, { "epoch": 1.54, "learning_rate": 0.00014303780217054423, "loss": 1.421, "step": 19627 }, { "epoch": 1.54, "learning_rate": 0.00014302545579860236, "loss": 1.4676, "step": 19628 }, { "epoch": 1.54, "learning_rate": 0.00014301310947401372, "loss": 1.5154, "step": 19629 }, { "epoch": 1.54, "learning_rate": 0.00014300076319686224, "loss": 1.4935, "step": 19630 }, { "epoch": 1.54, "learning_rate": 0.00014298841696723175, "loss": 1.4961, "step": 19631 }, { "epoch": 1.54, "learning_rate": 0.00014297607078520602, "loss": 1.5334, "step": 19632 }, { "epoch": 1.54, "learning_rate": 0.0001429637246508689, "loss": 1.5388, "step": 19633 }, { "epoch": 1.54, "learning_rate": 0.00014295137856430417, "loss": 1.55, "step": 19634 }, { "epoch": 1.54, "learning_rate": 0.0001429390325255957, "loss": 1.4931, "step": 19635 }, { "epoch": 1.54, "learning_rate": 0.00014292668653482734, "loss": 1.5064, "step": 19636 }, { "epoch": 1.55, "learning_rate": 0.00014291434059208284, "loss": 1.5263, "step": 19637 }, { "epoch": 1.55, "learning_rate": 0.00014290199469744604, "loss": 1.5173, "step": 19638 }, { "epoch": 1.55, "learning_rate": 0.00014288964885100078, "loss": 1.4632, "step": 19639 }, { "epoch": 1.55, "learning_rate": 0.00014287730305283093, "loss": 1.5585, "step": 19640 }, { "epoch": 1.55, "learning_rate": 0.00014286495730302023, "loss": 1.5214, "step": 19641 }, { "epoch": 1.55, "learning_rate": 0.00014285261160165255, "loss": 1.542, "step": 19642 }, { "epoch": 1.55, "learning_rate": 0.0001428402659488117, "loss": 1.4545, "step": 19643 }, { "epoch": 1.55, "learning_rate": 0.00014282792034458146, "loss": 1.525, "step": 19644 }, { "epoch": 1.55, "learning_rate": 0.00014281557478904573, "loss": 1.501, "step": 19645 }, { "epoch": 1.55, "learning_rate": 0.00014280322928228825, "loss": 1.5233, "step": 19646 }, { "epoch": 1.55, "learning_rate": 0.00014279088382439286, "loss": 1.5014, "step": 19647 }, { "epoch": 1.55, "learning_rate": 0.00014277853841544342, "loss": 1.4633, "step": 19648 }, { "epoch": 1.55, "learning_rate": 0.0001427661930555237, "loss": 1.5081, "step": 19649 }, { "epoch": 1.55, "learning_rate": 0.00014275384774471752, "loss": 1.4671, "step": 19650 }, { "epoch": 1.55, "learning_rate": 0.00014274150248310875, "loss": 1.5331, "step": 19651 }, { "epoch": 1.55, "learning_rate": 0.00014272915727078114, "loss": 1.4533, "step": 19652 }, { "epoch": 1.55, "learning_rate": 0.00014271681210781853, "loss": 1.505, "step": 19653 }, { "epoch": 1.55, "learning_rate": 0.00014270446699430475, "loss": 1.4908, "step": 19654 }, { "epoch": 1.55, "learning_rate": 0.00014269212193032368, "loss": 1.5237, "step": 19655 }, { "epoch": 1.55, "learning_rate": 0.000142679776915959, "loss": 1.5032, "step": 19656 }, { "epoch": 1.55, "learning_rate": 0.00014266743195129466, "loss": 1.5659, "step": 19657 }, { "epoch": 1.55, "learning_rate": 0.00014265508703641437, "loss": 1.5154, "step": 19658 }, { "epoch": 1.55, "learning_rate": 0.00014264274217140195, "loss": 1.5273, "step": 19659 }, { "epoch": 1.55, "learning_rate": 0.00014263039735634133, "loss": 1.5531, "step": 19660 }, { "epoch": 1.55, "learning_rate": 0.00014261805259131619, "loss": 1.497, "step": 19661 }, { "epoch": 1.55, "learning_rate": 0.00014260570787641045, "loss": 1.557, "step": 19662 }, { "epoch": 1.55, "learning_rate": 0.00014259336321170783, "loss": 1.5064, "step": 19663 }, { "epoch": 1.55, "learning_rate": 0.00014258101859729216, "loss": 1.4892, "step": 19664 }, { "epoch": 1.55, "learning_rate": 0.00014256867403324736, "loss": 1.4964, "step": 19665 }, { "epoch": 1.55, "learning_rate": 0.0001425563295196571, "loss": 1.5112, "step": 19666 }, { "epoch": 1.55, "learning_rate": 0.00014254398505660523, "loss": 1.4873, "step": 19667 }, { "epoch": 1.55, "learning_rate": 0.00014253164064417567, "loss": 1.4918, "step": 19668 }, { "epoch": 1.55, "learning_rate": 0.00014251929628245207, "loss": 1.5319, "step": 19669 }, { "epoch": 1.55, "learning_rate": 0.00014250695197151833, "loss": 1.5049, "step": 19670 }, { "epoch": 1.55, "learning_rate": 0.00014249460771145826, "loss": 1.5729, "step": 19671 }, { "epoch": 1.55, "learning_rate": 0.0001424822635023557, "loss": 1.5009, "step": 19672 }, { "epoch": 1.55, "learning_rate": 0.0001424699193442944, "loss": 1.4975, "step": 19673 }, { "epoch": 1.55, "learning_rate": 0.0001424575752373582, "loss": 1.5057, "step": 19674 }, { "epoch": 1.55, "learning_rate": 0.00014244523118163088, "loss": 1.5684, "step": 19675 }, { "epoch": 1.55, "learning_rate": 0.0001424328871771963, "loss": 1.4683, "step": 19676 }, { "epoch": 1.55, "learning_rate": 0.00014242054322413823, "loss": 1.4989, "step": 19677 }, { "epoch": 1.55, "learning_rate": 0.0001424081993225405, "loss": 1.5092, "step": 19678 }, { "epoch": 1.55, "learning_rate": 0.00014239585547248687, "loss": 1.5183, "step": 19679 }, { "epoch": 1.55, "learning_rate": 0.00014238351167406124, "loss": 1.5114, "step": 19680 }, { "epoch": 1.55, "learning_rate": 0.00014237116792734732, "loss": 1.4963, "step": 19681 }, { "epoch": 1.55, "learning_rate": 0.00014235882423242898, "loss": 1.5385, "step": 19682 }, { "epoch": 1.55, "learning_rate": 0.00014234648058939, "loss": 1.482, "step": 19683 }, { "epoch": 1.55, "learning_rate": 0.00014233413699831418, "loss": 1.5263, "step": 19684 }, { "epoch": 1.55, "learning_rate": 0.00014232179345928528, "loss": 1.5334, "step": 19685 }, { "epoch": 1.55, "learning_rate": 0.00014230944997238725, "loss": 1.5039, "step": 19686 }, { "epoch": 1.55, "learning_rate": 0.00014229710653770379, "loss": 1.4607, "step": 19687 }, { "epoch": 1.55, "learning_rate": 0.00014228476315531873, "loss": 1.4867, "step": 19688 }, { "epoch": 1.55, "learning_rate": 0.0001422724198253159, "loss": 1.4858, "step": 19689 }, { "epoch": 1.55, "learning_rate": 0.00014226007654777903, "loss": 1.5791, "step": 19690 }, { "epoch": 1.55, "learning_rate": 0.000142247733322792, "loss": 1.5312, "step": 19691 }, { "epoch": 1.55, "learning_rate": 0.00014223539015043856, "loss": 1.4916, "step": 19692 }, { "epoch": 1.55, "learning_rate": 0.00014222304703080253, "loss": 1.547, "step": 19693 }, { "epoch": 1.55, "learning_rate": 0.00014221070396396778, "loss": 1.4892, "step": 19694 }, { "epoch": 1.55, "learning_rate": 0.00014219836095001799, "loss": 1.4764, "step": 19695 }, { "epoch": 1.55, "learning_rate": 0.00014218601798903703, "loss": 1.5752, "step": 19696 }, { "epoch": 1.55, "learning_rate": 0.0001421736750811087, "loss": 1.5322, "step": 19697 }, { "epoch": 1.55, "learning_rate": 0.0001421613322263168, "loss": 1.4856, "step": 19698 }, { "epoch": 1.55, "learning_rate": 0.00014214898942474513, "loss": 1.5291, "step": 19699 }, { "epoch": 1.55, "learning_rate": 0.00014213664667647743, "loss": 1.4905, "step": 19700 }, { "epoch": 1.55, "learning_rate": 0.00014212430398159763, "loss": 1.4293, "step": 19701 }, { "epoch": 1.55, "learning_rate": 0.00014211196134018944, "loss": 1.4661, "step": 19702 }, { "epoch": 1.55, "learning_rate": 0.00014209961875233672, "loss": 1.4761, "step": 19703 }, { "epoch": 1.55, "learning_rate": 0.00014208727621812319, "loss": 1.5156, "step": 19704 }, { "epoch": 1.55, "learning_rate": 0.0001420749337376327, "loss": 1.5225, "step": 19705 }, { "epoch": 1.55, "learning_rate": 0.00014206259131094903, "loss": 1.4922, "step": 19706 }, { "epoch": 1.55, "learning_rate": 0.000142050248938156, "loss": 1.4741, "step": 19707 }, { "epoch": 1.55, "learning_rate": 0.00014203790661933735, "loss": 1.5295, "step": 19708 }, { "epoch": 1.55, "learning_rate": 0.00014202556435457698, "loss": 1.5719, "step": 19709 }, { "epoch": 1.55, "learning_rate": 0.00014201322214395858, "loss": 1.5021, "step": 19710 }, { "epoch": 1.55, "learning_rate": 0.00014200087998756603, "loss": 1.4928, "step": 19711 }, { "epoch": 1.55, "learning_rate": 0.00014198853788548307, "loss": 1.5088, "step": 19712 }, { "epoch": 1.55, "learning_rate": 0.0001419761958377935, "loss": 1.5138, "step": 19713 }, { "epoch": 1.55, "learning_rate": 0.00014196385384458116, "loss": 1.5597, "step": 19714 }, { "epoch": 1.55, "learning_rate": 0.0001419515119059298, "loss": 1.5253, "step": 19715 }, { "epoch": 1.55, "learning_rate": 0.00014193917002192321, "loss": 1.4945, "step": 19716 }, { "epoch": 1.55, "learning_rate": 0.00014192682819264522, "loss": 1.5414, "step": 19717 }, { "epoch": 1.55, "learning_rate": 0.00014191448641817964, "loss": 1.5105, "step": 19718 }, { "epoch": 1.55, "learning_rate": 0.00014190214469861023, "loss": 1.536, "step": 19719 }, { "epoch": 1.55, "learning_rate": 0.00014188980303402081, "loss": 1.518, "step": 19720 }, { "epoch": 1.55, "learning_rate": 0.0001418774614244951, "loss": 1.5687, "step": 19721 }, { "epoch": 1.55, "learning_rate": 0.00014186511987011698, "loss": 1.5023, "step": 19722 }, { "epoch": 1.55, "learning_rate": 0.0001418527783709702, "loss": 1.5342, "step": 19723 }, { "epoch": 1.55, "learning_rate": 0.00014184043692713855, "loss": 1.4956, "step": 19724 }, { "epoch": 1.55, "learning_rate": 0.0001418280955387058, "loss": 1.5767, "step": 19725 }, { "epoch": 1.55, "learning_rate": 0.00014181575420575584, "loss": 1.527, "step": 19726 }, { "epoch": 1.55, "learning_rate": 0.00014180341292837235, "loss": 1.4887, "step": 19727 }, { "epoch": 1.55, "learning_rate": 0.00014179107170663921, "loss": 1.4859, "step": 19728 }, { "epoch": 1.55, "learning_rate": 0.00014177873054064012, "loss": 1.5247, "step": 19729 }, { "epoch": 1.55, "learning_rate": 0.0001417663894304589, "loss": 1.5303, "step": 19730 }, { "epoch": 1.55, "learning_rate": 0.00014175404837617938, "loss": 1.479, "step": 19731 }, { "epoch": 1.55, "learning_rate": 0.00014174170737788527, "loss": 1.5309, "step": 19732 }, { "epoch": 1.55, "learning_rate": 0.00014172936643566043, "loss": 1.53, "step": 19733 }, { "epoch": 1.55, "learning_rate": 0.00014171702554958865, "loss": 1.5433, "step": 19734 }, { "epoch": 1.55, "learning_rate": 0.00014170468471975373, "loss": 1.5543, "step": 19735 }, { "epoch": 1.55, "learning_rate": 0.00014169234394623937, "loss": 1.5231, "step": 19736 }, { "epoch": 1.55, "learning_rate": 0.0001416800032291294, "loss": 1.4594, "step": 19737 }, { "epoch": 1.55, "learning_rate": 0.00014166766256850768, "loss": 1.4823, "step": 19738 }, { "epoch": 1.55, "learning_rate": 0.0001416553219644579, "loss": 1.5472, "step": 19739 }, { "epoch": 1.55, "learning_rate": 0.0001416429814170639, "loss": 1.4767, "step": 19740 }, { "epoch": 1.55, "learning_rate": 0.0001416306409264094, "loss": 1.4938, "step": 19741 }, { "epoch": 1.55, "learning_rate": 0.00014161830049257823, "loss": 1.4995, "step": 19742 }, { "epoch": 1.55, "learning_rate": 0.00014160596011565421, "loss": 1.5164, "step": 19743 }, { "epoch": 1.55, "learning_rate": 0.0001415936197957211, "loss": 1.4757, "step": 19744 }, { "epoch": 1.55, "learning_rate": 0.00014158127953286265, "loss": 1.5439, "step": 19745 }, { "epoch": 1.55, "learning_rate": 0.00014156893932716267, "loss": 1.5303, "step": 19746 }, { "epoch": 1.55, "learning_rate": 0.0001415565991787049, "loss": 1.5695, "step": 19747 }, { "epoch": 1.55, "learning_rate": 0.00014154425908757313, "loss": 1.5108, "step": 19748 }, { "epoch": 1.55, "learning_rate": 0.00014153191905385125, "loss": 1.5224, "step": 19749 }, { "epoch": 1.55, "learning_rate": 0.00014151957907762298, "loss": 1.5206, "step": 19750 }, { "epoch": 1.55, "learning_rate": 0.00014150723915897206, "loss": 1.5065, "step": 19751 }, { "epoch": 1.55, "learning_rate": 0.0001414948992979823, "loss": 1.5211, "step": 19752 }, { "epoch": 1.55, "learning_rate": 0.00014148255949473747, "loss": 1.4639, "step": 19753 }, { "epoch": 1.55, "learning_rate": 0.00014147021974932137, "loss": 1.5433, "step": 19754 }, { "epoch": 1.55, "learning_rate": 0.0001414578800618178, "loss": 1.5297, "step": 19755 }, { "epoch": 1.55, "learning_rate": 0.00014144554043231047, "loss": 1.5612, "step": 19756 }, { "epoch": 1.55, "learning_rate": 0.00014143320086088324, "loss": 1.5088, "step": 19757 }, { "epoch": 1.55, "learning_rate": 0.00014142086134761981, "loss": 1.5027, "step": 19758 }, { "epoch": 1.55, "learning_rate": 0.00014140852189260401, "loss": 1.5243, "step": 19759 }, { "epoch": 1.55, "learning_rate": 0.00014139618249591962, "loss": 1.5034, "step": 19760 }, { "epoch": 1.55, "learning_rate": 0.00014138384315765039, "loss": 1.4949, "step": 19761 }, { "epoch": 1.55, "learning_rate": 0.0001413715038778801, "loss": 1.5073, "step": 19762 }, { "epoch": 1.55, "learning_rate": 0.00014135916465669247, "loss": 1.5226, "step": 19763 }, { "epoch": 1.56, "learning_rate": 0.00014134682549417146, "loss": 1.4705, "step": 19764 }, { "epoch": 1.56, "learning_rate": 0.00014133448639040068, "loss": 1.4885, "step": 19765 }, { "epoch": 1.56, "learning_rate": 0.00014132214734546394, "loss": 1.5278, "step": 19766 }, { "epoch": 1.56, "learning_rate": 0.00014130980835944508, "loss": 1.586, "step": 19767 }, { "epoch": 1.56, "learning_rate": 0.0001412974694324278, "loss": 1.4953, "step": 19768 }, { "epoch": 1.56, "learning_rate": 0.0001412851305644959, "loss": 1.5431, "step": 19769 }, { "epoch": 1.56, "learning_rate": 0.00014127279175573315, "loss": 1.5378, "step": 19770 }, { "epoch": 1.56, "learning_rate": 0.0001412604530062233, "loss": 1.5307, "step": 19771 }, { "epoch": 1.56, "learning_rate": 0.00014124811431605024, "loss": 1.5088, "step": 19772 }, { "epoch": 1.56, "learning_rate": 0.00014123577568529757, "loss": 1.5208, "step": 19773 }, { "epoch": 1.56, "learning_rate": 0.0001412234371140492, "loss": 1.5453, "step": 19774 }, { "epoch": 1.56, "learning_rate": 0.00014121109860238881, "loss": 1.481, "step": 19775 }, { "epoch": 1.56, "learning_rate": 0.0001411987601504002, "loss": 1.4916, "step": 19776 }, { "epoch": 1.56, "learning_rate": 0.0001411864217581672, "loss": 1.4905, "step": 19777 }, { "epoch": 1.56, "learning_rate": 0.00014117408342577352, "loss": 1.4696, "step": 19778 }, { "epoch": 1.56, "learning_rate": 0.00014116174515330288, "loss": 1.5158, "step": 19779 }, { "epoch": 1.56, "learning_rate": 0.00014114940694083915, "loss": 1.5699, "step": 19780 }, { "epoch": 1.56, "learning_rate": 0.0001411370687884661, "loss": 1.4689, "step": 19781 }, { "epoch": 1.56, "learning_rate": 0.00014112473069626742, "loss": 1.4631, "step": 19782 }, { "epoch": 1.56, "learning_rate": 0.00014111239266432693, "loss": 1.5724, "step": 19783 }, { "epoch": 1.56, "learning_rate": 0.00014110005469272842, "loss": 1.4976, "step": 19784 }, { "epoch": 1.56, "learning_rate": 0.0001410877167815556, "loss": 1.5259, "step": 19785 }, { "epoch": 1.56, "learning_rate": 0.00014107537893089228, "loss": 1.5101, "step": 19786 }, { "epoch": 1.56, "learning_rate": 0.0001410630411408222, "loss": 1.5275, "step": 19787 }, { "epoch": 1.56, "learning_rate": 0.00014105070341142913, "loss": 1.5373, "step": 19788 }, { "epoch": 1.56, "learning_rate": 0.00014103836574279688, "loss": 1.5051, "step": 19789 }, { "epoch": 1.56, "learning_rate": 0.00014102602813500915, "loss": 1.5217, "step": 19790 }, { "epoch": 1.56, "learning_rate": 0.00014101369058814973, "loss": 1.4891, "step": 19791 }, { "epoch": 1.56, "learning_rate": 0.00014100135310230244, "loss": 1.5058, "step": 19792 }, { "epoch": 1.56, "learning_rate": 0.00014098901567755092, "loss": 1.5013, "step": 19793 }, { "epoch": 1.56, "learning_rate": 0.00014097667831397908, "loss": 1.4667, "step": 19794 }, { "epoch": 1.56, "learning_rate": 0.00014096434101167052, "loss": 1.4393, "step": 19795 }, { "epoch": 1.56, "learning_rate": 0.00014095200377070918, "loss": 1.5544, "step": 19796 }, { "epoch": 1.56, "learning_rate": 0.00014093966659117874, "loss": 1.4662, "step": 19797 }, { "epoch": 1.56, "learning_rate": 0.00014092732947316297, "loss": 1.5085, "step": 19798 }, { "epoch": 1.56, "learning_rate": 0.0001409149924167456, "loss": 1.5251, "step": 19799 }, { "epoch": 1.56, "learning_rate": 0.0001409026554220104, "loss": 1.4688, "step": 19800 }, { "epoch": 1.56, "learning_rate": 0.0001408903184890412, "loss": 1.5443, "step": 19801 }, { "epoch": 1.56, "learning_rate": 0.00014087798161792169, "loss": 1.468, "step": 19802 }, { "epoch": 1.56, "learning_rate": 0.00014086564480873565, "loss": 1.5475, "step": 19803 }, { "epoch": 1.56, "learning_rate": 0.00014085330806156684, "loss": 1.475, "step": 19804 }, { "epoch": 1.56, "learning_rate": 0.000140840971376499, "loss": 1.49, "step": 19805 }, { "epoch": 1.56, "learning_rate": 0.00014082863475361595, "loss": 1.5007, "step": 19806 }, { "epoch": 1.56, "learning_rate": 0.0001408162981930014, "loss": 1.4837, "step": 19807 }, { "epoch": 1.56, "learning_rate": 0.00014080396169473906, "loss": 1.5176, "step": 19808 }, { "epoch": 1.56, "learning_rate": 0.00014079162525891282, "loss": 1.5689, "step": 19809 }, { "epoch": 1.56, "learning_rate": 0.00014077928888560633, "loss": 1.4885, "step": 19810 }, { "epoch": 1.56, "learning_rate": 0.00014076695257490333, "loss": 1.5534, "step": 19811 }, { "epoch": 1.56, "learning_rate": 0.00014075461632688768, "loss": 1.4764, "step": 19812 }, { "epoch": 1.56, "learning_rate": 0.00014074228014164308, "loss": 1.5006, "step": 19813 }, { "epoch": 1.56, "learning_rate": 0.00014072994401925329, "loss": 1.4822, "step": 19814 }, { "epoch": 1.56, "learning_rate": 0.0001407176079598021, "loss": 1.5183, "step": 19815 }, { "epoch": 1.56, "learning_rate": 0.00014070527196337318, "loss": 1.5107, "step": 19816 }, { "epoch": 1.56, "learning_rate": 0.00014069293603005033, "loss": 1.5223, "step": 19817 }, { "epoch": 1.56, "learning_rate": 0.00014068060015991736, "loss": 1.5369, "step": 19818 }, { "epoch": 1.56, "learning_rate": 0.00014066826435305793, "loss": 1.5356, "step": 19819 }, { "epoch": 1.56, "learning_rate": 0.00014065592860955584, "loss": 1.5391, "step": 19820 }, { "epoch": 1.56, "learning_rate": 0.00014064359292949487, "loss": 1.5264, "step": 19821 }, { "epoch": 1.56, "learning_rate": 0.00014063125731295868, "loss": 1.5219, "step": 19822 }, { "epoch": 1.56, "learning_rate": 0.00014061892176003114, "loss": 1.5439, "step": 19823 }, { "epoch": 1.56, "learning_rate": 0.00014060658627079592, "loss": 1.5062, "step": 19824 }, { "epoch": 1.56, "learning_rate": 0.0001405942508453368, "loss": 1.5006, "step": 19825 }, { "epoch": 1.56, "learning_rate": 0.00014058191548373746, "loss": 1.5406, "step": 19826 }, { "epoch": 1.56, "learning_rate": 0.0001405695801860818, "loss": 1.5227, "step": 19827 }, { "epoch": 1.56, "learning_rate": 0.00014055724495245345, "loss": 1.5437, "step": 19828 }, { "epoch": 1.56, "learning_rate": 0.0001405449097829362, "loss": 1.5361, "step": 19829 }, { "epoch": 1.56, "learning_rate": 0.00014053257467761383, "loss": 1.4856, "step": 19830 }, { "epoch": 1.56, "learning_rate": 0.00014052023963657002, "loss": 1.5208, "step": 19831 }, { "epoch": 1.56, "learning_rate": 0.00014050790465988856, "loss": 1.5505, "step": 19832 }, { "epoch": 1.56, "learning_rate": 0.00014049556974765322, "loss": 1.4981, "step": 19833 }, { "epoch": 1.56, "learning_rate": 0.00014048323489994767, "loss": 1.5334, "step": 19834 }, { "epoch": 1.56, "learning_rate": 0.00014047090011685574, "loss": 1.4661, "step": 19835 }, { "epoch": 1.56, "learning_rate": 0.0001404585653984611, "loss": 1.4656, "step": 19836 }, { "epoch": 1.56, "learning_rate": 0.00014044623074484754, "loss": 1.501, "step": 19837 }, { "epoch": 1.56, "learning_rate": 0.00014043389615609885, "loss": 1.5369, "step": 19838 }, { "epoch": 1.56, "learning_rate": 0.0001404215616322987, "loss": 1.5136, "step": 19839 }, { "epoch": 1.56, "learning_rate": 0.00014040922717353086, "loss": 1.4846, "step": 19840 }, { "epoch": 1.56, "learning_rate": 0.00014039689277987907, "loss": 1.5485, "step": 19841 }, { "epoch": 1.56, "learning_rate": 0.00014038455845142702, "loss": 1.4861, "step": 19842 }, { "epoch": 1.56, "learning_rate": 0.00014037222418825855, "loss": 1.486, "step": 19843 }, { "epoch": 1.56, "learning_rate": 0.00014035988999045742, "loss": 1.4935, "step": 19844 }, { "epoch": 1.56, "learning_rate": 0.00014034755585810727, "loss": 1.461, "step": 19845 }, { "epoch": 1.56, "learning_rate": 0.00014033522179129188, "loss": 1.5292, "step": 19846 }, { "epoch": 1.56, "learning_rate": 0.00014032288779009504, "loss": 1.5483, "step": 19847 }, { "epoch": 1.56, "learning_rate": 0.0001403105538546004, "loss": 1.5473, "step": 19848 }, { "epoch": 1.56, "learning_rate": 0.00014029821998489178, "loss": 1.5016, "step": 19849 }, { "epoch": 1.56, "learning_rate": 0.00014028588618105294, "loss": 1.5017, "step": 19850 }, { "epoch": 1.56, "learning_rate": 0.0001402735524431675, "loss": 1.5455, "step": 19851 }, { "epoch": 1.56, "learning_rate": 0.00014026121877131932, "loss": 1.5646, "step": 19852 }, { "epoch": 1.56, "learning_rate": 0.00014024888516559207, "loss": 1.5168, "step": 19853 }, { "epoch": 1.56, "learning_rate": 0.0001402365516260695, "loss": 1.531, "step": 19854 }, { "epoch": 1.56, "learning_rate": 0.0001402242181528354, "loss": 1.4858, "step": 19855 }, { "epoch": 1.56, "learning_rate": 0.0001402118847459734, "loss": 1.5306, "step": 19856 }, { "epoch": 1.56, "learning_rate": 0.00014019955140556737, "loss": 1.516, "step": 19857 }, { "epoch": 1.56, "learning_rate": 0.00014018721813170086, "loss": 1.4886, "step": 19858 }, { "epoch": 1.56, "learning_rate": 0.0001401748849244578, "loss": 1.5624, "step": 19859 }, { "epoch": 1.56, "learning_rate": 0.00014016255178392185, "loss": 1.5636, "step": 19860 }, { "epoch": 1.56, "learning_rate": 0.00014015021871017675, "loss": 1.5292, "step": 19861 }, { "epoch": 1.56, "learning_rate": 0.00014013788570330625, "loss": 1.4898, "step": 19862 }, { "epoch": 1.56, "learning_rate": 0.000140125552763394, "loss": 1.4399, "step": 19863 }, { "epoch": 1.56, "learning_rate": 0.00014011321989052387, "loss": 1.4787, "step": 19864 }, { "epoch": 1.56, "learning_rate": 0.00014010088708477948, "loss": 1.4874, "step": 19865 }, { "epoch": 1.56, "learning_rate": 0.0001400885543462446, "loss": 1.5511, "step": 19866 }, { "epoch": 1.56, "learning_rate": 0.000140076221675003, "loss": 1.4906, "step": 19867 }, { "epoch": 1.56, "learning_rate": 0.00014006388907113836, "loss": 1.5222, "step": 19868 }, { "epoch": 1.56, "learning_rate": 0.00014005155653473443, "loss": 1.5003, "step": 19869 }, { "epoch": 1.56, "learning_rate": 0.00014003922406587494, "loss": 1.5007, "step": 19870 }, { "epoch": 1.56, "learning_rate": 0.0001400268916646436, "loss": 1.5332, "step": 19871 }, { "epoch": 1.56, "learning_rate": 0.0001400145593311242, "loss": 1.4357, "step": 19872 }, { "epoch": 1.56, "learning_rate": 0.00014000222706540036, "loss": 1.5496, "step": 19873 }, { "epoch": 1.56, "learning_rate": 0.00013998989486755593, "loss": 1.5037, "step": 19874 }, { "epoch": 1.56, "learning_rate": 0.00013997756273767458, "loss": 1.432, "step": 19875 }, { "epoch": 1.56, "learning_rate": 0.0001399652306758401, "loss": 1.5277, "step": 19876 }, { "epoch": 1.56, "learning_rate": 0.0001399528986821361, "loss": 1.5258, "step": 19877 }, { "epoch": 1.56, "learning_rate": 0.0001399405667566464, "loss": 1.4605, "step": 19878 }, { "epoch": 1.56, "learning_rate": 0.00013992823489945472, "loss": 1.5227, "step": 19879 }, { "epoch": 1.56, "learning_rate": 0.00013991590311064473, "loss": 1.5083, "step": 19880 }, { "epoch": 1.56, "learning_rate": 0.00013990357139030023, "loss": 1.4753, "step": 19881 }, { "epoch": 1.56, "learning_rate": 0.00013989123973850488, "loss": 1.5053, "step": 19882 }, { "epoch": 1.56, "learning_rate": 0.00013987890815534245, "loss": 1.5112, "step": 19883 }, { "epoch": 1.56, "learning_rate": 0.00013986657664089667, "loss": 1.4909, "step": 19884 }, { "epoch": 1.56, "learning_rate": 0.0001398542451952512, "loss": 1.4978, "step": 19885 }, { "epoch": 1.56, "learning_rate": 0.00013984191381848985, "loss": 1.4764, "step": 19886 }, { "epoch": 1.56, "learning_rate": 0.00013982958251069626, "loss": 1.5264, "step": 19887 }, { "epoch": 1.56, "learning_rate": 0.00013981725127195418, "loss": 1.5129, "step": 19888 }, { "epoch": 1.56, "learning_rate": 0.0001398049201023473, "loss": 1.5093, "step": 19889 }, { "epoch": 1.56, "learning_rate": 0.00013979258900195948, "loss": 1.528, "step": 19890 }, { "epoch": 1.57, "learning_rate": 0.00013978025797087434, "loss": 1.5254, "step": 19891 }, { "epoch": 1.57, "learning_rate": 0.00013976792700917556, "loss": 1.5219, "step": 19892 }, { "epoch": 1.57, "learning_rate": 0.00013975559611694696, "loss": 1.4738, "step": 19893 }, { "epoch": 1.57, "learning_rate": 0.00013974326529427218, "loss": 1.4937, "step": 19894 }, { "epoch": 1.57, "learning_rate": 0.00013973093454123497, "loss": 1.5084, "step": 19895 }, { "epoch": 1.57, "learning_rate": 0.00013971860385791906, "loss": 1.4874, "step": 19896 }, { "epoch": 1.57, "learning_rate": 0.00013970627324440816, "loss": 1.5153, "step": 19897 }, { "epoch": 1.57, "learning_rate": 0.00013969394270078598, "loss": 1.5037, "step": 19898 }, { "epoch": 1.57, "learning_rate": 0.00013968161222713624, "loss": 1.4771, "step": 19899 }, { "epoch": 1.57, "learning_rate": 0.00013966928182354265, "loss": 1.5521, "step": 19900 }, { "epoch": 1.57, "learning_rate": 0.00013965695149008894, "loss": 1.5165, "step": 19901 }, { "epoch": 1.57, "learning_rate": 0.00013964462122685882, "loss": 1.5073, "step": 19902 }, { "epoch": 1.57, "learning_rate": 0.000139632291033936, "loss": 1.5276, "step": 19903 }, { "epoch": 1.57, "learning_rate": 0.00013961996091140424, "loss": 1.5173, "step": 19904 }, { "epoch": 1.57, "learning_rate": 0.00013960763085934714, "loss": 1.4964, "step": 19905 }, { "epoch": 1.57, "learning_rate": 0.00013959530087784855, "loss": 1.5, "step": 19906 }, { "epoch": 1.57, "learning_rate": 0.0001395829709669921, "loss": 1.5042, "step": 19907 }, { "epoch": 1.57, "learning_rate": 0.00013957064112686155, "loss": 1.5055, "step": 19908 }, { "epoch": 1.57, "learning_rate": 0.0001395583113575406, "loss": 1.4993, "step": 19909 }, { "epoch": 1.57, "learning_rate": 0.00013954598165911294, "loss": 1.5841, "step": 19910 }, { "epoch": 1.57, "learning_rate": 0.00013953365203166229, "loss": 1.559, "step": 19911 }, { "epoch": 1.57, "learning_rate": 0.00013952132247527238, "loss": 1.5258, "step": 19912 }, { "epoch": 1.57, "learning_rate": 0.0001395089929900269, "loss": 1.5192, "step": 19913 }, { "epoch": 1.57, "learning_rate": 0.00013949666357600956, "loss": 1.5448, "step": 19914 }, { "epoch": 1.57, "learning_rate": 0.0001394843342333041, "loss": 1.5065, "step": 19915 }, { "epoch": 1.57, "learning_rate": 0.0001394720049619942, "loss": 1.5253, "step": 19916 }, { "epoch": 1.57, "learning_rate": 0.00013945967576216355, "loss": 1.5802, "step": 19917 }, { "epoch": 1.57, "learning_rate": 0.00013944734663389594, "loss": 1.4965, "step": 19918 }, { "epoch": 1.57, "learning_rate": 0.00013943501757727496, "loss": 1.4608, "step": 19919 }, { "epoch": 1.57, "learning_rate": 0.0001394226885923844, "loss": 1.5305, "step": 19920 }, { "epoch": 1.57, "learning_rate": 0.0001394103596793079, "loss": 1.5217, "step": 19921 }, { "epoch": 1.57, "learning_rate": 0.0001393980308381293, "loss": 1.5465, "step": 19922 }, { "epoch": 1.57, "learning_rate": 0.0001393857020689322, "loss": 1.5178, "step": 19923 }, { "epoch": 1.57, "learning_rate": 0.00013937337337180028, "loss": 1.5236, "step": 19924 }, { "epoch": 1.57, "learning_rate": 0.00013936104474681735, "loss": 1.5034, "step": 19925 }, { "epoch": 1.57, "learning_rate": 0.00013934871619406705, "loss": 1.5581, "step": 19926 }, { "epoch": 1.57, "learning_rate": 0.00013933638771363306, "loss": 1.5159, "step": 19927 }, { "epoch": 1.57, "learning_rate": 0.0001393240593055991, "loss": 1.5026, "step": 19928 }, { "epoch": 1.57, "learning_rate": 0.0001393117309700489, "loss": 1.4631, "step": 19929 }, { "epoch": 1.57, "learning_rate": 0.00013929940270706622, "loss": 1.5392, "step": 19930 }, { "epoch": 1.57, "learning_rate": 0.0001392870745167346, "loss": 1.6033, "step": 19931 }, { "epoch": 1.57, "learning_rate": 0.00013927474639913783, "loss": 1.5565, "step": 19932 }, { "epoch": 1.57, "learning_rate": 0.00013926241835435967, "loss": 1.4617, "step": 19933 }, { "epoch": 1.57, "learning_rate": 0.00013925009038248375, "loss": 1.5481, "step": 19934 }, { "epoch": 1.57, "learning_rate": 0.0001392377624835938, "loss": 1.4626, "step": 19935 }, { "epoch": 1.57, "learning_rate": 0.00013922543465777338, "loss": 1.4972, "step": 19936 }, { "epoch": 1.57, "learning_rate": 0.00013921310690510644, "loss": 1.5276, "step": 19937 }, { "epoch": 1.57, "learning_rate": 0.0001392007792256765, "loss": 1.4261, "step": 19938 }, { "epoch": 1.57, "learning_rate": 0.00013918845161956734, "loss": 1.5189, "step": 19939 }, { "epoch": 1.57, "learning_rate": 0.0001391761240868626, "loss": 1.5081, "step": 19940 }, { "epoch": 1.57, "learning_rate": 0.00013916379662764602, "loss": 1.4815, "step": 19941 }, { "epoch": 1.57, "learning_rate": 0.0001391514692420013, "loss": 1.5456, "step": 19942 }, { "epoch": 1.57, "learning_rate": 0.00013913914193001208, "loss": 1.5652, "step": 19943 }, { "epoch": 1.57, "learning_rate": 0.0001391268146917621, "loss": 1.4849, "step": 19944 }, { "epoch": 1.57, "learning_rate": 0.0001391144875273351, "loss": 1.5308, "step": 19945 }, { "epoch": 1.57, "learning_rate": 0.00013910216043681466, "loss": 1.5293, "step": 19946 }, { "epoch": 1.57, "learning_rate": 0.0001390898334202846, "loss": 1.5136, "step": 19947 }, { "epoch": 1.57, "learning_rate": 0.0001390775064778285, "loss": 1.5898, "step": 19948 }, { "epoch": 1.57, "learning_rate": 0.0001390651796095301, "loss": 1.5036, "step": 19949 }, { "epoch": 1.57, "learning_rate": 0.0001390528528154731, "loss": 1.5581, "step": 19950 }, { "epoch": 1.57, "learning_rate": 0.0001390405260957412, "loss": 1.5217, "step": 19951 }, { "epoch": 1.57, "learning_rate": 0.00013902819945041804, "loss": 1.4898, "step": 19952 }, { "epoch": 1.57, "learning_rate": 0.00013901587287958736, "loss": 1.5517, "step": 19953 }, { "epoch": 1.57, "learning_rate": 0.0001390035463833329, "loss": 1.5431, "step": 19954 }, { "epoch": 1.57, "learning_rate": 0.00013899121996173823, "loss": 1.4703, "step": 19955 }, { "epoch": 1.57, "learning_rate": 0.00013897889361488716, "loss": 1.5774, "step": 19956 }, { "epoch": 1.57, "learning_rate": 0.00013896656734286328, "loss": 1.5076, "step": 19957 }, { "epoch": 1.57, "learning_rate": 0.00013895424114575034, "loss": 1.5309, "step": 19958 }, { "epoch": 1.57, "learning_rate": 0.00013894191502363202, "loss": 1.4981, "step": 19959 }, { "epoch": 1.57, "learning_rate": 0.00013892958897659196, "loss": 1.546, "step": 19960 }, { "epoch": 1.57, "learning_rate": 0.00013891726300471386, "loss": 1.4556, "step": 19961 }, { "epoch": 1.57, "learning_rate": 0.0001389049371080815, "loss": 1.4888, "step": 19962 }, { "epoch": 1.57, "learning_rate": 0.00013889261128677844, "loss": 1.5075, "step": 19963 }, { "epoch": 1.57, "learning_rate": 0.00013888028554088846, "loss": 1.4914, "step": 19964 }, { "epoch": 1.57, "learning_rate": 0.00013886795987049516, "loss": 1.5043, "step": 19965 }, { "epoch": 1.57, "learning_rate": 0.00013885563427568228, "loss": 1.5071, "step": 19966 }, { "epoch": 1.57, "learning_rate": 0.00013884330875653354, "loss": 1.5177, "step": 19967 }, { "epoch": 1.57, "learning_rate": 0.0001388309833131325, "loss": 1.4988, "step": 19968 }, { "epoch": 1.57, "learning_rate": 0.00013881865794556294, "loss": 1.4815, "step": 19969 }, { "epoch": 1.57, "learning_rate": 0.00013880633265390854, "loss": 1.4934, "step": 19970 }, { "epoch": 1.57, "learning_rate": 0.00013879400743825298, "loss": 1.4802, "step": 19971 }, { "epoch": 1.57, "learning_rate": 0.00013878168229867991, "loss": 1.4948, "step": 19972 }, { "epoch": 1.57, "learning_rate": 0.000138769357235273, "loss": 1.4631, "step": 19973 }, { "epoch": 1.57, "learning_rate": 0.00013875703224811603, "loss": 1.4851, "step": 19974 }, { "epoch": 1.57, "learning_rate": 0.00013874470733729255, "loss": 1.5138, "step": 19975 }, { "epoch": 1.57, "learning_rate": 0.00013873238250288632, "loss": 1.5377, "step": 19976 }, { "epoch": 1.57, "learning_rate": 0.00013872005774498097, "loss": 1.5132, "step": 19977 }, { "epoch": 1.57, "learning_rate": 0.00013870773306366022, "loss": 1.465, "step": 19978 }, { "epoch": 1.57, "learning_rate": 0.00013869540845900773, "loss": 1.5251, "step": 19979 }, { "epoch": 1.57, "learning_rate": 0.00013868308393110717, "loss": 1.5691, "step": 19980 }, { "epoch": 1.57, "learning_rate": 0.00013867075948004225, "loss": 1.512, "step": 19981 }, { "epoch": 1.57, "learning_rate": 0.0001386584351058966, "loss": 1.533, "step": 19982 }, { "epoch": 1.57, "learning_rate": 0.00013864611080875386, "loss": 1.5256, "step": 19983 }, { "epoch": 1.57, "learning_rate": 0.0001386337865886978, "loss": 1.5179, "step": 19984 }, { "epoch": 1.57, "learning_rate": 0.00013862146244581213, "loss": 1.5007, "step": 19985 }, { "epoch": 1.57, "learning_rate": 0.00013860913838018038, "loss": 1.4624, "step": 19986 }, { "epoch": 1.57, "learning_rate": 0.00013859681439188628, "loss": 1.5861, "step": 19987 }, { "epoch": 1.57, "learning_rate": 0.0001385844904810136, "loss": 1.456, "step": 19988 }, { "epoch": 1.57, "learning_rate": 0.00013857216664764585, "loss": 1.4736, "step": 19989 }, { "epoch": 1.57, "learning_rate": 0.0001385598428918668, "loss": 1.4931, "step": 19990 }, { "epoch": 1.57, "learning_rate": 0.00013854751921376016, "loss": 1.5306, "step": 19991 }, { "epoch": 1.57, "learning_rate": 0.00013853519561340946, "loss": 1.5204, "step": 19992 }, { "epoch": 1.57, "learning_rate": 0.00013852287209089852, "loss": 1.5393, "step": 19993 }, { "epoch": 1.57, "learning_rate": 0.00013851054864631092, "loss": 1.5026, "step": 19994 }, { "epoch": 1.57, "learning_rate": 0.00013849822527973034, "loss": 1.4899, "step": 19995 }, { "epoch": 1.57, "learning_rate": 0.0001384859019912405, "loss": 1.4731, "step": 19996 }, { "epoch": 1.57, "learning_rate": 0.000138473578780925, "loss": 1.5333, "step": 19997 }, { "epoch": 1.57, "learning_rate": 0.00013846125564886754, "loss": 1.4772, "step": 19998 }, { "epoch": 1.57, "learning_rate": 0.00013844893259515174, "loss": 1.5269, "step": 19999 }, { "epoch": 1.57, "learning_rate": 0.0001384366096198614, "loss": 1.4998, "step": 20000 }, { "epoch": 1.57, "learning_rate": 0.00013842428672308004, "loss": 1.5544, "step": 20001 }, { "epoch": 1.57, "learning_rate": 0.0001384119639048914, "loss": 1.5374, "step": 20002 }, { "epoch": 1.57, "learning_rate": 0.00013839964116537919, "loss": 1.4641, "step": 20003 }, { "epoch": 1.57, "learning_rate": 0.00013838731850462696, "loss": 1.491, "step": 20004 }, { "epoch": 1.57, "learning_rate": 0.00013837499592271845, "loss": 1.512, "step": 20005 }, { "epoch": 1.57, "learning_rate": 0.00013836267341973727, "loss": 1.5049, "step": 20006 }, { "epoch": 1.57, "learning_rate": 0.00013835035099576712, "loss": 1.4766, "step": 20007 }, { "epoch": 1.57, "learning_rate": 0.0001383380286508917, "loss": 1.4777, "step": 20008 }, { "epoch": 1.57, "learning_rate": 0.0001383257063851946, "loss": 1.4473, "step": 20009 }, { "epoch": 1.57, "learning_rate": 0.00013831338419875955, "loss": 1.5324, "step": 20010 }, { "epoch": 1.57, "learning_rate": 0.00013830106209167012, "loss": 1.5036, "step": 20011 }, { "epoch": 1.57, "learning_rate": 0.00013828874006401, "loss": 1.5278, "step": 20012 }, { "epoch": 1.57, "learning_rate": 0.00013827641811586293, "loss": 1.5292, "step": 20013 }, { "epoch": 1.57, "learning_rate": 0.0001382640962473125, "loss": 1.5714, "step": 20014 }, { "epoch": 1.57, "learning_rate": 0.00013825177445844232, "loss": 1.5439, "step": 20015 }, { "epoch": 1.57, "learning_rate": 0.00013823945274933614, "loss": 1.4567, "step": 20016 }, { "epoch": 1.57, "learning_rate": 0.00013822713112007762, "loss": 1.5504, "step": 20017 }, { "epoch": 1.58, "learning_rate": 0.00013821480957075036, "loss": 1.5502, "step": 20018 }, { "epoch": 1.58, "learning_rate": 0.00013820248810143804, "loss": 1.551, "step": 20019 }, { "epoch": 1.58, "learning_rate": 0.00013819016671222435, "loss": 1.5131, "step": 20020 }, { "epoch": 1.58, "learning_rate": 0.00013817784540319286, "loss": 1.5611, "step": 20021 }, { "epoch": 1.58, "learning_rate": 0.00013816552417442735, "loss": 1.528, "step": 20022 }, { "epoch": 1.58, "learning_rate": 0.00013815320302601133, "loss": 1.5035, "step": 20023 }, { "epoch": 1.58, "learning_rate": 0.00013814088195802853, "loss": 1.5258, "step": 20024 }, { "epoch": 1.58, "learning_rate": 0.00013812856097056265, "loss": 1.5553, "step": 20025 }, { "epoch": 1.58, "learning_rate": 0.00013811624006369722, "loss": 1.4784, "step": 20026 }, { "epoch": 1.58, "learning_rate": 0.00013810391923751598, "loss": 1.5193, "step": 20027 }, { "epoch": 1.58, "learning_rate": 0.0001380915984921026, "loss": 1.4537, "step": 20028 }, { "epoch": 1.58, "learning_rate": 0.00013807927782754067, "loss": 1.458, "step": 20029 }, { "epoch": 1.58, "learning_rate": 0.00013806695724391388, "loss": 1.5254, "step": 20030 }, { "epoch": 1.58, "learning_rate": 0.0001380546367413058, "loss": 1.4867, "step": 20031 }, { "epoch": 1.58, "learning_rate": 0.0001380423163198002, "loss": 1.5246, "step": 20032 }, { "epoch": 1.58, "learning_rate": 0.00013802999597948065, "loss": 1.4774, "step": 20033 }, { "epoch": 1.58, "learning_rate": 0.00013801767572043085, "loss": 1.4977, "step": 20034 }, { "epoch": 1.58, "learning_rate": 0.0001380053555427344, "loss": 1.5297, "step": 20035 }, { "epoch": 1.58, "learning_rate": 0.00013799303544647498, "loss": 1.4892, "step": 20036 }, { "epoch": 1.58, "learning_rate": 0.00013798071543173624, "loss": 1.5752, "step": 20037 }, { "epoch": 1.58, "learning_rate": 0.00013796839549860178, "loss": 1.5224, "step": 20038 }, { "epoch": 1.58, "learning_rate": 0.00013795607564715532, "loss": 1.5427, "step": 20039 }, { "epoch": 1.58, "learning_rate": 0.0001379437558774804, "loss": 1.5424, "step": 20040 }, { "epoch": 1.58, "learning_rate": 0.00013793143618966074, "loss": 1.4934, "step": 20041 }, { "epoch": 1.58, "learning_rate": 0.00013791911658378, "loss": 1.5355, "step": 20042 }, { "epoch": 1.58, "learning_rate": 0.00013790679705992176, "loss": 1.5037, "step": 20043 }, { "epoch": 1.58, "learning_rate": 0.00013789447761816968, "loss": 1.5126, "step": 20044 }, { "epoch": 1.58, "learning_rate": 0.00013788215825860748, "loss": 1.4894, "step": 20045 }, { "epoch": 1.58, "learning_rate": 0.00013786983898131863, "loss": 1.4777, "step": 20046 }, { "epoch": 1.58, "learning_rate": 0.00013785751978638697, "loss": 1.5555, "step": 20047 }, { "epoch": 1.58, "learning_rate": 0.000137845200673896, "loss": 1.5172, "step": 20048 }, { "epoch": 1.58, "learning_rate": 0.00013783288164392944, "loss": 1.589, "step": 20049 }, { "epoch": 1.58, "learning_rate": 0.0001378205626965709, "loss": 1.494, "step": 20050 }, { "epoch": 1.58, "learning_rate": 0.00013780824383190403, "loss": 1.5343, "step": 20051 }, { "epoch": 1.58, "learning_rate": 0.00013779592505001244, "loss": 1.497, "step": 20052 }, { "epoch": 1.58, "learning_rate": 0.00013778360635097975, "loss": 1.5209, "step": 20053 }, { "epoch": 1.58, "learning_rate": 0.0001377712877348897, "loss": 1.5265, "step": 20054 }, { "epoch": 1.58, "learning_rate": 0.00013775896920182582, "loss": 1.5503, "step": 20055 }, { "epoch": 1.58, "learning_rate": 0.00013774665075187177, "loss": 1.5346, "step": 20056 }, { "epoch": 1.58, "learning_rate": 0.00013773433238511125, "loss": 1.5093, "step": 20057 }, { "epoch": 1.58, "learning_rate": 0.0001377220141016278, "loss": 1.5039, "step": 20058 }, { "epoch": 1.58, "learning_rate": 0.00013770969590150511, "loss": 1.5076, "step": 20059 }, { "epoch": 1.58, "learning_rate": 0.00013769737778482682, "loss": 1.4595, "step": 20060 }, { "epoch": 1.58, "learning_rate": 0.00013768505975167653, "loss": 1.4667, "step": 20061 }, { "epoch": 1.58, "learning_rate": 0.00013767274180213782, "loss": 1.4997, "step": 20062 }, { "epoch": 1.58, "learning_rate": 0.0001376604239362945, "loss": 1.5088, "step": 20063 }, { "epoch": 1.58, "learning_rate": 0.00013764810615423003, "loss": 1.5242, "step": 20064 }, { "epoch": 1.58, "learning_rate": 0.0001376357884560281, "loss": 1.477, "step": 20065 }, { "epoch": 1.58, "learning_rate": 0.00013762347084177238, "loss": 1.547, "step": 20066 }, { "epoch": 1.58, "learning_rate": 0.00013761115331154645, "loss": 1.5199, "step": 20067 }, { "epoch": 1.58, "learning_rate": 0.00013759883586543398, "loss": 1.4988, "step": 20068 }, { "epoch": 1.58, "learning_rate": 0.00013758651850351853, "loss": 1.521, "step": 20069 }, { "epoch": 1.58, "learning_rate": 0.00013757420122588378, "loss": 1.4457, "step": 20070 }, { "epoch": 1.58, "learning_rate": 0.00013756188403261335, "loss": 1.4913, "step": 20071 }, { "epoch": 1.58, "learning_rate": 0.00013754956692379084, "loss": 1.4681, "step": 20072 }, { "epoch": 1.58, "learning_rate": 0.0001375372498994999, "loss": 1.5348, "step": 20073 }, { "epoch": 1.58, "learning_rate": 0.00013752493295982423, "loss": 1.4427, "step": 20074 }, { "epoch": 1.58, "learning_rate": 0.00013751261610484732, "loss": 1.491, "step": 20075 }, { "epoch": 1.58, "learning_rate": 0.00013750029933465288, "loss": 1.5047, "step": 20076 }, { "epoch": 1.58, "learning_rate": 0.00013748798264932448, "loss": 1.4605, "step": 20077 }, { "epoch": 1.58, "learning_rate": 0.00013747566604894573, "loss": 1.4746, "step": 20078 }, { "epoch": 1.58, "learning_rate": 0.00013746334953360035, "loss": 1.5238, "step": 20079 }, { "epoch": 1.58, "learning_rate": 0.00013745103310337193, "loss": 1.5121, "step": 20080 }, { "epoch": 1.58, "learning_rate": 0.00013743871675834404, "loss": 1.5404, "step": 20081 }, { "epoch": 1.58, "learning_rate": 0.00013742640049860033, "loss": 1.507, "step": 20082 }, { "epoch": 1.58, "learning_rate": 0.00013741408432422445, "loss": 1.5156, "step": 20083 }, { "epoch": 1.58, "learning_rate": 0.00013740176823529997, "loss": 1.5321, "step": 20084 }, { "epoch": 1.58, "learning_rate": 0.00013738945223191052, "loss": 1.463, "step": 20085 }, { "epoch": 1.58, "learning_rate": 0.00013737713631413977, "loss": 1.5095, "step": 20086 }, { "epoch": 1.58, "learning_rate": 0.00013736482048207126, "loss": 1.5016, "step": 20087 }, { "epoch": 1.58, "learning_rate": 0.00013735250473578868, "loss": 1.541, "step": 20088 }, { "epoch": 1.58, "learning_rate": 0.00013734018907537562, "loss": 1.4739, "step": 20089 }, { "epoch": 1.58, "learning_rate": 0.00013732787350091564, "loss": 1.5181, "step": 20090 }, { "epoch": 1.58, "learning_rate": 0.00013731555801249244, "loss": 1.5884, "step": 20091 }, { "epoch": 1.58, "learning_rate": 0.00013730324261018958, "loss": 1.4833, "step": 20092 }, { "epoch": 1.58, "learning_rate": 0.00013729092729409067, "loss": 1.5135, "step": 20093 }, { "epoch": 1.58, "learning_rate": 0.0001372786120642794, "loss": 1.4812, "step": 20094 }, { "epoch": 1.58, "learning_rate": 0.00013726629692083933, "loss": 1.5356, "step": 20095 }, { "epoch": 1.58, "learning_rate": 0.00013725398186385405, "loss": 1.6071, "step": 20096 }, { "epoch": 1.58, "learning_rate": 0.00013724166689340725, "loss": 1.4319, "step": 20097 }, { "epoch": 1.58, "learning_rate": 0.00013722935200958245, "loss": 1.5188, "step": 20098 }, { "epoch": 1.58, "learning_rate": 0.00013721703721246328, "loss": 1.4454, "step": 20099 }, { "epoch": 1.58, "learning_rate": 0.00013720472250213343, "loss": 1.4727, "step": 20100 }, { "epoch": 1.58, "learning_rate": 0.00013719240787867643, "loss": 1.5238, "step": 20101 }, { "epoch": 1.58, "learning_rate": 0.0001371800933421759, "loss": 1.5203, "step": 20102 }, { "epoch": 1.58, "learning_rate": 0.00013716777889271549, "loss": 1.4912, "step": 20103 }, { "epoch": 1.58, "learning_rate": 0.00013715546453037876, "loss": 1.5386, "step": 20104 }, { "epoch": 1.58, "learning_rate": 0.00013714315025524938, "loss": 1.5067, "step": 20105 }, { "epoch": 1.58, "learning_rate": 0.00013713083606741084, "loss": 1.4938, "step": 20106 }, { "epoch": 1.58, "learning_rate": 0.00013711852196694684, "loss": 1.5084, "step": 20107 }, { "epoch": 1.58, "learning_rate": 0.00013710620795394103, "loss": 1.4439, "step": 20108 }, { "epoch": 1.58, "learning_rate": 0.00013709389402847684, "loss": 1.5333, "step": 20109 }, { "epoch": 1.58, "learning_rate": 0.00013708158019063804, "loss": 1.5317, "step": 20110 }, { "epoch": 1.58, "learning_rate": 0.0001370692664405082, "loss": 1.592, "step": 20111 }, { "epoch": 1.58, "learning_rate": 0.0001370569527781709, "loss": 1.5185, "step": 20112 }, { "epoch": 1.58, "learning_rate": 0.00013704463920370975, "loss": 1.4867, "step": 20113 }, { "epoch": 1.58, "learning_rate": 0.00013703232571720834, "loss": 1.55, "step": 20114 }, { "epoch": 1.58, "learning_rate": 0.00013702001231875033, "loss": 1.5246, "step": 20115 }, { "epoch": 1.58, "learning_rate": 0.0001370076990084192, "loss": 1.4997, "step": 20116 }, { "epoch": 1.58, "learning_rate": 0.00013699538578629868, "loss": 1.5017, "step": 20117 }, { "epoch": 1.58, "learning_rate": 0.0001369830726524723, "loss": 1.4847, "step": 20118 }, { "epoch": 1.58, "learning_rate": 0.00013697075960702364, "loss": 1.5627, "step": 20119 }, { "epoch": 1.58, "learning_rate": 0.00013695844665003639, "loss": 1.5376, "step": 20120 }, { "epoch": 1.58, "learning_rate": 0.00013694613378159402, "loss": 1.5395, "step": 20121 }, { "epoch": 1.58, "learning_rate": 0.00013693382100178028, "loss": 1.502, "step": 20122 }, { "epoch": 1.58, "learning_rate": 0.00013692150831067862, "loss": 1.594, "step": 20123 }, { "epoch": 1.58, "learning_rate": 0.0001369091957083727, "loss": 1.4797, "step": 20124 }, { "epoch": 1.58, "learning_rate": 0.00013689688319494612, "loss": 1.534, "step": 20125 }, { "epoch": 1.58, "learning_rate": 0.00013688457077048246, "loss": 1.4709, "step": 20126 }, { "epoch": 1.58, "learning_rate": 0.0001368722584350654, "loss": 1.4951, "step": 20127 }, { "epoch": 1.58, "learning_rate": 0.0001368599461887784, "loss": 1.5206, "step": 20128 }, { "epoch": 1.58, "learning_rate": 0.00013684763403170515, "loss": 1.4611, "step": 20129 }, { "epoch": 1.58, "learning_rate": 0.00013683532196392918, "loss": 1.5094, "step": 20130 }, { "epoch": 1.58, "learning_rate": 0.00013682300998553413, "loss": 1.4788, "step": 20131 }, { "epoch": 1.58, "learning_rate": 0.00013681069809660357, "loss": 1.52, "step": 20132 }, { "epoch": 1.58, "learning_rate": 0.00013679838629722109, "loss": 1.5786, "step": 20133 }, { "epoch": 1.58, "learning_rate": 0.00013678607458747028, "loss": 1.4645, "step": 20134 }, { "epoch": 1.58, "learning_rate": 0.0001367737629674347, "loss": 1.4654, "step": 20135 }, { "epoch": 1.58, "learning_rate": 0.00013676145143719798, "loss": 1.5074, "step": 20136 }, { "epoch": 1.58, "learning_rate": 0.00013674913999684374, "loss": 1.4497, "step": 20137 }, { "epoch": 1.58, "learning_rate": 0.0001367368286464555, "loss": 1.5244, "step": 20138 }, { "epoch": 1.58, "learning_rate": 0.00013672451738611687, "loss": 1.5213, "step": 20139 }, { "epoch": 1.58, "learning_rate": 0.00013671220621591147, "loss": 1.5459, "step": 20140 }, { "epoch": 1.58, "learning_rate": 0.00013669989513592277, "loss": 1.54, "step": 20141 }, { "epoch": 1.58, "learning_rate": 0.0001366875841462345, "loss": 1.4847, "step": 20142 }, { "epoch": 1.58, "learning_rate": 0.00013667527324693018, "loss": 1.4372, "step": 20143 }, { "epoch": 1.58, "learning_rate": 0.00013666296243809346, "loss": 1.4852, "step": 20144 }, { "epoch": 1.59, "learning_rate": 0.0001366506517198078, "loss": 1.4399, "step": 20145 }, { "epoch": 1.59, "learning_rate": 0.0001366383410921569, "loss": 1.4999, "step": 20146 }, { "epoch": 1.59, "learning_rate": 0.00013662603055522422, "loss": 1.5246, "step": 20147 }, { "epoch": 1.59, "learning_rate": 0.00013661372010909345, "loss": 1.479, "step": 20148 }, { "epoch": 1.59, "learning_rate": 0.00013660140975384815, "loss": 1.5485, "step": 20149 }, { "epoch": 1.59, "learning_rate": 0.00013658909948957186, "loss": 1.5081, "step": 20150 }, { "epoch": 1.59, "learning_rate": 0.00013657678931634822, "loss": 1.5027, "step": 20151 }, { "epoch": 1.59, "learning_rate": 0.00013656447923426072, "loss": 1.5481, "step": 20152 }, { "epoch": 1.59, "learning_rate": 0.00013655216924339303, "loss": 1.5341, "step": 20153 }, { "epoch": 1.59, "learning_rate": 0.00013653985934382868, "loss": 1.4994, "step": 20154 }, { "epoch": 1.59, "learning_rate": 0.00013652754953565123, "loss": 1.4655, "step": 20155 }, { "epoch": 1.59, "learning_rate": 0.00013651523981894427, "loss": 1.5505, "step": 20156 }, { "epoch": 1.59, "learning_rate": 0.00013650293019379142, "loss": 1.523, "step": 20157 }, { "epoch": 1.59, "learning_rate": 0.00013649062066027626, "loss": 1.55, "step": 20158 }, { "epoch": 1.59, "learning_rate": 0.0001364783112184823, "loss": 1.5394, "step": 20159 }, { "epoch": 1.59, "learning_rate": 0.00013646600186849312, "loss": 1.4749, "step": 20160 }, { "epoch": 1.59, "learning_rate": 0.00013645369261039238, "loss": 1.5349, "step": 20161 }, { "epoch": 1.59, "learning_rate": 0.00013644138344426354, "loss": 1.5237, "step": 20162 }, { "epoch": 1.59, "learning_rate": 0.00013642907437019024, "loss": 1.5044, "step": 20163 }, { "epoch": 1.59, "learning_rate": 0.00013641676538825605, "loss": 1.4957, "step": 20164 }, { "epoch": 1.59, "learning_rate": 0.0001364044564985445, "loss": 1.5243, "step": 20165 }, { "epoch": 1.59, "learning_rate": 0.00013639214770113923, "loss": 1.5245, "step": 20166 }, { "epoch": 1.59, "learning_rate": 0.00013637983899612372, "loss": 1.5074, "step": 20167 }, { "epoch": 1.59, "learning_rate": 0.0001363675303835816, "loss": 1.4888, "step": 20168 }, { "epoch": 1.59, "learning_rate": 0.00013635522186359646, "loss": 1.5253, "step": 20169 }, { "epoch": 1.59, "learning_rate": 0.00013634291343625178, "loss": 1.5057, "step": 20170 }, { "epoch": 1.59, "learning_rate": 0.00013633060510163125, "loss": 1.465, "step": 20171 }, { "epoch": 1.59, "learning_rate": 0.00013631829685981824, "loss": 1.5175, "step": 20172 }, { "epoch": 1.59, "learning_rate": 0.00013630598871089655, "loss": 1.4737, "step": 20173 }, { "epoch": 1.59, "learning_rate": 0.00013629368065494962, "loss": 1.516, "step": 20174 }, { "epoch": 1.59, "learning_rate": 0.00013628137269206106, "loss": 1.487, "step": 20175 }, { "epoch": 1.59, "learning_rate": 0.00013626906482231435, "loss": 1.4825, "step": 20176 }, { "epoch": 1.59, "learning_rate": 0.00013625675704579315, "loss": 1.5055, "step": 20177 }, { "epoch": 1.59, "learning_rate": 0.00013624444936258102, "loss": 1.4994, "step": 20178 }, { "epoch": 1.59, "learning_rate": 0.0001362321417727614, "loss": 1.5507, "step": 20179 }, { "epoch": 1.59, "learning_rate": 0.00013621983427641803, "loss": 1.5156, "step": 20180 }, { "epoch": 1.59, "learning_rate": 0.00013620752687363433, "loss": 1.4938, "step": 20181 }, { "epoch": 1.59, "learning_rate": 0.00013619521956449393, "loss": 1.522, "step": 20182 }, { "epoch": 1.59, "learning_rate": 0.00013618291234908036, "loss": 1.5327, "step": 20183 }, { "epoch": 1.59, "learning_rate": 0.00013617060522747718, "loss": 1.4736, "step": 20184 }, { "epoch": 1.59, "learning_rate": 0.00013615829819976796, "loss": 1.4883, "step": 20185 }, { "epoch": 1.59, "learning_rate": 0.0001361459912660363, "loss": 1.4989, "step": 20186 }, { "epoch": 1.59, "learning_rate": 0.00013613368442636566, "loss": 1.4714, "step": 20187 }, { "epoch": 1.59, "learning_rate": 0.00013612137768083963, "loss": 1.5382, "step": 20188 }, { "epoch": 1.59, "learning_rate": 0.00013610907102954182, "loss": 1.5072, "step": 20189 }, { "epoch": 1.59, "learning_rate": 0.00013609676447255578, "loss": 1.4742, "step": 20190 }, { "epoch": 1.59, "learning_rate": 0.00013608445800996502, "loss": 1.5137, "step": 20191 }, { "epoch": 1.59, "learning_rate": 0.00013607215164185312, "loss": 1.5171, "step": 20192 }, { "epoch": 1.59, "learning_rate": 0.0001360598453683036, "loss": 1.52, "step": 20193 }, { "epoch": 1.59, "learning_rate": 0.00013604753918940006, "loss": 1.4927, "step": 20194 }, { "epoch": 1.59, "learning_rate": 0.00013603523310522602, "loss": 1.5349, "step": 20195 }, { "epoch": 1.59, "learning_rate": 0.00013602292711586503, "loss": 1.5386, "step": 20196 }, { "epoch": 1.59, "learning_rate": 0.00013601062122140065, "loss": 1.534, "step": 20197 }, { "epoch": 1.59, "learning_rate": 0.00013599831542191647, "loss": 1.5014, "step": 20198 }, { "epoch": 1.59, "learning_rate": 0.00013598600971749595, "loss": 1.4794, "step": 20199 }, { "epoch": 1.59, "learning_rate": 0.00013597370410822277, "loss": 1.4526, "step": 20200 }, { "epoch": 1.59, "learning_rate": 0.00013596139859418032, "loss": 1.4792, "step": 20201 }, { "epoch": 1.59, "learning_rate": 0.00013594909317545225, "loss": 1.4897, "step": 20202 }, { "epoch": 1.59, "learning_rate": 0.00013593678785212202, "loss": 1.5052, "step": 20203 }, { "epoch": 1.59, "learning_rate": 0.00013592448262427336, "loss": 1.5789, "step": 20204 }, { "epoch": 1.59, "learning_rate": 0.0001359121774919896, "loss": 1.5171, "step": 20205 }, { "epoch": 1.59, "learning_rate": 0.00013589987245535442, "loss": 1.5611, "step": 20206 }, { "epoch": 1.59, "learning_rate": 0.00013588756751445135, "loss": 1.5044, "step": 20207 }, { "epoch": 1.59, "learning_rate": 0.00013587526266936386, "loss": 1.5364, "step": 20208 }, { "epoch": 1.59, "learning_rate": 0.00013586295792017555, "loss": 1.5361, "step": 20209 }, { "epoch": 1.59, "learning_rate": 0.00013585065326697, "loss": 1.5091, "step": 20210 }, { "epoch": 1.59, "learning_rate": 0.00013583834870983067, "loss": 1.524, "step": 20211 }, { "epoch": 1.59, "learning_rate": 0.00013582604424884116, "loss": 1.444, "step": 20212 }, { "epoch": 1.59, "learning_rate": 0.00013581373988408497, "loss": 1.4891, "step": 20213 }, { "epoch": 1.59, "learning_rate": 0.00013580143561564564, "loss": 1.5714, "step": 20214 }, { "epoch": 1.59, "learning_rate": 0.00013578913144360677, "loss": 1.4947, "step": 20215 }, { "epoch": 1.59, "learning_rate": 0.0001357768273680518, "loss": 1.5416, "step": 20216 }, { "epoch": 1.59, "learning_rate": 0.0001357645233890644, "loss": 1.5265, "step": 20217 }, { "epoch": 1.59, "learning_rate": 0.00013575221950672798, "loss": 1.5373, "step": 20218 }, { "epoch": 1.59, "learning_rate": 0.00013573991572112608, "loss": 1.4891, "step": 20219 }, { "epoch": 1.59, "learning_rate": 0.00013572761203234232, "loss": 1.4997, "step": 20220 }, { "epoch": 1.59, "learning_rate": 0.00013571530844046022, "loss": 1.4879, "step": 20221 }, { "epoch": 1.59, "learning_rate": 0.00013570300494556328, "loss": 1.5023, "step": 20222 }, { "epoch": 1.59, "learning_rate": 0.00013569070154773505, "loss": 1.5475, "step": 20223 }, { "epoch": 1.59, "learning_rate": 0.00013567839824705908, "loss": 1.505, "step": 20224 }, { "epoch": 1.59, "learning_rate": 0.00013566609504361886, "loss": 1.4703, "step": 20225 }, { "epoch": 1.59, "learning_rate": 0.00013565379193749793, "loss": 1.4899, "step": 20226 }, { "epoch": 1.59, "learning_rate": 0.00013564148892877988, "loss": 1.5053, "step": 20227 }, { "epoch": 1.59, "learning_rate": 0.00013562918601754817, "loss": 1.5104, "step": 20228 }, { "epoch": 1.59, "learning_rate": 0.00013561688320388638, "loss": 1.4796, "step": 20229 }, { "epoch": 1.59, "learning_rate": 0.00013560458048787798, "loss": 1.4553, "step": 20230 }, { "epoch": 1.59, "learning_rate": 0.00013559227786960653, "loss": 1.474, "step": 20231 }, { "epoch": 1.59, "learning_rate": 0.00013557997534915562, "loss": 1.477, "step": 20232 }, { "epoch": 1.59, "learning_rate": 0.00013556767292660865, "loss": 1.5818, "step": 20233 }, { "epoch": 1.59, "learning_rate": 0.00013555537060204925, "loss": 1.5021, "step": 20234 }, { "epoch": 1.59, "learning_rate": 0.00013554306837556084, "loss": 1.5108, "step": 20235 }, { "epoch": 1.59, "learning_rate": 0.00013553076624722713, "loss": 1.5081, "step": 20236 }, { "epoch": 1.59, "learning_rate": 0.00013551846421713148, "loss": 1.4822, "step": 20237 }, { "epoch": 1.59, "learning_rate": 0.00013550616228535743, "loss": 1.5389, "step": 20238 }, { "epoch": 1.59, "learning_rate": 0.00013549386045198864, "loss": 1.525, "step": 20239 }, { "epoch": 1.59, "learning_rate": 0.00013548155871710845, "loss": 1.5017, "step": 20240 }, { "epoch": 1.59, "learning_rate": 0.00013546925708080054, "loss": 1.5565, "step": 20241 }, { "epoch": 1.59, "learning_rate": 0.00013545695554314827, "loss": 1.498, "step": 20242 }, { "epoch": 1.59, "learning_rate": 0.00013544465410423527, "loss": 1.5239, "step": 20243 }, { "epoch": 1.59, "learning_rate": 0.0001354323527641451, "loss": 1.4863, "step": 20244 }, { "epoch": 1.59, "learning_rate": 0.00013542005152296114, "loss": 1.484, "step": 20245 }, { "epoch": 1.59, "learning_rate": 0.00013540775038076703, "loss": 1.5263, "step": 20246 }, { "epoch": 1.59, "learning_rate": 0.0001353954493376462, "loss": 1.4647, "step": 20247 }, { "epoch": 1.59, "learning_rate": 0.00013538314839368223, "loss": 1.5547, "step": 20248 }, { "epoch": 1.59, "learning_rate": 0.00013537084754895864, "loss": 1.5202, "step": 20249 }, { "epoch": 1.59, "learning_rate": 0.0001353585468035589, "loss": 1.5005, "step": 20250 }, { "epoch": 1.59, "learning_rate": 0.0001353462461575665, "loss": 1.4579, "step": 20251 }, { "epoch": 1.59, "learning_rate": 0.00013533394561106505, "loss": 1.5178, "step": 20252 }, { "epoch": 1.59, "learning_rate": 0.00013532164516413803, "loss": 1.563, "step": 20253 }, { "epoch": 1.59, "learning_rate": 0.00013530934481686892, "loss": 1.4895, "step": 20254 }, { "epoch": 1.59, "learning_rate": 0.00013529704456934123, "loss": 1.5513, "step": 20255 }, { "epoch": 1.59, "learning_rate": 0.00013528474442163854, "loss": 1.512, "step": 20256 }, { "epoch": 1.59, "learning_rate": 0.00013527244437384428, "loss": 1.5263, "step": 20257 }, { "epoch": 1.59, "learning_rate": 0.00013526014442604204, "loss": 1.52, "step": 20258 }, { "epoch": 1.59, "learning_rate": 0.00013524784457831526, "loss": 1.5247, "step": 20259 }, { "epoch": 1.59, "learning_rate": 0.00013523554483074745, "loss": 1.4563, "step": 20260 }, { "epoch": 1.59, "learning_rate": 0.00013522324518342217, "loss": 1.4799, "step": 20261 }, { "epoch": 1.59, "learning_rate": 0.00013521094563642287, "loss": 1.5086, "step": 20262 }, { "epoch": 1.59, "learning_rate": 0.00013519864618983314, "loss": 1.4934, "step": 20263 }, { "epoch": 1.59, "learning_rate": 0.0001351863468437364, "loss": 1.5448, "step": 20264 }, { "epoch": 1.59, "learning_rate": 0.00013517404759821617, "loss": 1.4388, "step": 20265 }, { "epoch": 1.59, "learning_rate": 0.00013516174845335598, "loss": 1.5099, "step": 20266 }, { "epoch": 1.59, "learning_rate": 0.00013514944940923933, "loss": 1.5241, "step": 20267 }, { "epoch": 1.59, "learning_rate": 0.00013513715046594978, "loss": 1.4608, "step": 20268 }, { "epoch": 1.59, "learning_rate": 0.0001351248516235707, "loss": 1.4341, "step": 20269 }, { "epoch": 1.59, "learning_rate": 0.00013511255288218576, "loss": 1.5296, "step": 20270 }, { "epoch": 1.59, "learning_rate": 0.0001351002542418783, "loss": 1.5151, "step": 20271 }, { "epoch": 1.6, "learning_rate": 0.0001350879557027319, "loss": 1.5172, "step": 20272 }, { "epoch": 1.6, "learning_rate": 0.0001350756572648301, "loss": 1.5292, "step": 20273 }, { "epoch": 1.6, "learning_rate": 0.00013506335892825628, "loss": 1.4729, "step": 20274 }, { "epoch": 1.6, "learning_rate": 0.00013505106069309407, "loss": 1.531, "step": 20275 }, { "epoch": 1.6, "learning_rate": 0.00013503876255942688, "loss": 1.4994, "step": 20276 }, { "epoch": 1.6, "learning_rate": 0.00013502646452733823, "loss": 1.4935, "step": 20277 }, { "epoch": 1.6, "learning_rate": 0.00013501416659691165, "loss": 1.5136, "step": 20278 }, { "epoch": 1.6, "learning_rate": 0.00013500186876823058, "loss": 1.5178, "step": 20279 }, { "epoch": 1.6, "learning_rate": 0.00013498957104137854, "loss": 1.522, "step": 20280 }, { "epoch": 1.6, "learning_rate": 0.00013497727341643906, "loss": 1.4833, "step": 20281 }, { "epoch": 1.6, "learning_rate": 0.00013496497589349555, "loss": 1.4914, "step": 20282 }, { "epoch": 1.6, "learning_rate": 0.00013495267847263157, "loss": 1.5221, "step": 20283 }, { "epoch": 1.6, "learning_rate": 0.0001349403811539306, "loss": 1.487, "step": 20284 }, { "epoch": 1.6, "learning_rate": 0.0001349280839374762, "loss": 1.5665, "step": 20285 }, { "epoch": 1.6, "learning_rate": 0.00013491578682335172, "loss": 1.5458, "step": 20286 }, { "epoch": 1.6, "learning_rate": 0.00013490348981164078, "loss": 1.5223, "step": 20287 }, { "epoch": 1.6, "learning_rate": 0.00013489119290242677, "loss": 1.5478, "step": 20288 }, { "epoch": 1.6, "learning_rate": 0.00013487889609579322, "loss": 1.5165, "step": 20289 }, { "epoch": 1.6, "learning_rate": 0.00013486659939182367, "loss": 1.5209, "step": 20290 }, { "epoch": 1.6, "learning_rate": 0.00013485430279060152, "loss": 1.5295, "step": 20291 }, { "epoch": 1.6, "learning_rate": 0.00013484200629221028, "loss": 1.4568, "step": 20292 }, { "epoch": 1.6, "learning_rate": 0.0001348297098967335, "loss": 1.4755, "step": 20293 }, { "epoch": 1.6, "learning_rate": 0.00013481741360425457, "loss": 1.5107, "step": 20294 }, { "epoch": 1.6, "learning_rate": 0.00013480511741485707, "loss": 1.5039, "step": 20295 }, { "epoch": 1.6, "learning_rate": 0.0001347928213286244, "loss": 1.5132, "step": 20296 }, { "epoch": 1.6, "learning_rate": 0.0001347805253456401, "loss": 1.5393, "step": 20297 }, { "epoch": 1.6, "learning_rate": 0.00013476822946598756, "loss": 1.5013, "step": 20298 }, { "epoch": 1.6, "learning_rate": 0.00013475593368975043, "loss": 1.508, "step": 20299 }, { "epoch": 1.6, "learning_rate": 0.00013474363801701207, "loss": 1.5286, "step": 20300 }, { "epoch": 1.6, "learning_rate": 0.00013473134244785598, "loss": 1.4986, "step": 20301 }, { "epoch": 1.6, "learning_rate": 0.0001347190469823657, "loss": 1.4826, "step": 20302 }, { "epoch": 1.6, "learning_rate": 0.00013470675162062458, "loss": 1.5666, "step": 20303 }, { "epoch": 1.6, "learning_rate": 0.00013469445636271626, "loss": 1.468, "step": 20304 }, { "epoch": 1.6, "learning_rate": 0.00013468216120872406, "loss": 1.5207, "step": 20305 }, { "epoch": 1.6, "learning_rate": 0.00013466986615873157, "loss": 1.5489, "step": 20306 }, { "epoch": 1.6, "learning_rate": 0.00013465757121282224, "loss": 1.4843, "step": 20307 }, { "epoch": 1.6, "learning_rate": 0.00013464527637107947, "loss": 1.5601, "step": 20308 }, { "epoch": 1.6, "learning_rate": 0.00013463298163358687, "loss": 1.5315, "step": 20309 }, { "epoch": 1.6, "learning_rate": 0.00013462068700042783, "loss": 1.4437, "step": 20310 }, { "epoch": 1.6, "learning_rate": 0.00013460839247168583, "loss": 1.5685, "step": 20311 }, { "epoch": 1.6, "learning_rate": 0.00013459609804744436, "loss": 1.5703, "step": 20312 }, { "epoch": 1.6, "learning_rate": 0.0001345838037277868, "loss": 1.5057, "step": 20313 }, { "epoch": 1.6, "learning_rate": 0.0001345715095127968, "loss": 1.5014, "step": 20314 }, { "epoch": 1.6, "learning_rate": 0.0001345592154025577, "loss": 1.4878, "step": 20315 }, { "epoch": 1.6, "learning_rate": 0.00013454692139715303, "loss": 1.5056, "step": 20316 }, { "epoch": 1.6, "learning_rate": 0.00013453462749666624, "loss": 1.5197, "step": 20317 }, { "epoch": 1.6, "learning_rate": 0.00013452233370118077, "loss": 1.5381, "step": 20318 }, { "epoch": 1.6, "learning_rate": 0.00013451004001078013, "loss": 1.5382, "step": 20319 }, { "epoch": 1.6, "learning_rate": 0.00013449774642554778, "loss": 1.5549, "step": 20320 }, { "epoch": 1.6, "learning_rate": 0.00013448545294556715, "loss": 1.5151, "step": 20321 }, { "epoch": 1.6, "learning_rate": 0.00013447315957092177, "loss": 1.5375, "step": 20322 }, { "epoch": 1.6, "learning_rate": 0.00013446086630169502, "loss": 1.4846, "step": 20323 }, { "epoch": 1.6, "learning_rate": 0.00013444857313797044, "loss": 1.5481, "step": 20324 }, { "epoch": 1.6, "learning_rate": 0.00013443628007983146, "loss": 1.4613, "step": 20325 }, { "epoch": 1.6, "learning_rate": 0.00013442398712736154, "loss": 1.5137, "step": 20326 }, { "epoch": 1.6, "learning_rate": 0.00013441169428064418, "loss": 1.5386, "step": 20327 }, { "epoch": 1.6, "learning_rate": 0.0001343994015397628, "loss": 1.5367, "step": 20328 }, { "epoch": 1.6, "learning_rate": 0.00013438710890480084, "loss": 1.496, "step": 20329 }, { "epoch": 1.6, "learning_rate": 0.0001343748163758418, "loss": 1.5233, "step": 20330 }, { "epoch": 1.6, "learning_rate": 0.00013436252395296919, "loss": 1.5818, "step": 20331 }, { "epoch": 1.6, "learning_rate": 0.00013435023163626636, "loss": 1.5034, "step": 20332 }, { "epoch": 1.6, "learning_rate": 0.00013433793942581687, "loss": 1.479, "step": 20333 }, { "epoch": 1.6, "learning_rate": 0.00013432564732170408, "loss": 1.5003, "step": 20334 }, { "epoch": 1.6, "learning_rate": 0.0001343133553240115, "loss": 1.5257, "step": 20335 }, { "epoch": 1.6, "learning_rate": 0.00013430106343282263, "loss": 1.5353, "step": 20336 }, { "epoch": 1.6, "learning_rate": 0.00013428877164822084, "loss": 1.5116, "step": 20337 }, { "epoch": 1.6, "learning_rate": 0.00013427647997028963, "loss": 1.5062, "step": 20338 }, { "epoch": 1.6, "learning_rate": 0.00013426418839911243, "loss": 1.479, "step": 20339 }, { "epoch": 1.6, "learning_rate": 0.0001342518969347727, "loss": 1.4882, "step": 20340 }, { "epoch": 1.6, "learning_rate": 0.00013423960557735397, "loss": 1.4976, "step": 20341 }, { "epoch": 1.6, "learning_rate": 0.00013422731432693956, "loss": 1.5487, "step": 20342 }, { "epoch": 1.6, "learning_rate": 0.00013421502318361296, "loss": 1.5227, "step": 20343 }, { "epoch": 1.6, "learning_rate": 0.0001342027321474577, "loss": 1.4565, "step": 20344 }, { "epoch": 1.6, "learning_rate": 0.0001341904412185571, "loss": 1.5364, "step": 20345 }, { "epoch": 1.6, "learning_rate": 0.0001341781503969947, "loss": 1.4695, "step": 20346 }, { "epoch": 1.6, "learning_rate": 0.00013416585968285393, "loss": 1.4881, "step": 20347 }, { "epoch": 1.6, "learning_rate": 0.00013415356907621828, "loss": 1.509, "step": 20348 }, { "epoch": 1.6, "learning_rate": 0.0001341412785771711, "loss": 1.4907, "step": 20349 }, { "epoch": 1.6, "learning_rate": 0.00013412898818579593, "loss": 1.499, "step": 20350 }, { "epoch": 1.6, "learning_rate": 0.00013411669790217617, "loss": 1.5189, "step": 20351 }, { "epoch": 1.6, "learning_rate": 0.00013410440772639522, "loss": 1.5551, "step": 20352 }, { "epoch": 1.6, "learning_rate": 0.00013409211765853663, "loss": 1.4816, "step": 20353 }, { "epoch": 1.6, "learning_rate": 0.00013407982769868374, "loss": 1.5271, "step": 20354 }, { "epoch": 1.6, "learning_rate": 0.00013406753784692003, "loss": 1.5162, "step": 20355 }, { "epoch": 1.6, "learning_rate": 0.00013405524810332898, "loss": 1.5438, "step": 20356 }, { "epoch": 1.6, "learning_rate": 0.00013404295846799398, "loss": 1.452, "step": 20357 }, { "epoch": 1.6, "learning_rate": 0.0001340306689409985, "loss": 1.4985, "step": 20358 }, { "epoch": 1.6, "learning_rate": 0.00013401837952242593, "loss": 1.5011, "step": 20359 }, { "epoch": 1.6, "learning_rate": 0.00013400609021235974, "loss": 1.4968, "step": 20360 }, { "epoch": 1.6, "learning_rate": 0.00013399380101088336, "loss": 1.4815, "step": 20361 }, { "epoch": 1.6, "learning_rate": 0.00013398151191808028, "loss": 1.5239, "step": 20362 }, { "epoch": 1.6, "learning_rate": 0.0001339692229340339, "loss": 1.5073, "step": 20363 }, { "epoch": 1.6, "learning_rate": 0.00013395693405882762, "loss": 1.5087, "step": 20364 }, { "epoch": 1.6, "learning_rate": 0.00013394464529254492, "loss": 1.4706, "step": 20365 }, { "epoch": 1.6, "learning_rate": 0.0001339323566352692, "loss": 1.5349, "step": 20366 }, { "epoch": 1.6, "learning_rate": 0.00013392006808708392, "loss": 1.5449, "step": 20367 }, { "epoch": 1.6, "learning_rate": 0.00013390777964807253, "loss": 1.4699, "step": 20368 }, { "epoch": 1.6, "learning_rate": 0.00013389549131831842, "loss": 1.5282, "step": 20369 }, { "epoch": 1.6, "learning_rate": 0.00013388320309790506, "loss": 1.4879, "step": 20370 }, { "epoch": 1.6, "learning_rate": 0.00013387091498691584, "loss": 1.5278, "step": 20371 }, { "epoch": 1.6, "learning_rate": 0.00013385862698543418, "loss": 1.4788, "step": 20372 }, { "epoch": 1.6, "learning_rate": 0.00013384633909354357, "loss": 1.5726, "step": 20373 }, { "epoch": 1.6, "learning_rate": 0.00013383405131132739, "loss": 1.4838, "step": 20374 }, { "epoch": 1.6, "learning_rate": 0.00013382176363886908, "loss": 1.5621, "step": 20375 }, { "epoch": 1.6, "learning_rate": 0.000133809476076252, "loss": 1.4467, "step": 20376 }, { "epoch": 1.6, "learning_rate": 0.00013379718862355973, "loss": 1.503, "step": 20377 }, { "epoch": 1.6, "learning_rate": 0.00013378490128087558, "loss": 1.4803, "step": 20378 }, { "epoch": 1.6, "learning_rate": 0.000133772614048283, "loss": 1.5404, "step": 20379 }, { "epoch": 1.6, "learning_rate": 0.00013376032692586544, "loss": 1.4766, "step": 20380 }, { "epoch": 1.6, "learning_rate": 0.00013374803991370629, "loss": 1.4931, "step": 20381 }, { "epoch": 1.6, "learning_rate": 0.000133735753011889, "loss": 1.4971, "step": 20382 }, { "epoch": 1.6, "learning_rate": 0.00013372346622049692, "loss": 1.505, "step": 20383 }, { "epoch": 1.6, "learning_rate": 0.00013371117953961354, "loss": 1.5115, "step": 20384 }, { "epoch": 1.6, "learning_rate": 0.00013369889296932229, "loss": 1.4854, "step": 20385 }, { "epoch": 1.6, "learning_rate": 0.00013368660650970652, "loss": 1.4961, "step": 20386 }, { "epoch": 1.6, "learning_rate": 0.00013367432016084973, "loss": 1.4919, "step": 20387 }, { "epoch": 1.6, "learning_rate": 0.00013366203392283527, "loss": 1.4693, "step": 20388 }, { "epoch": 1.6, "learning_rate": 0.00013364974779574658, "loss": 1.5126, "step": 20389 }, { "epoch": 1.6, "learning_rate": 0.0001336374617796671, "loss": 1.4486, "step": 20390 }, { "epoch": 1.6, "learning_rate": 0.00013362517587468023, "loss": 1.4843, "step": 20391 }, { "epoch": 1.6, "learning_rate": 0.0001336128900808693, "loss": 1.5067, "step": 20392 }, { "epoch": 1.6, "learning_rate": 0.00013360060439831785, "loss": 1.5117, "step": 20393 }, { "epoch": 1.6, "learning_rate": 0.0001335883188271093, "loss": 1.4951, "step": 20394 }, { "epoch": 1.6, "learning_rate": 0.00013357603336732694, "loss": 1.4696, "step": 20395 }, { "epoch": 1.6, "learning_rate": 0.00013356374801905429, "loss": 1.5101, "step": 20396 }, { "epoch": 1.6, "learning_rate": 0.00013355146278237474, "loss": 1.5315, "step": 20397 }, { "epoch": 1.6, "learning_rate": 0.00013353917765737163, "loss": 1.4699, "step": 20398 }, { "epoch": 1.61, "learning_rate": 0.00013352689264412845, "loss": 1.5239, "step": 20399 }, { "epoch": 1.61, "learning_rate": 0.00013351460774272856, "loss": 1.5149, "step": 20400 }, { "epoch": 1.61, "learning_rate": 0.0001335023229532554, "loss": 1.4676, "step": 20401 }, { "epoch": 1.61, "learning_rate": 0.00013349003827579236, "loss": 1.5279, "step": 20402 }, { "epoch": 1.61, "learning_rate": 0.00013347775371042286, "loss": 1.4937, "step": 20403 }, { "epoch": 1.61, "learning_rate": 0.00013346546925723028, "loss": 1.4925, "step": 20404 }, { "epoch": 1.61, "learning_rate": 0.00013345318491629805, "loss": 1.5406, "step": 20405 }, { "epoch": 1.61, "learning_rate": 0.00013344090068770955, "loss": 1.5307, "step": 20406 }, { "epoch": 1.61, "learning_rate": 0.0001334286165715482, "loss": 1.487, "step": 20407 }, { "epoch": 1.61, "learning_rate": 0.00013341633256789735, "loss": 1.4442, "step": 20408 }, { "epoch": 1.61, "learning_rate": 0.00013340404867684052, "loss": 1.5029, "step": 20409 }, { "epoch": 1.61, "learning_rate": 0.00013339176489846101, "loss": 1.4927, "step": 20410 }, { "epoch": 1.61, "learning_rate": 0.0001333794812328423, "loss": 1.5593, "step": 20411 }, { "epoch": 1.61, "learning_rate": 0.0001333671976800677, "loss": 1.5502, "step": 20412 }, { "epoch": 1.61, "learning_rate": 0.00013335491424022064, "loss": 1.5452, "step": 20413 }, { "epoch": 1.61, "learning_rate": 0.00013334263091338455, "loss": 1.5532, "step": 20414 }, { "epoch": 1.61, "learning_rate": 0.00013333034769964276, "loss": 1.5186, "step": 20415 }, { "epoch": 1.61, "learning_rate": 0.00013331806459907877, "loss": 1.5204, "step": 20416 }, { "epoch": 1.61, "learning_rate": 0.00013330578161177588, "loss": 1.4647, "step": 20417 }, { "epoch": 1.61, "learning_rate": 0.00013329349873781752, "loss": 1.5052, "step": 20418 }, { "epoch": 1.61, "learning_rate": 0.00013328121597728712, "loss": 1.5043, "step": 20419 }, { "epoch": 1.61, "learning_rate": 0.000133268933330268, "loss": 1.5222, "step": 20420 }, { "epoch": 1.61, "learning_rate": 0.00013325665079684358, "loss": 1.4711, "step": 20421 }, { "epoch": 1.61, "learning_rate": 0.00013324436837709733, "loss": 1.5061, "step": 20422 }, { "epoch": 1.61, "learning_rate": 0.00013323208607111248, "loss": 1.508, "step": 20423 }, { "epoch": 1.61, "learning_rate": 0.00013321980387897254, "loss": 1.497, "step": 20424 }, { "epoch": 1.61, "learning_rate": 0.00013320752180076087, "loss": 1.5778, "step": 20425 }, { "epoch": 1.61, "learning_rate": 0.0001331952398365609, "loss": 1.5328, "step": 20426 }, { "epoch": 1.61, "learning_rate": 0.00013318295798645595, "loss": 1.4575, "step": 20427 }, { "epoch": 1.61, "learning_rate": 0.00013317067625052945, "loss": 1.4943, "step": 20428 }, { "epoch": 1.61, "learning_rate": 0.00013315839462886474, "loss": 1.4828, "step": 20429 }, { "epoch": 1.61, "learning_rate": 0.00013314611312154525, "loss": 1.4555, "step": 20430 }, { "epoch": 1.61, "learning_rate": 0.0001331338317286544, "loss": 1.4975, "step": 20431 }, { "epoch": 1.61, "learning_rate": 0.00013312155045027546, "loss": 1.5701, "step": 20432 }, { "epoch": 1.61, "learning_rate": 0.0001331092692864919, "loss": 1.4961, "step": 20433 }, { "epoch": 1.61, "learning_rate": 0.0001330969882373871, "loss": 1.5192, "step": 20434 }, { "epoch": 1.61, "learning_rate": 0.0001330847073030444, "loss": 1.5318, "step": 20435 }, { "epoch": 1.61, "learning_rate": 0.00013307242648354724, "loss": 1.4979, "step": 20436 }, { "epoch": 1.61, "learning_rate": 0.0001330601457789789, "loss": 1.4981, "step": 20437 }, { "epoch": 1.61, "learning_rate": 0.00013304786518942286, "loss": 1.458, "step": 20438 }, { "epoch": 1.61, "learning_rate": 0.00013303558471496242, "loss": 1.5021, "step": 20439 }, { "epoch": 1.61, "learning_rate": 0.00013302330435568103, "loss": 1.4848, "step": 20440 }, { "epoch": 1.61, "learning_rate": 0.00013301102411166204, "loss": 1.4912, "step": 20441 }, { "epoch": 1.61, "learning_rate": 0.0001329987439829888, "loss": 1.5101, "step": 20442 }, { "epoch": 1.61, "learning_rate": 0.00013298646396974473, "loss": 1.5011, "step": 20443 }, { "epoch": 1.61, "learning_rate": 0.00013297418407201317, "loss": 1.5129, "step": 20444 }, { "epoch": 1.61, "learning_rate": 0.00013296190428987753, "loss": 1.4429, "step": 20445 }, { "epoch": 1.61, "learning_rate": 0.00013294962462342112, "loss": 1.5352, "step": 20446 }, { "epoch": 1.61, "learning_rate": 0.00013293734507272738, "loss": 1.5284, "step": 20447 }, { "epoch": 1.61, "learning_rate": 0.00013292506563787964, "loss": 1.4904, "step": 20448 }, { "epoch": 1.61, "learning_rate": 0.00013291278631896128, "loss": 1.4739, "step": 20449 }, { "epoch": 1.61, "learning_rate": 0.00013290050711605564, "loss": 1.5073, "step": 20450 }, { "epoch": 1.61, "learning_rate": 0.00013288822802924618, "loss": 1.4637, "step": 20451 }, { "epoch": 1.61, "learning_rate": 0.00013287594905861616, "loss": 1.5609, "step": 20452 }, { "epoch": 1.61, "learning_rate": 0.00013286367020424905, "loss": 1.4938, "step": 20453 }, { "epoch": 1.61, "learning_rate": 0.0001328513914662281, "loss": 1.547, "step": 20454 }, { "epoch": 1.61, "learning_rate": 0.00013283911284463673, "loss": 1.5346, "step": 20455 }, { "epoch": 1.61, "learning_rate": 0.00013282683433955836, "loss": 1.4809, "step": 20456 }, { "epoch": 1.61, "learning_rate": 0.0001328145559510763, "loss": 1.4952, "step": 20457 }, { "epoch": 1.61, "learning_rate": 0.0001328022776792739, "loss": 1.5049, "step": 20458 }, { "epoch": 1.61, "learning_rate": 0.00013278999952423456, "loss": 1.5244, "step": 20459 }, { "epoch": 1.61, "learning_rate": 0.00013277772148604167, "loss": 1.4631, "step": 20460 }, { "epoch": 1.61, "learning_rate": 0.0001327654435647785, "loss": 1.5093, "step": 20461 }, { "epoch": 1.61, "learning_rate": 0.00013275316576052843, "loss": 1.4791, "step": 20462 }, { "epoch": 1.61, "learning_rate": 0.0001327408880733749, "loss": 1.5169, "step": 20463 }, { "epoch": 1.61, "learning_rate": 0.0001327286105034012, "loss": 1.4896, "step": 20464 }, { "epoch": 1.61, "learning_rate": 0.0001327163330506907, "loss": 1.5095, "step": 20465 }, { "epoch": 1.61, "learning_rate": 0.00013270405571532676, "loss": 1.5483, "step": 20466 }, { "epoch": 1.61, "learning_rate": 0.0001326917784973927, "loss": 1.5154, "step": 20467 }, { "epoch": 1.61, "learning_rate": 0.000132679501396972, "loss": 1.5143, "step": 20468 }, { "epoch": 1.61, "learning_rate": 0.00013266722441414785, "loss": 1.4992, "step": 20469 }, { "epoch": 1.61, "learning_rate": 0.00013265494754900376, "loss": 1.533, "step": 20470 }, { "epoch": 1.61, "learning_rate": 0.00013264267080162286, "loss": 1.5055, "step": 20471 }, { "epoch": 1.61, "learning_rate": 0.00013263039417208878, "loss": 1.4789, "step": 20472 }, { "epoch": 1.61, "learning_rate": 0.0001326181176604847, "loss": 1.5, "step": 20473 }, { "epoch": 1.61, "learning_rate": 0.000132605841266894, "loss": 1.4974, "step": 20474 }, { "epoch": 1.61, "learning_rate": 0.00013259356499140001, "loss": 1.4971, "step": 20475 }, { "epoch": 1.61, "learning_rate": 0.00013258128883408618, "loss": 1.5117, "step": 20476 }, { "epoch": 1.61, "learning_rate": 0.00013256901279503575, "loss": 1.5582, "step": 20477 }, { "epoch": 1.61, "learning_rate": 0.0001325567368743321, "loss": 1.5215, "step": 20478 }, { "epoch": 1.61, "learning_rate": 0.00013254446107205858, "loss": 1.4764, "step": 20479 }, { "epoch": 1.61, "learning_rate": 0.00013253218538829853, "loss": 1.5552, "step": 20480 }, { "epoch": 1.61, "learning_rate": 0.0001325199098231353, "loss": 1.5506, "step": 20481 }, { "epoch": 1.61, "learning_rate": 0.00013250763437665228, "loss": 1.5052, "step": 20482 }, { "epoch": 1.61, "learning_rate": 0.00013249535904893273, "loss": 1.5554, "step": 20483 }, { "epoch": 1.61, "learning_rate": 0.00013248308384006003, "loss": 1.5495, "step": 20484 }, { "epoch": 1.61, "learning_rate": 0.00013247080875011756, "loss": 1.5631, "step": 20485 }, { "epoch": 1.61, "learning_rate": 0.00013245853377918856, "loss": 1.5014, "step": 20486 }, { "epoch": 1.61, "learning_rate": 0.00013244625892735646, "loss": 1.4921, "step": 20487 }, { "epoch": 1.61, "learning_rate": 0.00013243398419470457, "loss": 1.589, "step": 20488 }, { "epoch": 1.61, "learning_rate": 0.00013242170958131628, "loss": 1.554, "step": 20489 }, { "epoch": 1.61, "learning_rate": 0.00013240943508727486, "loss": 1.5016, "step": 20490 }, { "epoch": 1.61, "learning_rate": 0.00013239716071266364, "loss": 1.4586, "step": 20491 }, { "epoch": 1.61, "learning_rate": 0.00013238488645756605, "loss": 1.5262, "step": 20492 }, { "epoch": 1.61, "learning_rate": 0.0001323726123220653, "loss": 1.5285, "step": 20493 }, { "epoch": 1.61, "learning_rate": 0.00013236033830624482, "loss": 1.5175, "step": 20494 }, { "epoch": 1.61, "learning_rate": 0.00013234806441018786, "loss": 1.508, "step": 20495 }, { "epoch": 1.61, "learning_rate": 0.00013233579063397783, "loss": 1.476, "step": 20496 }, { "epoch": 1.61, "learning_rate": 0.00013232351697769806, "loss": 1.4827, "step": 20497 }, { "epoch": 1.61, "learning_rate": 0.00013231124344143184, "loss": 1.5303, "step": 20498 }, { "epoch": 1.61, "learning_rate": 0.00013229897002526252, "loss": 1.5045, "step": 20499 }, { "epoch": 1.61, "learning_rate": 0.0001322866967292734, "loss": 1.5453, "step": 20500 }, { "epoch": 1.61, "learning_rate": 0.00013227442355354783, "loss": 1.542, "step": 20501 }, { "epoch": 1.61, "learning_rate": 0.00013226215049816912, "loss": 1.5094, "step": 20502 }, { "epoch": 1.61, "learning_rate": 0.00013224987756322066, "loss": 1.4968, "step": 20503 }, { "epoch": 1.61, "learning_rate": 0.00013223760474878574, "loss": 1.5106, "step": 20504 }, { "epoch": 1.61, "learning_rate": 0.00013222533205494767, "loss": 1.4636, "step": 20505 }, { "epoch": 1.61, "learning_rate": 0.0001322130594817898, "loss": 1.5307, "step": 20506 }, { "epoch": 1.61, "learning_rate": 0.00013220078702939545, "loss": 1.454, "step": 20507 }, { "epoch": 1.61, "learning_rate": 0.0001321885146978479, "loss": 1.5118, "step": 20508 }, { "epoch": 1.61, "learning_rate": 0.00013217624248723053, "loss": 1.4582, "step": 20509 }, { "epoch": 1.61, "learning_rate": 0.00013216397039762662, "loss": 1.4519, "step": 20510 }, { "epoch": 1.61, "learning_rate": 0.00013215169842911955, "loss": 1.5359, "step": 20511 }, { "epoch": 1.61, "learning_rate": 0.00013213942658179254, "loss": 1.5546, "step": 20512 }, { "epoch": 1.61, "learning_rate": 0.000132127154855729, "loss": 1.5124, "step": 20513 }, { "epoch": 1.61, "learning_rate": 0.00013211488325101222, "loss": 1.4974, "step": 20514 }, { "epoch": 1.61, "learning_rate": 0.0001321026117677255, "loss": 1.4694, "step": 20515 }, { "epoch": 1.61, "learning_rate": 0.00013209034040595214, "loss": 1.5241, "step": 20516 }, { "epoch": 1.61, "learning_rate": 0.00013207806916577556, "loss": 1.5283, "step": 20517 }, { "epoch": 1.61, "learning_rate": 0.0001320657980472789, "loss": 1.4653, "step": 20518 }, { "epoch": 1.61, "learning_rate": 0.00013205352705054563, "loss": 1.5205, "step": 20519 }, { "epoch": 1.61, "learning_rate": 0.000132041256175659, "loss": 1.4989, "step": 20520 }, { "epoch": 1.61, "learning_rate": 0.00013202898542270236, "loss": 1.4633, "step": 20521 }, { "epoch": 1.61, "learning_rate": 0.00013201671479175895, "loss": 1.5146, "step": 20522 }, { "epoch": 1.61, "learning_rate": 0.00013200444428291218, "loss": 1.4956, "step": 20523 }, { "epoch": 1.61, "learning_rate": 0.00013199217389624527, "loss": 1.5107, "step": 20524 }, { "epoch": 1.61, "learning_rate": 0.00013197990363184153, "loss": 1.5309, "step": 20525 }, { "epoch": 1.62, "learning_rate": 0.00013196763348978434, "loss": 1.471, "step": 20526 }, { "epoch": 1.62, "learning_rate": 0.00013195536347015697, "loss": 1.5325, "step": 20527 }, { "epoch": 1.62, "learning_rate": 0.0001319430935730427, "loss": 1.4645, "step": 20528 }, { "epoch": 1.62, "learning_rate": 0.00013193082379852489, "loss": 1.4787, "step": 20529 }, { "epoch": 1.62, "learning_rate": 0.00013191855414668678, "loss": 1.4947, "step": 20530 }, { "epoch": 1.62, "learning_rate": 0.00013190628461761173, "loss": 1.4786, "step": 20531 }, { "epoch": 1.62, "learning_rate": 0.000131894015211383, "loss": 1.5111, "step": 20532 }, { "epoch": 1.62, "learning_rate": 0.0001318817459280839, "loss": 1.5323, "step": 20533 }, { "epoch": 1.62, "learning_rate": 0.00013186947676779777, "loss": 1.4699, "step": 20534 }, { "epoch": 1.62, "learning_rate": 0.00013185720773060792, "loss": 1.4665, "step": 20535 }, { "epoch": 1.62, "learning_rate": 0.0001318449388165976, "loss": 1.4901, "step": 20536 }, { "epoch": 1.62, "learning_rate": 0.0001318326700258501, "loss": 1.4579, "step": 20537 }, { "epoch": 1.62, "learning_rate": 0.00013182040135844878, "loss": 1.4864, "step": 20538 }, { "epoch": 1.62, "learning_rate": 0.0001318081328144769, "loss": 1.47, "step": 20539 }, { "epoch": 1.62, "learning_rate": 0.00013179586439401774, "loss": 1.5123, "step": 20540 }, { "epoch": 1.62, "learning_rate": 0.0001317835960971546, "loss": 1.4549, "step": 20541 }, { "epoch": 1.62, "learning_rate": 0.0001317713279239708, "loss": 1.4728, "step": 20542 }, { "epoch": 1.62, "learning_rate": 0.00013175905987454966, "loss": 1.5168, "step": 20543 }, { "epoch": 1.62, "learning_rate": 0.0001317467919489744, "loss": 1.5244, "step": 20544 }, { "epoch": 1.62, "learning_rate": 0.00013173452414732837, "loss": 1.5006, "step": 20545 }, { "epoch": 1.62, "learning_rate": 0.00013172225646969484, "loss": 1.5187, "step": 20546 }, { "epoch": 1.62, "learning_rate": 0.0001317099889161571, "loss": 1.5103, "step": 20547 }, { "epoch": 1.62, "learning_rate": 0.00013169772148679846, "loss": 1.5107, "step": 20548 }, { "epoch": 1.62, "learning_rate": 0.00013168545418170208, "loss": 1.5296, "step": 20549 }, { "epoch": 1.62, "learning_rate": 0.00013167318700095146, "loss": 1.4712, "step": 20550 }, { "epoch": 1.62, "learning_rate": 0.00013166091994462977, "loss": 1.5238, "step": 20551 }, { "epoch": 1.62, "learning_rate": 0.00013164865301282036, "loss": 1.4975, "step": 20552 }, { "epoch": 1.62, "learning_rate": 0.00013163638620560642, "loss": 1.5645, "step": 20553 }, { "epoch": 1.62, "learning_rate": 0.00013162411952307126, "loss": 1.5504, "step": 20554 }, { "epoch": 1.62, "learning_rate": 0.00013161185296529826, "loss": 1.4981, "step": 20555 }, { "epoch": 1.62, "learning_rate": 0.00013159958653237056, "loss": 1.5108, "step": 20556 }, { "epoch": 1.62, "learning_rate": 0.00013158732022437155, "loss": 1.4786, "step": 20557 }, { "epoch": 1.62, "learning_rate": 0.00013157505404138447, "loss": 1.4833, "step": 20558 }, { "epoch": 1.62, "learning_rate": 0.00013156278798349258, "loss": 1.4699, "step": 20559 }, { "epoch": 1.62, "learning_rate": 0.00013155052205077923, "loss": 1.539, "step": 20560 }, { "epoch": 1.62, "learning_rate": 0.00013153825624332764, "loss": 1.5071, "step": 20561 }, { "epoch": 1.62, "learning_rate": 0.00013152599056122106, "loss": 1.5011, "step": 20562 }, { "epoch": 1.62, "learning_rate": 0.00013151372500454288, "loss": 1.5714, "step": 20563 }, { "epoch": 1.62, "learning_rate": 0.00013150145957337625, "loss": 1.4975, "step": 20564 }, { "epoch": 1.62, "learning_rate": 0.0001314891942678045, "loss": 1.5063, "step": 20565 }, { "epoch": 1.62, "learning_rate": 0.0001314769290879109, "loss": 1.5336, "step": 20566 }, { "epoch": 1.62, "learning_rate": 0.00013146466403377878, "loss": 1.5494, "step": 20567 }, { "epoch": 1.62, "learning_rate": 0.00013145239910549133, "loss": 1.4788, "step": 20568 }, { "epoch": 1.62, "learning_rate": 0.00013144013430313188, "loss": 1.558, "step": 20569 }, { "epoch": 1.62, "learning_rate": 0.00013142786962678366, "loss": 1.5142, "step": 20570 }, { "epoch": 1.62, "learning_rate": 0.00013141560507652994, "loss": 1.4681, "step": 20571 }, { "epoch": 1.62, "learning_rate": 0.00013140334065245404, "loss": 1.4632, "step": 20572 }, { "epoch": 1.62, "learning_rate": 0.00013139107635463915, "loss": 1.5309, "step": 20573 }, { "epoch": 1.62, "learning_rate": 0.00013137881218316862, "loss": 1.525, "step": 20574 }, { "epoch": 1.62, "learning_rate": 0.00013136654813812568, "loss": 1.4622, "step": 20575 }, { "epoch": 1.62, "learning_rate": 0.00013135428421959356, "loss": 1.5008, "step": 20576 }, { "epoch": 1.62, "learning_rate": 0.0001313420204276556, "loss": 1.5084, "step": 20577 }, { "epoch": 1.62, "learning_rate": 0.000131329756762395, "loss": 1.4963, "step": 20578 }, { "epoch": 1.62, "learning_rate": 0.00013131749322389507, "loss": 1.5415, "step": 20579 }, { "epoch": 1.62, "learning_rate": 0.00013130522981223903, "loss": 1.5435, "step": 20580 }, { "epoch": 1.62, "learning_rate": 0.00013129296652751013, "loss": 1.5375, "step": 20581 }, { "epoch": 1.62, "learning_rate": 0.0001312807033697917, "loss": 1.508, "step": 20582 }, { "epoch": 1.62, "learning_rate": 0.00013126844033916696, "loss": 1.488, "step": 20583 }, { "epoch": 1.62, "learning_rate": 0.0001312561774357192, "loss": 1.4972, "step": 20584 }, { "epoch": 1.62, "learning_rate": 0.00013124391465953162, "loss": 1.4778, "step": 20585 }, { "epoch": 1.62, "learning_rate": 0.0001312316520106875, "loss": 1.4964, "step": 20586 }, { "epoch": 1.62, "learning_rate": 0.00013121938948927015, "loss": 1.5318, "step": 20587 }, { "epoch": 1.62, "learning_rate": 0.00013120712709536276, "loss": 1.494, "step": 20588 }, { "epoch": 1.62, "learning_rate": 0.00013119486482904863, "loss": 1.5235, "step": 20589 }, { "epoch": 1.62, "learning_rate": 0.00013118260269041096, "loss": 1.4954, "step": 20590 }, { "epoch": 1.62, "learning_rate": 0.000131170340679533, "loss": 1.5289, "step": 20591 }, { "epoch": 1.62, "learning_rate": 0.00013115807879649811, "loss": 1.4978, "step": 20592 }, { "epoch": 1.62, "learning_rate": 0.00013114581704138943, "loss": 1.5085, "step": 20593 }, { "epoch": 1.62, "learning_rate": 0.00013113355541429026, "loss": 1.534, "step": 20594 }, { "epoch": 1.62, "learning_rate": 0.00013112129391528381, "loss": 1.5233, "step": 20595 }, { "epoch": 1.62, "learning_rate": 0.00013110903254445335, "loss": 1.4957, "step": 20596 }, { "epoch": 1.62, "learning_rate": 0.00013109677130188215, "loss": 1.48, "step": 20597 }, { "epoch": 1.62, "learning_rate": 0.00013108451018765347, "loss": 1.5104, "step": 20598 }, { "epoch": 1.62, "learning_rate": 0.0001310722492018505, "loss": 1.5172, "step": 20599 }, { "epoch": 1.62, "learning_rate": 0.0001310599883445565, "loss": 1.491, "step": 20600 }, { "epoch": 1.62, "learning_rate": 0.00013104772761585477, "loss": 1.4985, "step": 20601 }, { "epoch": 1.62, "learning_rate": 0.00013103546701582846, "loss": 1.4649, "step": 20602 }, { "epoch": 1.62, "learning_rate": 0.00013102320654456088, "loss": 1.5383, "step": 20603 }, { "epoch": 1.62, "learning_rate": 0.0001310109462021353, "loss": 1.5311, "step": 20604 }, { "epoch": 1.62, "learning_rate": 0.00013099868598863486, "loss": 1.4887, "step": 20605 }, { "epoch": 1.62, "learning_rate": 0.00013098642590414288, "loss": 1.5056, "step": 20606 }, { "epoch": 1.62, "learning_rate": 0.00013097416594874258, "loss": 1.5266, "step": 20607 }, { "epoch": 1.62, "learning_rate": 0.00013096190612251718, "loss": 1.4953, "step": 20608 }, { "epoch": 1.62, "learning_rate": 0.00013094964642554997, "loss": 1.465, "step": 20609 }, { "epoch": 1.62, "learning_rate": 0.0001309373868579241, "loss": 1.5383, "step": 20610 }, { "epoch": 1.62, "learning_rate": 0.00013092512741972288, "loss": 1.5185, "step": 20611 }, { "epoch": 1.62, "learning_rate": 0.00013091286811102944, "loss": 1.534, "step": 20612 }, { "epoch": 1.62, "learning_rate": 0.00013090060893192716, "loss": 1.5046, "step": 20613 }, { "epoch": 1.62, "learning_rate": 0.00013088834988249923, "loss": 1.5291, "step": 20614 }, { "epoch": 1.62, "learning_rate": 0.0001308760909628288, "loss": 1.5555, "step": 20615 }, { "epoch": 1.62, "learning_rate": 0.00013086383217299924, "loss": 1.5326, "step": 20616 }, { "epoch": 1.62, "learning_rate": 0.00013085157351309362, "loss": 1.5033, "step": 20617 }, { "epoch": 1.62, "learning_rate": 0.00013083931498319531, "loss": 1.5278, "step": 20618 }, { "epoch": 1.62, "learning_rate": 0.00013082705658338742, "loss": 1.4493, "step": 20619 }, { "epoch": 1.62, "learning_rate": 0.00013081479831375328, "loss": 1.5232, "step": 20620 }, { "epoch": 1.62, "learning_rate": 0.00013080254017437605, "loss": 1.513, "step": 20621 }, { "epoch": 1.62, "learning_rate": 0.00013079028216533899, "loss": 1.4921, "step": 20622 }, { "epoch": 1.62, "learning_rate": 0.00013077802428672531, "loss": 1.5088, "step": 20623 }, { "epoch": 1.62, "learning_rate": 0.00013076576653861825, "loss": 1.5161, "step": 20624 }, { "epoch": 1.62, "learning_rate": 0.00013075350892110098, "loss": 1.5149, "step": 20625 }, { "epoch": 1.62, "learning_rate": 0.00013074125143425682, "loss": 1.507, "step": 20626 }, { "epoch": 1.62, "learning_rate": 0.0001307289940781689, "loss": 1.4611, "step": 20627 }, { "epoch": 1.62, "learning_rate": 0.0001307167368529204, "loss": 1.5054, "step": 20628 }, { "epoch": 1.62, "learning_rate": 0.0001307044797585947, "loss": 1.5079, "step": 20629 }, { "epoch": 1.62, "learning_rate": 0.00013069222279527495, "loss": 1.5101, "step": 20630 }, { "epoch": 1.62, "learning_rate": 0.00013067996596304433, "loss": 1.5098, "step": 20631 }, { "epoch": 1.62, "learning_rate": 0.00013066770926198608, "loss": 1.4411, "step": 20632 }, { "epoch": 1.62, "learning_rate": 0.00013065545269218344, "loss": 1.4711, "step": 20633 }, { "epoch": 1.62, "learning_rate": 0.00013064319625371955, "loss": 1.5212, "step": 20634 }, { "epoch": 1.62, "learning_rate": 0.00013063093994667774, "loss": 1.5342, "step": 20635 }, { "epoch": 1.62, "learning_rate": 0.0001306186837711411, "loss": 1.5081, "step": 20636 }, { "epoch": 1.62, "learning_rate": 0.0001306064277271929, "loss": 1.5608, "step": 20637 }, { "epoch": 1.62, "learning_rate": 0.00013059417181491642, "loss": 1.5401, "step": 20638 }, { "epoch": 1.62, "learning_rate": 0.00013058191603439474, "loss": 1.5205, "step": 20639 }, { "epoch": 1.62, "learning_rate": 0.00013056966038571118, "loss": 1.5509, "step": 20640 }, { "epoch": 1.62, "learning_rate": 0.00013055740486894886, "loss": 1.4663, "step": 20641 }, { "epoch": 1.62, "learning_rate": 0.00013054514948419103, "loss": 1.5211, "step": 20642 }, { "epoch": 1.62, "learning_rate": 0.0001305328942315209, "loss": 1.5028, "step": 20643 }, { "epoch": 1.62, "learning_rate": 0.00013052063911102166, "loss": 1.4876, "step": 20644 }, { "epoch": 1.62, "learning_rate": 0.0001305083841227766, "loss": 1.4818, "step": 20645 }, { "epoch": 1.62, "learning_rate": 0.00013049612926686882, "loss": 1.5136, "step": 20646 }, { "epoch": 1.62, "learning_rate": 0.00013048387454338156, "loss": 1.5341, "step": 20647 }, { "epoch": 1.62, "learning_rate": 0.00013047161995239804, "loss": 1.4798, "step": 20648 }, { "epoch": 1.62, "learning_rate": 0.0001304593654940014, "loss": 1.4926, "step": 20649 }, { "epoch": 1.62, "learning_rate": 0.00013044711116827495, "loss": 1.4552, "step": 20650 }, { "epoch": 1.62, "learning_rate": 0.00013043485697530175, "loss": 1.5213, "step": 20651 }, { "epoch": 1.62, "learning_rate": 0.00013042260291516516, "loss": 1.5796, "step": 20652 }, { "epoch": 1.63, "learning_rate": 0.00013041034898794823, "loss": 1.4985, "step": 20653 }, { "epoch": 1.63, "learning_rate": 0.0001303980951937342, "loss": 1.5328, "step": 20654 }, { "epoch": 1.63, "learning_rate": 0.00013038584153260636, "loss": 1.4873, "step": 20655 }, { "epoch": 1.63, "learning_rate": 0.00013037358800464777, "loss": 1.5183, "step": 20656 }, { "epoch": 1.63, "learning_rate": 0.0001303613346099417, "loss": 1.5344, "step": 20657 }, { "epoch": 1.63, "learning_rate": 0.00013034908134857136, "loss": 1.4664, "step": 20658 }, { "epoch": 1.63, "learning_rate": 0.00013033682822061985, "loss": 1.5215, "step": 20659 }, { "epoch": 1.63, "learning_rate": 0.00013032457522617046, "loss": 1.5463, "step": 20660 }, { "epoch": 1.63, "learning_rate": 0.00013031232236530635, "loss": 1.4918, "step": 20661 }, { "epoch": 1.63, "learning_rate": 0.00013030006963811073, "loss": 1.4952, "step": 20662 }, { "epoch": 1.63, "learning_rate": 0.00013028781704466674, "loss": 1.4974, "step": 20663 }, { "epoch": 1.63, "learning_rate": 0.0001302755645850576, "loss": 1.5414, "step": 20664 }, { "epoch": 1.63, "learning_rate": 0.00013026331225936649, "loss": 1.4887, "step": 20665 }, { "epoch": 1.63, "learning_rate": 0.0001302510600676766, "loss": 1.4606, "step": 20666 }, { "epoch": 1.63, "learning_rate": 0.00013023880801007112, "loss": 1.5014, "step": 20667 }, { "epoch": 1.63, "learning_rate": 0.00013022655608663323, "loss": 1.4327, "step": 20668 }, { "epoch": 1.63, "learning_rate": 0.00013021430429744607, "loss": 1.5018, "step": 20669 }, { "epoch": 1.63, "learning_rate": 0.00013020205264259295, "loss": 1.5055, "step": 20670 }, { "epoch": 1.63, "learning_rate": 0.00013018980112215688, "loss": 1.4976, "step": 20671 }, { "epoch": 1.63, "learning_rate": 0.0001301775497362212, "loss": 1.5085, "step": 20672 }, { "epoch": 1.63, "learning_rate": 0.00013016529848486897, "loss": 1.5415, "step": 20673 }, { "epoch": 1.63, "learning_rate": 0.00013015304736818342, "loss": 1.4861, "step": 20674 }, { "epoch": 1.63, "learning_rate": 0.0001301407963862477, "loss": 1.488, "step": 20675 }, { "epoch": 1.63, "learning_rate": 0.00013012854553914505, "loss": 1.4764, "step": 20676 }, { "epoch": 1.63, "learning_rate": 0.0001301162948269586, "loss": 1.4652, "step": 20677 }, { "epoch": 1.63, "learning_rate": 0.00013010404424977154, "loss": 1.5194, "step": 20678 }, { "epoch": 1.63, "learning_rate": 0.00013009179380766707, "loss": 1.5331, "step": 20679 }, { "epoch": 1.63, "learning_rate": 0.0001300795435007283, "loss": 1.4951, "step": 20680 }, { "epoch": 1.63, "learning_rate": 0.00013006729332903848, "loss": 1.4968, "step": 20681 }, { "epoch": 1.63, "learning_rate": 0.0001300550432926807, "loss": 1.5319, "step": 20682 }, { "epoch": 1.63, "learning_rate": 0.00013004279339173813, "loss": 1.5031, "step": 20683 }, { "epoch": 1.63, "learning_rate": 0.00013003054362629407, "loss": 1.4896, "step": 20684 }, { "epoch": 1.63, "learning_rate": 0.00013001829399643156, "loss": 1.4971, "step": 20685 }, { "epoch": 1.63, "learning_rate": 0.00013000604450223377, "loss": 1.4836, "step": 20686 }, { "epoch": 1.63, "learning_rate": 0.00012999379514378395, "loss": 1.5281, "step": 20687 }, { "epoch": 1.63, "learning_rate": 0.0001299815459211652, "loss": 1.4955, "step": 20688 }, { "epoch": 1.63, "learning_rate": 0.00012996929683446073, "loss": 1.4967, "step": 20689 }, { "epoch": 1.63, "learning_rate": 0.00012995704788375365, "loss": 1.4715, "step": 20690 }, { "epoch": 1.63, "learning_rate": 0.00012994479906912714, "loss": 1.5087, "step": 20691 }, { "epoch": 1.63, "learning_rate": 0.00012993255039066436, "loss": 1.5116, "step": 20692 }, { "epoch": 1.63, "learning_rate": 0.00012992030184844856, "loss": 1.4714, "step": 20693 }, { "epoch": 1.63, "learning_rate": 0.0001299080534425628, "loss": 1.5424, "step": 20694 }, { "epoch": 1.63, "learning_rate": 0.00012989580517309025, "loss": 1.4629, "step": 20695 }, { "epoch": 1.63, "learning_rate": 0.00012988355704011414, "loss": 1.5302, "step": 20696 }, { "epoch": 1.63, "learning_rate": 0.00012987130904371753, "loss": 1.5332, "step": 20697 }, { "epoch": 1.63, "learning_rate": 0.00012985906118398362, "loss": 1.4795, "step": 20698 }, { "epoch": 1.63, "learning_rate": 0.00012984681346099562, "loss": 1.5352, "step": 20699 }, { "epoch": 1.63, "learning_rate": 0.00012983456587483658, "loss": 1.5348, "step": 20700 }, { "epoch": 1.63, "learning_rate": 0.00012982231842558975, "loss": 1.5275, "step": 20701 }, { "epoch": 1.63, "learning_rate": 0.00012981007111333823, "loss": 1.5284, "step": 20702 }, { "epoch": 1.63, "learning_rate": 0.00012979782393816516, "loss": 1.5408, "step": 20703 }, { "epoch": 1.63, "learning_rate": 0.00012978557690015375, "loss": 1.5251, "step": 20704 }, { "epoch": 1.63, "learning_rate": 0.0001297733299993871, "loss": 1.5436, "step": 20705 }, { "epoch": 1.63, "learning_rate": 0.00012976108323594835, "loss": 1.504, "step": 20706 }, { "epoch": 1.63, "learning_rate": 0.0001297488366099207, "loss": 1.4694, "step": 20707 }, { "epoch": 1.63, "learning_rate": 0.0001297365901213873, "loss": 1.5268, "step": 20708 }, { "epoch": 1.63, "learning_rate": 0.00012972434377043124, "loss": 1.5428, "step": 20709 }, { "epoch": 1.63, "learning_rate": 0.00012971209755713574, "loss": 1.5422, "step": 20710 }, { "epoch": 1.63, "learning_rate": 0.00012969985148158386, "loss": 1.4865, "step": 20711 }, { "epoch": 1.63, "learning_rate": 0.0001296876055438588, "loss": 1.5141, "step": 20712 }, { "epoch": 1.63, "learning_rate": 0.0001296753597440437, "loss": 1.5578, "step": 20713 }, { "epoch": 1.63, "learning_rate": 0.00012966311408222166, "loss": 1.5105, "step": 20714 }, { "epoch": 1.63, "learning_rate": 0.00012965086855847588, "loss": 1.5532, "step": 20715 }, { "epoch": 1.63, "learning_rate": 0.00012963862317288947, "loss": 1.4532, "step": 20716 }, { "epoch": 1.63, "learning_rate": 0.00012962637792554558, "loss": 1.5041, "step": 20717 }, { "epoch": 1.63, "learning_rate": 0.00012961413281652732, "loss": 1.5092, "step": 20718 }, { "epoch": 1.63, "learning_rate": 0.00012960188784591785, "loss": 1.4601, "step": 20719 }, { "epoch": 1.63, "learning_rate": 0.0001295896430138003, "loss": 1.4462, "step": 20720 }, { "epoch": 1.63, "learning_rate": 0.00012957739832025785, "loss": 1.493, "step": 20721 }, { "epoch": 1.63, "learning_rate": 0.0001295651537653735, "loss": 1.4912, "step": 20722 }, { "epoch": 1.63, "learning_rate": 0.00012955290934923055, "loss": 1.5047, "step": 20723 }, { "epoch": 1.63, "learning_rate": 0.00012954066507191205, "loss": 1.5145, "step": 20724 }, { "epoch": 1.63, "learning_rate": 0.00012952842093350117, "loss": 1.5067, "step": 20725 }, { "epoch": 1.63, "learning_rate": 0.00012951617693408098, "loss": 1.4938, "step": 20726 }, { "epoch": 1.63, "learning_rate": 0.00012950393307373467, "loss": 1.4898, "step": 20727 }, { "epoch": 1.63, "learning_rate": 0.00012949168935254534, "loss": 1.4933, "step": 20728 }, { "epoch": 1.63, "learning_rate": 0.0001294794457705961, "loss": 1.5177, "step": 20729 }, { "epoch": 1.63, "learning_rate": 0.00012946720232797013, "loss": 1.483, "step": 20730 }, { "epoch": 1.63, "learning_rate": 0.00012945495902475052, "loss": 1.5652, "step": 20731 }, { "epoch": 1.63, "learning_rate": 0.00012944271586102038, "loss": 1.5093, "step": 20732 }, { "epoch": 1.63, "learning_rate": 0.00012943047283686288, "loss": 1.5065, "step": 20733 }, { "epoch": 1.63, "learning_rate": 0.0001294182299523611, "loss": 1.5169, "step": 20734 }, { "epoch": 1.63, "learning_rate": 0.0001294059872075982, "loss": 1.5285, "step": 20735 }, { "epoch": 1.63, "learning_rate": 0.00012939374460265726, "loss": 1.5059, "step": 20736 }, { "epoch": 1.63, "learning_rate": 0.00012938150213762141, "loss": 1.5115, "step": 20737 }, { "epoch": 1.63, "learning_rate": 0.00012936925981257377, "loss": 1.5097, "step": 20738 }, { "epoch": 1.63, "learning_rate": 0.00012935701762759752, "loss": 1.5158, "step": 20739 }, { "epoch": 1.63, "learning_rate": 0.0001293447755827757, "loss": 1.4871, "step": 20740 }, { "epoch": 1.63, "learning_rate": 0.00012933253367819144, "loss": 1.4676, "step": 20741 }, { "epoch": 1.63, "learning_rate": 0.00012932029191392794, "loss": 1.4744, "step": 20742 }, { "epoch": 1.63, "learning_rate": 0.0001293080502900682, "loss": 1.5181, "step": 20743 }, { "epoch": 1.63, "learning_rate": 0.00012929580880669537, "loss": 1.507, "step": 20744 }, { "epoch": 1.63, "learning_rate": 0.0001292835674638926, "loss": 1.5308, "step": 20745 }, { "epoch": 1.63, "learning_rate": 0.00012927132626174294, "loss": 1.4774, "step": 20746 }, { "epoch": 1.63, "learning_rate": 0.0001292590852003296, "loss": 1.4707, "step": 20747 }, { "epoch": 1.63, "learning_rate": 0.00012924684427973555, "loss": 1.4994, "step": 20748 }, { "epoch": 1.63, "learning_rate": 0.000129234603500044, "loss": 1.5145, "step": 20749 }, { "epoch": 1.63, "learning_rate": 0.00012922236286133808, "loss": 1.4997, "step": 20750 }, { "epoch": 1.63, "learning_rate": 0.0001292101223637008, "loss": 1.5394, "step": 20751 }, { "epoch": 1.63, "learning_rate": 0.0001291978820072153, "loss": 1.5031, "step": 20752 }, { "epoch": 1.63, "learning_rate": 0.00012918564179196468, "loss": 1.5175, "step": 20753 }, { "epoch": 1.63, "learning_rate": 0.00012917340171803214, "loss": 1.4827, "step": 20754 }, { "epoch": 1.63, "learning_rate": 0.00012916116178550066, "loss": 1.4939, "step": 20755 }, { "epoch": 1.63, "learning_rate": 0.00012914892199445343, "loss": 1.489, "step": 20756 }, { "epoch": 1.63, "learning_rate": 0.0001291366823449735, "loss": 1.5129, "step": 20757 }, { "epoch": 1.63, "learning_rate": 0.00012912444283714398, "loss": 1.5101, "step": 20758 }, { "epoch": 1.63, "learning_rate": 0.000129112203471048, "loss": 1.5267, "step": 20759 }, { "epoch": 1.63, "learning_rate": 0.0001290999642467686, "loss": 1.5389, "step": 20760 }, { "epoch": 1.63, "learning_rate": 0.00012908772516438888, "loss": 1.5306, "step": 20761 }, { "epoch": 1.63, "learning_rate": 0.00012907548622399204, "loss": 1.5313, "step": 20762 }, { "epoch": 1.63, "learning_rate": 0.00012906324742566105, "loss": 1.5174, "step": 20763 }, { "epoch": 1.63, "learning_rate": 0.00012905100876947907, "loss": 1.5281, "step": 20764 }, { "epoch": 1.63, "learning_rate": 0.00012903877025552917, "loss": 1.5001, "step": 20765 }, { "epoch": 1.63, "learning_rate": 0.00012902653188389448, "loss": 1.5257, "step": 20766 }, { "epoch": 1.63, "learning_rate": 0.00012901429365465804, "loss": 1.4957, "step": 20767 }, { "epoch": 1.63, "learning_rate": 0.00012900205556790298, "loss": 1.52, "step": 20768 }, { "epoch": 1.63, "learning_rate": 0.00012898981762371231, "loss": 1.4731, "step": 20769 }, { "epoch": 1.63, "learning_rate": 0.00012897757982216924, "loss": 1.4455, "step": 20770 }, { "epoch": 1.63, "learning_rate": 0.00012896534216335682, "loss": 1.483, "step": 20771 }, { "epoch": 1.63, "learning_rate": 0.0001289531046473581, "loss": 1.5231, "step": 20772 }, { "epoch": 1.63, "learning_rate": 0.00012894086727425615, "loss": 1.5105, "step": 20773 }, { "epoch": 1.63, "learning_rate": 0.00012892863004413416, "loss": 1.5266, "step": 20774 }, { "epoch": 1.63, "learning_rate": 0.0001289163929570751, "loss": 1.4643, "step": 20775 }, { "epoch": 1.63, "learning_rate": 0.00012890415601316213, "loss": 1.5045, "step": 20776 }, { "epoch": 1.63, "learning_rate": 0.00012889191921247825, "loss": 1.5021, "step": 20777 }, { "epoch": 1.63, "learning_rate": 0.0001288796825551066, "loss": 1.4866, "step": 20778 }, { "epoch": 1.63, "learning_rate": 0.00012886744604113028, "loss": 1.5127, "step": 20779 }, { "epoch": 1.63, "learning_rate": 0.00012885520967063235, "loss": 1.5083, "step": 20780 }, { "epoch": 1.64, "learning_rate": 0.00012884297344369582, "loss": 1.4825, "step": 20781 }, { "epoch": 1.64, "learning_rate": 0.00012883073736040388, "loss": 1.5029, "step": 20782 }, { "epoch": 1.64, "learning_rate": 0.00012881850142083953, "loss": 1.5648, "step": 20783 }, { "epoch": 1.64, "learning_rate": 0.00012880626562508586, "loss": 1.5256, "step": 20784 }, { "epoch": 1.64, "learning_rate": 0.0001287940299732259, "loss": 1.4451, "step": 20785 }, { "epoch": 1.64, "learning_rate": 0.00012878179446534284, "loss": 1.5135, "step": 20786 }, { "epoch": 1.64, "learning_rate": 0.00012876955910151968, "loss": 1.5234, "step": 20787 }, { "epoch": 1.64, "learning_rate": 0.00012875732388183952, "loss": 1.5666, "step": 20788 }, { "epoch": 1.64, "learning_rate": 0.00012874508880638536, "loss": 1.5245, "step": 20789 }, { "epoch": 1.64, "learning_rate": 0.00012873285387524032, "loss": 1.4807, "step": 20790 }, { "epoch": 1.64, "learning_rate": 0.0001287206190884875, "loss": 1.4325, "step": 20791 }, { "epoch": 1.64, "learning_rate": 0.00012870838444620992, "loss": 1.5032, "step": 20792 }, { "epoch": 1.64, "learning_rate": 0.0001286961499484907, "loss": 1.4852, "step": 20793 }, { "epoch": 1.64, "learning_rate": 0.0001286839155954128, "loss": 1.4977, "step": 20794 }, { "epoch": 1.64, "learning_rate": 0.00012867168138705937, "loss": 1.5244, "step": 20795 }, { "epoch": 1.64, "learning_rate": 0.00012865944732351345, "loss": 1.4699, "step": 20796 }, { "epoch": 1.64, "learning_rate": 0.00012864721340485812, "loss": 1.5104, "step": 20797 }, { "epoch": 1.64, "learning_rate": 0.00012863497963117642, "loss": 1.4419, "step": 20798 }, { "epoch": 1.64, "learning_rate": 0.00012862274600255143, "loss": 1.4757, "step": 20799 }, { "epoch": 1.64, "learning_rate": 0.00012861051251906617, "loss": 1.4696, "step": 20800 }, { "epoch": 1.64, "learning_rate": 0.0001285982791808037, "loss": 1.554, "step": 20801 }, { "epoch": 1.64, "learning_rate": 0.00012858604598784716, "loss": 1.4995, "step": 20802 }, { "epoch": 1.64, "learning_rate": 0.00012857381294027954, "loss": 1.5174, "step": 20803 }, { "epoch": 1.64, "learning_rate": 0.0001285615800381839, "loss": 1.5112, "step": 20804 }, { "epoch": 1.64, "learning_rate": 0.00012854934728164332, "loss": 1.509, "step": 20805 }, { "epoch": 1.64, "learning_rate": 0.00012853711467074083, "loss": 1.4624, "step": 20806 }, { "epoch": 1.64, "learning_rate": 0.00012852488220555945, "loss": 1.4669, "step": 20807 }, { "epoch": 1.64, "learning_rate": 0.0001285126498861823, "loss": 1.4979, "step": 20808 }, { "epoch": 1.64, "learning_rate": 0.0001285004177126924, "loss": 1.498, "step": 20809 }, { "epoch": 1.64, "learning_rate": 0.00012848818568517278, "loss": 1.5029, "step": 20810 }, { "epoch": 1.64, "learning_rate": 0.00012847595380370655, "loss": 1.4775, "step": 20811 }, { "epoch": 1.64, "learning_rate": 0.00012846372206837668, "loss": 1.5562, "step": 20812 }, { "epoch": 1.64, "learning_rate": 0.00012845149047926627, "loss": 1.5562, "step": 20813 }, { "epoch": 1.64, "learning_rate": 0.00012843925903645835, "loss": 1.5158, "step": 20814 }, { "epoch": 1.64, "learning_rate": 0.00012842702774003593, "loss": 1.5408, "step": 20815 }, { "epoch": 1.64, "learning_rate": 0.00012841479659008207, "loss": 1.5016, "step": 20816 }, { "epoch": 1.64, "learning_rate": 0.0001284025655866799, "loss": 1.5309, "step": 20817 }, { "epoch": 1.64, "learning_rate": 0.00012839033472991234, "loss": 1.4763, "step": 20818 }, { "epoch": 1.64, "learning_rate": 0.00012837810401986248, "loss": 1.5805, "step": 20819 }, { "epoch": 1.64, "learning_rate": 0.0001283658734566134, "loss": 1.4691, "step": 20820 }, { "epoch": 1.64, "learning_rate": 0.00012835364304024808, "loss": 1.5365, "step": 20821 }, { "epoch": 1.64, "learning_rate": 0.0001283414127708496, "loss": 1.4738, "step": 20822 }, { "epoch": 1.64, "learning_rate": 0.00012832918264850095, "loss": 1.4607, "step": 20823 }, { "epoch": 1.64, "learning_rate": 0.00012831695267328519, "loss": 1.5221, "step": 20824 }, { "epoch": 1.64, "learning_rate": 0.00012830472284528537, "loss": 1.5522, "step": 20825 }, { "epoch": 1.64, "learning_rate": 0.00012829249316458448, "loss": 1.4964, "step": 20826 }, { "epoch": 1.64, "learning_rate": 0.00012828026363126562, "loss": 1.5472, "step": 20827 }, { "epoch": 1.64, "learning_rate": 0.00012826803424541178, "loss": 1.5125, "step": 20828 }, { "epoch": 1.64, "learning_rate": 0.00012825580500710598, "loss": 1.4823, "step": 20829 }, { "epoch": 1.64, "learning_rate": 0.0001282435759164313, "loss": 1.5149, "step": 20830 }, { "epoch": 1.64, "learning_rate": 0.00012823134697347068, "loss": 1.5352, "step": 20831 }, { "epoch": 1.64, "learning_rate": 0.00012821911817830717, "loss": 1.5088, "step": 20832 }, { "epoch": 1.64, "learning_rate": 0.00012820688953102386, "loss": 1.5393, "step": 20833 }, { "epoch": 1.64, "learning_rate": 0.0001281946610317038, "loss": 1.4605, "step": 20834 }, { "epoch": 1.64, "learning_rate": 0.00012818243268042994, "loss": 1.4584, "step": 20835 }, { "epoch": 1.64, "learning_rate": 0.00012817020447728527, "loss": 1.4698, "step": 20836 }, { "epoch": 1.64, "learning_rate": 0.0001281579764223529, "loss": 1.4848, "step": 20837 }, { "epoch": 1.64, "learning_rate": 0.00012814574851571583, "loss": 1.548, "step": 20838 }, { "epoch": 1.64, "learning_rate": 0.00012813352075745704, "loss": 1.4754, "step": 20839 }, { "epoch": 1.64, "learning_rate": 0.00012812129314765963, "loss": 1.4678, "step": 20840 }, { "epoch": 1.64, "learning_rate": 0.00012810906568640649, "loss": 1.523, "step": 20841 }, { "epoch": 1.64, "learning_rate": 0.0001280968383737808, "loss": 1.5651, "step": 20842 }, { "epoch": 1.64, "learning_rate": 0.00012808461120986542, "loss": 1.4595, "step": 20843 }, { "epoch": 1.64, "learning_rate": 0.00012807238419474345, "loss": 1.498, "step": 20844 }, { "epoch": 1.64, "learning_rate": 0.0001280601573284979, "loss": 1.4956, "step": 20845 }, { "epoch": 1.64, "learning_rate": 0.00012804793061121176, "loss": 1.4728, "step": 20846 }, { "epoch": 1.64, "learning_rate": 0.0001280357040429681, "loss": 1.5572, "step": 20847 }, { "epoch": 1.64, "learning_rate": 0.00012802347762384976, "loss": 1.513, "step": 20848 }, { "epoch": 1.64, "learning_rate": 0.00012801125135394003, "loss": 1.4717, "step": 20849 }, { "epoch": 1.64, "learning_rate": 0.00012799902523332168, "loss": 1.485, "step": 20850 }, { "epoch": 1.64, "learning_rate": 0.00012798679926207787, "loss": 1.5355, "step": 20851 }, { "epoch": 1.64, "learning_rate": 0.0001279745734402915, "loss": 1.5065, "step": 20852 }, { "epoch": 1.64, "learning_rate": 0.00012796234776804564, "loss": 1.52, "step": 20853 }, { "epoch": 1.64, "learning_rate": 0.0001279501222454233, "loss": 1.4959, "step": 20854 }, { "epoch": 1.64, "learning_rate": 0.00012793789687250742, "loss": 1.5114, "step": 20855 }, { "epoch": 1.64, "learning_rate": 0.00012792567164938106, "loss": 1.4999, "step": 20856 }, { "epoch": 1.64, "learning_rate": 0.00012791344657612724, "loss": 1.5285, "step": 20857 }, { "epoch": 1.64, "learning_rate": 0.00012790122165282888, "loss": 1.4956, "step": 20858 }, { "epoch": 1.64, "learning_rate": 0.00012788899687956907, "loss": 1.4686, "step": 20859 }, { "epoch": 1.64, "learning_rate": 0.00012787677225643075, "loss": 1.4936, "step": 20860 }, { "epoch": 1.64, "learning_rate": 0.00012786454778349691, "loss": 1.533, "step": 20861 }, { "epoch": 1.64, "learning_rate": 0.00012785232346085066, "loss": 1.5327, "step": 20862 }, { "epoch": 1.64, "learning_rate": 0.00012784009928857478, "loss": 1.4789, "step": 20863 }, { "epoch": 1.64, "learning_rate": 0.00012782787526675248, "loss": 1.4483, "step": 20864 }, { "epoch": 1.64, "learning_rate": 0.00012781565139546666, "loss": 1.5166, "step": 20865 }, { "epoch": 1.64, "learning_rate": 0.00012780342767480034, "loss": 1.5077, "step": 20866 }, { "epoch": 1.64, "learning_rate": 0.00012779120410483648, "loss": 1.5002, "step": 20867 }, { "epoch": 1.64, "learning_rate": 0.00012777898068565808, "loss": 1.4923, "step": 20868 }, { "epoch": 1.64, "learning_rate": 0.00012776675741734818, "loss": 1.4844, "step": 20869 }, { "epoch": 1.64, "learning_rate": 0.0001277545342999897, "loss": 1.471, "step": 20870 }, { "epoch": 1.64, "learning_rate": 0.00012774231133366566, "loss": 1.4512, "step": 20871 }, { "epoch": 1.64, "learning_rate": 0.00012773008851845903, "loss": 1.5544, "step": 20872 }, { "epoch": 1.64, "learning_rate": 0.0001277178658544528, "loss": 1.4919, "step": 20873 }, { "epoch": 1.64, "learning_rate": 0.00012770564334173, "loss": 1.4717, "step": 20874 }, { "epoch": 1.64, "learning_rate": 0.00012769342098037357, "loss": 1.4861, "step": 20875 }, { "epoch": 1.64, "learning_rate": 0.00012768119877046652, "loss": 1.5204, "step": 20876 }, { "epoch": 1.64, "learning_rate": 0.00012766897671209176, "loss": 1.4706, "step": 20877 }, { "epoch": 1.64, "learning_rate": 0.00012765675480533236, "loss": 1.4976, "step": 20878 }, { "epoch": 1.64, "learning_rate": 0.0001276445330502712, "loss": 1.4685, "step": 20879 }, { "epoch": 1.64, "learning_rate": 0.00012763231144699135, "loss": 1.5148, "step": 20880 }, { "epoch": 1.64, "learning_rate": 0.00012762008999557583, "loss": 1.4752, "step": 20881 }, { "epoch": 1.64, "learning_rate": 0.0001276078686961075, "loss": 1.5431, "step": 20882 }, { "epoch": 1.64, "learning_rate": 0.0001275956475486694, "loss": 1.4746, "step": 20883 }, { "epoch": 1.64, "learning_rate": 0.0001275834265533445, "loss": 1.4926, "step": 20884 }, { "epoch": 1.64, "learning_rate": 0.00012757120571021572, "loss": 1.5127, "step": 20885 }, { "epoch": 1.64, "learning_rate": 0.00012755898501936615, "loss": 1.5083, "step": 20886 }, { "epoch": 1.64, "learning_rate": 0.00012754676448087861, "loss": 1.526, "step": 20887 }, { "epoch": 1.64, "learning_rate": 0.00012753454409483622, "loss": 1.5098, "step": 20888 }, { "epoch": 1.64, "learning_rate": 0.0001275223238613218, "loss": 1.5012, "step": 20889 }, { "epoch": 1.64, "learning_rate": 0.00012751010378041845, "loss": 1.5306, "step": 20890 }, { "epoch": 1.64, "learning_rate": 0.00012749788385220908, "loss": 1.4723, "step": 20891 }, { "epoch": 1.64, "learning_rate": 0.00012748566407677663, "loss": 1.4697, "step": 20892 }, { "epoch": 1.64, "learning_rate": 0.00012747344445420412, "loss": 1.5116, "step": 20893 }, { "epoch": 1.64, "learning_rate": 0.00012746122498457453, "loss": 1.5331, "step": 20894 }, { "epoch": 1.64, "learning_rate": 0.00012744900566797067, "loss": 1.4669, "step": 20895 }, { "epoch": 1.64, "learning_rate": 0.0001274367865044757, "loss": 1.5169, "step": 20896 }, { "epoch": 1.64, "learning_rate": 0.00012742456749417245, "loss": 1.4559, "step": 20897 }, { "epoch": 1.64, "learning_rate": 0.000127412348637144, "loss": 1.5006, "step": 20898 }, { "epoch": 1.64, "learning_rate": 0.0001274001299334732, "loss": 1.5156, "step": 20899 }, { "epoch": 1.64, "learning_rate": 0.00012738791138324306, "loss": 1.5239, "step": 20900 }, { "epoch": 1.64, "learning_rate": 0.0001273756929865365, "loss": 1.4817, "step": 20901 }, { "epoch": 1.64, "learning_rate": 0.0001273634747434365, "loss": 1.504, "step": 20902 }, { "epoch": 1.64, "learning_rate": 0.00012735125665402607, "loss": 1.4993, "step": 20903 }, { "epoch": 1.64, "learning_rate": 0.00012733903871838806, "loss": 1.4607, "step": 20904 }, { "epoch": 1.64, "learning_rate": 0.00012732682093660549, "loss": 1.4735, "step": 20905 }, { "epoch": 1.64, "learning_rate": 0.00012731460330876127, "loss": 1.5404, "step": 20906 }, { "epoch": 1.64, "learning_rate": 0.00012730238583493836, "loss": 1.4958, "step": 20907 }, { "epoch": 1.65, "learning_rate": 0.0001272901685152198, "loss": 1.4793, "step": 20908 }, { "epoch": 1.65, "learning_rate": 0.0001272779513496884, "loss": 1.4855, "step": 20909 }, { "epoch": 1.65, "learning_rate": 0.00012726573433842717, "loss": 1.507, "step": 20910 }, { "epoch": 1.65, "learning_rate": 0.00012725351748151903, "loss": 1.5089, "step": 20911 }, { "epoch": 1.65, "learning_rate": 0.000127241300779047, "loss": 1.4599, "step": 20912 }, { "epoch": 1.65, "learning_rate": 0.000127229084231094, "loss": 1.5008, "step": 20913 }, { "epoch": 1.65, "learning_rate": 0.00012721686783774292, "loss": 1.5215, "step": 20914 }, { "epoch": 1.65, "learning_rate": 0.00012720465159907676, "loss": 1.5376, "step": 20915 }, { "epoch": 1.65, "learning_rate": 0.0001271924355151784, "loss": 1.4698, "step": 20916 }, { "epoch": 1.65, "learning_rate": 0.00012718021958613084, "loss": 1.4571, "step": 20917 }, { "epoch": 1.65, "learning_rate": 0.00012716800381201699, "loss": 1.4598, "step": 20918 }, { "epoch": 1.65, "learning_rate": 0.00012715578819291978, "loss": 1.4809, "step": 20919 }, { "epoch": 1.65, "learning_rate": 0.00012714357272892223, "loss": 1.4651, "step": 20920 }, { "epoch": 1.65, "learning_rate": 0.00012713135742010713, "loss": 1.4974, "step": 20921 }, { "epoch": 1.65, "learning_rate": 0.0001271191422665575, "loss": 1.5993, "step": 20922 }, { "epoch": 1.65, "learning_rate": 0.00012710692726835632, "loss": 1.4723, "step": 20923 }, { "epoch": 1.65, "learning_rate": 0.00012709471242558642, "loss": 1.4857, "step": 20924 }, { "epoch": 1.65, "learning_rate": 0.00012708249773833082, "loss": 1.485, "step": 20925 }, { "epoch": 1.65, "learning_rate": 0.00012707028320667232, "loss": 1.4863, "step": 20926 }, { "epoch": 1.65, "learning_rate": 0.00012705806883069404, "loss": 1.5109, "step": 20927 }, { "epoch": 1.65, "learning_rate": 0.00012704585461047877, "loss": 1.5089, "step": 20928 }, { "epoch": 1.65, "learning_rate": 0.00012703364054610954, "loss": 1.4593, "step": 20929 }, { "epoch": 1.65, "learning_rate": 0.00012702142663766912, "loss": 1.5038, "step": 20930 }, { "epoch": 1.65, "learning_rate": 0.0001270092128852406, "loss": 1.5246, "step": 20931 }, { "epoch": 1.65, "learning_rate": 0.00012699699928890685, "loss": 1.4648, "step": 20932 }, { "epoch": 1.65, "learning_rate": 0.00012698478584875075, "loss": 1.5092, "step": 20933 }, { "epoch": 1.65, "learning_rate": 0.00012697257256485527, "loss": 1.5581, "step": 20934 }, { "epoch": 1.65, "learning_rate": 0.0001269603594373033, "loss": 1.5009, "step": 20935 }, { "epoch": 1.65, "learning_rate": 0.00012694814646617777, "loss": 1.5396, "step": 20936 }, { "epoch": 1.65, "learning_rate": 0.00012693593365156164, "loss": 1.4617, "step": 20937 }, { "epoch": 1.65, "learning_rate": 0.00012692372099353774, "loss": 1.4657, "step": 20938 }, { "epoch": 1.65, "learning_rate": 0.00012691150849218906, "loss": 1.5398, "step": 20939 }, { "epoch": 1.65, "learning_rate": 0.00012689929614759853, "loss": 1.5286, "step": 20940 }, { "epoch": 1.65, "learning_rate": 0.00012688708395984898, "loss": 1.4717, "step": 20941 }, { "epoch": 1.65, "learning_rate": 0.00012687487192902336, "loss": 1.569, "step": 20942 }, { "epoch": 1.65, "learning_rate": 0.0001268626600552046, "loss": 1.4607, "step": 20943 }, { "epoch": 1.65, "learning_rate": 0.00012685044833847569, "loss": 1.4758, "step": 20944 }, { "epoch": 1.65, "learning_rate": 0.0001268382367789194, "loss": 1.4871, "step": 20945 }, { "epoch": 1.65, "learning_rate": 0.00012682602537661874, "loss": 1.5197, "step": 20946 }, { "epoch": 1.65, "learning_rate": 0.00012681381413165655, "loss": 1.525, "step": 20947 }, { "epoch": 1.65, "learning_rate": 0.00012680160304411576, "loss": 1.5285, "step": 20948 }, { "epoch": 1.65, "learning_rate": 0.0001267893921140793, "loss": 1.4999, "step": 20949 }, { "epoch": 1.65, "learning_rate": 0.00012677718134163006, "loss": 1.5175, "step": 20950 }, { "epoch": 1.65, "learning_rate": 0.00012676497072685092, "loss": 1.5282, "step": 20951 }, { "epoch": 1.65, "learning_rate": 0.00012675276026982485, "loss": 1.5823, "step": 20952 }, { "epoch": 1.65, "learning_rate": 0.00012674054997063468, "loss": 1.4857, "step": 20953 }, { "epoch": 1.65, "learning_rate": 0.00012672833982936338, "loss": 1.5312, "step": 20954 }, { "epoch": 1.65, "learning_rate": 0.00012671612984609375, "loss": 1.5071, "step": 20955 }, { "epoch": 1.65, "learning_rate": 0.00012670392002090878, "loss": 1.5092, "step": 20956 }, { "epoch": 1.65, "learning_rate": 0.00012669171035389133, "loss": 1.5242, "step": 20957 }, { "epoch": 1.65, "learning_rate": 0.00012667950084512426, "loss": 1.5192, "step": 20958 }, { "epoch": 1.65, "learning_rate": 0.00012666729149469057, "loss": 1.4879, "step": 20959 }, { "epoch": 1.65, "learning_rate": 0.00012665508230267304, "loss": 1.4664, "step": 20960 }, { "epoch": 1.65, "learning_rate": 0.00012664287326915469, "loss": 1.5279, "step": 20961 }, { "epoch": 1.65, "learning_rate": 0.0001266306643942183, "loss": 1.4933, "step": 20962 }, { "epoch": 1.65, "learning_rate": 0.0001266184556779468, "loss": 1.4764, "step": 20963 }, { "epoch": 1.65, "learning_rate": 0.0001266062471204231, "loss": 1.4892, "step": 20964 }, { "epoch": 1.65, "learning_rate": 0.00012659403872173006, "loss": 1.5174, "step": 20965 }, { "epoch": 1.65, "learning_rate": 0.0001265818304819506, "loss": 1.4916, "step": 20966 }, { "epoch": 1.65, "learning_rate": 0.0001265696224011676, "loss": 1.4705, "step": 20967 }, { "epoch": 1.65, "learning_rate": 0.0001265574144794639, "loss": 1.5029, "step": 20968 }, { "epoch": 1.65, "learning_rate": 0.00012654520671692243, "loss": 1.5284, "step": 20969 }, { "epoch": 1.65, "learning_rate": 0.00012653299911362606, "loss": 1.4567, "step": 20970 }, { "epoch": 1.65, "learning_rate": 0.0001265207916696577, "loss": 1.4113, "step": 20971 }, { "epoch": 1.65, "learning_rate": 0.00012650858438510018, "loss": 1.4897, "step": 20972 }, { "epoch": 1.65, "learning_rate": 0.00012649637726003636, "loss": 1.4945, "step": 20973 }, { "epoch": 1.65, "learning_rate": 0.0001264841702945492, "loss": 1.4871, "step": 20974 }, { "epoch": 1.65, "learning_rate": 0.0001264719634887216, "loss": 1.4831, "step": 20975 }, { "epoch": 1.65, "learning_rate": 0.00012645975684263635, "loss": 1.5264, "step": 20976 }, { "epoch": 1.65, "learning_rate": 0.00012644755035637635, "loss": 1.4634, "step": 20977 }, { "epoch": 1.65, "learning_rate": 0.0001264353440300245, "loss": 1.5412, "step": 20978 }, { "epoch": 1.65, "learning_rate": 0.00012642313786366365, "loss": 1.5076, "step": 20979 }, { "epoch": 1.65, "learning_rate": 0.0001264109318573767, "loss": 1.5195, "step": 20980 }, { "epoch": 1.65, "learning_rate": 0.0001263987260112465, "loss": 1.4804, "step": 20981 }, { "epoch": 1.65, "learning_rate": 0.00012638652032535591, "loss": 1.4616, "step": 20982 }, { "epoch": 1.65, "learning_rate": 0.00012637431479978786, "loss": 1.4947, "step": 20983 }, { "epoch": 1.65, "learning_rate": 0.00012636210943462513, "loss": 1.5162, "step": 20984 }, { "epoch": 1.65, "learning_rate": 0.00012634990422995065, "loss": 1.5263, "step": 20985 }, { "epoch": 1.65, "learning_rate": 0.00012633769918584726, "loss": 1.5463, "step": 20986 }, { "epoch": 1.65, "learning_rate": 0.00012632549430239784, "loss": 1.5203, "step": 20987 }, { "epoch": 1.65, "learning_rate": 0.00012631328957968526, "loss": 1.5239, "step": 20988 }, { "epoch": 1.65, "learning_rate": 0.0001263010850177923, "loss": 1.4696, "step": 20989 }, { "epoch": 1.65, "learning_rate": 0.00012628888061680198, "loss": 1.4645, "step": 20990 }, { "epoch": 1.65, "learning_rate": 0.00012627667637679703, "loss": 1.5438, "step": 20991 }, { "epoch": 1.65, "learning_rate": 0.00012626447229786036, "loss": 1.4907, "step": 20992 }, { "epoch": 1.65, "learning_rate": 0.00012625226838007487, "loss": 1.4812, "step": 20993 }, { "epoch": 1.65, "learning_rate": 0.00012624006462352334, "loss": 1.429, "step": 20994 }, { "epoch": 1.65, "learning_rate": 0.0001262278610282887, "loss": 1.5502, "step": 20995 }, { "epoch": 1.65, "learning_rate": 0.0001262156575944537, "loss": 1.5093, "step": 20996 }, { "epoch": 1.65, "learning_rate": 0.00012620345432210126, "loss": 1.4856, "step": 20997 }, { "epoch": 1.65, "learning_rate": 0.0001261912512113143, "loss": 1.5389, "step": 20998 }, { "epoch": 1.65, "learning_rate": 0.00012617904826217556, "loss": 1.5046, "step": 20999 }, { "epoch": 1.65, "learning_rate": 0.00012616684547476795, "loss": 1.5003, "step": 21000 }, { "epoch": 1.65, "learning_rate": 0.0001261546428491743, "loss": 1.4645, "step": 21001 }, { "epoch": 1.65, "learning_rate": 0.00012614244038547745, "loss": 1.508, "step": 21002 }, { "epoch": 1.65, "learning_rate": 0.00012613023808376032, "loss": 1.5294, "step": 21003 }, { "epoch": 1.65, "learning_rate": 0.00012611803594410564, "loss": 1.4645, "step": 21004 }, { "epoch": 1.65, "learning_rate": 0.0001261058339665963, "loss": 1.5298, "step": 21005 }, { "epoch": 1.65, "learning_rate": 0.00012609363215131518, "loss": 1.546, "step": 21006 }, { "epoch": 1.65, "learning_rate": 0.00012608143049834514, "loss": 1.4668, "step": 21007 }, { "epoch": 1.65, "learning_rate": 0.00012606922900776897, "loss": 1.487, "step": 21008 }, { "epoch": 1.65, "learning_rate": 0.00012605702767966954, "loss": 1.4842, "step": 21009 }, { "epoch": 1.65, "learning_rate": 0.00012604482651412967, "loss": 1.5204, "step": 21010 }, { "epoch": 1.65, "learning_rate": 0.0001260326255112322, "loss": 1.5238, "step": 21011 }, { "epoch": 1.65, "learning_rate": 0.00012602042467106003, "loss": 1.4815, "step": 21012 }, { "epoch": 1.65, "learning_rate": 0.00012600822399369587, "loss": 1.5448, "step": 21013 }, { "epoch": 1.65, "learning_rate": 0.00012599602347922265, "loss": 1.5228, "step": 21014 }, { "epoch": 1.65, "learning_rate": 0.0001259838231277232, "loss": 1.516, "step": 21015 }, { "epoch": 1.65, "learning_rate": 0.00012597162293928035, "loss": 1.4558, "step": 21016 }, { "epoch": 1.65, "learning_rate": 0.0001259594229139769, "loss": 1.4939, "step": 21017 }, { "epoch": 1.65, "learning_rate": 0.0001259472230518957, "loss": 1.4971, "step": 21018 }, { "epoch": 1.65, "learning_rate": 0.00012593502335311957, "loss": 1.512, "step": 21019 }, { "epoch": 1.65, "learning_rate": 0.0001259228238177314, "loss": 1.503, "step": 21020 }, { "epoch": 1.65, "learning_rate": 0.00012591062444581384, "loss": 1.4863, "step": 21021 }, { "epoch": 1.65, "learning_rate": 0.00012589842523744998, "loss": 1.4528, "step": 21022 }, { "epoch": 1.65, "learning_rate": 0.00012588622619272245, "loss": 1.4875, "step": 21023 }, { "epoch": 1.65, "learning_rate": 0.0001258740273117142, "loss": 1.4603, "step": 21024 }, { "epoch": 1.65, "learning_rate": 0.00012586182859450793, "loss": 1.4804, "step": 21025 }, { "epoch": 1.65, "learning_rate": 0.00012584963004118652, "loss": 1.5493, "step": 21026 }, { "epoch": 1.65, "learning_rate": 0.00012583743165183286, "loss": 1.4975, "step": 21027 }, { "epoch": 1.65, "learning_rate": 0.00012582523342652966, "loss": 1.5556, "step": 21028 }, { "epoch": 1.65, "learning_rate": 0.0001258130353653598, "loss": 1.5211, "step": 21029 }, { "epoch": 1.65, "learning_rate": 0.00012580083746840606, "loss": 1.5239, "step": 21030 }, { "epoch": 1.65, "learning_rate": 0.0001257886397357513, "loss": 1.4871, "step": 21031 }, { "epoch": 1.65, "learning_rate": 0.0001257764421674783, "loss": 1.4641, "step": 21032 }, { "epoch": 1.65, "learning_rate": 0.00012576424476366991, "loss": 1.5491, "step": 21033 }, { "epoch": 1.65, "learning_rate": 0.00012575204752440889, "loss": 1.4725, "step": 21034 }, { "epoch": 1.66, "learning_rate": 0.00012573985044977813, "loss": 1.5207, "step": 21035 }, { "epoch": 1.66, "learning_rate": 0.00012572765353986032, "loss": 1.5062, "step": 21036 }, { "epoch": 1.66, "learning_rate": 0.0001257154567947384, "loss": 1.5421, "step": 21037 }, { "epoch": 1.66, "learning_rate": 0.0001257032602144951, "loss": 1.4578, "step": 21038 }, { "epoch": 1.66, "learning_rate": 0.00012569106379921332, "loss": 1.5071, "step": 21039 }, { "epoch": 1.66, "learning_rate": 0.00012567886754897574, "loss": 1.4432, "step": 21040 }, { "epoch": 1.66, "learning_rate": 0.00012566667146386528, "loss": 1.5124, "step": 21041 }, { "epoch": 1.66, "learning_rate": 0.00012565447554396467, "loss": 1.5155, "step": 21042 }, { "epoch": 1.66, "learning_rate": 0.00012564227978935672, "loss": 1.5076, "step": 21043 }, { "epoch": 1.66, "learning_rate": 0.00012563008420012428, "loss": 1.5524, "step": 21044 }, { "epoch": 1.66, "learning_rate": 0.00012561788877635008, "loss": 1.4636, "step": 21045 }, { "epoch": 1.66, "learning_rate": 0.00012560569351811697, "loss": 1.4983, "step": 21046 }, { "epoch": 1.66, "learning_rate": 0.00012559349842550778, "loss": 1.5195, "step": 21047 }, { "epoch": 1.66, "learning_rate": 0.00012558130349860522, "loss": 1.461, "step": 21048 }, { "epoch": 1.66, "learning_rate": 0.0001255691087374922, "loss": 1.5016, "step": 21049 }, { "epoch": 1.66, "learning_rate": 0.00012555691414225137, "loss": 1.5344, "step": 21050 }, { "epoch": 1.66, "learning_rate": 0.00012554471971296563, "loss": 1.459, "step": 21051 }, { "epoch": 1.66, "learning_rate": 0.0001255325254497177, "loss": 1.4809, "step": 21052 }, { "epoch": 1.66, "learning_rate": 0.0001255203313525905, "loss": 1.4765, "step": 21053 }, { "epoch": 1.66, "learning_rate": 0.0001255081374216667, "loss": 1.5284, "step": 21054 }, { "epoch": 1.66, "learning_rate": 0.00012549594365702914, "loss": 1.4683, "step": 21055 }, { "epoch": 1.66, "learning_rate": 0.00012548375005876062, "loss": 1.5303, "step": 21056 }, { "epoch": 1.66, "learning_rate": 0.00012547155662694388, "loss": 1.5085, "step": 21057 }, { "epoch": 1.66, "learning_rate": 0.00012545936336166177, "loss": 1.4855, "step": 21058 }, { "epoch": 1.66, "learning_rate": 0.000125447170262997, "loss": 1.5345, "step": 21059 }, { "epoch": 1.66, "learning_rate": 0.0001254349773310324, "loss": 1.5119, "step": 21060 }, { "epoch": 1.66, "learning_rate": 0.00012542278456585077, "loss": 1.5322, "step": 21061 }, { "epoch": 1.66, "learning_rate": 0.00012541059196753487, "loss": 1.52, "step": 21062 }, { "epoch": 1.66, "learning_rate": 0.00012539839953616745, "loss": 1.4737, "step": 21063 }, { "epoch": 1.66, "learning_rate": 0.00012538620727183135, "loss": 1.5536, "step": 21064 }, { "epoch": 1.66, "learning_rate": 0.00012537401517460933, "loss": 1.497, "step": 21065 }, { "epoch": 1.66, "learning_rate": 0.00012536182324458415, "loss": 1.4993, "step": 21066 }, { "epoch": 1.66, "learning_rate": 0.00012534963148183858, "loss": 1.5199, "step": 21067 }, { "epoch": 1.66, "learning_rate": 0.00012533743988645536, "loss": 1.5112, "step": 21068 }, { "epoch": 1.66, "learning_rate": 0.00012532524845851735, "loss": 1.4488, "step": 21069 }, { "epoch": 1.66, "learning_rate": 0.0001253130571981073, "loss": 1.4815, "step": 21070 }, { "epoch": 1.66, "learning_rate": 0.00012530086610530798, "loss": 1.4565, "step": 21071 }, { "epoch": 1.66, "learning_rate": 0.00012528867518020212, "loss": 1.5093, "step": 21072 }, { "epoch": 1.66, "learning_rate": 0.00012527648442287254, "loss": 1.4984, "step": 21073 }, { "epoch": 1.66, "learning_rate": 0.00012526429383340199, "loss": 1.4905, "step": 21074 }, { "epoch": 1.66, "learning_rate": 0.00012525210341187323, "loss": 1.5741, "step": 21075 }, { "epoch": 1.66, "learning_rate": 0.00012523991315836904, "loss": 1.4425, "step": 21076 }, { "epoch": 1.66, "learning_rate": 0.00012522772307297216, "loss": 1.5116, "step": 21077 }, { "epoch": 1.66, "learning_rate": 0.00012521553315576539, "loss": 1.5003, "step": 21078 }, { "epoch": 1.66, "learning_rate": 0.00012520334340683145, "loss": 1.5115, "step": 21079 }, { "epoch": 1.66, "learning_rate": 0.00012519115382625311, "loss": 1.4693, "step": 21080 }, { "epoch": 1.66, "learning_rate": 0.0001251789644141132, "loss": 1.4645, "step": 21081 }, { "epoch": 1.66, "learning_rate": 0.00012516677517049438, "loss": 1.4905, "step": 21082 }, { "epoch": 1.66, "learning_rate": 0.00012515458609547948, "loss": 1.4778, "step": 21083 }, { "epoch": 1.66, "learning_rate": 0.00012514239718915113, "loss": 1.5438, "step": 21084 }, { "epoch": 1.66, "learning_rate": 0.0001251302084515923, "loss": 1.5387, "step": 21085 }, { "epoch": 1.66, "learning_rate": 0.00012511801988288558, "loss": 1.5163, "step": 21086 }, { "epoch": 1.66, "learning_rate": 0.00012510583148311384, "loss": 1.5232, "step": 21087 }, { "epoch": 1.66, "learning_rate": 0.0001250936432523597, "loss": 1.5432, "step": 21088 }, { "epoch": 1.66, "learning_rate": 0.00012508145519070596, "loss": 1.4641, "step": 21089 }, { "epoch": 1.66, "learning_rate": 0.00012506926729823547, "loss": 1.4768, "step": 21090 }, { "epoch": 1.66, "learning_rate": 0.00012505707957503084, "loss": 1.4961, "step": 21091 }, { "epoch": 1.66, "learning_rate": 0.00012504489202117485, "loss": 1.511, "step": 21092 }, { "epoch": 1.66, "learning_rate": 0.00012503270463675036, "loss": 1.5203, "step": 21093 }, { "epoch": 1.66, "learning_rate": 0.00012502051742183996, "loss": 1.5386, "step": 21094 }, { "epoch": 1.66, "learning_rate": 0.0001250083303765265, "loss": 1.4964, "step": 21095 }, { "epoch": 1.66, "learning_rate": 0.00012499614350089264, "loss": 1.429, "step": 21096 }, { "epoch": 1.66, "learning_rate": 0.00012498395679502117, "loss": 1.4949, "step": 21097 }, { "epoch": 1.66, "learning_rate": 0.00012497177025899489, "loss": 1.5083, "step": 21098 }, { "epoch": 1.66, "learning_rate": 0.0001249595838928964, "loss": 1.5346, "step": 21099 }, { "epoch": 1.66, "learning_rate": 0.00012494739769680854, "loss": 1.4961, "step": 21100 }, { "epoch": 1.66, "learning_rate": 0.00012493521167081402, "loss": 1.496, "step": 21101 }, { "epoch": 1.66, "learning_rate": 0.00012492302581499563, "loss": 1.4744, "step": 21102 }, { "epoch": 1.66, "learning_rate": 0.000124910840129436, "loss": 1.489, "step": 21103 }, { "epoch": 1.66, "learning_rate": 0.00012489865461421794, "loss": 1.4956, "step": 21104 }, { "epoch": 1.66, "learning_rate": 0.0001248864692694242, "loss": 1.5077, "step": 21105 }, { "epoch": 1.66, "learning_rate": 0.00012487428409513744, "loss": 1.5525, "step": 21106 }, { "epoch": 1.66, "learning_rate": 0.00012486209909144045, "loss": 1.5155, "step": 21107 }, { "epoch": 1.66, "learning_rate": 0.0001248499142584159, "loss": 1.4572, "step": 21108 }, { "epoch": 1.66, "learning_rate": 0.00012483772959614656, "loss": 1.5525, "step": 21109 }, { "epoch": 1.66, "learning_rate": 0.00012482554510471518, "loss": 1.5293, "step": 21110 }, { "epoch": 1.66, "learning_rate": 0.00012481336078420442, "loss": 1.4867, "step": 21111 }, { "epoch": 1.66, "learning_rate": 0.00012480117663469706, "loss": 1.4974, "step": 21112 }, { "epoch": 1.66, "learning_rate": 0.0001247889926562758, "loss": 1.5133, "step": 21113 }, { "epoch": 1.66, "learning_rate": 0.00012477680884902338, "loss": 1.4684, "step": 21114 }, { "epoch": 1.66, "learning_rate": 0.00012476462521302244, "loss": 1.483, "step": 21115 }, { "epoch": 1.66, "learning_rate": 0.00012475244174835586, "loss": 1.4557, "step": 21116 }, { "epoch": 1.66, "learning_rate": 0.0001247402584551062, "loss": 1.4987, "step": 21117 }, { "epoch": 1.66, "learning_rate": 0.00012472807533335625, "loss": 1.5232, "step": 21118 }, { "epoch": 1.66, "learning_rate": 0.0001247158923831888, "loss": 1.5314, "step": 21119 }, { "epoch": 1.66, "learning_rate": 0.00012470370960468641, "loss": 1.5236, "step": 21120 }, { "epoch": 1.66, "learning_rate": 0.00012469152699793188, "loss": 1.4819, "step": 21121 }, { "epoch": 1.66, "learning_rate": 0.00012467934456300797, "loss": 1.5152, "step": 21122 }, { "epoch": 1.66, "learning_rate": 0.0001246671622999973, "loss": 1.5385, "step": 21123 }, { "epoch": 1.66, "learning_rate": 0.00012465498020898264, "loss": 1.491, "step": 21124 }, { "epoch": 1.66, "learning_rate": 0.00012464279829004665, "loss": 1.4984, "step": 21125 }, { "epoch": 1.66, "learning_rate": 0.00012463061654327206, "loss": 1.4662, "step": 21126 }, { "epoch": 1.66, "learning_rate": 0.00012461843496874164, "loss": 1.4901, "step": 21127 }, { "epoch": 1.66, "learning_rate": 0.00012460625356653797, "loss": 1.4673, "step": 21128 }, { "epoch": 1.66, "learning_rate": 0.00012459407233674383, "loss": 1.5409, "step": 21129 }, { "epoch": 1.66, "learning_rate": 0.00012458189127944198, "loss": 1.5017, "step": 21130 }, { "epoch": 1.66, "learning_rate": 0.00012456971039471497, "loss": 1.4836, "step": 21131 }, { "epoch": 1.66, "learning_rate": 0.00012455752968264564, "loss": 1.4845, "step": 21132 }, { "epoch": 1.66, "learning_rate": 0.00012454534914331666, "loss": 1.4616, "step": 21133 }, { "epoch": 1.66, "learning_rate": 0.00012453316877681072, "loss": 1.5253, "step": 21134 }, { "epoch": 1.66, "learning_rate": 0.00012452098858321047, "loss": 1.4878, "step": 21135 }, { "epoch": 1.66, "learning_rate": 0.0001245088085625987, "loss": 1.4801, "step": 21136 }, { "epoch": 1.66, "learning_rate": 0.000124496628715058, "loss": 1.5179, "step": 21137 }, { "epoch": 1.66, "learning_rate": 0.00012448444904067114, "loss": 1.5277, "step": 21138 }, { "epoch": 1.66, "learning_rate": 0.0001244722695395208, "loss": 1.5076, "step": 21139 }, { "epoch": 1.66, "learning_rate": 0.00012446009021168964, "loss": 1.4864, "step": 21140 }, { "epoch": 1.66, "learning_rate": 0.00012444791105726042, "loss": 1.491, "step": 21141 }, { "epoch": 1.66, "learning_rate": 0.00012443573207631572, "loss": 1.4988, "step": 21142 }, { "epoch": 1.66, "learning_rate": 0.00012442355326893834, "loss": 1.486, "step": 21143 }, { "epoch": 1.66, "learning_rate": 0.0001244113746352109, "loss": 1.5021, "step": 21144 }, { "epoch": 1.66, "learning_rate": 0.0001243991961752161, "loss": 1.477, "step": 21145 }, { "epoch": 1.66, "learning_rate": 0.00012438701788903658, "loss": 1.4851, "step": 21146 }, { "epoch": 1.66, "learning_rate": 0.00012437483977675512, "loss": 1.5169, "step": 21147 }, { "epoch": 1.66, "learning_rate": 0.0001243626618384544, "loss": 1.5148, "step": 21148 }, { "epoch": 1.66, "learning_rate": 0.000124350484074217, "loss": 1.4509, "step": 21149 }, { "epoch": 1.66, "learning_rate": 0.0001243383064841257, "loss": 1.524, "step": 21150 }, { "epoch": 1.66, "learning_rate": 0.00012432612906826312, "loss": 1.4861, "step": 21151 }, { "epoch": 1.66, "learning_rate": 0.00012431395182671193, "loss": 1.5201, "step": 21152 }, { "epoch": 1.66, "learning_rate": 0.00012430177475955488, "loss": 1.5597, "step": 21153 }, { "epoch": 1.66, "learning_rate": 0.00012428959786687458, "loss": 1.4812, "step": 21154 }, { "epoch": 1.66, "learning_rate": 0.0001242774211487537, "loss": 1.488, "step": 21155 }, { "epoch": 1.66, "learning_rate": 0.00012426524460527498, "loss": 1.4975, "step": 21156 }, { "epoch": 1.66, "learning_rate": 0.000124253068236521, "loss": 1.5283, "step": 21157 }, { "epoch": 1.66, "learning_rate": 0.0001242408920425745, "loss": 1.4898, "step": 21158 }, { "epoch": 1.66, "learning_rate": 0.00012422871602351816, "loss": 1.483, "step": 21159 }, { "epoch": 1.66, "learning_rate": 0.00012421654017943457, "loss": 1.5013, "step": 21160 }, { "epoch": 1.66, "learning_rate": 0.00012420436451040647, "loss": 1.4935, "step": 21161 }, { "epoch": 1.67, "learning_rate": 0.0001241921890165164, "loss": 1.5478, "step": 21162 }, { "epoch": 1.67, "learning_rate": 0.00012418001369784727, "loss": 1.5513, "step": 21163 }, { "epoch": 1.67, "learning_rate": 0.0001241678385544815, "loss": 1.5083, "step": 21164 }, { "epoch": 1.67, "learning_rate": 0.00012415566358650192, "loss": 1.524, "step": 21165 }, { "epoch": 1.67, "learning_rate": 0.0001241434887939911, "loss": 1.5242, "step": 21166 }, { "epoch": 1.67, "learning_rate": 0.00012413131417703168, "loss": 1.5072, "step": 21167 }, { "epoch": 1.67, "learning_rate": 0.0001241191397357064, "loss": 1.5017, "step": 21168 }, { "epoch": 1.67, "learning_rate": 0.00012410696547009788, "loss": 1.5253, "step": 21169 }, { "epoch": 1.67, "learning_rate": 0.0001240947913802888, "loss": 1.5816, "step": 21170 }, { "epoch": 1.67, "learning_rate": 0.00012408261746636175, "loss": 1.5197, "step": 21171 }, { "epoch": 1.67, "learning_rate": 0.00012407044372839943, "loss": 1.5041, "step": 21172 }, { "epoch": 1.67, "learning_rate": 0.00012405827016648453, "loss": 1.5085, "step": 21173 }, { "epoch": 1.67, "learning_rate": 0.0001240460967806996, "loss": 1.4762, "step": 21174 }, { "epoch": 1.67, "learning_rate": 0.00012403392357112738, "loss": 1.5228, "step": 21175 }, { "epoch": 1.67, "learning_rate": 0.0001240217505378505, "loss": 1.4792, "step": 21176 }, { "epoch": 1.67, "learning_rate": 0.00012400957768095156, "loss": 1.5102, "step": 21177 }, { "epoch": 1.67, "learning_rate": 0.00012399740500051323, "loss": 1.4882, "step": 21178 }, { "epoch": 1.67, "learning_rate": 0.00012398523249661822, "loss": 1.5305, "step": 21179 }, { "epoch": 1.67, "learning_rate": 0.00012397306016934912, "loss": 1.4876, "step": 21180 }, { "epoch": 1.67, "learning_rate": 0.00012396088801878857, "loss": 1.4954, "step": 21181 }, { "epoch": 1.67, "learning_rate": 0.00012394871604501923, "loss": 1.5377, "step": 21182 }, { "epoch": 1.67, "learning_rate": 0.00012393654424812373, "loss": 1.5149, "step": 21183 }, { "epoch": 1.67, "learning_rate": 0.00012392437262818468, "loss": 1.5258, "step": 21184 }, { "epoch": 1.67, "learning_rate": 0.0001239122011852848, "loss": 1.4927, "step": 21185 }, { "epoch": 1.67, "learning_rate": 0.00012390002991950663, "loss": 1.5319, "step": 21186 }, { "epoch": 1.67, "learning_rate": 0.00012388785883093287, "loss": 1.505, "step": 21187 }, { "epoch": 1.67, "learning_rate": 0.00012387568791964618, "loss": 1.4866, "step": 21188 }, { "epoch": 1.67, "learning_rate": 0.00012386351718572913, "loss": 1.5032, "step": 21189 }, { "epoch": 1.67, "learning_rate": 0.00012385134662926437, "loss": 1.5263, "step": 21190 }, { "epoch": 1.67, "learning_rate": 0.00012383917625033452, "loss": 1.4591, "step": 21191 }, { "epoch": 1.67, "learning_rate": 0.00012382700604902222, "loss": 1.498, "step": 21192 }, { "epoch": 1.67, "learning_rate": 0.00012381483602541015, "loss": 1.4554, "step": 21193 }, { "epoch": 1.67, "learning_rate": 0.00012380266617958082, "loss": 1.4753, "step": 21194 }, { "epoch": 1.67, "learning_rate": 0.00012379049651161696, "loss": 1.5304, "step": 21195 }, { "epoch": 1.67, "learning_rate": 0.00012377832702160116, "loss": 1.5089, "step": 21196 }, { "epoch": 1.67, "learning_rate": 0.0001237661577096161, "loss": 1.4948, "step": 21197 }, { "epoch": 1.67, "learning_rate": 0.00012375398857574432, "loss": 1.5611, "step": 21198 }, { "epoch": 1.67, "learning_rate": 0.00012374181962006848, "loss": 1.5484, "step": 21199 }, { "epoch": 1.67, "learning_rate": 0.00012372965084267117, "loss": 1.5428, "step": 21200 }, { "epoch": 1.67, "learning_rate": 0.00012371748224363505, "loss": 1.4486, "step": 21201 }, { "epoch": 1.67, "learning_rate": 0.00012370531382304274, "loss": 1.4573, "step": 21202 }, { "epoch": 1.67, "learning_rate": 0.00012369314558097682, "loss": 1.4977, "step": 21203 }, { "epoch": 1.67, "learning_rate": 0.00012368097751751993, "loss": 1.4808, "step": 21204 }, { "epoch": 1.67, "learning_rate": 0.0001236688096327547, "loss": 1.5489, "step": 21205 }, { "epoch": 1.67, "learning_rate": 0.00012365664192676368, "loss": 1.5064, "step": 21206 }, { "epoch": 1.67, "learning_rate": 0.00012364447439962956, "loss": 1.476, "step": 21207 }, { "epoch": 1.67, "learning_rate": 0.00012363230705143488, "loss": 1.4458, "step": 21208 }, { "epoch": 1.67, "learning_rate": 0.00012362013988226228, "loss": 1.5033, "step": 21209 }, { "epoch": 1.67, "learning_rate": 0.00012360797289219438, "loss": 1.4532, "step": 21210 }, { "epoch": 1.67, "learning_rate": 0.0001235958060813138, "loss": 1.5649, "step": 21211 }, { "epoch": 1.67, "learning_rate": 0.00012358363944970312, "loss": 1.5217, "step": 21212 }, { "epoch": 1.67, "learning_rate": 0.00012357147299744495, "loss": 1.4957, "step": 21213 }, { "epoch": 1.67, "learning_rate": 0.00012355930672462188, "loss": 1.4544, "step": 21214 }, { "epoch": 1.67, "learning_rate": 0.00012354714063131654, "loss": 1.5302, "step": 21215 }, { "epoch": 1.67, "learning_rate": 0.00012353497471761151, "loss": 1.4729, "step": 21216 }, { "epoch": 1.67, "learning_rate": 0.00012352280898358944, "loss": 1.5031, "step": 21217 }, { "epoch": 1.67, "learning_rate": 0.00012351064342933283, "loss": 1.4977, "step": 21218 }, { "epoch": 1.67, "learning_rate": 0.00012349847805492438, "loss": 1.4941, "step": 21219 }, { "epoch": 1.67, "learning_rate": 0.0001234863128604466, "loss": 1.481, "step": 21220 }, { "epoch": 1.67, "learning_rate": 0.00012347414784598214, "loss": 1.4848, "step": 21221 }, { "epoch": 1.67, "learning_rate": 0.00012346198301161357, "loss": 1.4578, "step": 21222 }, { "epoch": 1.67, "learning_rate": 0.0001234498183574235, "loss": 1.487, "step": 21223 }, { "epoch": 1.67, "learning_rate": 0.0001234376538834945, "loss": 1.4395, "step": 21224 }, { "epoch": 1.67, "learning_rate": 0.00012342548958990912, "loss": 1.4484, "step": 21225 }, { "epoch": 1.67, "learning_rate": 0.00012341332547675008, "loss": 1.544, "step": 21226 }, { "epoch": 1.67, "learning_rate": 0.00012340116154409985, "loss": 1.5079, "step": 21227 }, { "epoch": 1.67, "learning_rate": 0.00012338899779204107, "loss": 1.5057, "step": 21228 }, { "epoch": 1.67, "learning_rate": 0.00012337683422065633, "loss": 1.5528, "step": 21229 }, { "epoch": 1.67, "learning_rate": 0.00012336467083002816, "loss": 1.4466, "step": 21230 }, { "epoch": 1.67, "learning_rate": 0.0001233525076202392, "loss": 1.536, "step": 21231 }, { "epoch": 1.67, "learning_rate": 0.000123340344591372, "loss": 1.54, "step": 21232 }, { "epoch": 1.67, "learning_rate": 0.00012332818174350915, "loss": 1.4931, "step": 21233 }, { "epoch": 1.67, "learning_rate": 0.00012331601907673322, "loss": 1.4745, "step": 21234 }, { "epoch": 1.67, "learning_rate": 0.00012330385659112681, "loss": 1.5217, "step": 21235 }, { "epoch": 1.67, "learning_rate": 0.0001232916942867725, "loss": 1.5158, "step": 21236 }, { "epoch": 1.67, "learning_rate": 0.0001232795321637528, "loss": 1.5001, "step": 21237 }, { "epoch": 1.67, "learning_rate": 0.00012326737022215034, "loss": 1.4981, "step": 21238 }, { "epoch": 1.67, "learning_rate": 0.0001232552084620477, "loss": 1.469, "step": 21239 }, { "epoch": 1.67, "learning_rate": 0.00012324304688352743, "loss": 1.4726, "step": 21240 }, { "epoch": 1.67, "learning_rate": 0.00012323088548667205, "loss": 1.5154, "step": 21241 }, { "epoch": 1.67, "learning_rate": 0.00012321872427156424, "loss": 1.4398, "step": 21242 }, { "epoch": 1.67, "learning_rate": 0.00012320656323828652, "loss": 1.542, "step": 21243 }, { "epoch": 1.67, "learning_rate": 0.00012319440238692144, "loss": 1.4823, "step": 21244 }, { "epoch": 1.67, "learning_rate": 0.00012318224171755157, "loss": 1.5124, "step": 21245 }, { "epoch": 1.67, "learning_rate": 0.00012317008123025953, "loss": 1.5221, "step": 21246 }, { "epoch": 1.67, "learning_rate": 0.00012315792092512776, "loss": 1.4478, "step": 21247 }, { "epoch": 1.67, "learning_rate": 0.00012314576080223896, "loss": 1.51, "step": 21248 }, { "epoch": 1.67, "learning_rate": 0.00012313360086167556, "loss": 1.5527, "step": 21249 }, { "epoch": 1.67, "learning_rate": 0.0001231214411035202, "loss": 1.492, "step": 21250 }, { "epoch": 1.67, "learning_rate": 0.00012310928152785546, "loss": 1.5022, "step": 21251 }, { "epoch": 1.67, "learning_rate": 0.00012309712213476383, "loss": 1.4677, "step": 21252 }, { "epoch": 1.67, "learning_rate": 0.00012308496292432792, "loss": 1.531, "step": 21253 }, { "epoch": 1.67, "learning_rate": 0.00012307280389663023, "loss": 1.5035, "step": 21254 }, { "epoch": 1.67, "learning_rate": 0.00012306064505175334, "loss": 1.4816, "step": 21255 }, { "epoch": 1.67, "learning_rate": 0.00012304848638977978, "loss": 1.5128, "step": 21256 }, { "epoch": 1.67, "learning_rate": 0.00012303632791079214, "loss": 1.5558, "step": 21257 }, { "epoch": 1.67, "learning_rate": 0.000123024169614873, "loss": 1.4896, "step": 21258 }, { "epoch": 1.67, "learning_rate": 0.0001230120115021048, "loss": 1.5013, "step": 21259 }, { "epoch": 1.67, "learning_rate": 0.00012299985357257023, "loss": 1.4947, "step": 21260 }, { "epoch": 1.67, "learning_rate": 0.0001229876958263517, "loss": 1.4987, "step": 21261 }, { "epoch": 1.67, "learning_rate": 0.00012297553826353178, "loss": 1.5189, "step": 21262 }, { "epoch": 1.67, "learning_rate": 0.0001229633808841931, "loss": 1.5124, "step": 21263 }, { "epoch": 1.67, "learning_rate": 0.0001229512236884181, "loss": 1.5027, "step": 21264 }, { "epoch": 1.67, "learning_rate": 0.00012293906667628943, "loss": 1.501, "step": 21265 }, { "epoch": 1.67, "learning_rate": 0.0001229269098478895, "loss": 1.4797, "step": 21266 }, { "epoch": 1.67, "learning_rate": 0.00012291475320330093, "loss": 1.4768, "step": 21267 }, { "epoch": 1.67, "learning_rate": 0.00012290259674260624, "loss": 1.4859, "step": 21268 }, { "epoch": 1.67, "learning_rate": 0.00012289044046588795, "loss": 1.4962, "step": 21269 }, { "epoch": 1.67, "learning_rate": 0.00012287828437322862, "loss": 1.4716, "step": 21270 }, { "epoch": 1.67, "learning_rate": 0.00012286612846471078, "loss": 1.4764, "step": 21271 }, { "epoch": 1.67, "learning_rate": 0.0001228539727404169, "loss": 1.5017, "step": 21272 }, { "epoch": 1.67, "learning_rate": 0.0001228418172004296, "loss": 1.5362, "step": 21273 }, { "epoch": 1.67, "learning_rate": 0.0001228296618448314, "loss": 1.4851, "step": 21274 }, { "epoch": 1.67, "learning_rate": 0.0001228175066737048, "loss": 1.5003, "step": 21275 }, { "epoch": 1.67, "learning_rate": 0.00012280535168713232, "loss": 1.5637, "step": 21276 }, { "epoch": 1.67, "learning_rate": 0.00012279319688519652, "loss": 1.5072, "step": 21277 }, { "epoch": 1.67, "learning_rate": 0.00012278104226797986, "loss": 1.4891, "step": 21278 }, { "epoch": 1.67, "learning_rate": 0.0001227688878355649, "loss": 1.5303, "step": 21279 }, { "epoch": 1.67, "learning_rate": 0.0001227567335880342, "loss": 1.5231, "step": 21280 }, { "epoch": 1.67, "learning_rate": 0.00012274457952547022, "loss": 1.4983, "step": 21281 }, { "epoch": 1.67, "learning_rate": 0.0001227324256479555, "loss": 1.4658, "step": 21282 }, { "epoch": 1.67, "learning_rate": 0.00012272027195557258, "loss": 1.4953, "step": 21283 }, { "epoch": 1.67, "learning_rate": 0.00012270811844840394, "loss": 1.4629, "step": 21284 }, { "epoch": 1.67, "learning_rate": 0.00012269596512653216, "loss": 1.4505, "step": 21285 }, { "epoch": 1.67, "learning_rate": 0.00012268381199003966, "loss": 1.5504, "step": 21286 }, { "epoch": 1.67, "learning_rate": 0.000122671659039009, "loss": 1.484, "step": 21287 }, { "epoch": 1.67, "learning_rate": 0.00012265950627352268, "loss": 1.5077, "step": 21288 }, { "epoch": 1.68, "learning_rate": 0.00012264735369366329, "loss": 1.4747, "step": 21289 }, { "epoch": 1.68, "learning_rate": 0.0001226352012995132, "loss": 1.5046, "step": 21290 }, { "epoch": 1.68, "learning_rate": 0.00012262304909115503, "loss": 1.5168, "step": 21291 }, { "epoch": 1.68, "learning_rate": 0.00012261089706867127, "loss": 1.5027, "step": 21292 }, { "epoch": 1.68, "learning_rate": 0.00012259874523214438, "loss": 1.5706, "step": 21293 }, { "epoch": 1.68, "learning_rate": 0.0001225865935816569, "loss": 1.5313, "step": 21294 }, { "epoch": 1.68, "learning_rate": 0.0001225744421172913, "loss": 1.4795, "step": 21295 }, { "epoch": 1.68, "learning_rate": 0.00012256229083913012, "loss": 1.5459, "step": 21296 }, { "epoch": 1.68, "learning_rate": 0.00012255013974725587, "loss": 1.4756, "step": 21297 }, { "epoch": 1.68, "learning_rate": 0.00012253798884175098, "loss": 1.5189, "step": 21298 }, { "epoch": 1.68, "learning_rate": 0.000122525838122698, "loss": 1.5421, "step": 21299 }, { "epoch": 1.68, "learning_rate": 0.00012251368759017944, "loss": 1.5024, "step": 21300 }, { "epoch": 1.68, "learning_rate": 0.00012250153724427775, "loss": 1.533, "step": 21301 }, { "epoch": 1.68, "learning_rate": 0.00012248938708507549, "loss": 1.5192, "step": 21302 }, { "epoch": 1.68, "learning_rate": 0.00012247723711265504, "loss": 1.4132, "step": 21303 }, { "epoch": 1.68, "learning_rate": 0.00012246508732709894, "loss": 1.4636, "step": 21304 }, { "epoch": 1.68, "learning_rate": 0.00012245293772848977, "loss": 1.4879, "step": 21305 }, { "epoch": 1.68, "learning_rate": 0.00012244078831690993, "loss": 1.5046, "step": 21306 }, { "epoch": 1.68, "learning_rate": 0.00012242863909244195, "loss": 1.5333, "step": 21307 }, { "epoch": 1.68, "learning_rate": 0.00012241649005516827, "loss": 1.5256, "step": 21308 }, { "epoch": 1.68, "learning_rate": 0.00012240434120517143, "loss": 1.5138, "step": 21309 }, { "epoch": 1.68, "learning_rate": 0.00012239219254253387, "loss": 1.545, "step": 21310 }, { "epoch": 1.68, "learning_rate": 0.0001223800440673381, "loss": 1.5385, "step": 21311 }, { "epoch": 1.68, "learning_rate": 0.00012236789577966655, "loss": 1.5394, "step": 21312 }, { "epoch": 1.68, "learning_rate": 0.00012235574767960176, "loss": 1.5179, "step": 21313 }, { "epoch": 1.68, "learning_rate": 0.00012234359976722622, "loss": 1.4832, "step": 21314 }, { "epoch": 1.68, "learning_rate": 0.00012233145204262232, "loss": 1.5222, "step": 21315 }, { "epoch": 1.68, "learning_rate": 0.00012231930450587263, "loss": 1.5096, "step": 21316 }, { "epoch": 1.68, "learning_rate": 0.00012230715715705958, "loss": 1.5033, "step": 21317 }, { "epoch": 1.68, "learning_rate": 0.00012229500999626564, "loss": 1.5265, "step": 21318 }, { "epoch": 1.68, "learning_rate": 0.00012228286302357327, "loss": 1.5077, "step": 21319 }, { "epoch": 1.68, "learning_rate": 0.00012227071623906497, "loss": 1.4834, "step": 21320 }, { "epoch": 1.68, "learning_rate": 0.00012225856964282326, "loss": 1.5262, "step": 21321 }, { "epoch": 1.68, "learning_rate": 0.0001222464232349305, "loss": 1.4501, "step": 21322 }, { "epoch": 1.68, "learning_rate": 0.00012223427701546925, "loss": 1.4505, "step": 21323 }, { "epoch": 1.68, "learning_rate": 0.00012222213098452193, "loss": 1.4941, "step": 21324 }, { "epoch": 1.68, "learning_rate": 0.000122209985142171, "loss": 1.4711, "step": 21325 }, { "epoch": 1.68, "learning_rate": 0.00012219783948849892, "loss": 1.5277, "step": 21326 }, { "epoch": 1.68, "learning_rate": 0.0001221856940235882, "loss": 1.4374, "step": 21327 }, { "epoch": 1.68, "learning_rate": 0.00012217354874752124, "loss": 1.5413, "step": 21328 }, { "epoch": 1.68, "learning_rate": 0.00012216140366038056, "loss": 1.4866, "step": 21329 }, { "epoch": 1.68, "learning_rate": 0.00012214925876224855, "loss": 1.5087, "step": 21330 }, { "epoch": 1.68, "learning_rate": 0.00012213711405320774, "loss": 1.5399, "step": 21331 }, { "epoch": 1.68, "learning_rate": 0.0001221249695333405, "loss": 1.4789, "step": 21332 }, { "epoch": 1.68, "learning_rate": 0.00012211282520272938, "loss": 1.5415, "step": 21333 }, { "epoch": 1.68, "learning_rate": 0.00012210068106145678, "loss": 1.4927, "step": 21334 }, { "epoch": 1.68, "learning_rate": 0.00012208853710960512, "loss": 1.5164, "step": 21335 }, { "epoch": 1.68, "learning_rate": 0.0001220763933472569, "loss": 1.506, "step": 21336 }, { "epoch": 1.68, "learning_rate": 0.00012206424977449456, "loss": 1.4867, "step": 21337 }, { "epoch": 1.68, "learning_rate": 0.0001220521063914006, "loss": 1.4949, "step": 21338 }, { "epoch": 1.68, "learning_rate": 0.00012203996319805738, "loss": 1.497, "step": 21339 }, { "epoch": 1.68, "learning_rate": 0.00012202782019454736, "loss": 1.4618, "step": 21340 }, { "epoch": 1.68, "learning_rate": 0.00012201567738095305, "loss": 1.5089, "step": 21341 }, { "epoch": 1.68, "learning_rate": 0.00012200353475735682, "loss": 1.5078, "step": 21342 }, { "epoch": 1.68, "learning_rate": 0.00012199139232384117, "loss": 1.4883, "step": 21343 }, { "epoch": 1.68, "learning_rate": 0.00012197925008048845, "loss": 1.4582, "step": 21344 }, { "epoch": 1.68, "learning_rate": 0.0001219671080273812, "loss": 1.4372, "step": 21345 }, { "epoch": 1.68, "learning_rate": 0.00012195496616460183, "loss": 1.4758, "step": 21346 }, { "epoch": 1.68, "learning_rate": 0.00012194282449223273, "loss": 1.4814, "step": 21347 }, { "epoch": 1.68, "learning_rate": 0.00012193068301035641, "loss": 1.5142, "step": 21348 }, { "epoch": 1.68, "learning_rate": 0.00012191854171905521, "loss": 1.4612, "step": 21349 }, { "epoch": 1.68, "learning_rate": 0.00012190640061841164, "loss": 1.5153, "step": 21350 }, { "epoch": 1.68, "learning_rate": 0.00012189425970850804, "loss": 1.5071, "step": 21351 }, { "epoch": 1.68, "learning_rate": 0.00012188211898942702, "loss": 1.5361, "step": 21352 }, { "epoch": 1.68, "learning_rate": 0.00012186997846125082, "loss": 1.5182, "step": 21353 }, { "epoch": 1.68, "learning_rate": 0.00012185783812406196, "loss": 1.51, "step": 21354 }, { "epoch": 1.68, "learning_rate": 0.00012184569797794288, "loss": 1.5089, "step": 21355 }, { "epoch": 1.68, "learning_rate": 0.00012183355802297594, "loss": 1.5039, "step": 21356 }, { "epoch": 1.68, "learning_rate": 0.0001218214182592436, "loss": 1.4943, "step": 21357 }, { "epoch": 1.68, "learning_rate": 0.00012180927868682832, "loss": 1.5506, "step": 21358 }, { "epoch": 1.68, "learning_rate": 0.00012179713930581244, "loss": 1.4934, "step": 21359 }, { "epoch": 1.68, "learning_rate": 0.00012178500011627845, "loss": 1.4646, "step": 21360 }, { "epoch": 1.68, "learning_rate": 0.00012177286111830871, "loss": 1.5339, "step": 21361 }, { "epoch": 1.68, "learning_rate": 0.00012176072231198565, "loss": 1.4714, "step": 21362 }, { "epoch": 1.68, "learning_rate": 0.00012174858369739177, "loss": 1.4789, "step": 21363 }, { "epoch": 1.68, "learning_rate": 0.00012173644527460937, "loss": 1.5097, "step": 21364 }, { "epoch": 1.68, "learning_rate": 0.00012172430704372094, "loss": 1.4862, "step": 21365 }, { "epoch": 1.68, "learning_rate": 0.00012171216900480875, "loss": 1.4829, "step": 21366 }, { "epoch": 1.68, "learning_rate": 0.00012170003115795542, "loss": 1.4968, "step": 21367 }, { "epoch": 1.68, "learning_rate": 0.00012168789350324325, "loss": 1.4659, "step": 21368 }, { "epoch": 1.68, "learning_rate": 0.00012167575604075465, "loss": 1.5311, "step": 21369 }, { "epoch": 1.68, "learning_rate": 0.00012166361877057204, "loss": 1.5308, "step": 21370 }, { "epoch": 1.68, "learning_rate": 0.00012165148169277782, "loss": 1.5202, "step": 21371 }, { "epoch": 1.68, "learning_rate": 0.00012163934480745443, "loss": 1.5175, "step": 21372 }, { "epoch": 1.68, "learning_rate": 0.0001216272081146842, "loss": 1.4841, "step": 21373 }, { "epoch": 1.68, "learning_rate": 0.00012161507161454957, "loss": 1.5086, "step": 21374 }, { "epoch": 1.68, "learning_rate": 0.00012160293530713296, "loss": 1.5395, "step": 21375 }, { "epoch": 1.68, "learning_rate": 0.00012159079919251672, "loss": 1.5394, "step": 21376 }, { "epoch": 1.68, "learning_rate": 0.00012157866327078332, "loss": 1.4747, "step": 21377 }, { "epoch": 1.68, "learning_rate": 0.00012156652754201507, "loss": 1.4848, "step": 21378 }, { "epoch": 1.68, "learning_rate": 0.0001215543920062944, "loss": 1.5322, "step": 21379 }, { "epoch": 1.68, "learning_rate": 0.00012154225666370377, "loss": 1.511, "step": 21380 }, { "epoch": 1.68, "learning_rate": 0.00012153012151432547, "loss": 1.4616, "step": 21381 }, { "epoch": 1.68, "learning_rate": 0.00012151798655824189, "loss": 1.4839, "step": 21382 }, { "epoch": 1.68, "learning_rate": 0.0001215058517955355, "loss": 1.5016, "step": 21383 }, { "epoch": 1.68, "learning_rate": 0.00012149371722628868, "loss": 1.4918, "step": 21384 }, { "epoch": 1.68, "learning_rate": 0.00012148158285058377, "loss": 1.4628, "step": 21385 }, { "epoch": 1.68, "learning_rate": 0.00012146944866850316, "loss": 1.5204, "step": 21386 }, { "epoch": 1.68, "learning_rate": 0.00012145731468012928, "loss": 1.5076, "step": 21387 }, { "epoch": 1.68, "learning_rate": 0.00012144518088554449, "loss": 1.5035, "step": 21388 }, { "epoch": 1.68, "learning_rate": 0.00012143304728483115, "loss": 1.4865, "step": 21389 }, { "epoch": 1.68, "learning_rate": 0.00012142091387807162, "loss": 1.5287, "step": 21390 }, { "epoch": 1.68, "learning_rate": 0.00012140878066534834, "loss": 1.5179, "step": 21391 }, { "epoch": 1.68, "learning_rate": 0.00012139664764674368, "loss": 1.5151, "step": 21392 }, { "epoch": 1.68, "learning_rate": 0.00012138451482233998, "loss": 1.4709, "step": 21393 }, { "epoch": 1.68, "learning_rate": 0.00012137238219221965, "loss": 1.4805, "step": 21394 }, { "epoch": 1.68, "learning_rate": 0.00012136024975646502, "loss": 1.5596, "step": 21395 }, { "epoch": 1.68, "learning_rate": 0.00012134811751515848, "loss": 1.516, "step": 21396 }, { "epoch": 1.68, "learning_rate": 0.00012133598546838246, "loss": 1.4998, "step": 21397 }, { "epoch": 1.68, "learning_rate": 0.00012132385361621918, "loss": 1.5257, "step": 21398 }, { "epoch": 1.68, "learning_rate": 0.0001213117219587512, "loss": 1.4848, "step": 21399 }, { "epoch": 1.68, "learning_rate": 0.00012129959049606076, "loss": 1.434, "step": 21400 }, { "epoch": 1.68, "learning_rate": 0.0001212874592282303, "loss": 1.4971, "step": 21401 }, { "epoch": 1.68, "learning_rate": 0.00012127532815534213, "loss": 1.4906, "step": 21402 }, { "epoch": 1.68, "learning_rate": 0.0001212631972774786, "loss": 1.54, "step": 21403 }, { "epoch": 1.68, "learning_rate": 0.00012125106659472215, "loss": 1.5003, "step": 21404 }, { "epoch": 1.68, "learning_rate": 0.00012123893610715506, "loss": 1.5156, "step": 21405 }, { "epoch": 1.68, "learning_rate": 0.00012122680581485975, "loss": 1.4549, "step": 21406 }, { "epoch": 1.68, "learning_rate": 0.00012121467571791853, "loss": 1.4978, "step": 21407 }, { "epoch": 1.68, "learning_rate": 0.00012120254581641376, "loss": 1.5288, "step": 21408 }, { "epoch": 1.68, "learning_rate": 0.00012119041611042786, "loss": 1.4661, "step": 21409 }, { "epoch": 1.68, "learning_rate": 0.0001211782866000431, "loss": 1.4735, "step": 21410 }, { "epoch": 1.68, "learning_rate": 0.00012116615728534185, "loss": 1.5271, "step": 21411 }, { "epoch": 1.68, "learning_rate": 0.00012115402816640653, "loss": 1.5412, "step": 21412 }, { "epoch": 1.68, "learning_rate": 0.00012114189924331941, "loss": 1.4692, "step": 21413 }, { "epoch": 1.68, "learning_rate": 0.00012112977051616283, "loss": 1.4908, "step": 21414 }, { "epoch": 1.68, "learning_rate": 0.00012111764198501924, "loss": 1.4882, "step": 21415 }, { "epoch": 1.69, "learning_rate": 0.00012110551364997092, "loss": 1.5197, "step": 21416 }, { "epoch": 1.69, "learning_rate": 0.00012109338551110018, "loss": 1.4353, "step": 21417 }, { "epoch": 1.69, "learning_rate": 0.00012108125756848945, "loss": 1.4465, "step": 21418 }, { "epoch": 1.69, "learning_rate": 0.00012106912982222098, "loss": 1.4529, "step": 21419 }, { "epoch": 1.69, "learning_rate": 0.00012105700227237714, "loss": 1.4944, "step": 21420 }, { "epoch": 1.69, "learning_rate": 0.00012104487491904036, "loss": 1.5283, "step": 21421 }, { "epoch": 1.69, "learning_rate": 0.00012103274776229283, "loss": 1.4882, "step": 21422 }, { "epoch": 1.69, "learning_rate": 0.00012102062080221697, "loss": 1.5121, "step": 21423 }, { "epoch": 1.69, "learning_rate": 0.00012100849403889514, "loss": 1.4706, "step": 21424 }, { "epoch": 1.69, "learning_rate": 0.00012099636747240959, "loss": 1.5332, "step": 21425 }, { "epoch": 1.69, "learning_rate": 0.00012098424110284273, "loss": 1.4404, "step": 21426 }, { "epoch": 1.69, "learning_rate": 0.00012097211493027684, "loss": 1.4935, "step": 21427 }, { "epoch": 1.69, "learning_rate": 0.00012095998895479427, "loss": 1.4642, "step": 21428 }, { "epoch": 1.69, "learning_rate": 0.00012094786317647732, "loss": 1.5152, "step": 21429 }, { "epoch": 1.69, "learning_rate": 0.0001209357375954084, "loss": 1.5185, "step": 21430 }, { "epoch": 1.69, "learning_rate": 0.00012092361221166975, "loss": 1.5258, "step": 21431 }, { "epoch": 1.69, "learning_rate": 0.00012091148702534374, "loss": 1.4761, "step": 21432 }, { "epoch": 1.69, "learning_rate": 0.0001208993620365127, "loss": 1.5359, "step": 21433 }, { "epoch": 1.69, "learning_rate": 0.00012088723724525892, "loss": 1.4912, "step": 21434 }, { "epoch": 1.69, "learning_rate": 0.00012087511265166474, "loss": 1.4994, "step": 21435 }, { "epoch": 1.69, "learning_rate": 0.00012086298825581247, "loss": 1.479, "step": 21436 }, { "epoch": 1.69, "learning_rate": 0.00012085086405778438, "loss": 1.5248, "step": 21437 }, { "epoch": 1.69, "learning_rate": 0.00012083874005766292, "loss": 1.4972, "step": 21438 }, { "epoch": 1.69, "learning_rate": 0.00012082661625553029, "loss": 1.4632, "step": 21439 }, { "epoch": 1.69, "learning_rate": 0.0001208144926514688, "loss": 1.4907, "step": 21440 }, { "epoch": 1.69, "learning_rate": 0.00012080236924556087, "loss": 1.4942, "step": 21441 }, { "epoch": 1.69, "learning_rate": 0.00012079024603788867, "loss": 1.5233, "step": 21442 }, { "epoch": 1.69, "learning_rate": 0.00012077812302853464, "loss": 1.5156, "step": 21443 }, { "epoch": 1.69, "learning_rate": 0.00012076600021758099, "loss": 1.4618, "step": 21444 }, { "epoch": 1.69, "learning_rate": 0.00012075387760511003, "loss": 1.6035, "step": 21445 }, { "epoch": 1.69, "learning_rate": 0.00012074175519120413, "loss": 1.5227, "step": 21446 }, { "epoch": 1.69, "learning_rate": 0.0001207296329759456, "loss": 1.5141, "step": 21447 }, { "epoch": 1.69, "learning_rate": 0.0001207175109594167, "loss": 1.5028, "step": 21448 }, { "epoch": 1.69, "learning_rate": 0.00012070538914169972, "loss": 1.4444, "step": 21449 }, { "epoch": 1.69, "learning_rate": 0.00012069326752287701, "loss": 1.5117, "step": 21450 }, { "epoch": 1.69, "learning_rate": 0.00012068114610303082, "loss": 1.4904, "step": 21451 }, { "epoch": 1.69, "learning_rate": 0.00012066902488224345, "loss": 1.5067, "step": 21452 }, { "epoch": 1.69, "learning_rate": 0.00012065690386059727, "loss": 1.4943, "step": 21453 }, { "epoch": 1.69, "learning_rate": 0.00012064478303817447, "loss": 1.4842, "step": 21454 }, { "epoch": 1.69, "learning_rate": 0.00012063266241505745, "loss": 1.5138, "step": 21455 }, { "epoch": 1.69, "learning_rate": 0.00012062054199132838, "loss": 1.5191, "step": 21456 }, { "epoch": 1.69, "learning_rate": 0.00012060842176706964, "loss": 1.5853, "step": 21457 }, { "epoch": 1.69, "learning_rate": 0.00012059630174236353, "loss": 1.5062, "step": 21458 }, { "epoch": 1.69, "learning_rate": 0.00012058418191729226, "loss": 1.5212, "step": 21459 }, { "epoch": 1.69, "learning_rate": 0.0001205720622919382, "loss": 1.4473, "step": 21460 }, { "epoch": 1.69, "learning_rate": 0.0001205599428663835, "loss": 1.4756, "step": 21461 }, { "epoch": 1.69, "learning_rate": 0.00012054782364071063, "loss": 1.5317, "step": 21462 }, { "epoch": 1.69, "learning_rate": 0.00012053570461500176, "loss": 1.4749, "step": 21463 }, { "epoch": 1.69, "learning_rate": 0.00012052358578933925, "loss": 1.4983, "step": 21464 }, { "epoch": 1.69, "learning_rate": 0.00012051146716380525, "loss": 1.4793, "step": 21465 }, { "epoch": 1.69, "learning_rate": 0.00012049934873848216, "loss": 1.4981, "step": 21466 }, { "epoch": 1.69, "learning_rate": 0.00012048723051345221, "loss": 1.5273, "step": 21467 }, { "epoch": 1.69, "learning_rate": 0.00012047511248879766, "loss": 1.4867, "step": 21468 }, { "epoch": 1.69, "learning_rate": 0.0001204629946646008, "loss": 1.5411, "step": 21469 }, { "epoch": 1.69, "learning_rate": 0.00012045087704094395, "loss": 1.4866, "step": 21470 }, { "epoch": 1.69, "learning_rate": 0.00012043875961790929, "loss": 1.4881, "step": 21471 }, { "epoch": 1.69, "learning_rate": 0.00012042664239557918, "loss": 1.4875, "step": 21472 }, { "epoch": 1.69, "learning_rate": 0.00012041452537403582, "loss": 1.4711, "step": 21473 }, { "epoch": 1.69, "learning_rate": 0.00012040240855336149, "loss": 1.5042, "step": 21474 }, { "epoch": 1.69, "learning_rate": 0.00012039029193363852, "loss": 1.486, "step": 21475 }, { "epoch": 1.69, "learning_rate": 0.00012037817551494904, "loss": 1.4848, "step": 21476 }, { "epoch": 1.69, "learning_rate": 0.00012036605929737547, "loss": 1.532, "step": 21477 }, { "epoch": 1.69, "learning_rate": 0.00012035394328099999, "loss": 1.5167, "step": 21478 }, { "epoch": 1.69, "learning_rate": 0.0001203418274659049, "loss": 1.4347, "step": 21479 }, { "epoch": 1.69, "learning_rate": 0.00012032971185217239, "loss": 1.4821, "step": 21480 }, { "epoch": 1.69, "learning_rate": 0.00012031759643988479, "loss": 1.4759, "step": 21481 }, { "epoch": 1.69, "learning_rate": 0.00012030548122912435, "loss": 1.4815, "step": 21482 }, { "epoch": 1.69, "learning_rate": 0.00012029336621997326, "loss": 1.496, "step": 21483 }, { "epoch": 1.69, "learning_rate": 0.00012028125141251388, "loss": 1.5163, "step": 21484 }, { "epoch": 1.69, "learning_rate": 0.00012026913680682835, "loss": 1.5377, "step": 21485 }, { "epoch": 1.69, "learning_rate": 0.00012025702240299898, "loss": 1.4521, "step": 21486 }, { "epoch": 1.69, "learning_rate": 0.00012024490820110805, "loss": 1.502, "step": 21487 }, { "epoch": 1.69, "learning_rate": 0.00012023279420123774, "loss": 1.4525, "step": 21488 }, { "epoch": 1.69, "learning_rate": 0.00012022068040347037, "loss": 1.4957, "step": 21489 }, { "epoch": 1.69, "learning_rate": 0.0001202085668078881, "loss": 1.4864, "step": 21490 }, { "epoch": 1.69, "learning_rate": 0.00012019645341457322, "loss": 1.5423, "step": 21491 }, { "epoch": 1.69, "learning_rate": 0.00012018434022360795, "loss": 1.5031, "step": 21492 }, { "epoch": 1.69, "learning_rate": 0.00012017222723507462, "loss": 1.5593, "step": 21493 }, { "epoch": 1.69, "learning_rate": 0.00012016011444905538, "loss": 1.5042, "step": 21494 }, { "epoch": 1.69, "learning_rate": 0.00012014800186563249, "loss": 1.4622, "step": 21495 }, { "epoch": 1.69, "learning_rate": 0.00012013588948488822, "loss": 1.4643, "step": 21496 }, { "epoch": 1.69, "learning_rate": 0.00012012377730690474, "loss": 1.461, "step": 21497 }, { "epoch": 1.69, "learning_rate": 0.00012011166533176436, "loss": 1.5146, "step": 21498 }, { "epoch": 1.69, "learning_rate": 0.00012009955355954928, "loss": 1.4803, "step": 21499 }, { "epoch": 1.69, "learning_rate": 0.00012008744199034171, "loss": 1.5241, "step": 21500 }, { "epoch": 1.69, "learning_rate": 0.00012007533062422394, "loss": 1.4451, "step": 21501 }, { "epoch": 1.69, "learning_rate": 0.00012006321946127811, "loss": 1.5289, "step": 21502 }, { "epoch": 1.69, "learning_rate": 0.0001200511085015865, "loss": 1.4795, "step": 21503 }, { "epoch": 1.69, "learning_rate": 0.0001200389977452314, "loss": 1.5238, "step": 21504 }, { "epoch": 1.69, "learning_rate": 0.00012002688719229491, "loss": 1.5007, "step": 21505 }, { "epoch": 1.69, "learning_rate": 0.00012001477684285933, "loss": 1.5033, "step": 21506 }, { "epoch": 1.69, "learning_rate": 0.00012000266669700688, "loss": 1.4943, "step": 21507 }, { "epoch": 1.69, "learning_rate": 0.00011999055675481973, "loss": 1.5524, "step": 21508 }, { "epoch": 1.69, "learning_rate": 0.00011997844701638017, "loss": 1.5184, "step": 21509 }, { "epoch": 1.69, "learning_rate": 0.00011996633748177036, "loss": 1.4731, "step": 21510 }, { "epoch": 1.69, "learning_rate": 0.00011995422815107259, "loss": 1.5365, "step": 21511 }, { "epoch": 1.69, "learning_rate": 0.00011994211902436901, "loss": 1.5178, "step": 21512 }, { "epoch": 1.69, "learning_rate": 0.00011993001010174188, "loss": 1.4859, "step": 21513 }, { "epoch": 1.69, "learning_rate": 0.00011991790138327336, "loss": 1.5308, "step": 21514 }, { "epoch": 1.69, "learning_rate": 0.00011990579286904567, "loss": 1.4976, "step": 21515 }, { "epoch": 1.69, "learning_rate": 0.00011989368455914109, "loss": 1.4693, "step": 21516 }, { "epoch": 1.69, "learning_rate": 0.00011988157645364174, "loss": 1.4888, "step": 21517 }, { "epoch": 1.69, "learning_rate": 0.0001198694685526299, "loss": 1.5032, "step": 21518 }, { "epoch": 1.69, "learning_rate": 0.0001198573608561877, "loss": 1.5124, "step": 21519 }, { "epoch": 1.69, "learning_rate": 0.00011984525336439739, "loss": 1.467, "step": 21520 }, { "epoch": 1.69, "learning_rate": 0.00011983314607734121, "loss": 1.4977, "step": 21521 }, { "epoch": 1.69, "learning_rate": 0.00011982103899510127, "loss": 1.5004, "step": 21522 }, { "epoch": 1.69, "learning_rate": 0.00011980893211775985, "loss": 1.4684, "step": 21523 }, { "epoch": 1.69, "learning_rate": 0.00011979682544539906, "loss": 1.4886, "step": 21524 }, { "epoch": 1.69, "learning_rate": 0.00011978471897810123, "loss": 1.4103, "step": 21525 }, { "epoch": 1.69, "learning_rate": 0.00011977261271594844, "loss": 1.4514, "step": 21526 }, { "epoch": 1.69, "learning_rate": 0.00011976050665902296, "loss": 1.4737, "step": 21527 }, { "epoch": 1.69, "learning_rate": 0.00011974840080740698, "loss": 1.4997, "step": 21528 }, { "epoch": 1.69, "learning_rate": 0.00011973629516118261, "loss": 1.4975, "step": 21529 }, { "epoch": 1.69, "learning_rate": 0.00011972418972043213, "loss": 1.4788, "step": 21530 }, { "epoch": 1.69, "learning_rate": 0.00011971208448523768, "loss": 1.5255, "step": 21531 }, { "epoch": 1.69, "learning_rate": 0.00011969997945568144, "loss": 1.519, "step": 21532 }, { "epoch": 1.69, "learning_rate": 0.00011968787463184566, "loss": 1.5204, "step": 21533 }, { "epoch": 1.69, "learning_rate": 0.00011967577001381246, "loss": 1.4941, "step": 21534 }, { "epoch": 1.69, "learning_rate": 0.00011966366560166403, "loss": 1.4406, "step": 21535 }, { "epoch": 1.69, "learning_rate": 0.00011965156139548263, "loss": 1.5003, "step": 21536 }, { "epoch": 1.69, "learning_rate": 0.00011963945739535033, "loss": 1.4469, "step": 21537 }, { "epoch": 1.69, "learning_rate": 0.00011962735360134938, "loss": 1.5315, "step": 21538 }, { "epoch": 1.69, "learning_rate": 0.00011961525001356185, "loss": 1.4969, "step": 21539 }, { "epoch": 1.69, "learning_rate": 0.0001196031466320701, "loss": 1.6015, "step": 21540 }, { "epoch": 1.69, "learning_rate": 0.0001195910434569562, "loss": 1.4983, "step": 21541 }, { "epoch": 1.69, "learning_rate": 0.00011957894048830235, "loss": 1.5032, "step": 21542 }, { "epoch": 1.7, "learning_rate": 0.00011956683772619066, "loss": 1.5289, "step": 21543 }, { "epoch": 1.7, "learning_rate": 0.00011955473517070337, "loss": 1.5344, "step": 21544 }, { "epoch": 1.7, "learning_rate": 0.00011954263282192266, "loss": 1.5459, "step": 21545 }, { "epoch": 1.7, "learning_rate": 0.00011953053067993061, "loss": 1.4862, "step": 21546 }, { "epoch": 1.7, "learning_rate": 0.00011951842874480949, "loss": 1.4886, "step": 21547 }, { "epoch": 1.7, "learning_rate": 0.00011950632701664139, "loss": 1.5196, "step": 21548 }, { "epoch": 1.7, "learning_rate": 0.00011949422549550847, "loss": 1.4527, "step": 21549 }, { "epoch": 1.7, "learning_rate": 0.000119482124181493, "loss": 1.5406, "step": 21550 }, { "epoch": 1.7, "learning_rate": 0.00011947002307467702, "loss": 1.4829, "step": 21551 }, { "epoch": 1.7, "learning_rate": 0.00011945792217514272, "loss": 1.4831, "step": 21552 }, { "epoch": 1.7, "learning_rate": 0.00011944582148297232, "loss": 1.5323, "step": 21553 }, { "epoch": 1.7, "learning_rate": 0.0001194337209982479, "loss": 1.4736, "step": 21554 }, { "epoch": 1.7, "learning_rate": 0.0001194216207210516, "loss": 1.5183, "step": 21555 }, { "epoch": 1.7, "learning_rate": 0.00011940952065146566, "loss": 1.4709, "step": 21556 }, { "epoch": 1.7, "learning_rate": 0.00011939742078957224, "loss": 1.5245, "step": 21557 }, { "epoch": 1.7, "learning_rate": 0.00011938532113545339, "loss": 1.4484, "step": 21558 }, { "epoch": 1.7, "learning_rate": 0.00011937322168919137, "loss": 1.4169, "step": 21559 }, { "epoch": 1.7, "learning_rate": 0.00011936112245086822, "loss": 1.5267, "step": 21560 }, { "epoch": 1.7, "learning_rate": 0.00011934902342056614, "loss": 1.4161, "step": 21561 }, { "epoch": 1.7, "learning_rate": 0.00011933692459836735, "loss": 1.5142, "step": 21562 }, { "epoch": 1.7, "learning_rate": 0.00011932482598435384, "loss": 1.5096, "step": 21563 }, { "epoch": 1.7, "learning_rate": 0.00011931272757860785, "loss": 1.5489, "step": 21564 }, { "epoch": 1.7, "learning_rate": 0.00011930062938121154, "loss": 1.4874, "step": 21565 }, { "epoch": 1.7, "learning_rate": 0.00011928853139224698, "loss": 1.4895, "step": 21566 }, { "epoch": 1.7, "learning_rate": 0.00011927643361179639, "loss": 1.5226, "step": 21567 }, { "epoch": 1.7, "learning_rate": 0.0001192643360399418, "loss": 1.5422, "step": 21568 }, { "epoch": 1.7, "learning_rate": 0.00011925223867676542, "loss": 1.5371, "step": 21569 }, { "epoch": 1.7, "learning_rate": 0.00011924014152234943, "loss": 1.5061, "step": 21570 }, { "epoch": 1.7, "learning_rate": 0.0001192280445767758, "loss": 1.5074, "step": 21571 }, { "epoch": 1.7, "learning_rate": 0.00011921594784012682, "loss": 1.4699, "step": 21572 }, { "epoch": 1.7, "learning_rate": 0.00011920385131248457, "loss": 1.4558, "step": 21573 }, { "epoch": 1.7, "learning_rate": 0.00011919175499393119, "loss": 1.5069, "step": 21574 }, { "epoch": 1.7, "learning_rate": 0.00011917965888454877, "loss": 1.4485, "step": 21575 }, { "epoch": 1.7, "learning_rate": 0.00011916756298441948, "loss": 1.5545, "step": 21576 }, { "epoch": 1.7, "learning_rate": 0.0001191554672936254, "loss": 1.5062, "step": 21577 }, { "epoch": 1.7, "learning_rate": 0.00011914337181224867, "loss": 1.5244, "step": 21578 }, { "epoch": 1.7, "learning_rate": 0.00011913127654037146, "loss": 1.5448, "step": 21579 }, { "epoch": 1.7, "learning_rate": 0.00011911918147807581, "loss": 1.5402, "step": 21580 }, { "epoch": 1.7, "learning_rate": 0.00011910708662544388, "loss": 1.5194, "step": 21581 }, { "epoch": 1.7, "learning_rate": 0.0001190949919825578, "loss": 1.4934, "step": 21582 }, { "epoch": 1.7, "learning_rate": 0.00011908289754949964, "loss": 1.4823, "step": 21583 }, { "epoch": 1.7, "learning_rate": 0.0001190708033263516, "loss": 1.5152, "step": 21584 }, { "epoch": 1.7, "learning_rate": 0.0001190587093131957, "loss": 1.5233, "step": 21585 }, { "epoch": 1.7, "learning_rate": 0.00011904661551011404, "loss": 1.5369, "step": 21586 }, { "epoch": 1.7, "learning_rate": 0.00011903452191718881, "loss": 1.5572, "step": 21587 }, { "epoch": 1.7, "learning_rate": 0.00011902242853450214, "loss": 1.4551, "step": 21588 }, { "epoch": 1.7, "learning_rate": 0.00011901033536213604, "loss": 1.484, "step": 21589 }, { "epoch": 1.7, "learning_rate": 0.00011899824240017266, "loss": 1.5057, "step": 21590 }, { "epoch": 1.7, "learning_rate": 0.00011898614964869413, "loss": 1.4681, "step": 21591 }, { "epoch": 1.7, "learning_rate": 0.00011897405710778252, "loss": 1.5077, "step": 21592 }, { "epoch": 1.7, "learning_rate": 0.00011896196477751992, "loss": 1.4724, "step": 21593 }, { "epoch": 1.7, "learning_rate": 0.00011894987265798849, "loss": 1.4572, "step": 21594 }, { "epoch": 1.7, "learning_rate": 0.00011893778074927026, "loss": 1.4778, "step": 21595 }, { "epoch": 1.7, "learning_rate": 0.0001189256890514474, "loss": 1.5069, "step": 21596 }, { "epoch": 1.7, "learning_rate": 0.00011891359756460192, "loss": 1.4426, "step": 21597 }, { "epoch": 1.7, "learning_rate": 0.00011890150628881596, "loss": 1.4473, "step": 21598 }, { "epoch": 1.7, "learning_rate": 0.00011888941522417162, "loss": 1.5082, "step": 21599 }, { "epoch": 1.7, "learning_rate": 0.000118877324370751, "loss": 1.4897, "step": 21600 }, { "epoch": 1.7, "learning_rate": 0.00011886523372863617, "loss": 1.4622, "step": 21601 }, { "epoch": 1.7, "learning_rate": 0.00011885314329790911, "loss": 1.5669, "step": 21602 }, { "epoch": 1.7, "learning_rate": 0.00011884105307865213, "loss": 1.5222, "step": 21603 }, { "epoch": 1.7, "learning_rate": 0.0001188289630709472, "loss": 1.4794, "step": 21604 }, { "epoch": 1.7, "learning_rate": 0.00011881687327487638, "loss": 1.5106, "step": 21605 }, { "epoch": 1.7, "learning_rate": 0.00011880478369052183, "loss": 1.4657, "step": 21606 }, { "epoch": 1.7, "learning_rate": 0.00011879269431796553, "loss": 1.5357, "step": 21607 }, { "epoch": 1.7, "learning_rate": 0.00011878060515728966, "loss": 1.4815, "step": 21608 }, { "epoch": 1.7, "learning_rate": 0.00011876851620857622, "loss": 1.537, "step": 21609 }, { "epoch": 1.7, "learning_rate": 0.00011875642747190733, "loss": 1.471, "step": 21610 }, { "epoch": 1.7, "learning_rate": 0.00011874433894736508, "loss": 1.4808, "step": 21611 }, { "epoch": 1.7, "learning_rate": 0.00011873225063503147, "loss": 1.4701, "step": 21612 }, { "epoch": 1.7, "learning_rate": 0.00011872016253498867, "loss": 1.459, "step": 21613 }, { "epoch": 1.7, "learning_rate": 0.00011870807464731868, "loss": 1.5109, "step": 21614 }, { "epoch": 1.7, "learning_rate": 0.00011869598697210359, "loss": 1.469, "step": 21615 }, { "epoch": 1.7, "learning_rate": 0.00011868389950942551, "loss": 1.5093, "step": 21616 }, { "epoch": 1.7, "learning_rate": 0.00011867181225936643, "loss": 1.4654, "step": 21617 }, { "epoch": 1.7, "learning_rate": 0.00011865972522200841, "loss": 1.5158, "step": 21618 }, { "epoch": 1.7, "learning_rate": 0.00011864763839743362, "loss": 1.5314, "step": 21619 }, { "epoch": 1.7, "learning_rate": 0.00011863555178572409, "loss": 1.4894, "step": 21620 }, { "epoch": 1.7, "learning_rate": 0.00011862346538696182, "loss": 1.5045, "step": 21621 }, { "epoch": 1.7, "learning_rate": 0.00011861137920122891, "loss": 1.4674, "step": 21622 }, { "epoch": 1.7, "learning_rate": 0.00011859929322860745, "loss": 1.4562, "step": 21623 }, { "epoch": 1.7, "learning_rate": 0.0001185872074691794, "loss": 1.5016, "step": 21624 }, { "epoch": 1.7, "learning_rate": 0.00011857512192302693, "loss": 1.5228, "step": 21625 }, { "epoch": 1.7, "learning_rate": 0.00011856303659023201, "loss": 1.4864, "step": 21626 }, { "epoch": 1.7, "learning_rate": 0.0001185509514708767, "loss": 1.4566, "step": 21627 }, { "epoch": 1.7, "learning_rate": 0.00011853886656504313, "loss": 1.4574, "step": 21628 }, { "epoch": 1.7, "learning_rate": 0.00011852678187281326, "loss": 1.4946, "step": 21629 }, { "epoch": 1.7, "learning_rate": 0.0001185146973942692, "loss": 1.5484, "step": 21630 }, { "epoch": 1.7, "learning_rate": 0.00011850261312949295, "loss": 1.5019, "step": 21631 }, { "epoch": 1.7, "learning_rate": 0.00011849052907856656, "loss": 1.5157, "step": 21632 }, { "epoch": 1.7, "learning_rate": 0.00011847844524157213, "loss": 1.5345, "step": 21633 }, { "epoch": 1.7, "learning_rate": 0.00011846636161859154, "loss": 1.5075, "step": 21634 }, { "epoch": 1.7, "learning_rate": 0.00011845427820970708, "loss": 1.5105, "step": 21635 }, { "epoch": 1.7, "learning_rate": 0.00011844219501500062, "loss": 1.4903, "step": 21636 }, { "epoch": 1.7, "learning_rate": 0.00011843011203455427, "loss": 1.47, "step": 21637 }, { "epoch": 1.7, "learning_rate": 0.00011841802926845003, "loss": 1.4797, "step": 21638 }, { "epoch": 1.7, "learning_rate": 0.00011840594671676992, "loss": 1.487, "step": 21639 }, { "epoch": 1.7, "learning_rate": 0.00011839386437959603, "loss": 1.513, "step": 21640 }, { "epoch": 1.7, "learning_rate": 0.00011838178225701031, "loss": 1.5482, "step": 21641 }, { "epoch": 1.7, "learning_rate": 0.0001183697003490949, "loss": 1.5106, "step": 21642 }, { "epoch": 1.7, "learning_rate": 0.00011835761865593172, "loss": 1.5402, "step": 21643 }, { "epoch": 1.7, "learning_rate": 0.00011834553717760286, "loss": 1.5133, "step": 21644 }, { "epoch": 1.7, "learning_rate": 0.00011833345591419037, "loss": 1.4774, "step": 21645 }, { "epoch": 1.7, "learning_rate": 0.00011832137486577619, "loss": 1.5177, "step": 21646 }, { "epoch": 1.7, "learning_rate": 0.0001183092940324424, "loss": 1.4412, "step": 21647 }, { "epoch": 1.7, "learning_rate": 0.00011829721341427105, "loss": 1.5121, "step": 21648 }, { "epoch": 1.7, "learning_rate": 0.00011828513301134406, "loss": 1.5466, "step": 21649 }, { "epoch": 1.7, "learning_rate": 0.00011827305282374356, "loss": 1.5031, "step": 21650 }, { "epoch": 1.7, "learning_rate": 0.00011826097285155151, "loss": 1.5064, "step": 21651 }, { "epoch": 1.7, "learning_rate": 0.00011824889309484997, "loss": 1.5155, "step": 21652 }, { "epoch": 1.7, "learning_rate": 0.00011823681355372089, "loss": 1.4834, "step": 21653 }, { "epoch": 1.7, "learning_rate": 0.00011822473422824636, "loss": 1.5416, "step": 21654 }, { "epoch": 1.7, "learning_rate": 0.0001182126551185083, "loss": 1.5001, "step": 21655 }, { "epoch": 1.7, "learning_rate": 0.00011820057622458878, "loss": 1.4959, "step": 21656 }, { "epoch": 1.7, "learning_rate": 0.00011818849754656982, "loss": 1.5275, "step": 21657 }, { "epoch": 1.7, "learning_rate": 0.0001181764190845334, "loss": 1.4808, "step": 21658 }, { "epoch": 1.7, "learning_rate": 0.00011816434083856155, "loss": 1.4909, "step": 21659 }, { "epoch": 1.7, "learning_rate": 0.00011815226280873624, "loss": 1.5266, "step": 21660 }, { "epoch": 1.7, "learning_rate": 0.00011814018499513948, "loss": 1.5244, "step": 21661 }, { "epoch": 1.7, "learning_rate": 0.0001181281073978533, "loss": 1.4977, "step": 21662 }, { "epoch": 1.7, "learning_rate": 0.00011811603001695967, "loss": 1.5004, "step": 21663 }, { "epoch": 1.7, "learning_rate": 0.0001181039528525406, "loss": 1.4648, "step": 21664 }, { "epoch": 1.7, "learning_rate": 0.00011809187590467803, "loss": 1.5262, "step": 21665 }, { "epoch": 1.7, "learning_rate": 0.0001180797991734541, "loss": 1.5244, "step": 21666 }, { "epoch": 1.7, "learning_rate": 0.00011806772265895069, "loss": 1.4891, "step": 21667 }, { "epoch": 1.7, "learning_rate": 0.00011805564636124982, "loss": 1.4786, "step": 21668 }, { "epoch": 1.7, "learning_rate": 0.00011804357028043351, "loss": 1.5007, "step": 21669 }, { "epoch": 1.71, "learning_rate": 0.00011803149441658369, "loss": 1.4543, "step": 21670 }, { "epoch": 1.71, "learning_rate": 0.00011801941876978241, "loss": 1.4938, "step": 21671 }, { "epoch": 1.71, "learning_rate": 0.0001180073433401116, "loss": 1.56, "step": 21672 }, { "epoch": 1.71, "learning_rate": 0.00011799526812765328, "loss": 1.528, "step": 21673 }, { "epoch": 1.71, "learning_rate": 0.00011798319313248945, "loss": 1.4719, "step": 21674 }, { "epoch": 1.71, "learning_rate": 0.00011797111835470206, "loss": 1.507, "step": 21675 }, { "epoch": 1.71, "learning_rate": 0.00011795904379437308, "loss": 1.5946, "step": 21676 }, { "epoch": 1.71, "learning_rate": 0.00011794696945158453, "loss": 1.5284, "step": 21677 }, { "epoch": 1.71, "learning_rate": 0.00011793489532641835, "loss": 1.5054, "step": 21678 }, { "epoch": 1.71, "learning_rate": 0.00011792282141895659, "loss": 1.4852, "step": 21679 }, { "epoch": 1.71, "learning_rate": 0.00011791074772928112, "loss": 1.5357, "step": 21680 }, { "epoch": 1.71, "learning_rate": 0.00011789867425747394, "loss": 1.5356, "step": 21681 }, { "epoch": 1.71, "learning_rate": 0.00011788660100361706, "loss": 1.4826, "step": 21682 }, { "epoch": 1.71, "learning_rate": 0.00011787452796779248, "loss": 1.5301, "step": 21683 }, { "epoch": 1.71, "learning_rate": 0.0001178624551500821, "loss": 1.5182, "step": 21684 }, { "epoch": 1.71, "learning_rate": 0.0001178503825505679, "loss": 1.4864, "step": 21685 }, { "epoch": 1.71, "learning_rate": 0.0001178383101693319, "loss": 1.4372, "step": 21686 }, { "epoch": 1.71, "learning_rate": 0.00011782623800645602, "loss": 1.5054, "step": 21687 }, { "epoch": 1.71, "learning_rate": 0.00011781416606202223, "loss": 1.5361, "step": 21688 }, { "epoch": 1.71, "learning_rate": 0.00011780209433611247, "loss": 1.4908, "step": 21689 }, { "epoch": 1.71, "learning_rate": 0.00011779002282880872, "loss": 1.5077, "step": 21690 }, { "epoch": 1.71, "learning_rate": 0.00011777795154019296, "loss": 1.4826, "step": 21691 }, { "epoch": 1.71, "learning_rate": 0.00011776588047034711, "loss": 1.4563, "step": 21692 }, { "epoch": 1.71, "learning_rate": 0.00011775380961935316, "loss": 1.5122, "step": 21693 }, { "epoch": 1.71, "learning_rate": 0.00011774173898729304, "loss": 1.5389, "step": 21694 }, { "epoch": 1.71, "learning_rate": 0.00011772966857424871, "loss": 1.4913, "step": 21695 }, { "epoch": 1.71, "learning_rate": 0.00011771759838030207, "loss": 1.5403, "step": 21696 }, { "epoch": 1.71, "learning_rate": 0.00011770552840553516, "loss": 1.5086, "step": 21697 }, { "epoch": 1.71, "learning_rate": 0.00011769345865002993, "loss": 1.4935, "step": 21698 }, { "epoch": 1.71, "learning_rate": 0.00011768138911386826, "loss": 1.473, "step": 21699 }, { "epoch": 1.71, "learning_rate": 0.00011766931979713214, "loss": 1.4336, "step": 21700 }, { "epoch": 1.71, "learning_rate": 0.00011765725069990347, "loss": 1.4842, "step": 21701 }, { "epoch": 1.71, "learning_rate": 0.00011764518182226421, "loss": 1.531, "step": 21702 }, { "epoch": 1.71, "learning_rate": 0.00011763311316429636, "loss": 1.5034, "step": 21703 }, { "epoch": 1.71, "learning_rate": 0.00011762104472608177, "loss": 1.5245, "step": 21704 }, { "epoch": 1.71, "learning_rate": 0.0001176089765077024, "loss": 1.5292, "step": 21705 }, { "epoch": 1.71, "learning_rate": 0.00011759690850924027, "loss": 1.5075, "step": 21706 }, { "epoch": 1.71, "learning_rate": 0.0001175848407307772, "loss": 1.4793, "step": 21707 }, { "epoch": 1.71, "learning_rate": 0.00011757277317239521, "loss": 1.5059, "step": 21708 }, { "epoch": 1.71, "learning_rate": 0.00011756070583417617, "loss": 1.544, "step": 21709 }, { "epoch": 1.71, "learning_rate": 0.00011754863871620203, "loss": 1.4878, "step": 21710 }, { "epoch": 1.71, "learning_rate": 0.00011753657181855475, "loss": 1.4575, "step": 21711 }, { "epoch": 1.71, "learning_rate": 0.00011752450514131617, "loss": 1.5104, "step": 21712 }, { "epoch": 1.71, "learning_rate": 0.00011751243868456832, "loss": 1.4892, "step": 21713 }, { "epoch": 1.71, "learning_rate": 0.00011750037244839306, "loss": 1.5046, "step": 21714 }, { "epoch": 1.71, "learning_rate": 0.0001174883064328724, "loss": 1.4801, "step": 21715 }, { "epoch": 1.71, "learning_rate": 0.00011747624063808815, "loss": 1.4941, "step": 21716 }, { "epoch": 1.71, "learning_rate": 0.00011746417506412228, "loss": 1.5244, "step": 21717 }, { "epoch": 1.71, "learning_rate": 0.00011745210971105673, "loss": 1.5306, "step": 21718 }, { "epoch": 1.71, "learning_rate": 0.00011744004457897338, "loss": 1.444, "step": 21719 }, { "epoch": 1.71, "learning_rate": 0.00011742797966795418, "loss": 1.4778, "step": 21720 }, { "epoch": 1.71, "learning_rate": 0.00011741591497808099, "loss": 1.5031, "step": 21721 }, { "epoch": 1.71, "learning_rate": 0.00011740385050943576, "loss": 1.4679, "step": 21722 }, { "epoch": 1.71, "learning_rate": 0.00011739178626210042, "loss": 1.495, "step": 21723 }, { "epoch": 1.71, "learning_rate": 0.00011737972223615684, "loss": 1.4789, "step": 21724 }, { "epoch": 1.71, "learning_rate": 0.00011736765843168697, "loss": 1.5634, "step": 21725 }, { "epoch": 1.71, "learning_rate": 0.00011735559484877266, "loss": 1.4928, "step": 21726 }, { "epoch": 1.71, "learning_rate": 0.00011734353148749584, "loss": 1.5092, "step": 21727 }, { "epoch": 1.71, "learning_rate": 0.0001173314683479384, "loss": 1.5391, "step": 21728 }, { "epoch": 1.71, "learning_rate": 0.00011731940543018231, "loss": 1.5576, "step": 21729 }, { "epoch": 1.71, "learning_rate": 0.0001173073427343094, "loss": 1.4675, "step": 21730 }, { "epoch": 1.71, "learning_rate": 0.00011729528026040158, "loss": 1.4554, "step": 21731 }, { "epoch": 1.71, "learning_rate": 0.00011728321800854081, "loss": 1.5468, "step": 21732 }, { "epoch": 1.71, "learning_rate": 0.00011727115597880888, "loss": 1.4949, "step": 21733 }, { "epoch": 1.71, "learning_rate": 0.00011725909417128776, "loss": 1.4844, "step": 21734 }, { "epoch": 1.71, "learning_rate": 0.00011724703258605935, "loss": 1.4894, "step": 21735 }, { "epoch": 1.71, "learning_rate": 0.00011723497122320549, "loss": 1.5277, "step": 21736 }, { "epoch": 1.71, "learning_rate": 0.00011722291008280812, "loss": 1.4879, "step": 21737 }, { "epoch": 1.71, "learning_rate": 0.00011721084916494906, "loss": 1.4581, "step": 21738 }, { "epoch": 1.71, "learning_rate": 0.00011719878846971024, "loss": 1.4552, "step": 21739 }, { "epoch": 1.71, "learning_rate": 0.0001171867279971736, "loss": 1.5276, "step": 21740 }, { "epoch": 1.71, "learning_rate": 0.00011717466774742092, "loss": 1.4879, "step": 21741 }, { "epoch": 1.71, "learning_rate": 0.00011716260772053415, "loss": 1.5284, "step": 21742 }, { "epoch": 1.71, "learning_rate": 0.00011715054791659514, "loss": 1.4829, "step": 21743 }, { "epoch": 1.71, "learning_rate": 0.00011713848833568573, "loss": 1.5225, "step": 21744 }, { "epoch": 1.71, "learning_rate": 0.0001171264289778879, "loss": 1.4853, "step": 21745 }, { "epoch": 1.71, "learning_rate": 0.00011711436984328347, "loss": 1.4977, "step": 21746 }, { "epoch": 1.71, "learning_rate": 0.00011710231093195437, "loss": 1.4956, "step": 21747 }, { "epoch": 1.71, "learning_rate": 0.00011709025224398237, "loss": 1.4475, "step": 21748 }, { "epoch": 1.71, "learning_rate": 0.00011707819377944944, "loss": 1.557, "step": 21749 }, { "epoch": 1.71, "learning_rate": 0.00011706613553843736, "loss": 1.4646, "step": 21750 }, { "epoch": 1.71, "learning_rate": 0.00011705407752102806, "loss": 1.4843, "step": 21751 }, { "epoch": 1.71, "learning_rate": 0.00011704201972730343, "loss": 1.4955, "step": 21752 }, { "epoch": 1.71, "learning_rate": 0.00011702996215734525, "loss": 1.4307, "step": 21753 }, { "epoch": 1.71, "learning_rate": 0.00011701790481123548, "loss": 1.4937, "step": 21754 }, { "epoch": 1.71, "learning_rate": 0.00011700584768905588, "loss": 1.4803, "step": 21755 }, { "epoch": 1.71, "learning_rate": 0.00011699379079088839, "loss": 1.5109, "step": 21756 }, { "epoch": 1.71, "learning_rate": 0.00011698173411681487, "loss": 1.5359, "step": 21757 }, { "epoch": 1.71, "learning_rate": 0.00011696967766691713, "loss": 1.4953, "step": 21758 }, { "epoch": 1.71, "learning_rate": 0.000116957621441277, "loss": 1.4488, "step": 21759 }, { "epoch": 1.71, "learning_rate": 0.00011694556543997643, "loss": 1.5283, "step": 21760 }, { "epoch": 1.71, "learning_rate": 0.00011693350966309725, "loss": 1.4602, "step": 21761 }, { "epoch": 1.71, "learning_rate": 0.00011692145411072126, "loss": 1.5352, "step": 21762 }, { "epoch": 1.71, "learning_rate": 0.00011690939878293037, "loss": 1.5044, "step": 21763 }, { "epoch": 1.71, "learning_rate": 0.00011689734367980642, "loss": 1.5356, "step": 21764 }, { "epoch": 1.71, "learning_rate": 0.00011688528880143119, "loss": 1.494, "step": 21765 }, { "epoch": 1.71, "learning_rate": 0.00011687323414788663, "loss": 1.5042, "step": 21766 }, { "epoch": 1.71, "learning_rate": 0.00011686117971925447, "loss": 1.4992, "step": 21767 }, { "epoch": 1.71, "learning_rate": 0.00011684912551561664, "loss": 1.4584, "step": 21768 }, { "epoch": 1.71, "learning_rate": 0.00011683707153705497, "loss": 1.4876, "step": 21769 }, { "epoch": 1.71, "learning_rate": 0.00011682501778365127, "loss": 1.4736, "step": 21770 }, { "epoch": 1.71, "learning_rate": 0.0001168129642554874, "loss": 1.4856, "step": 21771 }, { "epoch": 1.71, "learning_rate": 0.00011680091095264516, "loss": 1.4931, "step": 21772 }, { "epoch": 1.71, "learning_rate": 0.00011678885787520643, "loss": 1.5092, "step": 21773 }, { "epoch": 1.71, "learning_rate": 0.00011677680502325305, "loss": 1.4945, "step": 21774 }, { "epoch": 1.71, "learning_rate": 0.00011676475239686673, "loss": 1.4686, "step": 21775 }, { "epoch": 1.71, "learning_rate": 0.0001167526999961295, "loss": 1.502, "step": 21776 }, { "epoch": 1.71, "learning_rate": 0.00011674064782112306, "loss": 1.4837, "step": 21777 }, { "epoch": 1.71, "learning_rate": 0.0001167285958719293, "loss": 1.4697, "step": 21778 }, { "epoch": 1.71, "learning_rate": 0.00011671654414862998, "loss": 1.4899, "step": 21779 }, { "epoch": 1.71, "learning_rate": 0.00011670449265130696, "loss": 1.5091, "step": 21780 }, { "epoch": 1.71, "learning_rate": 0.0001166924413800421, "loss": 1.4932, "step": 21781 }, { "epoch": 1.71, "learning_rate": 0.00011668039033491711, "loss": 1.5346, "step": 21782 }, { "epoch": 1.71, "learning_rate": 0.00011666833951601395, "loss": 1.5021, "step": 21783 }, { "epoch": 1.71, "learning_rate": 0.00011665628892341433, "loss": 1.489, "step": 21784 }, { "epoch": 1.71, "learning_rate": 0.00011664423855720012, "loss": 1.4885, "step": 21785 }, { "epoch": 1.71, "learning_rate": 0.00011663218841745314, "loss": 1.4825, "step": 21786 }, { "epoch": 1.71, "learning_rate": 0.00011662013850425516, "loss": 1.4402, "step": 21787 }, { "epoch": 1.71, "learning_rate": 0.00011660808881768803, "loss": 1.5133, "step": 21788 }, { "epoch": 1.71, "learning_rate": 0.00011659603935783357, "loss": 1.4744, "step": 21789 }, { "epoch": 1.71, "learning_rate": 0.00011658399012477353, "loss": 1.5261, "step": 21790 }, { "epoch": 1.71, "learning_rate": 0.00011657194111858974, "loss": 1.501, "step": 21791 }, { "epoch": 1.71, "learning_rate": 0.00011655989233936404, "loss": 1.5039, "step": 21792 }, { "epoch": 1.71, "learning_rate": 0.00011654784378717825, "loss": 1.499, "step": 21793 }, { "epoch": 1.71, "learning_rate": 0.00011653579546211413, "loss": 1.4708, "step": 21794 }, { "epoch": 1.71, "learning_rate": 0.0001165237473642535, "loss": 1.4568, "step": 21795 }, { "epoch": 1.71, "learning_rate": 0.00011651169949367813, "loss": 1.5327, "step": 21796 }, { "epoch": 1.72, "learning_rate": 0.00011649965185046984, "loss": 1.4441, "step": 21797 }, { "epoch": 1.72, "learning_rate": 0.00011648760443471045, "loss": 1.4718, "step": 21798 }, { "epoch": 1.72, "learning_rate": 0.0001164755572464817, "loss": 1.5542, "step": 21799 }, { "epoch": 1.72, "learning_rate": 0.00011646351028586544, "loss": 1.5415, "step": 21800 }, { "epoch": 1.72, "learning_rate": 0.00011645146355294344, "loss": 1.4788, "step": 21801 }, { "epoch": 1.72, "learning_rate": 0.00011643941704779747, "loss": 1.5376, "step": 21802 }, { "epoch": 1.72, "learning_rate": 0.00011642737077050936, "loss": 1.4918, "step": 21803 }, { "epoch": 1.72, "learning_rate": 0.00011641532472116087, "loss": 1.5142, "step": 21804 }, { "epoch": 1.72, "learning_rate": 0.00011640327889983377, "loss": 1.474, "step": 21805 }, { "epoch": 1.72, "learning_rate": 0.00011639123330660983, "loss": 1.4919, "step": 21806 }, { "epoch": 1.72, "learning_rate": 0.00011637918794157096, "loss": 1.5138, "step": 21807 }, { "epoch": 1.72, "learning_rate": 0.0001163671428047988, "loss": 1.4818, "step": 21808 }, { "epoch": 1.72, "learning_rate": 0.00011635509789637518, "loss": 1.4592, "step": 21809 }, { "epoch": 1.72, "learning_rate": 0.00011634305321638191, "loss": 1.5153, "step": 21810 }, { "epoch": 1.72, "learning_rate": 0.00011633100876490072, "loss": 1.5415, "step": 21811 }, { "epoch": 1.72, "learning_rate": 0.0001163189645420134, "loss": 1.5633, "step": 21812 }, { "epoch": 1.72, "learning_rate": 0.00011630692054780172, "loss": 1.4835, "step": 21813 }, { "epoch": 1.72, "learning_rate": 0.00011629487678234742, "loss": 1.5361, "step": 21814 }, { "epoch": 1.72, "learning_rate": 0.00011628283324573238, "loss": 1.5168, "step": 21815 }, { "epoch": 1.72, "learning_rate": 0.00011627078993803824, "loss": 1.5538, "step": 21816 }, { "epoch": 1.72, "learning_rate": 0.00011625874685934683, "loss": 1.5534, "step": 21817 }, { "epoch": 1.72, "learning_rate": 0.00011624670400973996, "loss": 1.5094, "step": 21818 }, { "epoch": 1.72, "learning_rate": 0.00011623466138929928, "loss": 1.5114, "step": 21819 }, { "epoch": 1.72, "learning_rate": 0.00011622261899810666, "loss": 1.462, "step": 21820 }, { "epoch": 1.72, "learning_rate": 0.00011621057683624378, "loss": 1.4697, "step": 21821 }, { "epoch": 1.72, "learning_rate": 0.00011619853490379242, "loss": 1.5199, "step": 21822 }, { "epoch": 1.72, "learning_rate": 0.00011618649320083437, "loss": 1.5217, "step": 21823 }, { "epoch": 1.72, "learning_rate": 0.0001161744517274514, "loss": 1.5031, "step": 21824 }, { "epoch": 1.72, "learning_rate": 0.00011616241048372522, "loss": 1.4758, "step": 21825 }, { "epoch": 1.72, "learning_rate": 0.00011615036946973759, "loss": 1.4821, "step": 21826 }, { "epoch": 1.72, "learning_rate": 0.00011613832868557032, "loss": 1.5424, "step": 21827 }, { "epoch": 1.72, "learning_rate": 0.00011612628813130506, "loss": 1.432, "step": 21828 }, { "epoch": 1.72, "learning_rate": 0.00011611424780702362, "loss": 1.5258, "step": 21829 }, { "epoch": 1.72, "learning_rate": 0.00011610220771280778, "loss": 1.5107, "step": 21830 }, { "epoch": 1.72, "learning_rate": 0.0001160901678487392, "loss": 1.5418, "step": 21831 }, { "epoch": 1.72, "learning_rate": 0.0001160781282148997, "loss": 1.5465, "step": 21832 }, { "epoch": 1.72, "learning_rate": 0.00011606608881137095, "loss": 1.5296, "step": 21833 }, { "epoch": 1.72, "learning_rate": 0.00011605404963823474, "loss": 1.4953, "step": 21834 }, { "epoch": 1.72, "learning_rate": 0.00011604201069557283, "loss": 1.5021, "step": 21835 }, { "epoch": 1.72, "learning_rate": 0.0001160299719834669, "loss": 1.5264, "step": 21836 }, { "epoch": 1.72, "learning_rate": 0.00011601793350199873, "loss": 1.5237, "step": 21837 }, { "epoch": 1.72, "learning_rate": 0.00011600589525124995, "loss": 1.4743, "step": 21838 }, { "epoch": 1.72, "learning_rate": 0.00011599385723130249, "loss": 1.4846, "step": 21839 }, { "epoch": 1.72, "learning_rate": 0.00011598181944223793, "loss": 1.5016, "step": 21840 }, { "epoch": 1.72, "learning_rate": 0.00011596978188413807, "loss": 1.4983, "step": 21841 }, { "epoch": 1.72, "learning_rate": 0.0001159577445570846, "loss": 1.5422, "step": 21842 }, { "epoch": 1.72, "learning_rate": 0.00011594570746115924, "loss": 1.4817, "step": 21843 }, { "epoch": 1.72, "learning_rate": 0.00011593367059644377, "loss": 1.4687, "step": 21844 }, { "epoch": 1.72, "learning_rate": 0.00011592163396301983, "loss": 1.5071, "step": 21845 }, { "epoch": 1.72, "learning_rate": 0.00011590959756096922, "loss": 1.4531, "step": 21846 }, { "epoch": 1.72, "learning_rate": 0.00011589756139037365, "loss": 1.5099, "step": 21847 }, { "epoch": 1.72, "learning_rate": 0.00011588552545131478, "loss": 1.5048, "step": 21848 }, { "epoch": 1.72, "learning_rate": 0.00011587348974387441, "loss": 1.4703, "step": 21849 }, { "epoch": 1.72, "learning_rate": 0.00011586145426813417, "loss": 1.4876, "step": 21850 }, { "epoch": 1.72, "learning_rate": 0.00011584941902417583, "loss": 1.5792, "step": 21851 }, { "epoch": 1.72, "learning_rate": 0.00011583738401208111, "loss": 1.5129, "step": 21852 }, { "epoch": 1.72, "learning_rate": 0.00011582534923193166, "loss": 1.4772, "step": 21853 }, { "epoch": 1.72, "learning_rate": 0.0001158133146838092, "loss": 1.5065, "step": 21854 }, { "epoch": 1.72, "learning_rate": 0.0001158012803677955, "loss": 1.5115, "step": 21855 }, { "epoch": 1.72, "learning_rate": 0.00011578924628397227, "loss": 1.5596, "step": 21856 }, { "epoch": 1.72, "learning_rate": 0.00011577721243242117, "loss": 1.5103, "step": 21857 }, { "epoch": 1.72, "learning_rate": 0.00011576517881322387, "loss": 1.4645, "step": 21858 }, { "epoch": 1.72, "learning_rate": 0.00011575314542646217, "loss": 1.497, "step": 21859 }, { "epoch": 1.72, "learning_rate": 0.00011574111227221767, "loss": 1.5305, "step": 21860 }, { "epoch": 1.72, "learning_rate": 0.00011572907935057216, "loss": 1.5523, "step": 21861 }, { "epoch": 1.72, "learning_rate": 0.00011571704666160724, "loss": 1.4699, "step": 21862 }, { "epoch": 1.72, "learning_rate": 0.00011570501420540468, "loss": 1.4998, "step": 21863 }, { "epoch": 1.72, "learning_rate": 0.00011569298198204616, "loss": 1.5148, "step": 21864 }, { "epoch": 1.72, "learning_rate": 0.00011568094999161332, "loss": 1.4403, "step": 21865 }, { "epoch": 1.72, "learning_rate": 0.00011566891823418795, "loss": 1.537, "step": 21866 }, { "epoch": 1.72, "learning_rate": 0.00011565688670985163, "loss": 1.5663, "step": 21867 }, { "epoch": 1.72, "learning_rate": 0.00011564485541868609, "loss": 1.52, "step": 21868 }, { "epoch": 1.72, "learning_rate": 0.000115632824360773, "loss": 1.4904, "step": 21869 }, { "epoch": 1.72, "learning_rate": 0.00011562079353619413, "loss": 1.5177, "step": 21870 }, { "epoch": 1.72, "learning_rate": 0.00011560876294503105, "loss": 1.5503, "step": 21871 }, { "epoch": 1.72, "learning_rate": 0.00011559673258736552, "loss": 1.5356, "step": 21872 }, { "epoch": 1.72, "learning_rate": 0.00011558470246327922, "loss": 1.4913, "step": 21873 }, { "epoch": 1.72, "learning_rate": 0.00011557267257285374, "loss": 1.5184, "step": 21874 }, { "epoch": 1.72, "learning_rate": 0.00011556064291617085, "loss": 1.4641, "step": 21875 }, { "epoch": 1.72, "learning_rate": 0.0001155486134933122, "loss": 1.5139, "step": 21876 }, { "epoch": 1.72, "learning_rate": 0.00011553658430435943, "loss": 1.4969, "step": 21877 }, { "epoch": 1.72, "learning_rate": 0.00011552455534939425, "loss": 1.5087, "step": 21878 }, { "epoch": 1.72, "learning_rate": 0.0001155125266284983, "loss": 1.5017, "step": 21879 }, { "epoch": 1.72, "learning_rate": 0.00011550049814175326, "loss": 1.4887, "step": 21880 }, { "epoch": 1.72, "learning_rate": 0.00011548846988924081, "loss": 1.4585, "step": 21881 }, { "epoch": 1.72, "learning_rate": 0.0001154764418710426, "loss": 1.4869, "step": 21882 }, { "epoch": 1.72, "learning_rate": 0.00011546441408724029, "loss": 1.4536, "step": 21883 }, { "epoch": 1.72, "learning_rate": 0.00011545238653791557, "loss": 1.5074, "step": 21884 }, { "epoch": 1.72, "learning_rate": 0.00011544035922315002, "loss": 1.4954, "step": 21885 }, { "epoch": 1.72, "learning_rate": 0.0001154283321430254, "loss": 1.5201, "step": 21886 }, { "epoch": 1.72, "learning_rate": 0.00011541630529762333, "loss": 1.4452, "step": 21887 }, { "epoch": 1.72, "learning_rate": 0.00011540427868702549, "loss": 1.4284, "step": 21888 }, { "epoch": 1.72, "learning_rate": 0.00011539225231131347, "loss": 1.6, "step": 21889 }, { "epoch": 1.72, "learning_rate": 0.00011538022617056898, "loss": 1.4925, "step": 21890 }, { "epoch": 1.72, "learning_rate": 0.00011536820026487365, "loss": 1.5019, "step": 21891 }, { "epoch": 1.72, "learning_rate": 0.00011535617459430909, "loss": 1.4889, "step": 21892 }, { "epoch": 1.72, "learning_rate": 0.00011534414915895704, "loss": 1.4703, "step": 21893 }, { "epoch": 1.72, "learning_rate": 0.00011533212395889905, "loss": 1.4774, "step": 21894 }, { "epoch": 1.72, "learning_rate": 0.00011532009899421685, "loss": 1.4353, "step": 21895 }, { "epoch": 1.72, "learning_rate": 0.00011530807426499201, "loss": 1.466, "step": 21896 }, { "epoch": 1.72, "learning_rate": 0.00011529604977130619, "loss": 1.4694, "step": 21897 }, { "epoch": 1.72, "learning_rate": 0.00011528402551324109, "loss": 1.4774, "step": 21898 }, { "epoch": 1.72, "learning_rate": 0.00011527200149087825, "loss": 1.5012, "step": 21899 }, { "epoch": 1.72, "learning_rate": 0.00011525997770429937, "loss": 1.5184, "step": 21900 }, { "epoch": 1.72, "learning_rate": 0.000115247954153586, "loss": 1.5062, "step": 21901 }, { "epoch": 1.72, "learning_rate": 0.00011523593083881994, "loss": 1.5275, "step": 21902 }, { "epoch": 1.72, "learning_rate": 0.00011522390776008271, "loss": 1.4936, "step": 21903 }, { "epoch": 1.72, "learning_rate": 0.00011521188491745593, "loss": 1.4416, "step": 21904 }, { "epoch": 1.72, "learning_rate": 0.00011519986231102129, "loss": 1.5371, "step": 21905 }, { "epoch": 1.72, "learning_rate": 0.00011518783994086033, "loss": 1.4748, "step": 21906 }, { "epoch": 1.72, "learning_rate": 0.0001151758178070548, "loss": 1.522, "step": 21907 }, { "epoch": 1.72, "learning_rate": 0.00011516379590968619, "loss": 1.4949, "step": 21908 }, { "epoch": 1.72, "learning_rate": 0.00011515177424883618, "loss": 1.5433, "step": 21909 }, { "epoch": 1.72, "learning_rate": 0.00011513975282458643, "loss": 1.5048, "step": 21910 }, { "epoch": 1.72, "learning_rate": 0.0001151277316370185, "loss": 1.5097, "step": 21911 }, { "epoch": 1.72, "learning_rate": 0.00011511571068621402, "loss": 1.4218, "step": 21912 }, { "epoch": 1.72, "learning_rate": 0.00011510368997225464, "loss": 1.4586, "step": 21913 }, { "epoch": 1.72, "learning_rate": 0.0001150916694952219, "loss": 1.4927, "step": 21914 }, { "epoch": 1.72, "learning_rate": 0.00011507964925519752, "loss": 1.468, "step": 21915 }, { "epoch": 1.72, "learning_rate": 0.00011506762925226295, "loss": 1.4981, "step": 21916 }, { "epoch": 1.72, "learning_rate": 0.0001150556094865, "loss": 1.532, "step": 21917 }, { "epoch": 1.72, "learning_rate": 0.00011504358995799012, "loss": 1.4571, "step": 21918 }, { "epoch": 1.72, "learning_rate": 0.00011503157066681504, "loss": 1.4705, "step": 21919 }, { "epoch": 1.72, "learning_rate": 0.00011501955161305623, "loss": 1.488, "step": 21920 }, { "epoch": 1.72, "learning_rate": 0.00011500753279679539, "loss": 1.4521, "step": 21921 }, { "epoch": 1.72, "learning_rate": 0.0001149955142181141, "loss": 1.5566, "step": 21922 }, { "epoch": 1.72, "learning_rate": 0.00011498349587709395, "loss": 1.4782, "step": 21923 }, { "epoch": 1.73, "learning_rate": 0.00011497147777381656, "loss": 1.4882, "step": 21924 }, { "epoch": 1.73, "learning_rate": 0.00011495945990836345, "loss": 1.5078, "step": 21925 }, { "epoch": 1.73, "learning_rate": 0.00011494744228081631, "loss": 1.4632, "step": 21926 }, { "epoch": 1.73, "learning_rate": 0.0001149354248912567, "loss": 1.5036, "step": 21927 }, { "epoch": 1.73, "learning_rate": 0.00011492340773976616, "loss": 1.496, "step": 21928 }, { "epoch": 1.73, "learning_rate": 0.00011491139082642636, "loss": 1.4721, "step": 21929 }, { "epoch": 1.73, "learning_rate": 0.00011489937415131884, "loss": 1.4573, "step": 21930 }, { "epoch": 1.73, "learning_rate": 0.00011488735771452521, "loss": 1.452, "step": 21931 }, { "epoch": 1.73, "learning_rate": 0.00011487534151612698, "loss": 1.501, "step": 21932 }, { "epoch": 1.73, "learning_rate": 0.00011486332555620586, "loss": 1.4838, "step": 21933 }, { "epoch": 1.73, "learning_rate": 0.00011485130983484338, "loss": 1.51, "step": 21934 }, { "epoch": 1.73, "learning_rate": 0.00011483929435212109, "loss": 1.5409, "step": 21935 }, { "epoch": 1.73, "learning_rate": 0.00011482727910812061, "loss": 1.5138, "step": 21936 }, { "epoch": 1.73, "learning_rate": 0.00011481526410292347, "loss": 1.4601, "step": 21937 }, { "epoch": 1.73, "learning_rate": 0.00011480324933661126, "loss": 1.4668, "step": 21938 }, { "epoch": 1.73, "learning_rate": 0.00011479123480926561, "loss": 1.5292, "step": 21939 }, { "epoch": 1.73, "learning_rate": 0.000114779220520968, "loss": 1.5164, "step": 21940 }, { "epoch": 1.73, "learning_rate": 0.00011476720647180006, "loss": 1.4796, "step": 21941 }, { "epoch": 1.73, "learning_rate": 0.00011475519266184337, "loss": 1.5116, "step": 21942 }, { "epoch": 1.73, "learning_rate": 0.00011474317909117944, "loss": 1.4171, "step": 21943 }, { "epoch": 1.73, "learning_rate": 0.0001147311657598899, "loss": 1.4449, "step": 21944 }, { "epoch": 1.73, "learning_rate": 0.00011471915266805624, "loss": 1.5341, "step": 21945 }, { "epoch": 1.73, "learning_rate": 0.00011470713981576008, "loss": 1.4861, "step": 21946 }, { "epoch": 1.73, "learning_rate": 0.00011469512720308299, "loss": 1.4571, "step": 21947 }, { "epoch": 1.73, "learning_rate": 0.00011468311483010644, "loss": 1.5567, "step": 21948 }, { "epoch": 1.73, "learning_rate": 0.00011467110269691208, "loss": 1.5348, "step": 21949 }, { "epoch": 1.73, "learning_rate": 0.00011465909080358144, "loss": 1.5227, "step": 21950 }, { "epoch": 1.73, "learning_rate": 0.0001146470791501961, "loss": 1.5149, "step": 21951 }, { "epoch": 1.73, "learning_rate": 0.00011463506773683756, "loss": 1.5066, "step": 21952 }, { "epoch": 1.73, "learning_rate": 0.00011462305656358741, "loss": 1.5197, "step": 21953 }, { "epoch": 1.73, "learning_rate": 0.00011461104563052715, "loss": 1.5093, "step": 21954 }, { "epoch": 1.73, "learning_rate": 0.00011459903493773839, "loss": 1.49, "step": 21955 }, { "epoch": 1.73, "learning_rate": 0.00011458702448530265, "loss": 1.4679, "step": 21956 }, { "epoch": 1.73, "learning_rate": 0.00011457501427330145, "loss": 1.5195, "step": 21957 }, { "epoch": 1.73, "learning_rate": 0.00011456300430181636, "loss": 1.4719, "step": 21958 }, { "epoch": 1.73, "learning_rate": 0.00011455099457092893, "loss": 1.473, "step": 21959 }, { "epoch": 1.73, "learning_rate": 0.00011453898508072067, "loss": 1.4846, "step": 21960 }, { "epoch": 1.73, "learning_rate": 0.00011452697583127316, "loss": 1.5012, "step": 21961 }, { "epoch": 1.73, "learning_rate": 0.00011451496682266787, "loss": 1.4668, "step": 21962 }, { "epoch": 1.73, "learning_rate": 0.00011450295805498637, "loss": 1.4933, "step": 21963 }, { "epoch": 1.73, "learning_rate": 0.00011449094952831017, "loss": 1.5032, "step": 21964 }, { "epoch": 1.73, "learning_rate": 0.00011447894124272089, "loss": 1.4718, "step": 21965 }, { "epoch": 1.73, "learning_rate": 0.00011446693319829996, "loss": 1.4638, "step": 21966 }, { "epoch": 1.73, "learning_rate": 0.00011445492539512896, "loss": 1.4554, "step": 21967 }, { "epoch": 1.73, "learning_rate": 0.00011444291783328943, "loss": 1.4749, "step": 21968 }, { "epoch": 1.73, "learning_rate": 0.00011443091051286282, "loss": 1.4621, "step": 21969 }, { "epoch": 1.73, "learning_rate": 0.00011441890343393071, "loss": 1.524, "step": 21970 }, { "epoch": 1.73, "learning_rate": 0.00011440689659657464, "loss": 1.5302, "step": 21971 }, { "epoch": 1.73, "learning_rate": 0.00011439489000087607, "loss": 1.49, "step": 21972 }, { "epoch": 1.73, "learning_rate": 0.00011438288364691657, "loss": 1.4521, "step": 21973 }, { "epoch": 1.73, "learning_rate": 0.00011437087753477761, "loss": 1.4869, "step": 21974 }, { "epoch": 1.73, "learning_rate": 0.00011435887166454074, "loss": 1.4977, "step": 21975 }, { "epoch": 1.73, "learning_rate": 0.00011434686603628748, "loss": 1.4957, "step": 21976 }, { "epoch": 1.73, "learning_rate": 0.0001143348606500993, "loss": 1.4507, "step": 21977 }, { "epoch": 1.73, "learning_rate": 0.00011432285550605777, "loss": 1.4978, "step": 21978 }, { "epoch": 1.73, "learning_rate": 0.00011431085060424426, "loss": 1.4572, "step": 21979 }, { "epoch": 1.73, "learning_rate": 0.00011429884594474047, "loss": 1.4642, "step": 21980 }, { "epoch": 1.73, "learning_rate": 0.00011428684152762778, "loss": 1.5046, "step": 21981 }, { "epoch": 1.73, "learning_rate": 0.00011427483735298775, "loss": 1.4848, "step": 21982 }, { "epoch": 1.73, "learning_rate": 0.00011426283342090188, "loss": 1.5113, "step": 21983 }, { "epoch": 1.73, "learning_rate": 0.00011425082973145161, "loss": 1.4739, "step": 21984 }, { "epoch": 1.73, "learning_rate": 0.00011423882628471852, "loss": 1.5461, "step": 21985 }, { "epoch": 1.73, "learning_rate": 0.00011422682308078403, "loss": 1.5106, "step": 21986 }, { "epoch": 1.73, "learning_rate": 0.00011421482011972967, "loss": 1.4884, "step": 21987 }, { "epoch": 1.73, "learning_rate": 0.00011420281740163697, "loss": 1.5756, "step": 21988 }, { "epoch": 1.73, "learning_rate": 0.00011419081492658736, "loss": 1.465, "step": 21989 }, { "epoch": 1.73, "learning_rate": 0.00011417881269466236, "loss": 1.5383, "step": 21990 }, { "epoch": 1.73, "learning_rate": 0.00011416681070594343, "loss": 1.5478, "step": 21991 }, { "epoch": 1.73, "learning_rate": 0.0001141548089605121, "loss": 1.5555, "step": 21992 }, { "epoch": 1.73, "learning_rate": 0.00011414280745844985, "loss": 1.4659, "step": 21993 }, { "epoch": 1.73, "learning_rate": 0.00011413080619983814, "loss": 1.5253, "step": 21994 }, { "epoch": 1.73, "learning_rate": 0.0001141188051847584, "loss": 1.4709, "step": 21995 }, { "epoch": 1.73, "learning_rate": 0.00011410680441329222, "loss": 1.4962, "step": 21996 }, { "epoch": 1.73, "learning_rate": 0.00011409480388552105, "loss": 1.4983, "step": 21997 }, { "epoch": 1.73, "learning_rate": 0.00011408280360152633, "loss": 1.5203, "step": 21998 }, { "epoch": 1.73, "learning_rate": 0.00011407080356138956, "loss": 1.4904, "step": 21999 }, { "epoch": 1.73, "learning_rate": 0.00011405880376519222, "loss": 1.5718, "step": 22000 }, { "epoch": 1.73, "learning_rate": 0.00011404680421301575, "loss": 1.5214, "step": 22001 }, { "epoch": 1.73, "learning_rate": 0.00011403480490494166, "loss": 1.5165, "step": 22002 }, { "epoch": 1.73, "learning_rate": 0.00011402280584105137, "loss": 1.4844, "step": 22003 }, { "epoch": 1.73, "learning_rate": 0.00011401080702142637, "loss": 1.4727, "step": 22004 }, { "epoch": 1.73, "learning_rate": 0.00011399880844614818, "loss": 1.5617, "step": 22005 }, { "epoch": 1.73, "learning_rate": 0.00011398681011529816, "loss": 1.4765, "step": 22006 }, { "epoch": 1.73, "learning_rate": 0.00011397481202895786, "loss": 1.4933, "step": 22007 }, { "epoch": 1.73, "learning_rate": 0.00011396281418720869, "loss": 1.52, "step": 22008 }, { "epoch": 1.73, "learning_rate": 0.00011395081659013211, "loss": 1.4937, "step": 22009 }, { "epoch": 1.73, "learning_rate": 0.00011393881923780964, "loss": 1.5215, "step": 22010 }, { "epoch": 1.73, "learning_rate": 0.00011392682213032258, "loss": 1.4979, "step": 22011 }, { "epoch": 1.73, "learning_rate": 0.00011391482526775258, "loss": 1.4988, "step": 22012 }, { "epoch": 1.73, "learning_rate": 0.00011390282865018097, "loss": 1.4822, "step": 22013 }, { "epoch": 1.73, "learning_rate": 0.00011389083227768928, "loss": 1.4733, "step": 22014 }, { "epoch": 1.73, "learning_rate": 0.00011387883615035888, "loss": 1.521, "step": 22015 }, { "epoch": 1.73, "learning_rate": 0.00011386684026827125, "loss": 1.437, "step": 22016 }, { "epoch": 1.73, "learning_rate": 0.00011385484463150784, "loss": 1.5031, "step": 22017 }, { "epoch": 1.73, "learning_rate": 0.00011384284924015007, "loss": 1.5062, "step": 22018 }, { "epoch": 1.73, "learning_rate": 0.00011383085409427944, "loss": 1.5117, "step": 22019 }, { "epoch": 1.73, "learning_rate": 0.00011381885919397733, "loss": 1.5086, "step": 22020 }, { "epoch": 1.73, "learning_rate": 0.00011380686453932518, "loss": 1.5233, "step": 22021 }, { "epoch": 1.73, "learning_rate": 0.00011379487013040448, "loss": 1.5505, "step": 22022 }, { "epoch": 1.73, "learning_rate": 0.00011378287596729661, "loss": 1.4835, "step": 22023 }, { "epoch": 1.73, "learning_rate": 0.00011377088205008303, "loss": 1.4274, "step": 22024 }, { "epoch": 1.73, "learning_rate": 0.0001137588883788452, "loss": 1.4837, "step": 22025 }, { "epoch": 1.73, "learning_rate": 0.00011374689495366443, "loss": 1.4864, "step": 22026 }, { "epoch": 1.73, "learning_rate": 0.00011373490177462229, "loss": 1.4719, "step": 22027 }, { "epoch": 1.73, "learning_rate": 0.00011372290884180014, "loss": 1.4943, "step": 22028 }, { "epoch": 1.73, "learning_rate": 0.00011371091615527947, "loss": 1.4556, "step": 22029 }, { "epoch": 1.73, "learning_rate": 0.0001136989237151416, "loss": 1.5462, "step": 22030 }, { "epoch": 1.73, "learning_rate": 0.00011368693152146806, "loss": 1.4792, "step": 22031 }, { "epoch": 1.73, "learning_rate": 0.00011367493957434017, "loss": 1.4675, "step": 22032 }, { "epoch": 1.73, "learning_rate": 0.00011366294787383939, "loss": 1.5415, "step": 22033 }, { "epoch": 1.73, "learning_rate": 0.00011365095642004719, "loss": 1.5002, "step": 22034 }, { "epoch": 1.73, "learning_rate": 0.00011363896521304489, "loss": 1.4228, "step": 22035 }, { "epoch": 1.73, "learning_rate": 0.00011362697425291398, "loss": 1.5013, "step": 22036 }, { "epoch": 1.73, "learning_rate": 0.00011361498353973583, "loss": 1.4515, "step": 22037 }, { "epoch": 1.73, "learning_rate": 0.00011360299307359184, "loss": 1.4855, "step": 22038 }, { "epoch": 1.73, "learning_rate": 0.0001135910028545635, "loss": 1.5149, "step": 22039 }, { "epoch": 1.73, "learning_rate": 0.00011357901288273212, "loss": 1.5121, "step": 22040 }, { "epoch": 1.73, "learning_rate": 0.00011356702315817913, "loss": 1.4721, "step": 22041 }, { "epoch": 1.73, "learning_rate": 0.0001135550336809859, "loss": 1.4097, "step": 22042 }, { "epoch": 1.73, "learning_rate": 0.00011354304445123397, "loss": 1.5125, "step": 22043 }, { "epoch": 1.73, "learning_rate": 0.00011353105546900463, "loss": 1.486, "step": 22044 }, { "epoch": 1.73, "learning_rate": 0.00011351906673437926, "loss": 1.4732, "step": 22045 }, { "epoch": 1.73, "learning_rate": 0.00011350707824743935, "loss": 1.5026, "step": 22046 }, { "epoch": 1.73, "learning_rate": 0.0001134950900082662, "loss": 1.4605, "step": 22047 }, { "epoch": 1.73, "learning_rate": 0.00011348310201694129, "loss": 1.4983, "step": 22048 }, { "epoch": 1.73, "learning_rate": 0.00011347111427354592, "loss": 1.531, "step": 22049 }, { "epoch": 1.73, "learning_rate": 0.00011345912677816154, "loss": 1.4764, "step": 22050 }, { "epoch": 1.74, "learning_rate": 0.00011344713953086954, "loss": 1.5228, "step": 22051 }, { "epoch": 1.74, "learning_rate": 0.00011343515253175127, "loss": 1.4626, "step": 22052 }, { "epoch": 1.74, "learning_rate": 0.00011342316578088812, "loss": 1.5128, "step": 22053 }, { "epoch": 1.74, "learning_rate": 0.00011341117927836155, "loss": 1.512, "step": 22054 }, { "epoch": 1.74, "learning_rate": 0.00011339919302425283, "loss": 1.5125, "step": 22055 }, { "epoch": 1.74, "learning_rate": 0.00011338720701864342, "loss": 1.5102, "step": 22056 }, { "epoch": 1.74, "learning_rate": 0.00011337522126161464, "loss": 1.4214, "step": 22057 }, { "epoch": 1.74, "learning_rate": 0.00011336323575324788, "loss": 1.4589, "step": 22058 }, { "epoch": 1.74, "learning_rate": 0.00011335125049362455, "loss": 1.503, "step": 22059 }, { "epoch": 1.74, "learning_rate": 0.00011333926548282602, "loss": 1.4847, "step": 22060 }, { "epoch": 1.74, "learning_rate": 0.00011332728072093365, "loss": 1.4716, "step": 22061 }, { "epoch": 1.74, "learning_rate": 0.00011331529620802879, "loss": 1.5293, "step": 22062 }, { "epoch": 1.74, "learning_rate": 0.00011330331194419284, "loss": 1.5373, "step": 22063 }, { "epoch": 1.74, "learning_rate": 0.00011329132792950714, "loss": 1.5418, "step": 22064 }, { "epoch": 1.74, "learning_rate": 0.00011327934416405309, "loss": 1.4043, "step": 22065 }, { "epoch": 1.74, "learning_rate": 0.000113267360647912, "loss": 1.4734, "step": 22066 }, { "epoch": 1.74, "learning_rate": 0.00011325537738116526, "loss": 1.4359, "step": 22067 }, { "epoch": 1.74, "learning_rate": 0.00011324339436389427, "loss": 1.538, "step": 22068 }, { "epoch": 1.74, "learning_rate": 0.0001132314115961803, "loss": 1.4314, "step": 22069 }, { "epoch": 1.74, "learning_rate": 0.00011321942907810477, "loss": 1.4777, "step": 22070 }, { "epoch": 1.74, "learning_rate": 0.00011320744680974905, "loss": 1.4658, "step": 22071 }, { "epoch": 1.74, "learning_rate": 0.00011319546479119441, "loss": 1.4965, "step": 22072 }, { "epoch": 1.74, "learning_rate": 0.00011318348302252232, "loss": 1.5015, "step": 22073 }, { "epoch": 1.74, "learning_rate": 0.00011317150150381393, "loss": 1.497, "step": 22074 }, { "epoch": 1.74, "learning_rate": 0.00011315952023515083, "loss": 1.4711, "step": 22075 }, { "epoch": 1.74, "learning_rate": 0.00011314753921661424, "loss": 1.5293, "step": 22076 }, { "epoch": 1.74, "learning_rate": 0.00011313555844828553, "loss": 1.5261, "step": 22077 }, { "epoch": 1.74, "learning_rate": 0.00011312357793024604, "loss": 1.4559, "step": 22078 }, { "epoch": 1.74, "learning_rate": 0.00011311159766257706, "loss": 1.4679, "step": 22079 }, { "epoch": 1.74, "learning_rate": 0.00011309961764536004, "loss": 1.5415, "step": 22080 }, { "epoch": 1.74, "learning_rate": 0.0001130876378786762, "loss": 1.4063, "step": 22081 }, { "epoch": 1.74, "learning_rate": 0.00011307565836260694, "loss": 1.4841, "step": 22082 }, { "epoch": 1.74, "learning_rate": 0.00011306367909723363, "loss": 1.5321, "step": 22083 }, { "epoch": 1.74, "learning_rate": 0.0001130517000826375, "loss": 1.5106, "step": 22084 }, { "epoch": 1.74, "learning_rate": 0.00011303972131889997, "loss": 1.5351, "step": 22085 }, { "epoch": 1.74, "learning_rate": 0.0001130277428061023, "loss": 1.5237, "step": 22086 }, { "epoch": 1.74, "learning_rate": 0.00011301576454432588, "loss": 1.5138, "step": 22087 }, { "epoch": 1.74, "learning_rate": 0.00011300378653365203, "loss": 1.4375, "step": 22088 }, { "epoch": 1.74, "learning_rate": 0.00011299180877416198, "loss": 1.4774, "step": 22089 }, { "epoch": 1.74, "learning_rate": 0.00011297983126593716, "loss": 1.4497, "step": 22090 }, { "epoch": 1.74, "learning_rate": 0.00011296785400905886, "loss": 1.4189, "step": 22091 }, { "epoch": 1.74, "learning_rate": 0.00011295587700360843, "loss": 1.5062, "step": 22092 }, { "epoch": 1.74, "learning_rate": 0.00011294390024966711, "loss": 1.4501, "step": 22093 }, { "epoch": 1.74, "learning_rate": 0.00011293192374731625, "loss": 1.5694, "step": 22094 }, { "epoch": 1.74, "learning_rate": 0.00011291994749663724, "loss": 1.5273, "step": 22095 }, { "epoch": 1.74, "learning_rate": 0.00011290797149771127, "loss": 1.5321, "step": 22096 }, { "epoch": 1.74, "learning_rate": 0.00011289599575061972, "loss": 1.515, "step": 22097 }, { "epoch": 1.74, "learning_rate": 0.00011288402025544389, "loss": 1.5293, "step": 22098 }, { "epoch": 1.74, "learning_rate": 0.00011287204501226505, "loss": 1.5375, "step": 22099 }, { "epoch": 1.74, "learning_rate": 0.00011286007002116457, "loss": 1.5174, "step": 22100 }, { "epoch": 1.74, "learning_rate": 0.00011284809528222368, "loss": 1.5306, "step": 22101 }, { "epoch": 1.74, "learning_rate": 0.00011283612079552377, "loss": 1.4794, "step": 22102 }, { "epoch": 1.74, "learning_rate": 0.00011282414656114606, "loss": 1.4456, "step": 22103 }, { "epoch": 1.74, "learning_rate": 0.00011281217257917188, "loss": 1.4921, "step": 22104 }, { "epoch": 1.74, "learning_rate": 0.00011280019884968248, "loss": 1.4898, "step": 22105 }, { "epoch": 1.74, "learning_rate": 0.00011278822537275926, "loss": 1.5146, "step": 22106 }, { "epoch": 1.74, "learning_rate": 0.00011277625214848345, "loss": 1.499, "step": 22107 }, { "epoch": 1.74, "learning_rate": 0.00011276427917693632, "loss": 1.452, "step": 22108 }, { "epoch": 1.74, "learning_rate": 0.00011275230645819924, "loss": 1.4796, "step": 22109 }, { "epoch": 1.74, "learning_rate": 0.00011274033399235341, "loss": 1.5113, "step": 22110 }, { "epoch": 1.74, "learning_rate": 0.00011272836177948015, "loss": 1.5105, "step": 22111 }, { "epoch": 1.74, "learning_rate": 0.00011271638981966076, "loss": 1.5193, "step": 22112 }, { "epoch": 1.74, "learning_rate": 0.00011270441811297649, "loss": 1.4914, "step": 22113 }, { "epoch": 1.74, "learning_rate": 0.00011269244665950867, "loss": 1.4938, "step": 22114 }, { "epoch": 1.74, "learning_rate": 0.0001126804754593385, "loss": 1.4603, "step": 22115 }, { "epoch": 1.74, "learning_rate": 0.00011266850451254733, "loss": 1.4681, "step": 22116 }, { "epoch": 1.74, "learning_rate": 0.00011265653381921644, "loss": 1.5172, "step": 22117 }, { "epoch": 1.74, "learning_rate": 0.00011264456337942704, "loss": 1.5043, "step": 22118 }, { "epoch": 1.74, "learning_rate": 0.00011263259319326046, "loss": 1.5021, "step": 22119 }, { "epoch": 1.74, "learning_rate": 0.00011262062326079795, "loss": 1.4801, "step": 22120 }, { "epoch": 1.74, "learning_rate": 0.00011260865358212072, "loss": 1.5219, "step": 22121 }, { "epoch": 1.74, "learning_rate": 0.00011259668415731015, "loss": 1.4715, "step": 22122 }, { "epoch": 1.74, "learning_rate": 0.00011258471498644745, "loss": 1.4628, "step": 22123 }, { "epoch": 1.74, "learning_rate": 0.00011257274606961392, "loss": 1.5561, "step": 22124 }, { "epoch": 1.74, "learning_rate": 0.00011256077740689074, "loss": 1.4529, "step": 22125 }, { "epoch": 1.74, "learning_rate": 0.00011254880899835928, "loss": 1.4963, "step": 22126 }, { "epoch": 1.74, "learning_rate": 0.0001125368408441007, "loss": 1.531, "step": 22127 }, { "epoch": 1.74, "learning_rate": 0.00011252487294419628, "loss": 1.4919, "step": 22128 }, { "epoch": 1.74, "learning_rate": 0.00011251290529872734, "loss": 1.4949, "step": 22129 }, { "epoch": 1.74, "learning_rate": 0.00011250093790777506, "loss": 1.5161, "step": 22130 }, { "epoch": 1.74, "learning_rate": 0.00011248897077142073, "loss": 1.5005, "step": 22131 }, { "epoch": 1.74, "learning_rate": 0.00011247700388974557, "loss": 1.4761, "step": 22132 }, { "epoch": 1.74, "learning_rate": 0.00011246503726283083, "loss": 1.4723, "step": 22133 }, { "epoch": 1.74, "learning_rate": 0.00011245307089075781, "loss": 1.5189, "step": 22134 }, { "epoch": 1.74, "learning_rate": 0.00011244110477360771, "loss": 1.4977, "step": 22135 }, { "epoch": 1.74, "learning_rate": 0.00011242913891146172, "loss": 1.5253, "step": 22136 }, { "epoch": 1.74, "learning_rate": 0.0001124171733044012, "loss": 1.5039, "step": 22137 }, { "epoch": 1.74, "learning_rate": 0.00011240520795250735, "loss": 1.5078, "step": 22138 }, { "epoch": 1.74, "learning_rate": 0.00011239324285586138, "loss": 1.4823, "step": 22139 }, { "epoch": 1.74, "learning_rate": 0.00011238127801454451, "loss": 1.5498, "step": 22140 }, { "epoch": 1.74, "learning_rate": 0.00011236931342863805, "loss": 1.4971, "step": 22141 }, { "epoch": 1.74, "learning_rate": 0.00011235734909822314, "loss": 1.4966, "step": 22142 }, { "epoch": 1.74, "learning_rate": 0.00011234538502338112, "loss": 1.5257, "step": 22143 }, { "epoch": 1.74, "learning_rate": 0.00011233342120419309, "loss": 1.516, "step": 22144 }, { "epoch": 1.74, "learning_rate": 0.00011232145764074035, "loss": 1.459, "step": 22145 }, { "epoch": 1.74, "learning_rate": 0.00011230949433310417, "loss": 1.5085, "step": 22146 }, { "epoch": 1.74, "learning_rate": 0.00011229753128136567, "loss": 1.4783, "step": 22147 }, { "epoch": 1.74, "learning_rate": 0.00011228556848560616, "loss": 1.471, "step": 22148 }, { "epoch": 1.74, "learning_rate": 0.00011227360594590681, "loss": 1.5175, "step": 22149 }, { "epoch": 1.74, "learning_rate": 0.00011226164366234887, "loss": 1.4708, "step": 22150 }, { "epoch": 1.74, "learning_rate": 0.00011224968163501354, "loss": 1.4838, "step": 22151 }, { "epoch": 1.74, "learning_rate": 0.00011223771986398197, "loss": 1.5274, "step": 22152 }, { "epoch": 1.74, "learning_rate": 0.00011222575834933553, "loss": 1.4748, "step": 22153 }, { "epoch": 1.74, "learning_rate": 0.00011221379709115532, "loss": 1.4734, "step": 22154 }, { "epoch": 1.74, "learning_rate": 0.0001122018360895226, "loss": 1.5461, "step": 22155 }, { "epoch": 1.74, "learning_rate": 0.00011218987534451851, "loss": 1.5037, "step": 22156 }, { "epoch": 1.74, "learning_rate": 0.00011217791485622431, "loss": 1.4722, "step": 22157 }, { "epoch": 1.74, "learning_rate": 0.00011216595462472125, "loss": 1.4863, "step": 22158 }, { "epoch": 1.74, "learning_rate": 0.00011215399465009044, "loss": 1.5193, "step": 22159 }, { "epoch": 1.74, "learning_rate": 0.00011214203493241313, "loss": 1.4726, "step": 22160 }, { "epoch": 1.74, "learning_rate": 0.0001121300754717705, "loss": 1.5501, "step": 22161 }, { "epoch": 1.74, "learning_rate": 0.00011211811626824376, "loss": 1.501, "step": 22162 }, { "epoch": 1.74, "learning_rate": 0.00011210615732191411, "loss": 1.4904, "step": 22163 }, { "epoch": 1.74, "learning_rate": 0.00011209419863286272, "loss": 1.5401, "step": 22164 }, { "epoch": 1.74, "learning_rate": 0.00011208224020117082, "loss": 1.4915, "step": 22165 }, { "epoch": 1.74, "learning_rate": 0.0001120702820269196, "loss": 1.5085, "step": 22166 }, { "epoch": 1.74, "learning_rate": 0.00011205832411019021, "loss": 1.4283, "step": 22167 }, { "epoch": 1.74, "learning_rate": 0.00011204636645106383, "loss": 1.5081, "step": 22168 }, { "epoch": 1.74, "learning_rate": 0.00011203440904962171, "loss": 1.4884, "step": 22169 }, { "epoch": 1.74, "learning_rate": 0.00011202245190594502, "loss": 1.5082, "step": 22170 }, { "epoch": 1.74, "learning_rate": 0.00011201049502011491, "loss": 1.5, "step": 22171 }, { "epoch": 1.74, "learning_rate": 0.00011199853839221262, "loss": 1.4355, "step": 22172 }, { "epoch": 1.74, "learning_rate": 0.00011198658202231921, "loss": 1.4994, "step": 22173 }, { "epoch": 1.74, "learning_rate": 0.00011197462591051596, "loss": 1.4153, "step": 22174 }, { "epoch": 1.74, "learning_rate": 0.00011196267005688404, "loss": 1.4387, "step": 22175 }, { "epoch": 1.74, "learning_rate": 0.00011195071446150456, "loss": 1.4575, "step": 22176 }, { "epoch": 1.74, "learning_rate": 0.00011193875912445873, "loss": 1.5414, "step": 22177 }, { "epoch": 1.74, "learning_rate": 0.00011192680404582776, "loss": 1.4559, "step": 22178 }, { "epoch": 1.75, "learning_rate": 0.00011191484922569275, "loss": 1.4674, "step": 22179 }, { "epoch": 1.75, "learning_rate": 0.00011190289466413493, "loss": 1.5104, "step": 22180 }, { "epoch": 1.75, "learning_rate": 0.0001118909403612354, "loss": 1.4944, "step": 22181 }, { "epoch": 1.75, "learning_rate": 0.00011187898631707536, "loss": 1.5167, "step": 22182 }, { "epoch": 1.75, "learning_rate": 0.00011186703253173598, "loss": 1.5368, "step": 22183 }, { "epoch": 1.75, "learning_rate": 0.00011185507900529835, "loss": 1.493, "step": 22184 }, { "epoch": 1.75, "learning_rate": 0.00011184312573784371, "loss": 1.5532, "step": 22185 }, { "epoch": 1.75, "learning_rate": 0.00011183117272945321, "loss": 1.5172, "step": 22186 }, { "epoch": 1.75, "learning_rate": 0.00011181921998020801, "loss": 1.4727, "step": 22187 }, { "epoch": 1.75, "learning_rate": 0.00011180726749018917, "loss": 1.4873, "step": 22188 }, { "epoch": 1.75, "learning_rate": 0.000111795315259478, "loss": 1.5176, "step": 22189 }, { "epoch": 1.75, "learning_rate": 0.00011178336328815548, "loss": 1.4858, "step": 22190 }, { "epoch": 1.75, "learning_rate": 0.00011177141157630284, "loss": 1.5321, "step": 22191 }, { "epoch": 1.75, "learning_rate": 0.00011175946012400125, "loss": 1.4761, "step": 22192 }, { "epoch": 1.75, "learning_rate": 0.0001117475089313318, "loss": 1.4917, "step": 22193 }, { "epoch": 1.75, "learning_rate": 0.00011173555799837564, "loss": 1.499, "step": 22194 }, { "epoch": 1.75, "learning_rate": 0.00011172360732521398, "loss": 1.5193, "step": 22195 }, { "epoch": 1.75, "learning_rate": 0.00011171165691192785, "loss": 1.5205, "step": 22196 }, { "epoch": 1.75, "learning_rate": 0.00011169970675859848, "loss": 1.4806, "step": 22197 }, { "epoch": 1.75, "learning_rate": 0.00011168775686530694, "loss": 1.5406, "step": 22198 }, { "epoch": 1.75, "learning_rate": 0.00011167580723213436, "loss": 1.4453, "step": 22199 }, { "epoch": 1.75, "learning_rate": 0.00011166385785916191, "loss": 1.5255, "step": 22200 }, { "epoch": 1.75, "learning_rate": 0.00011165190874647077, "loss": 1.5439, "step": 22201 }, { "epoch": 1.75, "learning_rate": 0.00011163995989414195, "loss": 1.4272, "step": 22202 }, { "epoch": 1.75, "learning_rate": 0.00011162801130225664, "loss": 1.489, "step": 22203 }, { "epoch": 1.75, "learning_rate": 0.00011161606297089599, "loss": 1.481, "step": 22204 }, { "epoch": 1.75, "learning_rate": 0.00011160411490014106, "loss": 1.541, "step": 22205 }, { "epoch": 1.75, "learning_rate": 0.00011159216709007302, "loss": 1.4939, "step": 22206 }, { "epoch": 1.75, "learning_rate": 0.00011158021954077298, "loss": 1.4661, "step": 22207 }, { "epoch": 1.75, "learning_rate": 0.00011156827225232202, "loss": 1.4798, "step": 22208 }, { "epoch": 1.75, "learning_rate": 0.00011155632522480133, "loss": 1.5505, "step": 22209 }, { "epoch": 1.75, "learning_rate": 0.00011154437845829191, "loss": 1.5458, "step": 22210 }, { "epoch": 1.75, "learning_rate": 0.00011153243195287496, "loss": 1.5215, "step": 22211 }, { "epoch": 1.75, "learning_rate": 0.00011152048570863162, "loss": 1.5153, "step": 22212 }, { "epoch": 1.75, "learning_rate": 0.00011150853972564289, "loss": 1.4705, "step": 22213 }, { "epoch": 1.75, "learning_rate": 0.00011149659400398998, "loss": 1.4618, "step": 22214 }, { "epoch": 1.75, "learning_rate": 0.00011148464854375384, "loss": 1.4674, "step": 22215 }, { "epoch": 1.75, "learning_rate": 0.00011147270334501578, "loss": 1.492, "step": 22216 }, { "epoch": 1.75, "learning_rate": 0.00011146075840785676, "loss": 1.5024, "step": 22217 }, { "epoch": 1.75, "learning_rate": 0.00011144881373235797, "loss": 1.5261, "step": 22218 }, { "epoch": 1.75, "learning_rate": 0.00011143686931860042, "loss": 1.428, "step": 22219 }, { "epoch": 1.75, "learning_rate": 0.00011142492516666525, "loss": 1.4806, "step": 22220 }, { "epoch": 1.75, "learning_rate": 0.00011141298127663361, "loss": 1.4767, "step": 22221 }, { "epoch": 1.75, "learning_rate": 0.00011140103764858646, "loss": 1.4633, "step": 22222 }, { "epoch": 1.75, "learning_rate": 0.00011138909428260498, "loss": 1.4788, "step": 22223 }, { "epoch": 1.75, "learning_rate": 0.00011137715117877028, "loss": 1.5492, "step": 22224 }, { "epoch": 1.75, "learning_rate": 0.00011136520833716337, "loss": 1.5026, "step": 22225 }, { "epoch": 1.75, "learning_rate": 0.00011135326575786542, "loss": 1.5523, "step": 22226 }, { "epoch": 1.75, "learning_rate": 0.00011134132344095741, "loss": 1.5013, "step": 22227 }, { "epoch": 1.75, "learning_rate": 0.00011132938138652051, "loss": 1.5252, "step": 22228 }, { "epoch": 1.75, "learning_rate": 0.00011131743959463578, "loss": 1.4747, "step": 22229 }, { "epoch": 1.75, "learning_rate": 0.00011130549806538426, "loss": 1.501, "step": 22230 }, { "epoch": 1.75, "learning_rate": 0.00011129355679884704, "loss": 1.4947, "step": 22231 }, { "epoch": 1.75, "learning_rate": 0.00011128161579510522, "loss": 1.4905, "step": 22232 }, { "epoch": 1.75, "learning_rate": 0.00011126967505423989, "loss": 1.5202, "step": 22233 }, { "epoch": 1.75, "learning_rate": 0.00011125773457633209, "loss": 1.5299, "step": 22234 }, { "epoch": 1.75, "learning_rate": 0.00011124579436146288, "loss": 1.5049, "step": 22235 }, { "epoch": 1.75, "learning_rate": 0.00011123385440971336, "loss": 1.4932, "step": 22236 }, { "epoch": 1.75, "learning_rate": 0.00011122191472116455, "loss": 1.4861, "step": 22237 }, { "epoch": 1.75, "learning_rate": 0.00011120997529589756, "loss": 1.6041, "step": 22238 }, { "epoch": 1.75, "learning_rate": 0.00011119803613399344, "loss": 1.4824, "step": 22239 }, { "epoch": 1.75, "learning_rate": 0.0001111860972355332, "loss": 1.5449, "step": 22240 }, { "epoch": 1.75, "learning_rate": 0.00011117415860059799, "loss": 1.5004, "step": 22241 }, { "epoch": 1.75, "learning_rate": 0.00011116222022926879, "loss": 1.4683, "step": 22242 }, { "epoch": 1.75, "learning_rate": 0.0001111502821216267, "loss": 1.5271, "step": 22243 }, { "epoch": 1.75, "learning_rate": 0.00011113834427775273, "loss": 1.491, "step": 22244 }, { "epoch": 1.75, "learning_rate": 0.00011112640669772796, "loss": 1.5192, "step": 22245 }, { "epoch": 1.75, "learning_rate": 0.0001111144693816334, "loss": 1.4832, "step": 22246 }, { "epoch": 1.75, "learning_rate": 0.0001111025323295502, "loss": 1.4747, "step": 22247 }, { "epoch": 1.75, "learning_rate": 0.00011109059554155931, "loss": 1.4918, "step": 22248 }, { "epoch": 1.75, "learning_rate": 0.00011107865901774181, "loss": 1.4671, "step": 22249 }, { "epoch": 1.75, "learning_rate": 0.00011106672275817876, "loss": 1.5032, "step": 22250 }, { "epoch": 1.75, "learning_rate": 0.00011105478676295113, "loss": 1.4992, "step": 22251 }, { "epoch": 1.75, "learning_rate": 0.00011104285103214002, "loss": 1.4906, "step": 22252 }, { "epoch": 1.75, "learning_rate": 0.00011103091556582651, "loss": 1.4976, "step": 22253 }, { "epoch": 1.75, "learning_rate": 0.00011101898036409152, "loss": 1.5076, "step": 22254 }, { "epoch": 1.75, "learning_rate": 0.00011100704542701617, "loss": 1.4712, "step": 22255 }, { "epoch": 1.75, "learning_rate": 0.00011099511075468144, "loss": 1.5207, "step": 22256 }, { "epoch": 1.75, "learning_rate": 0.00011098317634716837, "loss": 1.4867, "step": 22257 }, { "epoch": 1.75, "learning_rate": 0.00011097124220455806, "loss": 1.4517, "step": 22258 }, { "epoch": 1.75, "learning_rate": 0.00011095930832693144, "loss": 1.5027, "step": 22259 }, { "epoch": 1.75, "learning_rate": 0.00011094737471436954, "loss": 1.5226, "step": 22260 }, { "epoch": 1.75, "learning_rate": 0.00011093544136695348, "loss": 1.4952, "step": 22261 }, { "epoch": 1.75, "learning_rate": 0.00011092350828476414, "loss": 1.5291, "step": 22262 }, { "epoch": 1.75, "learning_rate": 0.00011091157546788265, "loss": 1.5101, "step": 22263 }, { "epoch": 1.75, "learning_rate": 0.00011089964291638999, "loss": 1.5111, "step": 22264 }, { "epoch": 1.75, "learning_rate": 0.0001108877106303672, "loss": 1.4397, "step": 22265 }, { "epoch": 1.75, "learning_rate": 0.00011087577860989527, "loss": 1.4682, "step": 22266 }, { "epoch": 1.75, "learning_rate": 0.00011086384685505521, "loss": 1.4917, "step": 22267 }, { "epoch": 1.75, "learning_rate": 0.00011085191536592802, "loss": 1.4723, "step": 22268 }, { "epoch": 1.75, "learning_rate": 0.00011083998414259472, "loss": 1.4565, "step": 22269 }, { "epoch": 1.75, "learning_rate": 0.00011082805318513633, "loss": 1.5246, "step": 22270 }, { "epoch": 1.75, "learning_rate": 0.00011081612249363382, "loss": 1.4989, "step": 22271 }, { "epoch": 1.75, "learning_rate": 0.00011080419206816826, "loss": 1.458, "step": 22272 }, { "epoch": 1.75, "learning_rate": 0.00011079226190882055, "loss": 1.4989, "step": 22273 }, { "epoch": 1.75, "learning_rate": 0.00011078033201567177, "loss": 1.4782, "step": 22274 }, { "epoch": 1.75, "learning_rate": 0.00011076840238880291, "loss": 1.5185, "step": 22275 }, { "epoch": 1.75, "learning_rate": 0.00011075647302829493, "loss": 1.4855, "step": 22276 }, { "epoch": 1.75, "learning_rate": 0.00011074454393422883, "loss": 1.4611, "step": 22277 }, { "epoch": 1.75, "learning_rate": 0.00011073261510668558, "loss": 1.5054, "step": 22278 }, { "epoch": 1.75, "learning_rate": 0.00011072068654574628, "loss": 1.5035, "step": 22279 }, { "epoch": 1.75, "learning_rate": 0.0001107087582514918, "loss": 1.5051, "step": 22280 }, { "epoch": 1.75, "learning_rate": 0.00011069683022400316, "loss": 1.495, "step": 22281 }, { "epoch": 1.75, "learning_rate": 0.00011068490246336139, "loss": 1.4847, "step": 22282 }, { "epoch": 1.75, "learning_rate": 0.00011067297496964742, "loss": 1.532, "step": 22283 }, { "epoch": 1.75, "learning_rate": 0.00011066104774294227, "loss": 1.5232, "step": 22284 }, { "epoch": 1.75, "learning_rate": 0.00011064912078332687, "loss": 1.4724, "step": 22285 }, { "epoch": 1.75, "learning_rate": 0.0001106371940908822, "loss": 1.5398, "step": 22286 }, { "epoch": 1.75, "learning_rate": 0.00011062526766568931, "loss": 1.4782, "step": 22287 }, { "epoch": 1.75, "learning_rate": 0.0001106133415078291, "loss": 1.504, "step": 22288 }, { "epoch": 1.75, "learning_rate": 0.00011060141561738254, "loss": 1.5223, "step": 22289 }, { "epoch": 1.75, "learning_rate": 0.00011058948999443069, "loss": 1.5212, "step": 22290 }, { "epoch": 1.75, "learning_rate": 0.00011057756463905443, "loss": 1.4785, "step": 22291 }, { "epoch": 1.75, "learning_rate": 0.00011056563955133474, "loss": 1.4861, "step": 22292 }, { "epoch": 1.75, "learning_rate": 0.00011055371473135259, "loss": 1.4508, "step": 22293 }, { "epoch": 1.75, "learning_rate": 0.00011054179017918892, "loss": 1.479, "step": 22294 }, { "epoch": 1.75, "learning_rate": 0.00011052986589492473, "loss": 1.5162, "step": 22295 }, { "epoch": 1.75, "learning_rate": 0.00011051794187864104, "loss": 1.538, "step": 22296 }, { "epoch": 1.75, "learning_rate": 0.00011050601813041866, "loss": 1.4756, "step": 22297 }, { "epoch": 1.75, "learning_rate": 0.00011049409465033864, "loss": 1.5446, "step": 22298 }, { "epoch": 1.75, "learning_rate": 0.00011048217143848196, "loss": 1.4862, "step": 22299 }, { "epoch": 1.75, "learning_rate": 0.00011047024849492949, "loss": 1.5338, "step": 22300 }, { "epoch": 1.75, "learning_rate": 0.00011045832581976223, "loss": 1.4681, "step": 22301 }, { "epoch": 1.75, "learning_rate": 0.00011044640341306111, "loss": 1.5111, "step": 22302 }, { "epoch": 1.75, "learning_rate": 0.00011043448127490707, "loss": 1.4947, "step": 22303 }, { "epoch": 1.75, "learning_rate": 0.00011042255940538112, "loss": 1.5316, "step": 22304 }, { "epoch": 1.75, "learning_rate": 0.00011041063780456408, "loss": 1.4901, "step": 22305 }, { "epoch": 1.76, "learning_rate": 0.000110398716472537, "loss": 1.5236, "step": 22306 }, { "epoch": 1.76, "learning_rate": 0.00011038679540938079, "loss": 1.4831, "step": 22307 }, { "epoch": 1.76, "learning_rate": 0.00011037487461517637, "loss": 1.5462, "step": 22308 }, { "epoch": 1.76, "learning_rate": 0.00011036295409000464, "loss": 1.5154, "step": 22309 }, { "epoch": 1.76, "learning_rate": 0.00011035103383394662, "loss": 1.5286, "step": 22310 }, { "epoch": 1.76, "learning_rate": 0.00011033911384708321, "loss": 1.4627, "step": 22311 }, { "epoch": 1.76, "learning_rate": 0.0001103271941294953, "loss": 1.4518, "step": 22312 }, { "epoch": 1.76, "learning_rate": 0.0001103152746812639, "loss": 1.5009, "step": 22313 }, { "epoch": 1.76, "learning_rate": 0.00011030335550246985, "loss": 1.4868, "step": 22314 }, { "epoch": 1.76, "learning_rate": 0.00011029143659319408, "loss": 1.4571, "step": 22315 }, { "epoch": 1.76, "learning_rate": 0.0001102795179535176, "loss": 1.5134, "step": 22316 }, { "epoch": 1.76, "learning_rate": 0.00011026759958352125, "loss": 1.5193, "step": 22317 }, { "epoch": 1.76, "learning_rate": 0.00011025568148328596, "loss": 1.5022, "step": 22318 }, { "epoch": 1.76, "learning_rate": 0.00011024376365289268, "loss": 1.4813, "step": 22319 }, { "epoch": 1.76, "learning_rate": 0.0001102318460924223, "loss": 1.5038, "step": 22320 }, { "epoch": 1.76, "learning_rate": 0.00011021992880195575, "loss": 1.4511, "step": 22321 }, { "epoch": 1.76, "learning_rate": 0.00011020801178157391, "loss": 1.473, "step": 22322 }, { "epoch": 1.76, "learning_rate": 0.0001101960950313577, "loss": 1.5346, "step": 22323 }, { "epoch": 1.76, "learning_rate": 0.00011018417855138809, "loss": 1.4534, "step": 22324 }, { "epoch": 1.76, "learning_rate": 0.00011017226234174585, "loss": 1.4577, "step": 22325 }, { "epoch": 1.76, "learning_rate": 0.00011016034640251202, "loss": 1.4306, "step": 22326 }, { "epoch": 1.76, "learning_rate": 0.00011014843073376745, "loss": 1.53, "step": 22327 }, { "epoch": 1.76, "learning_rate": 0.00011013651533559308, "loss": 1.4874, "step": 22328 }, { "epoch": 1.76, "learning_rate": 0.00011012460020806972, "loss": 1.482, "step": 22329 }, { "epoch": 1.76, "learning_rate": 0.00011011268535127837, "loss": 1.4827, "step": 22330 }, { "epoch": 1.76, "learning_rate": 0.00011010077076529984, "loss": 1.4756, "step": 22331 }, { "epoch": 1.76, "learning_rate": 0.00011008885645021504, "loss": 1.5332, "step": 22332 }, { "epoch": 1.76, "learning_rate": 0.00011007694240610492, "loss": 1.5333, "step": 22333 }, { "epoch": 1.76, "learning_rate": 0.00011006502863305033, "loss": 1.5014, "step": 22334 }, { "epoch": 1.76, "learning_rate": 0.00011005311513113211, "loss": 1.4914, "step": 22335 }, { "epoch": 1.76, "learning_rate": 0.00011004120190043124, "loss": 1.4641, "step": 22336 }, { "epoch": 1.76, "learning_rate": 0.00011002928894102855, "loss": 1.483, "step": 22337 }, { "epoch": 1.76, "learning_rate": 0.00011001737625300494, "loss": 1.4994, "step": 22338 }, { "epoch": 1.76, "learning_rate": 0.00011000546383644125, "loss": 1.4944, "step": 22339 }, { "epoch": 1.76, "learning_rate": 0.00010999355169141841, "loss": 1.5314, "step": 22340 }, { "epoch": 1.76, "learning_rate": 0.00010998163981801721, "loss": 1.5216, "step": 22341 }, { "epoch": 1.76, "learning_rate": 0.00010996972821631867, "loss": 1.4536, "step": 22342 }, { "epoch": 1.76, "learning_rate": 0.00010995781688640358, "loss": 1.4331, "step": 22343 }, { "epoch": 1.76, "learning_rate": 0.00010994590582835276, "loss": 1.4396, "step": 22344 }, { "epoch": 1.76, "learning_rate": 0.00010993399504224723, "loss": 1.5322, "step": 22345 }, { "epoch": 1.76, "learning_rate": 0.00010992208452816769, "loss": 1.4916, "step": 22346 }, { "epoch": 1.76, "learning_rate": 0.00010991017428619509, "loss": 1.5532, "step": 22347 }, { "epoch": 1.76, "learning_rate": 0.00010989826431641032, "loss": 1.5208, "step": 22348 }, { "epoch": 1.76, "learning_rate": 0.00010988635461889417, "loss": 1.4384, "step": 22349 }, { "epoch": 1.76, "learning_rate": 0.00010987444519372756, "loss": 1.5096, "step": 22350 }, { "epoch": 1.76, "learning_rate": 0.00010986253604099131, "loss": 1.5011, "step": 22351 }, { "epoch": 1.76, "learning_rate": 0.00010985062716076627, "loss": 1.5186, "step": 22352 }, { "epoch": 1.76, "learning_rate": 0.00010983871855313336, "loss": 1.4804, "step": 22353 }, { "epoch": 1.76, "learning_rate": 0.00010982681021817336, "loss": 1.5077, "step": 22354 }, { "epoch": 1.76, "learning_rate": 0.00010981490215596718, "loss": 1.4601, "step": 22355 }, { "epoch": 1.76, "learning_rate": 0.0001098029943665956, "loss": 1.4919, "step": 22356 }, { "epoch": 1.76, "learning_rate": 0.00010979108685013947, "loss": 1.4943, "step": 22357 }, { "epoch": 1.76, "learning_rate": 0.00010977917960667972, "loss": 1.5274, "step": 22358 }, { "epoch": 1.76, "learning_rate": 0.0001097672726362971, "loss": 1.5344, "step": 22359 }, { "epoch": 1.76, "learning_rate": 0.00010975536593907256, "loss": 1.5375, "step": 22360 }, { "epoch": 1.76, "learning_rate": 0.00010974345951508687, "loss": 1.4987, "step": 22361 }, { "epoch": 1.76, "learning_rate": 0.00010973155336442089, "loss": 1.5552, "step": 22362 }, { "epoch": 1.76, "learning_rate": 0.00010971964748715539, "loss": 1.5421, "step": 22363 }, { "epoch": 1.76, "learning_rate": 0.00010970774188337128, "loss": 1.4894, "step": 22364 }, { "epoch": 1.76, "learning_rate": 0.00010969583655314938, "loss": 1.5147, "step": 22365 }, { "epoch": 1.76, "learning_rate": 0.00010968393149657047, "loss": 1.4657, "step": 22366 }, { "epoch": 1.76, "learning_rate": 0.00010967202671371546, "loss": 1.5131, "step": 22367 }, { "epoch": 1.76, "learning_rate": 0.0001096601222046651, "loss": 1.5263, "step": 22368 }, { "epoch": 1.76, "learning_rate": 0.00010964821796950027, "loss": 1.5198, "step": 22369 }, { "epoch": 1.76, "learning_rate": 0.00010963631400830177, "loss": 1.504, "step": 22370 }, { "epoch": 1.76, "learning_rate": 0.00010962441032115042, "loss": 1.504, "step": 22371 }, { "epoch": 1.76, "learning_rate": 0.000109612506908127, "loss": 1.4983, "step": 22372 }, { "epoch": 1.76, "learning_rate": 0.00010960060376931239, "loss": 1.4627, "step": 22373 }, { "epoch": 1.76, "learning_rate": 0.00010958870090478744, "loss": 1.4973, "step": 22374 }, { "epoch": 1.76, "learning_rate": 0.00010957679831463285, "loss": 1.4917, "step": 22375 }, { "epoch": 1.76, "learning_rate": 0.00010956489599892952, "loss": 1.4273, "step": 22376 }, { "epoch": 1.76, "learning_rate": 0.00010955299395775825, "loss": 1.4616, "step": 22377 }, { "epoch": 1.76, "learning_rate": 0.0001095410921911998, "loss": 1.4451, "step": 22378 }, { "epoch": 1.76, "learning_rate": 0.00010952919069933504, "loss": 1.5194, "step": 22379 }, { "epoch": 1.76, "learning_rate": 0.00010951728948224471, "loss": 1.531, "step": 22380 }, { "epoch": 1.76, "learning_rate": 0.00010950538854000966, "loss": 1.428, "step": 22381 }, { "epoch": 1.76, "learning_rate": 0.00010949348787271067, "loss": 1.4964, "step": 22382 }, { "epoch": 1.76, "learning_rate": 0.00010948158748042854, "loss": 1.4974, "step": 22383 }, { "epoch": 1.76, "learning_rate": 0.00010946968736324409, "loss": 1.544, "step": 22384 }, { "epoch": 1.76, "learning_rate": 0.00010945778752123806, "loss": 1.4822, "step": 22385 }, { "epoch": 1.76, "learning_rate": 0.0001094458879544913, "loss": 1.5334, "step": 22386 }, { "epoch": 1.76, "learning_rate": 0.00010943398866308462, "loss": 1.4283, "step": 22387 }, { "epoch": 1.76, "learning_rate": 0.00010942208964709866, "loss": 1.5194, "step": 22388 }, { "epoch": 1.76, "learning_rate": 0.0001094101909066144, "loss": 1.494, "step": 22389 }, { "epoch": 1.76, "learning_rate": 0.00010939829244171253, "loss": 1.5064, "step": 22390 }, { "epoch": 1.76, "learning_rate": 0.00010938639425247387, "loss": 1.5267, "step": 22391 }, { "epoch": 1.76, "learning_rate": 0.00010937449633897914, "loss": 1.5105, "step": 22392 }, { "epoch": 1.76, "learning_rate": 0.00010936259870130918, "loss": 1.5159, "step": 22393 }, { "epoch": 1.76, "learning_rate": 0.00010935070133954478, "loss": 1.5247, "step": 22394 }, { "epoch": 1.76, "learning_rate": 0.00010933880425376664, "loss": 1.4715, "step": 22395 }, { "epoch": 1.76, "learning_rate": 0.00010932690744405565, "loss": 1.5097, "step": 22396 }, { "epoch": 1.76, "learning_rate": 0.00010931501091049243, "loss": 1.4488, "step": 22397 }, { "epoch": 1.76, "learning_rate": 0.00010930311465315787, "loss": 1.5317, "step": 22398 }, { "epoch": 1.76, "learning_rate": 0.00010929121867213272, "loss": 1.4989, "step": 22399 }, { "epoch": 1.76, "learning_rate": 0.0001092793229674977, "loss": 1.5307, "step": 22400 }, { "epoch": 1.76, "learning_rate": 0.00010926742753933359, "loss": 1.5297, "step": 22401 }, { "epoch": 1.76, "learning_rate": 0.00010925553238772123, "loss": 1.4549, "step": 22402 }, { "epoch": 1.76, "learning_rate": 0.00010924363751274127, "loss": 1.5012, "step": 22403 }, { "epoch": 1.76, "learning_rate": 0.0001092317429144745, "loss": 1.469, "step": 22404 }, { "epoch": 1.76, "learning_rate": 0.00010921984859300173, "loss": 1.4796, "step": 22405 }, { "epoch": 1.76, "learning_rate": 0.0001092079545484037, "loss": 1.5004, "step": 22406 }, { "epoch": 1.76, "learning_rate": 0.00010919606078076112, "loss": 1.5037, "step": 22407 }, { "epoch": 1.76, "learning_rate": 0.00010918416729015481, "loss": 1.4786, "step": 22408 }, { "epoch": 1.76, "learning_rate": 0.00010917227407666545, "loss": 1.4631, "step": 22409 }, { "epoch": 1.76, "learning_rate": 0.00010916038114037382, "loss": 1.5497, "step": 22410 }, { "epoch": 1.76, "learning_rate": 0.00010914848848136067, "loss": 1.5403, "step": 22411 }, { "epoch": 1.76, "learning_rate": 0.00010913659609970675, "loss": 1.5205, "step": 22412 }, { "epoch": 1.76, "learning_rate": 0.0001091247039954928, "loss": 1.5166, "step": 22413 }, { "epoch": 1.76, "learning_rate": 0.00010911281216879952, "loss": 1.5074, "step": 22414 }, { "epoch": 1.76, "learning_rate": 0.00010910092061970769, "loss": 1.4752, "step": 22415 }, { "epoch": 1.76, "learning_rate": 0.00010908902934829806, "loss": 1.4567, "step": 22416 }, { "epoch": 1.76, "learning_rate": 0.00010907713835465132, "loss": 1.4509, "step": 22417 }, { "epoch": 1.76, "learning_rate": 0.00010906524763884823, "loss": 1.479, "step": 22418 }, { "epoch": 1.76, "learning_rate": 0.00010905335720096947, "loss": 1.4656, "step": 22419 }, { "epoch": 1.76, "learning_rate": 0.0001090414670410959, "loss": 1.4906, "step": 22420 }, { "epoch": 1.76, "learning_rate": 0.00010902957715930813, "loss": 1.5144, "step": 22421 }, { "epoch": 1.76, "learning_rate": 0.00010901768755568692, "loss": 1.504, "step": 22422 }, { "epoch": 1.76, "learning_rate": 0.00010900579823031303, "loss": 1.5101, "step": 22423 }, { "epoch": 1.76, "learning_rate": 0.0001089939091832671, "loss": 1.498, "step": 22424 }, { "epoch": 1.76, "learning_rate": 0.00010898202041462994, "loss": 1.5007, "step": 22425 }, { "epoch": 1.76, "learning_rate": 0.00010897013192448221, "loss": 1.4982, "step": 22426 }, { "epoch": 1.76, "learning_rate": 0.00010895824371290463, "loss": 1.4582, "step": 22427 }, { "epoch": 1.76, "learning_rate": 0.00010894635577997797, "loss": 1.4976, "step": 22428 }, { "epoch": 1.76, "learning_rate": 0.00010893446812578285, "loss": 1.481, "step": 22429 }, { "epoch": 1.76, "learning_rate": 0.00010892258075040004, "loss": 1.4704, "step": 22430 }, { "epoch": 1.76, "learning_rate": 0.00010891069365391027, "loss": 1.4746, "step": 22431 }, { "epoch": 1.76, "learning_rate": 0.00010889880683639416, "loss": 1.4661, "step": 22432 }, { "epoch": 1.77, "learning_rate": 0.00010888692029793252, "loss": 1.4654, "step": 22433 }, { "epoch": 1.77, "learning_rate": 0.00010887503403860598, "loss": 1.4912, "step": 22434 }, { "epoch": 1.77, "learning_rate": 0.00010886314805849521, "loss": 1.4258, "step": 22435 }, { "epoch": 1.77, "learning_rate": 0.00010885126235768101, "loss": 1.515, "step": 22436 }, { "epoch": 1.77, "learning_rate": 0.00010883937693624408, "loss": 1.4786, "step": 22437 }, { "epoch": 1.77, "learning_rate": 0.000108827491794265, "loss": 1.473, "step": 22438 }, { "epoch": 1.77, "learning_rate": 0.00010881560693182455, "loss": 1.4791, "step": 22439 }, { "epoch": 1.77, "learning_rate": 0.00010880372234900343, "loss": 1.5673, "step": 22440 }, { "epoch": 1.77, "learning_rate": 0.00010879183804588227, "loss": 1.4753, "step": 22441 }, { "epoch": 1.77, "learning_rate": 0.00010877995402254182, "loss": 1.4289, "step": 22442 }, { "epoch": 1.77, "learning_rate": 0.00010876807027906269, "loss": 1.5229, "step": 22443 }, { "epoch": 1.77, "learning_rate": 0.00010875618681552563, "loss": 1.4608, "step": 22444 }, { "epoch": 1.77, "learning_rate": 0.00010874430363201133, "loss": 1.4905, "step": 22445 }, { "epoch": 1.77, "learning_rate": 0.0001087324207286004, "loss": 1.5226, "step": 22446 }, { "epoch": 1.77, "learning_rate": 0.00010872053810537356, "loss": 1.5354, "step": 22447 }, { "epoch": 1.77, "learning_rate": 0.00010870865576241154, "loss": 1.4736, "step": 22448 }, { "epoch": 1.77, "learning_rate": 0.0001086967736997949, "loss": 1.4953, "step": 22449 }, { "epoch": 1.77, "learning_rate": 0.00010868489191760441, "loss": 1.4688, "step": 22450 }, { "epoch": 1.77, "learning_rate": 0.00010867301041592063, "loss": 1.4704, "step": 22451 }, { "epoch": 1.77, "learning_rate": 0.00010866112919482438, "loss": 1.5704, "step": 22452 }, { "epoch": 1.77, "learning_rate": 0.00010864924825439622, "loss": 1.4646, "step": 22453 }, { "epoch": 1.77, "learning_rate": 0.00010863736759471688, "loss": 1.4738, "step": 22454 }, { "epoch": 1.77, "learning_rate": 0.00010862548721586695, "loss": 1.5035, "step": 22455 }, { "epoch": 1.77, "learning_rate": 0.00010861360711792714, "loss": 1.4775, "step": 22456 }, { "epoch": 1.77, "learning_rate": 0.00010860172730097814, "loss": 1.5012, "step": 22457 }, { "epoch": 1.77, "learning_rate": 0.0001085898477651005, "loss": 1.448, "step": 22458 }, { "epoch": 1.77, "learning_rate": 0.00010857796851037497, "loss": 1.578, "step": 22459 }, { "epoch": 1.77, "learning_rate": 0.00010856608953688221, "loss": 1.5021, "step": 22460 }, { "epoch": 1.77, "learning_rate": 0.00010855421084470279, "loss": 1.5365, "step": 22461 }, { "epoch": 1.77, "learning_rate": 0.00010854233243391744, "loss": 1.4428, "step": 22462 }, { "epoch": 1.77, "learning_rate": 0.00010853045430460674, "loss": 1.4533, "step": 22463 }, { "epoch": 1.77, "learning_rate": 0.00010851857645685136, "loss": 1.5313, "step": 22464 }, { "epoch": 1.77, "learning_rate": 0.00010850669889073202, "loss": 1.493, "step": 22465 }, { "epoch": 1.77, "learning_rate": 0.00010849482160632924, "loss": 1.4714, "step": 22466 }, { "epoch": 1.77, "learning_rate": 0.0001084829446037237, "loss": 1.4713, "step": 22467 }, { "epoch": 1.77, "learning_rate": 0.00010847106788299608, "loss": 1.4399, "step": 22468 }, { "epoch": 1.77, "learning_rate": 0.00010845919144422703, "loss": 1.4523, "step": 22469 }, { "epoch": 1.77, "learning_rate": 0.00010844731528749709, "loss": 1.5294, "step": 22470 }, { "epoch": 1.77, "learning_rate": 0.00010843543941288698, "loss": 1.5254, "step": 22471 }, { "epoch": 1.77, "learning_rate": 0.00010842356382047731, "loss": 1.5011, "step": 22472 }, { "epoch": 1.77, "learning_rate": 0.00010841168851034869, "loss": 1.4864, "step": 22473 }, { "epoch": 1.77, "learning_rate": 0.00010839981348258177, "loss": 1.4627, "step": 22474 }, { "epoch": 1.77, "learning_rate": 0.00010838793873725712, "loss": 1.4814, "step": 22475 }, { "epoch": 1.77, "learning_rate": 0.00010837606427445541, "loss": 1.5466, "step": 22476 }, { "epoch": 1.77, "learning_rate": 0.00010836419009425728, "loss": 1.5257, "step": 22477 }, { "epoch": 1.77, "learning_rate": 0.00010835231619674328, "loss": 1.5206, "step": 22478 }, { "epoch": 1.77, "learning_rate": 0.00010834044258199413, "loss": 1.4478, "step": 22479 }, { "epoch": 1.77, "learning_rate": 0.00010832856925009034, "loss": 1.4991, "step": 22480 }, { "epoch": 1.77, "learning_rate": 0.00010831669620111257, "loss": 1.4905, "step": 22481 }, { "epoch": 1.77, "learning_rate": 0.00010830482343514139, "loss": 1.4902, "step": 22482 }, { "epoch": 1.77, "learning_rate": 0.00010829295095225752, "loss": 1.5115, "step": 22483 }, { "epoch": 1.77, "learning_rate": 0.00010828107875254148, "loss": 1.4628, "step": 22484 }, { "epoch": 1.77, "learning_rate": 0.00010826920683607387, "loss": 1.4631, "step": 22485 }, { "epoch": 1.77, "learning_rate": 0.00010825733520293536, "loss": 1.5167, "step": 22486 }, { "epoch": 1.77, "learning_rate": 0.00010824546385320647, "loss": 1.5267, "step": 22487 }, { "epoch": 1.77, "learning_rate": 0.00010823359278696785, "loss": 1.4825, "step": 22488 }, { "epoch": 1.77, "learning_rate": 0.00010822172200430012, "loss": 1.4904, "step": 22489 }, { "epoch": 1.77, "learning_rate": 0.00010820985150528378, "loss": 1.5027, "step": 22490 }, { "epoch": 1.77, "learning_rate": 0.00010819798128999954, "loss": 1.5103, "step": 22491 }, { "epoch": 1.77, "learning_rate": 0.0001081861113585279, "loss": 1.4874, "step": 22492 }, { "epoch": 1.77, "learning_rate": 0.00010817424171094951, "loss": 1.4735, "step": 22493 }, { "epoch": 1.77, "learning_rate": 0.00010816237234734496, "loss": 1.5577, "step": 22494 }, { "epoch": 1.77, "learning_rate": 0.00010815050326779477, "loss": 1.54, "step": 22495 }, { "epoch": 1.77, "learning_rate": 0.00010813863447237961, "loss": 1.5361, "step": 22496 }, { "epoch": 1.77, "learning_rate": 0.00010812676596118, "loss": 1.5017, "step": 22497 }, { "epoch": 1.77, "learning_rate": 0.00010811489773427649, "loss": 1.4795, "step": 22498 }, { "epoch": 1.77, "learning_rate": 0.00010810302979174973, "loss": 1.5457, "step": 22499 }, { "epoch": 1.77, "learning_rate": 0.0001080911621336803, "loss": 1.4952, "step": 22500 }, { "epoch": 1.77, "learning_rate": 0.00010807929476014879, "loss": 1.4751, "step": 22501 }, { "epoch": 1.77, "learning_rate": 0.00010806742767123569, "loss": 1.4867, "step": 22502 }, { "epoch": 1.77, "learning_rate": 0.00010805556086702164, "loss": 1.4954, "step": 22503 }, { "epoch": 1.77, "learning_rate": 0.00010804369434758717, "loss": 1.4967, "step": 22504 }, { "epoch": 1.77, "learning_rate": 0.00010803182811301285, "loss": 1.5063, "step": 22505 }, { "epoch": 1.77, "learning_rate": 0.0001080199621633793, "loss": 1.4559, "step": 22506 }, { "epoch": 1.77, "learning_rate": 0.000108008096498767, "loss": 1.5029, "step": 22507 }, { "epoch": 1.77, "learning_rate": 0.00010799623111925659, "loss": 1.4774, "step": 22508 }, { "epoch": 1.77, "learning_rate": 0.00010798436602492855, "loss": 1.4985, "step": 22509 }, { "epoch": 1.77, "learning_rate": 0.00010797250121586348, "loss": 1.4558, "step": 22510 }, { "epoch": 1.77, "learning_rate": 0.00010796063669214196, "loss": 1.5066, "step": 22511 }, { "epoch": 1.77, "learning_rate": 0.0001079487724538445, "loss": 1.4567, "step": 22512 }, { "epoch": 1.77, "learning_rate": 0.00010793690850105167, "loss": 1.474, "step": 22513 }, { "epoch": 1.77, "learning_rate": 0.00010792504483384399, "loss": 1.4869, "step": 22514 }, { "epoch": 1.77, "learning_rate": 0.00010791318145230209, "loss": 1.5176, "step": 22515 }, { "epoch": 1.77, "learning_rate": 0.00010790131835650642, "loss": 1.4988, "step": 22516 }, { "epoch": 1.77, "learning_rate": 0.00010788945554653758, "loss": 1.525, "step": 22517 }, { "epoch": 1.77, "learning_rate": 0.00010787759302247613, "loss": 1.4302, "step": 22518 }, { "epoch": 1.77, "learning_rate": 0.00010786573078440255, "loss": 1.4917, "step": 22519 }, { "epoch": 1.77, "learning_rate": 0.00010785386883239744, "loss": 1.4803, "step": 22520 }, { "epoch": 1.77, "learning_rate": 0.00010784200716654126, "loss": 1.4866, "step": 22521 }, { "epoch": 1.77, "learning_rate": 0.00010783014578691458, "loss": 1.5103, "step": 22522 }, { "epoch": 1.77, "learning_rate": 0.00010781828469359799, "loss": 1.4509, "step": 22523 }, { "epoch": 1.77, "learning_rate": 0.00010780642388667193, "loss": 1.5375, "step": 22524 }, { "epoch": 1.77, "learning_rate": 0.00010779456336621699, "loss": 1.4623, "step": 22525 }, { "epoch": 1.77, "learning_rate": 0.00010778270313231366, "loss": 1.4987, "step": 22526 }, { "epoch": 1.77, "learning_rate": 0.00010777084318504246, "loss": 1.429, "step": 22527 }, { "epoch": 1.77, "learning_rate": 0.00010775898352448399, "loss": 1.5332, "step": 22528 }, { "epoch": 1.77, "learning_rate": 0.00010774712415071858, "loss": 1.5299, "step": 22529 }, { "epoch": 1.77, "learning_rate": 0.000107735265063827, "loss": 1.491, "step": 22530 }, { "epoch": 1.77, "learning_rate": 0.0001077234062638896, "loss": 1.5448, "step": 22531 }, { "epoch": 1.77, "learning_rate": 0.000107711547750987, "loss": 1.4953, "step": 22532 }, { "epoch": 1.77, "learning_rate": 0.00010769968952519958, "loss": 1.4868, "step": 22533 }, { "epoch": 1.77, "learning_rate": 0.00010768783158660797, "loss": 1.5291, "step": 22534 }, { "epoch": 1.77, "learning_rate": 0.00010767597393529263, "loss": 1.49, "step": 22535 }, { "epoch": 1.77, "learning_rate": 0.00010766411657133405, "loss": 1.5584, "step": 22536 }, { "epoch": 1.77, "learning_rate": 0.0001076522594948128, "loss": 1.4957, "step": 22537 }, { "epoch": 1.77, "learning_rate": 0.0001076404027058093, "loss": 1.5531, "step": 22538 }, { "epoch": 1.77, "learning_rate": 0.00010762854620440407, "loss": 1.5091, "step": 22539 }, { "epoch": 1.77, "learning_rate": 0.00010761668999067768, "loss": 1.5344, "step": 22540 }, { "epoch": 1.77, "learning_rate": 0.00010760483406471054, "loss": 1.4824, "step": 22541 }, { "epoch": 1.77, "learning_rate": 0.00010759297842658318, "loss": 1.5409, "step": 22542 }, { "epoch": 1.77, "learning_rate": 0.00010758112307637613, "loss": 1.4496, "step": 22543 }, { "epoch": 1.77, "learning_rate": 0.00010756926801416982, "loss": 1.5418, "step": 22544 }, { "epoch": 1.77, "learning_rate": 0.00010755741324004471, "loss": 1.4553, "step": 22545 }, { "epoch": 1.77, "learning_rate": 0.0001075455587540814, "loss": 1.497, "step": 22546 }, { "epoch": 1.77, "learning_rate": 0.00010753370455636034, "loss": 1.4693, "step": 22547 }, { "epoch": 1.77, "learning_rate": 0.00010752185064696194, "loss": 1.4922, "step": 22548 }, { "epoch": 1.77, "learning_rate": 0.00010750999702596678, "loss": 1.4742, "step": 22549 }, { "epoch": 1.77, "learning_rate": 0.00010749814369345528, "loss": 1.4543, "step": 22550 }, { "epoch": 1.77, "learning_rate": 0.00010748629064950791, "loss": 1.5142, "step": 22551 }, { "epoch": 1.77, "learning_rate": 0.0001074744378942052, "loss": 1.5065, "step": 22552 }, { "epoch": 1.77, "learning_rate": 0.00010746258542762757, "loss": 1.4988, "step": 22553 }, { "epoch": 1.77, "learning_rate": 0.00010745073324985548, "loss": 1.4793, "step": 22554 }, { "epoch": 1.77, "learning_rate": 0.00010743888136096949, "loss": 1.4903, "step": 22555 }, { "epoch": 1.77, "learning_rate": 0.00010742702976104995, "loss": 1.4896, "step": 22556 }, { "epoch": 1.77, "learning_rate": 0.00010741517845017745, "loss": 1.5044, "step": 22557 }, { "epoch": 1.77, "learning_rate": 0.00010740332742843234, "loss": 1.4454, "step": 22558 }, { "epoch": 1.77, "learning_rate": 0.00010739147669589512, "loss": 1.4959, "step": 22559 }, { "epoch": 1.78, "learning_rate": 0.0001073796262526463, "loss": 1.482, "step": 22560 }, { "epoch": 1.78, "learning_rate": 0.00010736777609876626, "loss": 1.4417, "step": 22561 }, { "epoch": 1.78, "learning_rate": 0.00010735592623433549, "loss": 1.4732, "step": 22562 }, { "epoch": 1.78, "learning_rate": 0.00010734407665943445, "loss": 1.5112, "step": 22563 }, { "epoch": 1.78, "learning_rate": 0.00010733222737414364, "loss": 1.5287, "step": 22564 }, { "epoch": 1.78, "learning_rate": 0.00010732037837854343, "loss": 1.4786, "step": 22565 }, { "epoch": 1.78, "learning_rate": 0.00010730852967271431, "loss": 1.4928, "step": 22566 }, { "epoch": 1.78, "learning_rate": 0.00010729668125673669, "loss": 1.4728, "step": 22567 }, { "epoch": 1.78, "learning_rate": 0.00010728483313069103, "loss": 1.4968, "step": 22568 }, { "epoch": 1.78, "learning_rate": 0.00010727298529465785, "loss": 1.5454, "step": 22569 }, { "epoch": 1.78, "learning_rate": 0.00010726113774871744, "loss": 1.5241, "step": 22570 }, { "epoch": 1.78, "learning_rate": 0.00010724929049295036, "loss": 1.5023, "step": 22571 }, { "epoch": 1.78, "learning_rate": 0.00010723744352743699, "loss": 1.4663, "step": 22572 }, { "epoch": 1.78, "learning_rate": 0.0001072255968522578, "loss": 1.4948, "step": 22573 }, { "epoch": 1.78, "learning_rate": 0.00010721375046749321, "loss": 1.4967, "step": 22574 }, { "epoch": 1.78, "learning_rate": 0.00010720190437322361, "loss": 1.4847, "step": 22575 }, { "epoch": 1.78, "learning_rate": 0.00010719005856952947, "loss": 1.4802, "step": 22576 }, { "epoch": 1.78, "learning_rate": 0.00010717821305649116, "loss": 1.4902, "step": 22577 }, { "epoch": 1.78, "learning_rate": 0.00010716636783418922, "loss": 1.5366, "step": 22578 }, { "epoch": 1.78, "learning_rate": 0.00010715452290270399, "loss": 1.5164, "step": 22579 }, { "epoch": 1.78, "learning_rate": 0.0001071426782621159, "loss": 1.4549, "step": 22580 }, { "epoch": 1.78, "learning_rate": 0.0001071308339125054, "loss": 1.5186, "step": 22581 }, { "epoch": 1.78, "learning_rate": 0.00010711898985395285, "loss": 1.5346, "step": 22582 }, { "epoch": 1.78, "learning_rate": 0.0001071071460865387, "loss": 1.4753, "step": 22583 }, { "epoch": 1.78, "learning_rate": 0.00010709530261034338, "loss": 1.4763, "step": 22584 }, { "epoch": 1.78, "learning_rate": 0.00010708345942544725, "loss": 1.4687, "step": 22585 }, { "epoch": 1.78, "learning_rate": 0.00010707161653193077, "loss": 1.5035, "step": 22586 }, { "epoch": 1.78, "learning_rate": 0.00010705977392987431, "loss": 1.5378, "step": 22587 }, { "epoch": 1.78, "learning_rate": 0.00010704793161935828, "loss": 1.5034, "step": 22588 }, { "epoch": 1.78, "learning_rate": 0.00010703608960046311, "loss": 1.4832, "step": 22589 }, { "epoch": 1.78, "learning_rate": 0.00010702424787326918, "loss": 1.4567, "step": 22590 }, { "epoch": 1.78, "learning_rate": 0.0001070124064378569, "loss": 1.4593, "step": 22591 }, { "epoch": 1.78, "learning_rate": 0.00010700056529430658, "loss": 1.4776, "step": 22592 }, { "epoch": 1.78, "learning_rate": 0.00010698872444269878, "loss": 1.4831, "step": 22593 }, { "epoch": 1.78, "learning_rate": 0.00010697688388311377, "loss": 1.5085, "step": 22594 }, { "epoch": 1.78, "learning_rate": 0.00010696504361563201, "loss": 1.4711, "step": 22595 }, { "epoch": 1.78, "learning_rate": 0.00010695320364033382, "loss": 1.4342, "step": 22596 }, { "epoch": 1.78, "learning_rate": 0.00010694136395729962, "loss": 1.4482, "step": 22597 }, { "epoch": 1.78, "learning_rate": 0.00010692952456660984, "loss": 1.4474, "step": 22598 }, { "epoch": 1.78, "learning_rate": 0.00010691768546834477, "loss": 1.521, "step": 22599 }, { "epoch": 1.78, "learning_rate": 0.00010690584666258484, "loss": 1.4989, "step": 22600 }, { "epoch": 1.78, "learning_rate": 0.00010689400814941049, "loss": 1.4859, "step": 22601 }, { "epoch": 1.78, "learning_rate": 0.000106882169928902, "loss": 1.5119, "step": 22602 }, { "epoch": 1.78, "learning_rate": 0.0001068703320011398, "loss": 1.548, "step": 22603 }, { "epoch": 1.78, "learning_rate": 0.00010685849436620421, "loss": 1.4926, "step": 22604 }, { "epoch": 1.78, "learning_rate": 0.00010684665702417565, "loss": 1.5866, "step": 22605 }, { "epoch": 1.78, "learning_rate": 0.0001068348199751345, "loss": 1.5834, "step": 22606 }, { "epoch": 1.78, "learning_rate": 0.00010682298321916105, "loss": 1.4642, "step": 22607 }, { "epoch": 1.78, "learning_rate": 0.00010681114675633571, "loss": 1.5222, "step": 22608 }, { "epoch": 1.78, "learning_rate": 0.00010679931058673887, "loss": 1.4938, "step": 22609 }, { "epoch": 1.78, "learning_rate": 0.00010678747471045091, "loss": 1.5062, "step": 22610 }, { "epoch": 1.78, "learning_rate": 0.00010677563912755213, "loss": 1.4864, "step": 22611 }, { "epoch": 1.78, "learning_rate": 0.00010676380383812289, "loss": 1.4801, "step": 22612 }, { "epoch": 1.78, "learning_rate": 0.0001067519688422436, "loss": 1.5258, "step": 22613 }, { "epoch": 1.78, "learning_rate": 0.00010674013413999453, "loss": 1.5016, "step": 22614 }, { "epoch": 1.78, "learning_rate": 0.00010672829973145614, "loss": 1.4776, "step": 22615 }, { "epoch": 1.78, "learning_rate": 0.00010671646561670865, "loss": 1.4929, "step": 22616 }, { "epoch": 1.78, "learning_rate": 0.00010670463179583248, "loss": 1.5025, "step": 22617 }, { "epoch": 1.78, "learning_rate": 0.00010669279826890802, "loss": 1.5004, "step": 22618 }, { "epoch": 1.78, "learning_rate": 0.0001066809650360155, "loss": 1.4967, "step": 22619 }, { "epoch": 1.78, "learning_rate": 0.00010666913209723538, "loss": 1.4433, "step": 22620 }, { "epoch": 1.78, "learning_rate": 0.00010665729945264789, "loss": 1.5558, "step": 22621 }, { "epoch": 1.78, "learning_rate": 0.00010664546710233341, "loss": 1.4951, "step": 22622 }, { "epoch": 1.78, "learning_rate": 0.00010663363504637235, "loss": 1.5076, "step": 22623 }, { "epoch": 1.78, "learning_rate": 0.00010662180328484489, "loss": 1.4819, "step": 22624 }, { "epoch": 1.78, "learning_rate": 0.00010660997181783147, "loss": 1.4556, "step": 22625 }, { "epoch": 1.78, "learning_rate": 0.00010659814064541243, "loss": 1.4857, "step": 22626 }, { "epoch": 1.78, "learning_rate": 0.00010658630976766807, "loss": 1.5088, "step": 22627 }, { "epoch": 1.78, "learning_rate": 0.00010657447918467867, "loss": 1.4529, "step": 22628 }, { "epoch": 1.78, "learning_rate": 0.00010656264889652461, "loss": 1.4939, "step": 22629 }, { "epoch": 1.78, "learning_rate": 0.00010655081890328623, "loss": 1.5387, "step": 22630 }, { "epoch": 1.78, "learning_rate": 0.00010653898920504378, "loss": 1.5149, "step": 22631 }, { "epoch": 1.78, "learning_rate": 0.00010652715980187763, "loss": 1.4823, "step": 22632 }, { "epoch": 1.78, "learning_rate": 0.00010651533069386803, "loss": 1.5193, "step": 22633 }, { "epoch": 1.78, "learning_rate": 0.00010650350188109535, "loss": 1.4964, "step": 22634 }, { "epoch": 1.78, "learning_rate": 0.00010649167336363995, "loss": 1.4818, "step": 22635 }, { "epoch": 1.78, "learning_rate": 0.000106479845141582, "loss": 1.5112, "step": 22636 }, { "epoch": 1.78, "learning_rate": 0.0001064680172150019, "loss": 1.5171, "step": 22637 }, { "epoch": 1.78, "learning_rate": 0.00010645618958397998, "loss": 1.4833, "step": 22638 }, { "epoch": 1.78, "learning_rate": 0.00010644436224859643, "loss": 1.4768, "step": 22639 }, { "epoch": 1.78, "learning_rate": 0.00010643253520893168, "loss": 1.5342, "step": 22640 }, { "epoch": 1.78, "learning_rate": 0.00010642070846506594, "loss": 1.539, "step": 22641 }, { "epoch": 1.78, "learning_rate": 0.00010640888201707959, "loss": 1.4766, "step": 22642 }, { "epoch": 1.78, "learning_rate": 0.00010639705586505285, "loss": 1.5173, "step": 22643 }, { "epoch": 1.78, "learning_rate": 0.00010638523000906605, "loss": 1.5257, "step": 22644 }, { "epoch": 1.78, "learning_rate": 0.00010637340444919945, "loss": 1.4916, "step": 22645 }, { "epoch": 1.78, "learning_rate": 0.00010636157918553338, "loss": 1.5133, "step": 22646 }, { "epoch": 1.78, "learning_rate": 0.0001063497542181481, "loss": 1.5254, "step": 22647 }, { "epoch": 1.78, "learning_rate": 0.00010633792954712389, "loss": 1.4927, "step": 22648 }, { "epoch": 1.78, "learning_rate": 0.00010632610517254106, "loss": 1.5256, "step": 22649 }, { "epoch": 1.78, "learning_rate": 0.00010631428109447986, "loss": 1.4586, "step": 22650 }, { "epoch": 1.78, "learning_rate": 0.00010630245731302057, "loss": 1.5632, "step": 22651 }, { "epoch": 1.78, "learning_rate": 0.00010629063382824353, "loss": 1.5457, "step": 22652 }, { "epoch": 1.78, "learning_rate": 0.00010627881064022891, "loss": 1.4549, "step": 22653 }, { "epoch": 1.78, "learning_rate": 0.00010626698774905707, "loss": 1.4875, "step": 22654 }, { "epoch": 1.78, "learning_rate": 0.0001062551651548082, "loss": 1.5048, "step": 22655 }, { "epoch": 1.78, "learning_rate": 0.00010624334285756267, "loss": 1.5346, "step": 22656 }, { "epoch": 1.78, "learning_rate": 0.00010623152085740066, "loss": 1.4566, "step": 22657 }, { "epoch": 1.78, "learning_rate": 0.0001062196991544025, "loss": 1.5029, "step": 22658 }, { "epoch": 1.78, "learning_rate": 0.00010620787774864843, "loss": 1.5195, "step": 22659 }, { "epoch": 1.78, "learning_rate": 0.00010619605664021868, "loss": 1.5459, "step": 22660 }, { "epoch": 1.78, "learning_rate": 0.00010618423582919357, "loss": 1.5148, "step": 22661 }, { "epoch": 1.78, "learning_rate": 0.00010617241531565327, "loss": 1.425, "step": 22662 }, { "epoch": 1.78, "learning_rate": 0.00010616059509967811, "loss": 1.4984, "step": 22663 }, { "epoch": 1.78, "learning_rate": 0.00010614877518134833, "loss": 1.5439, "step": 22664 }, { "epoch": 1.78, "learning_rate": 0.00010613695556074413, "loss": 1.4581, "step": 22665 }, { "epoch": 1.78, "learning_rate": 0.00010612513623794582, "loss": 1.5079, "step": 22666 }, { "epoch": 1.78, "learning_rate": 0.00010611331721303364, "loss": 1.5066, "step": 22667 }, { "epoch": 1.78, "learning_rate": 0.00010610149848608778, "loss": 1.4937, "step": 22668 }, { "epoch": 1.78, "learning_rate": 0.00010608968005718855, "loss": 1.5368, "step": 22669 }, { "epoch": 1.78, "learning_rate": 0.00010607786192641615, "loss": 1.4859, "step": 22670 }, { "epoch": 1.78, "learning_rate": 0.00010606604409385077, "loss": 1.4986, "step": 22671 }, { "epoch": 1.78, "learning_rate": 0.00010605422655957276, "loss": 1.4943, "step": 22672 }, { "epoch": 1.78, "learning_rate": 0.00010604240932366233, "loss": 1.4813, "step": 22673 }, { "epoch": 1.78, "learning_rate": 0.00010603059238619964, "loss": 1.5121, "step": 22674 }, { "epoch": 1.78, "learning_rate": 0.00010601877574726497, "loss": 1.4797, "step": 22675 }, { "epoch": 1.78, "learning_rate": 0.00010600695940693858, "loss": 1.5324, "step": 22676 }, { "epoch": 1.78, "learning_rate": 0.0001059951433653006, "loss": 1.4732, "step": 22677 }, { "epoch": 1.78, "learning_rate": 0.00010598332762243139, "loss": 1.4849, "step": 22678 }, { "epoch": 1.78, "learning_rate": 0.00010597151217841103, "loss": 1.4856, "step": 22679 }, { "epoch": 1.78, "learning_rate": 0.0001059596970333198, "loss": 1.4329, "step": 22680 }, { "epoch": 1.78, "learning_rate": 0.00010594788218723797, "loss": 1.5016, "step": 22681 }, { "epoch": 1.78, "learning_rate": 0.00010593606764024567, "loss": 1.479, "step": 22682 }, { "epoch": 1.78, "learning_rate": 0.00010592425339242316, "loss": 1.4275, "step": 22683 }, { "epoch": 1.78, "learning_rate": 0.00010591243944385068, "loss": 1.5041, "step": 22684 }, { "epoch": 1.78, "learning_rate": 0.00010590062579460838, "loss": 1.5302, "step": 22685 }, { "epoch": 1.78, "learning_rate": 0.00010588881244477652, "loss": 1.4901, "step": 22686 }, { "epoch": 1.79, "learning_rate": 0.00010587699939443517, "loss": 1.4926, "step": 22687 }, { "epoch": 1.79, "learning_rate": 0.00010586518664366476, "loss": 1.5216, "step": 22688 }, { "epoch": 1.79, "learning_rate": 0.00010585337419254535, "loss": 1.4605, "step": 22689 }, { "epoch": 1.79, "learning_rate": 0.00010584156204115718, "loss": 1.5521, "step": 22690 }, { "epoch": 1.79, "learning_rate": 0.00010582975018958041, "loss": 1.5468, "step": 22691 }, { "epoch": 1.79, "learning_rate": 0.00010581793863789528, "loss": 1.5286, "step": 22692 }, { "epoch": 1.79, "learning_rate": 0.00010580612738618198, "loss": 1.4871, "step": 22693 }, { "epoch": 1.79, "learning_rate": 0.00010579431643452065, "loss": 1.5462, "step": 22694 }, { "epoch": 1.79, "learning_rate": 0.00010578250578299154, "loss": 1.5106, "step": 22695 }, { "epoch": 1.79, "learning_rate": 0.00010577069543167481, "loss": 1.4886, "step": 22696 }, { "epoch": 1.79, "learning_rate": 0.00010575888538065064, "loss": 1.501, "step": 22697 }, { "epoch": 1.79, "learning_rate": 0.00010574707562999924, "loss": 1.5218, "step": 22698 }, { "epoch": 1.79, "learning_rate": 0.00010573526617980077, "loss": 1.5093, "step": 22699 }, { "epoch": 1.79, "learning_rate": 0.0001057234570301354, "loss": 1.4758, "step": 22700 }, { "epoch": 1.79, "learning_rate": 0.00010571164818108336, "loss": 1.5314, "step": 22701 }, { "epoch": 1.79, "learning_rate": 0.00010569983963272471, "loss": 1.4941, "step": 22702 }, { "epoch": 1.79, "learning_rate": 0.00010568803138513975, "loss": 1.5097, "step": 22703 }, { "epoch": 1.79, "learning_rate": 0.00010567622343840859, "loss": 1.4647, "step": 22704 }, { "epoch": 1.79, "learning_rate": 0.00010566441579261148, "loss": 1.4662, "step": 22705 }, { "epoch": 1.79, "learning_rate": 0.00010565260844782844, "loss": 1.482, "step": 22706 }, { "epoch": 1.79, "learning_rate": 0.00010564080140413978, "loss": 1.4603, "step": 22707 }, { "epoch": 1.79, "learning_rate": 0.00010562899466162556, "loss": 1.4483, "step": 22708 }, { "epoch": 1.79, "learning_rate": 0.00010561718822036597, "loss": 1.5144, "step": 22709 }, { "epoch": 1.79, "learning_rate": 0.00010560538208044122, "loss": 1.4334, "step": 22710 }, { "epoch": 1.79, "learning_rate": 0.0001055935762419314, "loss": 1.564, "step": 22711 }, { "epoch": 1.79, "learning_rate": 0.00010558177070491668, "loss": 1.448, "step": 22712 }, { "epoch": 1.79, "learning_rate": 0.00010556996546947727, "loss": 1.4851, "step": 22713 }, { "epoch": 1.79, "learning_rate": 0.00010555816053569323, "loss": 1.462, "step": 22714 }, { "epoch": 1.79, "learning_rate": 0.00010554635590364478, "loss": 1.451, "step": 22715 }, { "epoch": 1.79, "learning_rate": 0.00010553455157341204, "loss": 1.4989, "step": 22716 }, { "epoch": 1.79, "learning_rate": 0.00010552274754507514, "loss": 1.5183, "step": 22717 }, { "epoch": 1.79, "learning_rate": 0.00010551094381871421, "loss": 1.4964, "step": 22718 }, { "epoch": 1.79, "learning_rate": 0.00010549914039440949, "loss": 1.4584, "step": 22719 }, { "epoch": 1.79, "learning_rate": 0.000105487337272241, "loss": 1.4742, "step": 22720 }, { "epoch": 1.79, "learning_rate": 0.00010547553445228892, "loss": 1.511, "step": 22721 }, { "epoch": 1.79, "learning_rate": 0.00010546373193463346, "loss": 1.5218, "step": 22722 }, { "epoch": 1.79, "learning_rate": 0.00010545192971935461, "loss": 1.4669, "step": 22723 }, { "epoch": 1.79, "learning_rate": 0.00010544012780653259, "loss": 1.5405, "step": 22724 }, { "epoch": 1.79, "learning_rate": 0.00010542832619624755, "loss": 1.4752, "step": 22725 }, { "epoch": 1.79, "learning_rate": 0.00010541652488857955, "loss": 1.5509, "step": 22726 }, { "epoch": 1.79, "learning_rate": 0.00010540472388360876, "loss": 1.4941, "step": 22727 }, { "epoch": 1.79, "learning_rate": 0.00010539292318141526, "loss": 1.4664, "step": 22728 }, { "epoch": 1.79, "learning_rate": 0.00010538112278207921, "loss": 1.4677, "step": 22729 }, { "epoch": 1.79, "learning_rate": 0.00010536932268568071, "loss": 1.5383, "step": 22730 }, { "epoch": 1.79, "learning_rate": 0.00010535752289229988, "loss": 1.47, "step": 22731 }, { "epoch": 1.79, "learning_rate": 0.00010534572340201687, "loss": 1.4819, "step": 22732 }, { "epoch": 1.79, "learning_rate": 0.0001053339242149117, "loss": 1.4962, "step": 22733 }, { "epoch": 1.79, "learning_rate": 0.0001053221253310645, "loss": 1.5743, "step": 22734 }, { "epoch": 1.79, "learning_rate": 0.00010531032675055547, "loss": 1.4377, "step": 22735 }, { "epoch": 1.79, "learning_rate": 0.00010529852847346465, "loss": 1.4685, "step": 22736 }, { "epoch": 1.79, "learning_rate": 0.00010528673049987219, "loss": 1.5273, "step": 22737 }, { "epoch": 1.79, "learning_rate": 0.0001052749328298581, "loss": 1.4849, "step": 22738 }, { "epoch": 1.79, "learning_rate": 0.0001052631354635026, "loss": 1.5341, "step": 22739 }, { "epoch": 1.79, "learning_rate": 0.00010525133840088565, "loss": 1.4533, "step": 22740 }, { "epoch": 1.79, "learning_rate": 0.00010523954164208745, "loss": 1.4679, "step": 22741 }, { "epoch": 1.79, "learning_rate": 0.00010522774518718809, "loss": 1.5031, "step": 22742 }, { "epoch": 1.79, "learning_rate": 0.0001052159490362676, "loss": 1.4862, "step": 22743 }, { "epoch": 1.79, "learning_rate": 0.00010520415318940611, "loss": 1.478, "step": 22744 }, { "epoch": 1.79, "learning_rate": 0.00010519235764668369, "loss": 1.4957, "step": 22745 }, { "epoch": 1.79, "learning_rate": 0.00010518056240818044, "loss": 1.487, "step": 22746 }, { "epoch": 1.79, "learning_rate": 0.00010516876747397645, "loss": 1.4871, "step": 22747 }, { "epoch": 1.79, "learning_rate": 0.00010515697284415177, "loss": 1.5029, "step": 22748 }, { "epoch": 1.79, "learning_rate": 0.00010514517851878647, "loss": 1.4669, "step": 22749 }, { "epoch": 1.79, "learning_rate": 0.00010513338449796069, "loss": 1.4967, "step": 22750 }, { "epoch": 1.79, "learning_rate": 0.00010512159078175449, "loss": 1.5234, "step": 22751 }, { "epoch": 1.79, "learning_rate": 0.0001051097973702479, "loss": 1.4715, "step": 22752 }, { "epoch": 1.79, "learning_rate": 0.000105098004263521, "loss": 1.4645, "step": 22753 }, { "epoch": 1.79, "learning_rate": 0.0001050862114616539, "loss": 1.5045, "step": 22754 }, { "epoch": 1.79, "learning_rate": 0.00010507441896472663, "loss": 1.4925, "step": 22755 }, { "epoch": 1.79, "learning_rate": 0.00010506262677281926, "loss": 1.5146, "step": 22756 }, { "epoch": 1.79, "learning_rate": 0.00010505083488601187, "loss": 1.5286, "step": 22757 }, { "epoch": 1.79, "learning_rate": 0.00010503904330438449, "loss": 1.4822, "step": 22758 }, { "epoch": 1.79, "learning_rate": 0.00010502725202801721, "loss": 1.4133, "step": 22759 }, { "epoch": 1.79, "learning_rate": 0.00010501546105699005, "loss": 1.5108, "step": 22760 }, { "epoch": 1.79, "learning_rate": 0.00010500367039138311, "loss": 1.4719, "step": 22761 }, { "epoch": 1.79, "learning_rate": 0.00010499188003127639, "loss": 1.4998, "step": 22762 }, { "epoch": 1.79, "learning_rate": 0.00010498008997674997, "loss": 1.4765, "step": 22763 }, { "epoch": 1.79, "learning_rate": 0.00010496830022788392, "loss": 1.5333, "step": 22764 }, { "epoch": 1.79, "learning_rate": 0.00010495651078475819, "loss": 1.5041, "step": 22765 }, { "epoch": 1.79, "learning_rate": 0.00010494472164745294, "loss": 1.4651, "step": 22766 }, { "epoch": 1.79, "learning_rate": 0.00010493293281604818, "loss": 1.4308, "step": 22767 }, { "epoch": 1.79, "learning_rate": 0.00010492114429062394, "loss": 1.5181, "step": 22768 }, { "epoch": 1.79, "learning_rate": 0.00010490935607126025, "loss": 1.4879, "step": 22769 }, { "epoch": 1.79, "learning_rate": 0.00010489756815803713, "loss": 1.4838, "step": 22770 }, { "epoch": 1.79, "learning_rate": 0.00010488578055103466, "loss": 1.5253, "step": 22771 }, { "epoch": 1.79, "learning_rate": 0.00010487399325033284, "loss": 1.4948, "step": 22772 }, { "epoch": 1.79, "learning_rate": 0.0001048622062560117, "loss": 1.5264, "step": 22773 }, { "epoch": 1.79, "learning_rate": 0.00010485041956815126, "loss": 1.4837, "step": 22774 }, { "epoch": 1.79, "learning_rate": 0.00010483863318683155, "loss": 1.4739, "step": 22775 }, { "epoch": 1.79, "learning_rate": 0.00010482684711213261, "loss": 1.5389, "step": 22776 }, { "epoch": 1.79, "learning_rate": 0.00010481506134413445, "loss": 1.4962, "step": 22777 }, { "epoch": 1.79, "learning_rate": 0.00010480327588291708, "loss": 1.4658, "step": 22778 }, { "epoch": 1.79, "learning_rate": 0.00010479149072856055, "loss": 1.469, "step": 22779 }, { "epoch": 1.79, "learning_rate": 0.00010477970588114482, "loss": 1.4517, "step": 22780 }, { "epoch": 1.79, "learning_rate": 0.0001047679213407499, "loss": 1.5454, "step": 22781 }, { "epoch": 1.79, "learning_rate": 0.00010475613710745588, "loss": 1.4624, "step": 22782 }, { "epoch": 1.79, "learning_rate": 0.00010474435318134273, "loss": 1.4844, "step": 22783 }, { "epoch": 1.79, "learning_rate": 0.00010473256956249043, "loss": 1.5321, "step": 22784 }, { "epoch": 1.79, "learning_rate": 0.00010472078625097902, "loss": 1.454, "step": 22785 }, { "epoch": 1.79, "learning_rate": 0.00010470900324688847, "loss": 1.5223, "step": 22786 }, { "epoch": 1.79, "learning_rate": 0.00010469722055029879, "loss": 1.512, "step": 22787 }, { "epoch": 1.79, "learning_rate": 0.00010468543816129, "loss": 1.4963, "step": 22788 }, { "epoch": 1.79, "learning_rate": 0.00010467365607994205, "loss": 1.428, "step": 22789 }, { "epoch": 1.79, "learning_rate": 0.00010466187430633499, "loss": 1.5333, "step": 22790 }, { "epoch": 1.79, "learning_rate": 0.00010465009284054878, "loss": 1.4658, "step": 22791 }, { "epoch": 1.79, "learning_rate": 0.00010463831168266339, "loss": 1.5547, "step": 22792 }, { "epoch": 1.79, "learning_rate": 0.00010462653083275886, "loss": 1.4573, "step": 22793 }, { "epoch": 1.79, "learning_rate": 0.00010461475029091513, "loss": 1.5352, "step": 22794 }, { "epoch": 1.79, "learning_rate": 0.0001046029700572122, "loss": 1.479, "step": 22795 }, { "epoch": 1.79, "learning_rate": 0.00010459119013173006, "loss": 1.4623, "step": 22796 }, { "epoch": 1.79, "learning_rate": 0.00010457941051454864, "loss": 1.5222, "step": 22797 }, { "epoch": 1.79, "learning_rate": 0.00010456763120574798, "loss": 1.4991, "step": 22798 }, { "epoch": 1.79, "learning_rate": 0.00010455585220540804, "loss": 1.4826, "step": 22799 }, { "epoch": 1.79, "learning_rate": 0.00010454407351360881, "loss": 1.5275, "step": 22800 }, { "epoch": 1.79, "learning_rate": 0.00010453229513043021, "loss": 1.5, "step": 22801 }, { "epoch": 1.79, "learning_rate": 0.00010452051705595226, "loss": 1.5034, "step": 22802 }, { "epoch": 1.79, "learning_rate": 0.00010450873929025488, "loss": 1.4893, "step": 22803 }, { "epoch": 1.79, "learning_rate": 0.00010449696183341804, "loss": 1.4802, "step": 22804 }, { "epoch": 1.79, "learning_rate": 0.00010448518468552174, "loss": 1.4957, "step": 22805 }, { "epoch": 1.79, "learning_rate": 0.00010447340784664591, "loss": 1.468, "step": 22806 }, { "epoch": 1.79, "learning_rate": 0.00010446163131687053, "loss": 1.4638, "step": 22807 }, { "epoch": 1.79, "learning_rate": 0.00010444985509627555, "loss": 1.5348, "step": 22808 }, { "epoch": 1.79, "learning_rate": 0.0001044380791849409, "loss": 1.458, "step": 22809 }, { "epoch": 1.79, "learning_rate": 0.00010442630358294658, "loss": 1.5023, "step": 22810 }, { "epoch": 1.79, "learning_rate": 0.00010441452829037246, "loss": 1.4982, "step": 22811 }, { "epoch": 1.79, "learning_rate": 0.00010440275330729852, "loss": 1.4688, "step": 22812 }, { "epoch": 1.79, "learning_rate": 0.00010439097863380474, "loss": 1.4668, "step": 22813 }, { "epoch": 1.8, "learning_rate": 0.00010437920426997111, "loss": 1.4996, "step": 22814 }, { "epoch": 1.8, "learning_rate": 0.00010436743021587746, "loss": 1.4867, "step": 22815 }, { "epoch": 1.8, "learning_rate": 0.00010435565647160376, "loss": 1.4677, "step": 22816 }, { "epoch": 1.8, "learning_rate": 0.00010434388303723001, "loss": 1.4844, "step": 22817 }, { "epoch": 1.8, "learning_rate": 0.00010433210991283605, "loss": 1.5006, "step": 22818 }, { "epoch": 1.8, "learning_rate": 0.00010432033709850191, "loss": 1.511, "step": 22819 }, { "epoch": 1.8, "learning_rate": 0.00010430856459430745, "loss": 1.4673, "step": 22820 }, { "epoch": 1.8, "learning_rate": 0.0001042967924003326, "loss": 1.5142, "step": 22821 }, { "epoch": 1.8, "learning_rate": 0.00010428502051665735, "loss": 1.4542, "step": 22822 }, { "epoch": 1.8, "learning_rate": 0.00010427324894336155, "loss": 1.5123, "step": 22823 }, { "epoch": 1.8, "learning_rate": 0.00010426147768052518, "loss": 1.4775, "step": 22824 }, { "epoch": 1.8, "learning_rate": 0.00010424970672822813, "loss": 1.46, "step": 22825 }, { "epoch": 1.8, "learning_rate": 0.0001042379360865503, "loss": 1.4957, "step": 22826 }, { "epoch": 1.8, "learning_rate": 0.00010422616575557168, "loss": 1.5132, "step": 22827 }, { "epoch": 1.8, "learning_rate": 0.00010421439573537203, "loss": 1.4731, "step": 22828 }, { "epoch": 1.8, "learning_rate": 0.00010420262602603147, "loss": 1.4955, "step": 22829 }, { "epoch": 1.8, "learning_rate": 0.00010419085662762976, "loss": 1.5059, "step": 22830 }, { "epoch": 1.8, "learning_rate": 0.00010417908754024688, "loss": 1.4794, "step": 22831 }, { "epoch": 1.8, "learning_rate": 0.00010416731876396267, "loss": 1.5094, "step": 22832 }, { "epoch": 1.8, "learning_rate": 0.00010415555029885711, "loss": 1.5002, "step": 22833 }, { "epoch": 1.8, "learning_rate": 0.00010414378214501009, "loss": 1.4772, "step": 22834 }, { "epoch": 1.8, "learning_rate": 0.00010413201430250144, "loss": 1.452, "step": 22835 }, { "epoch": 1.8, "learning_rate": 0.00010412024677141108, "loss": 1.4774, "step": 22836 }, { "epoch": 1.8, "learning_rate": 0.00010410847955181899, "loss": 1.4811, "step": 22837 }, { "epoch": 1.8, "learning_rate": 0.00010409671264380496, "loss": 1.4968, "step": 22838 }, { "epoch": 1.8, "learning_rate": 0.00010408494604744895, "loss": 1.5102, "step": 22839 }, { "epoch": 1.8, "learning_rate": 0.00010407317976283078, "loss": 1.4899, "step": 22840 }, { "epoch": 1.8, "learning_rate": 0.00010406141379003036, "loss": 1.4421, "step": 22841 }, { "epoch": 1.8, "learning_rate": 0.00010404964812912764, "loss": 1.4693, "step": 22842 }, { "epoch": 1.8, "learning_rate": 0.00010403788278020245, "loss": 1.5323, "step": 22843 }, { "epoch": 1.8, "learning_rate": 0.00010402611774333458, "loss": 1.5194, "step": 22844 }, { "epoch": 1.8, "learning_rate": 0.00010401435301860407, "loss": 1.5545, "step": 22845 }, { "epoch": 1.8, "learning_rate": 0.00010400258860609075, "loss": 1.4692, "step": 22846 }, { "epoch": 1.8, "learning_rate": 0.00010399082450587444, "loss": 1.4663, "step": 22847 }, { "epoch": 1.8, "learning_rate": 0.00010397906071803504, "loss": 1.4776, "step": 22848 }, { "epoch": 1.8, "learning_rate": 0.00010396729724265245, "loss": 1.4952, "step": 22849 }, { "epoch": 1.8, "learning_rate": 0.00010395553407980648, "loss": 1.4432, "step": 22850 }, { "epoch": 1.8, "learning_rate": 0.00010394377122957706, "loss": 1.4555, "step": 22851 }, { "epoch": 1.8, "learning_rate": 0.00010393200869204397, "loss": 1.4416, "step": 22852 }, { "epoch": 1.8, "learning_rate": 0.00010392024646728714, "loss": 1.483, "step": 22853 }, { "epoch": 1.8, "learning_rate": 0.00010390848455538642, "loss": 1.5144, "step": 22854 }, { "epoch": 1.8, "learning_rate": 0.00010389672295642164, "loss": 1.4468, "step": 22855 }, { "epoch": 1.8, "learning_rate": 0.00010388496167047269, "loss": 1.5179, "step": 22856 }, { "epoch": 1.8, "learning_rate": 0.00010387320069761937, "loss": 1.452, "step": 22857 }, { "epoch": 1.8, "learning_rate": 0.00010386144003794156, "loss": 1.4674, "step": 22858 }, { "epoch": 1.8, "learning_rate": 0.00010384967969151907, "loss": 1.4886, "step": 22859 }, { "epoch": 1.8, "learning_rate": 0.00010383791965843186, "loss": 1.5132, "step": 22860 }, { "epoch": 1.8, "learning_rate": 0.00010382615993875968, "loss": 1.5014, "step": 22861 }, { "epoch": 1.8, "learning_rate": 0.00010381440053258241, "loss": 1.5393, "step": 22862 }, { "epoch": 1.8, "learning_rate": 0.00010380264143997986, "loss": 1.526, "step": 22863 }, { "epoch": 1.8, "learning_rate": 0.00010379088266103188, "loss": 1.4809, "step": 22864 }, { "epoch": 1.8, "learning_rate": 0.00010377912419581831, "loss": 1.4711, "step": 22865 }, { "epoch": 1.8, "learning_rate": 0.00010376736604441898, "loss": 1.5532, "step": 22866 }, { "epoch": 1.8, "learning_rate": 0.00010375560820691372, "loss": 1.4814, "step": 22867 }, { "epoch": 1.8, "learning_rate": 0.00010374385068338238, "loss": 1.4672, "step": 22868 }, { "epoch": 1.8, "learning_rate": 0.00010373209347390473, "loss": 1.4777, "step": 22869 }, { "epoch": 1.8, "learning_rate": 0.00010372033657856065, "loss": 1.5357, "step": 22870 }, { "epoch": 1.8, "learning_rate": 0.00010370857999742997, "loss": 1.4779, "step": 22871 }, { "epoch": 1.8, "learning_rate": 0.00010369682373059244, "loss": 1.4525, "step": 22872 }, { "epoch": 1.8, "learning_rate": 0.00010368506777812797, "loss": 1.4993, "step": 22873 }, { "epoch": 1.8, "learning_rate": 0.0001036733121401163, "loss": 1.4899, "step": 22874 }, { "epoch": 1.8, "learning_rate": 0.00010366155681663724, "loss": 1.534, "step": 22875 }, { "epoch": 1.8, "learning_rate": 0.00010364980180777066, "loss": 1.5109, "step": 22876 }, { "epoch": 1.8, "learning_rate": 0.00010363804711359635, "loss": 1.4721, "step": 22877 }, { "epoch": 1.8, "learning_rate": 0.00010362629273419416, "loss": 1.5575, "step": 22878 }, { "epoch": 1.8, "learning_rate": 0.00010361453866964382, "loss": 1.5054, "step": 22879 }, { "epoch": 1.8, "learning_rate": 0.00010360278492002518, "loss": 1.5069, "step": 22880 }, { "epoch": 1.8, "learning_rate": 0.000103591031485418, "loss": 1.4965, "step": 22881 }, { "epoch": 1.8, "learning_rate": 0.00010357927836590211, "loss": 1.5167, "step": 22882 }, { "epoch": 1.8, "learning_rate": 0.00010356752556155733, "loss": 1.4705, "step": 22883 }, { "epoch": 1.8, "learning_rate": 0.00010355577307246342, "loss": 1.5329, "step": 22884 }, { "epoch": 1.8, "learning_rate": 0.00010354402089870018, "loss": 1.4555, "step": 22885 }, { "epoch": 1.8, "learning_rate": 0.0001035322690403474, "loss": 1.4729, "step": 22886 }, { "epoch": 1.8, "learning_rate": 0.00010352051749748484, "loss": 1.4726, "step": 22887 }, { "epoch": 1.8, "learning_rate": 0.00010350876627019237, "loss": 1.5012, "step": 22888 }, { "epoch": 1.8, "learning_rate": 0.00010349701535854967, "loss": 1.4709, "step": 22889 }, { "epoch": 1.8, "learning_rate": 0.0001034852647626366, "loss": 1.5106, "step": 22890 }, { "epoch": 1.8, "learning_rate": 0.00010347351448253285, "loss": 1.4691, "step": 22891 }, { "epoch": 1.8, "learning_rate": 0.00010346176451831834, "loss": 1.5302, "step": 22892 }, { "epoch": 1.8, "learning_rate": 0.00010345001487007275, "loss": 1.466, "step": 22893 }, { "epoch": 1.8, "learning_rate": 0.00010343826553787585, "loss": 1.5027, "step": 22894 }, { "epoch": 1.8, "learning_rate": 0.00010342651652180746, "loss": 1.4952, "step": 22895 }, { "epoch": 1.8, "learning_rate": 0.00010341476782194731, "loss": 1.4946, "step": 22896 }, { "epoch": 1.8, "learning_rate": 0.00010340301943837518, "loss": 1.4654, "step": 22897 }, { "epoch": 1.8, "learning_rate": 0.00010339127137117084, "loss": 1.5068, "step": 22898 }, { "epoch": 1.8, "learning_rate": 0.00010337952362041402, "loss": 1.508, "step": 22899 }, { "epoch": 1.8, "learning_rate": 0.00010336777618618455, "loss": 1.4684, "step": 22900 }, { "epoch": 1.8, "learning_rate": 0.00010335602906856212, "loss": 1.4587, "step": 22901 }, { "epoch": 1.8, "learning_rate": 0.00010334428226762653, "loss": 1.4956, "step": 22902 }, { "epoch": 1.8, "learning_rate": 0.0001033325357834575, "loss": 1.5032, "step": 22903 }, { "epoch": 1.8, "learning_rate": 0.00010332078961613479, "loss": 1.5001, "step": 22904 }, { "epoch": 1.8, "learning_rate": 0.0001033090437657382, "loss": 1.4814, "step": 22905 }, { "epoch": 1.8, "learning_rate": 0.00010329729823234738, "loss": 1.5568, "step": 22906 }, { "epoch": 1.8, "learning_rate": 0.00010328555301604211, "loss": 1.5091, "step": 22907 }, { "epoch": 1.8, "learning_rate": 0.00010327380811690218, "loss": 1.5406, "step": 22908 }, { "epoch": 1.8, "learning_rate": 0.00010326206353500738, "loss": 1.4809, "step": 22909 }, { "epoch": 1.8, "learning_rate": 0.00010325031927043732, "loss": 1.4833, "step": 22910 }, { "epoch": 1.8, "learning_rate": 0.00010323857532327179, "loss": 1.4426, "step": 22911 }, { "epoch": 1.8, "learning_rate": 0.00010322683169359055, "loss": 1.4682, "step": 22912 }, { "epoch": 1.8, "learning_rate": 0.00010321508838147329, "loss": 1.5285, "step": 22913 }, { "epoch": 1.8, "learning_rate": 0.0001032033453869998, "loss": 1.5218, "step": 22914 }, { "epoch": 1.8, "learning_rate": 0.00010319160271024973, "loss": 1.4553, "step": 22915 }, { "epoch": 1.8, "learning_rate": 0.00010317986035130285, "loss": 1.5579, "step": 22916 }, { "epoch": 1.8, "learning_rate": 0.00010316811831023891, "loss": 1.5168, "step": 22917 }, { "epoch": 1.8, "learning_rate": 0.00010315637658713757, "loss": 1.4908, "step": 22918 }, { "epoch": 1.8, "learning_rate": 0.00010314463518207858, "loss": 1.4826, "step": 22919 }, { "epoch": 1.8, "learning_rate": 0.00010313289409514169, "loss": 1.4761, "step": 22920 }, { "epoch": 1.8, "learning_rate": 0.00010312115332640657, "loss": 1.4753, "step": 22921 }, { "epoch": 1.8, "learning_rate": 0.00010310941287595291, "loss": 1.4427, "step": 22922 }, { "epoch": 1.8, "learning_rate": 0.00010309767274386049, "loss": 1.481, "step": 22923 }, { "epoch": 1.8, "learning_rate": 0.00010308593293020902, "loss": 1.4827, "step": 22924 }, { "epoch": 1.8, "learning_rate": 0.00010307419343507815, "loss": 1.4635, "step": 22925 }, { "epoch": 1.8, "learning_rate": 0.00010306245425854764, "loss": 1.4784, "step": 22926 }, { "epoch": 1.8, "learning_rate": 0.00010305071540069714, "loss": 1.4865, "step": 22927 }, { "epoch": 1.8, "learning_rate": 0.00010303897686160636, "loss": 1.5222, "step": 22928 }, { "epoch": 1.8, "learning_rate": 0.00010302723864135504, "loss": 1.4921, "step": 22929 }, { "epoch": 1.8, "learning_rate": 0.00010301550074002281, "loss": 1.5343, "step": 22930 }, { "epoch": 1.8, "learning_rate": 0.00010300376315768943, "loss": 1.4455, "step": 22931 }, { "epoch": 1.8, "learning_rate": 0.00010299202589443458, "loss": 1.4808, "step": 22932 }, { "epoch": 1.8, "learning_rate": 0.00010298028895033789, "loss": 1.4955, "step": 22933 }, { "epoch": 1.8, "learning_rate": 0.00010296855232547914, "loss": 1.5006, "step": 22934 }, { "epoch": 1.8, "learning_rate": 0.00010295681601993794, "loss": 1.5178, "step": 22935 }, { "epoch": 1.8, "learning_rate": 0.00010294508003379398, "loss": 1.4912, "step": 22936 }, { "epoch": 1.8, "learning_rate": 0.000102933344367127, "loss": 1.525, "step": 22937 }, { "epoch": 1.8, "learning_rate": 0.00010292160902001657, "loss": 1.5018, "step": 22938 }, { "epoch": 1.8, "learning_rate": 0.00010290987399254247, "loss": 1.5116, "step": 22939 }, { "epoch": 1.8, "learning_rate": 0.00010289813928478434, "loss": 1.4678, "step": 22940 }, { "epoch": 1.81, "learning_rate": 0.00010288640489682186, "loss": 1.4764, "step": 22941 }, { "epoch": 1.81, "learning_rate": 0.00010287467082873469, "loss": 1.4457, "step": 22942 }, { "epoch": 1.81, "learning_rate": 0.00010286293708060252, "loss": 1.4873, "step": 22943 }, { "epoch": 1.81, "learning_rate": 0.00010285120365250497, "loss": 1.5063, "step": 22944 }, { "epoch": 1.81, "learning_rate": 0.00010283947054452173, "loss": 1.5344, "step": 22945 }, { "epoch": 1.81, "learning_rate": 0.00010282773775673248, "loss": 1.4949, "step": 22946 }, { "epoch": 1.81, "learning_rate": 0.00010281600528921683, "loss": 1.4459, "step": 22947 }, { "epoch": 1.81, "learning_rate": 0.00010280427314205447, "loss": 1.4492, "step": 22948 }, { "epoch": 1.81, "learning_rate": 0.00010279254131532507, "loss": 1.4217, "step": 22949 }, { "epoch": 1.81, "learning_rate": 0.00010278080980910823, "loss": 1.5072, "step": 22950 }, { "epoch": 1.81, "learning_rate": 0.00010276907862348368, "loss": 1.5213, "step": 22951 }, { "epoch": 1.81, "learning_rate": 0.00010275734775853099, "loss": 1.4951, "step": 22952 }, { "epoch": 1.81, "learning_rate": 0.00010274561721432985, "loss": 1.5847, "step": 22953 }, { "epoch": 1.81, "learning_rate": 0.00010273388699095984, "loss": 1.5048, "step": 22954 }, { "epoch": 1.81, "learning_rate": 0.00010272215708850072, "loss": 1.5439, "step": 22955 }, { "epoch": 1.81, "learning_rate": 0.00010271042750703202, "loss": 1.477, "step": 22956 }, { "epoch": 1.81, "learning_rate": 0.00010269869824663344, "loss": 1.4352, "step": 22957 }, { "epoch": 1.81, "learning_rate": 0.00010268696930738464, "loss": 1.487, "step": 22958 }, { "epoch": 1.81, "learning_rate": 0.00010267524068936514, "loss": 1.4756, "step": 22959 }, { "epoch": 1.81, "learning_rate": 0.00010266351239265466, "loss": 1.4454, "step": 22960 }, { "epoch": 1.81, "learning_rate": 0.00010265178441733284, "loss": 1.4651, "step": 22961 }, { "epoch": 1.81, "learning_rate": 0.00010264005676347925, "loss": 1.4831, "step": 22962 }, { "epoch": 1.81, "learning_rate": 0.00010262832943117355, "loss": 1.4699, "step": 22963 }, { "epoch": 1.81, "learning_rate": 0.00010261660242049535, "loss": 1.508, "step": 22964 }, { "epoch": 1.81, "learning_rate": 0.00010260487573152424, "loss": 1.4717, "step": 22965 }, { "epoch": 1.81, "learning_rate": 0.00010259314936433992, "loss": 1.4451, "step": 22966 }, { "epoch": 1.81, "learning_rate": 0.00010258142331902193, "loss": 1.4724, "step": 22967 }, { "epoch": 1.81, "learning_rate": 0.00010256969759564992, "loss": 1.5254, "step": 22968 }, { "epoch": 1.81, "learning_rate": 0.0001025579721943034, "loss": 1.5293, "step": 22969 }, { "epoch": 1.81, "learning_rate": 0.00010254624711506215, "loss": 1.4848, "step": 22970 }, { "epoch": 1.81, "learning_rate": 0.00010253452235800568, "loss": 1.4734, "step": 22971 }, { "epoch": 1.81, "learning_rate": 0.00010252279792321365, "loss": 1.4733, "step": 22972 }, { "epoch": 1.81, "learning_rate": 0.00010251107381076556, "loss": 1.5553, "step": 22973 }, { "epoch": 1.81, "learning_rate": 0.0001024993500207411, "loss": 1.529, "step": 22974 }, { "epoch": 1.81, "learning_rate": 0.00010248762655321987, "loss": 1.4404, "step": 22975 }, { "epoch": 1.81, "learning_rate": 0.0001024759034082814, "loss": 1.5427, "step": 22976 }, { "epoch": 1.81, "learning_rate": 0.00010246418058600531, "loss": 1.4662, "step": 22977 }, { "epoch": 1.81, "learning_rate": 0.00010245245808647124, "loss": 1.4702, "step": 22978 }, { "epoch": 1.81, "learning_rate": 0.00010244073590975871, "loss": 1.4922, "step": 22979 }, { "epoch": 1.81, "learning_rate": 0.00010242901405594737, "loss": 1.4821, "step": 22980 }, { "epoch": 1.81, "learning_rate": 0.00010241729252511675, "loss": 1.4992, "step": 22981 }, { "epoch": 1.81, "learning_rate": 0.00010240557131734644, "loss": 1.4419, "step": 22982 }, { "epoch": 1.81, "learning_rate": 0.00010239385043271608, "loss": 1.5223, "step": 22983 }, { "epoch": 1.81, "learning_rate": 0.00010238212987130517, "loss": 1.4876, "step": 22984 }, { "epoch": 1.81, "learning_rate": 0.00010237040963319328, "loss": 1.4961, "step": 22985 }, { "epoch": 1.81, "learning_rate": 0.00010235868971846006, "loss": 1.5028, "step": 22986 }, { "epoch": 1.81, "learning_rate": 0.00010234697012718507, "loss": 1.442, "step": 22987 }, { "epoch": 1.81, "learning_rate": 0.00010233525085944783, "loss": 1.4895, "step": 22988 }, { "epoch": 1.81, "learning_rate": 0.00010232353191532795, "loss": 1.4778, "step": 22989 }, { "epoch": 1.81, "learning_rate": 0.00010231181329490499, "loss": 1.4689, "step": 22990 }, { "epoch": 1.81, "learning_rate": 0.00010230009499825848, "loss": 1.5079, "step": 22991 }, { "epoch": 1.81, "learning_rate": 0.00010228837702546801, "loss": 1.4551, "step": 22992 }, { "epoch": 1.81, "learning_rate": 0.00010227665937661313, "loss": 1.496, "step": 22993 }, { "epoch": 1.81, "learning_rate": 0.00010226494205177339, "loss": 1.4893, "step": 22994 }, { "epoch": 1.81, "learning_rate": 0.00010225322505102839, "loss": 1.5217, "step": 22995 }, { "epoch": 1.81, "learning_rate": 0.00010224150837445759, "loss": 1.4603, "step": 22996 }, { "epoch": 1.81, "learning_rate": 0.00010222979202214062, "loss": 1.5026, "step": 22997 }, { "epoch": 1.81, "learning_rate": 0.00010221807599415697, "loss": 1.5203, "step": 22998 }, { "epoch": 1.81, "learning_rate": 0.00010220636029058624, "loss": 1.5108, "step": 22999 }, { "epoch": 1.81, "learning_rate": 0.00010219464491150799, "loss": 1.4758, "step": 23000 }, { "epoch": 1.81, "learning_rate": 0.00010218292985700162, "loss": 1.5473, "step": 23001 }, { "epoch": 1.81, "learning_rate": 0.00010217121512714682, "loss": 1.4933, "step": 23002 }, { "epoch": 1.81, "learning_rate": 0.00010215950072202307, "loss": 1.5054, "step": 23003 }, { "epoch": 1.81, "learning_rate": 0.00010214778664170995, "loss": 1.448, "step": 23004 }, { "epoch": 1.81, "learning_rate": 0.00010213607288628692, "loss": 1.4779, "step": 23005 }, { "epoch": 1.81, "learning_rate": 0.00010212435945583352, "loss": 1.4982, "step": 23006 }, { "epoch": 1.81, "learning_rate": 0.00010211264635042933, "loss": 1.5869, "step": 23007 }, { "epoch": 1.81, "learning_rate": 0.00010210093357015384, "loss": 1.5239, "step": 23008 }, { "epoch": 1.81, "learning_rate": 0.0001020892211150866, "loss": 1.4848, "step": 23009 }, { "epoch": 1.81, "learning_rate": 0.00010207750898530707, "loss": 1.5005, "step": 23010 }, { "epoch": 1.81, "learning_rate": 0.0001020657971808948, "loss": 1.5111, "step": 23011 }, { "epoch": 1.81, "learning_rate": 0.00010205408570192937, "loss": 1.4591, "step": 23012 }, { "epoch": 1.81, "learning_rate": 0.0001020423745484902, "loss": 1.5381, "step": 23013 }, { "epoch": 1.81, "learning_rate": 0.00010203066372065684, "loss": 1.5171, "step": 23014 }, { "epoch": 1.81, "learning_rate": 0.00010201895321850883, "loss": 1.5242, "step": 23015 }, { "epoch": 1.81, "learning_rate": 0.00010200724304212562, "loss": 1.4484, "step": 23016 }, { "epoch": 1.81, "learning_rate": 0.00010199553319158671, "loss": 1.5298, "step": 23017 }, { "epoch": 1.81, "learning_rate": 0.00010198382366697168, "loss": 1.4984, "step": 23018 }, { "epoch": 1.81, "learning_rate": 0.00010197211446836002, "loss": 1.4855, "step": 23019 }, { "epoch": 1.81, "learning_rate": 0.00010196040559583115, "loss": 1.5343, "step": 23020 }, { "epoch": 1.81, "learning_rate": 0.00010194869704946465, "loss": 1.5338, "step": 23021 }, { "epoch": 1.81, "learning_rate": 0.00010193698882933998, "loss": 1.5077, "step": 23022 }, { "epoch": 1.81, "learning_rate": 0.0001019252809355366, "loss": 1.496, "step": 23023 }, { "epoch": 1.81, "learning_rate": 0.00010191357336813408, "loss": 1.4513, "step": 23024 }, { "epoch": 1.81, "learning_rate": 0.00010190186612721182, "loss": 1.4927, "step": 23025 }, { "epoch": 1.81, "learning_rate": 0.00010189015921284938, "loss": 1.5307, "step": 23026 }, { "epoch": 1.81, "learning_rate": 0.0001018784526251262, "loss": 1.4922, "step": 23027 }, { "epoch": 1.81, "learning_rate": 0.00010186674636412174, "loss": 1.5316, "step": 23028 }, { "epoch": 1.81, "learning_rate": 0.00010185504042991555, "loss": 1.4437, "step": 23029 }, { "epoch": 1.81, "learning_rate": 0.00010184333482258704, "loss": 1.5198, "step": 23030 }, { "epoch": 1.81, "learning_rate": 0.0001018316295422157, "loss": 1.5083, "step": 23031 }, { "epoch": 1.81, "learning_rate": 0.00010181992458888098, "loss": 1.4806, "step": 23032 }, { "epoch": 1.81, "learning_rate": 0.00010180821996266248, "loss": 1.5073, "step": 23033 }, { "epoch": 1.81, "learning_rate": 0.00010179651566363951, "loss": 1.467, "step": 23034 }, { "epoch": 1.81, "learning_rate": 0.00010178481169189161, "loss": 1.467, "step": 23035 }, { "epoch": 1.81, "learning_rate": 0.00010177310804749827, "loss": 1.4938, "step": 23036 }, { "epoch": 1.81, "learning_rate": 0.00010176140473053887, "loss": 1.4996, "step": 23037 }, { "epoch": 1.81, "learning_rate": 0.00010174970174109293, "loss": 1.4971, "step": 23038 }, { "epoch": 1.81, "learning_rate": 0.00010173799907923988, "loss": 1.448, "step": 23039 }, { "epoch": 1.81, "learning_rate": 0.00010172629674505917, "loss": 1.5061, "step": 23040 }, { "epoch": 1.81, "learning_rate": 0.0001017145947386303, "loss": 1.4966, "step": 23041 }, { "epoch": 1.81, "learning_rate": 0.00010170289306003266, "loss": 1.4931, "step": 23042 }, { "epoch": 1.81, "learning_rate": 0.00010169119170934572, "loss": 1.5274, "step": 23043 }, { "epoch": 1.81, "learning_rate": 0.00010167949068664896, "loss": 1.4545, "step": 23044 }, { "epoch": 1.81, "learning_rate": 0.00010166778999202176, "loss": 1.4611, "step": 23045 }, { "epoch": 1.81, "learning_rate": 0.00010165608962554362, "loss": 1.4817, "step": 23046 }, { "epoch": 1.81, "learning_rate": 0.00010164438958729393, "loss": 1.4668, "step": 23047 }, { "epoch": 1.81, "learning_rate": 0.00010163268987735211, "loss": 1.5251, "step": 23048 }, { "epoch": 1.81, "learning_rate": 0.00010162099049579767, "loss": 1.4751, "step": 23049 }, { "epoch": 1.81, "learning_rate": 0.00010160929144271005, "loss": 1.5318, "step": 23050 }, { "epoch": 1.81, "learning_rate": 0.00010159759271816858, "loss": 1.4913, "step": 23051 }, { "epoch": 1.81, "learning_rate": 0.00010158589432225278, "loss": 1.5081, "step": 23052 }, { "epoch": 1.81, "learning_rate": 0.00010157419625504204, "loss": 1.4747, "step": 23053 }, { "epoch": 1.81, "learning_rate": 0.00010156249851661577, "loss": 1.494, "step": 23054 }, { "epoch": 1.81, "learning_rate": 0.00010155080110705343, "loss": 1.4563, "step": 23055 }, { "epoch": 1.81, "learning_rate": 0.00010153910402643439, "loss": 1.5073, "step": 23056 }, { "epoch": 1.81, "learning_rate": 0.00010152740727483809, "loss": 1.4669, "step": 23057 }, { "epoch": 1.81, "learning_rate": 0.00010151571085234395, "loss": 1.5015, "step": 23058 }, { "epoch": 1.81, "learning_rate": 0.0001015040147590314, "loss": 1.4809, "step": 23059 }, { "epoch": 1.81, "learning_rate": 0.00010149231899497979, "loss": 1.4894, "step": 23060 }, { "epoch": 1.81, "learning_rate": 0.00010148062356026859, "loss": 1.4793, "step": 23061 }, { "epoch": 1.81, "learning_rate": 0.00010146892845497716, "loss": 1.4813, "step": 23062 }, { "epoch": 1.81, "learning_rate": 0.00010145723367918496, "loss": 1.4445, "step": 23063 }, { "epoch": 1.81, "learning_rate": 0.00010144553923297125, "loss": 1.4913, "step": 23064 }, { "epoch": 1.81, "learning_rate": 0.00010143384511641564, "loss": 1.4849, "step": 23065 }, { "epoch": 1.81, "learning_rate": 0.00010142215132959738, "loss": 1.5091, "step": 23066 }, { "epoch": 1.81, "learning_rate": 0.00010141045787259595, "loss": 1.5116, "step": 23067 }, { "epoch": 1.82, "learning_rate": 0.00010139876474549067, "loss": 1.4573, "step": 23068 }, { "epoch": 1.82, "learning_rate": 0.00010138707194836093, "loss": 1.4778, "step": 23069 }, { "epoch": 1.82, "learning_rate": 0.00010137537948128618, "loss": 1.491, "step": 23070 }, { "epoch": 1.82, "learning_rate": 0.00010136368734434576, "loss": 1.4263, "step": 23071 }, { "epoch": 1.82, "learning_rate": 0.00010135199553761906, "loss": 1.4591, "step": 23072 }, { "epoch": 1.82, "learning_rate": 0.00010134030406118548, "loss": 1.5257, "step": 23073 }, { "epoch": 1.82, "learning_rate": 0.00010132861291512436, "loss": 1.4615, "step": 23074 }, { "epoch": 1.82, "learning_rate": 0.00010131692209951513, "loss": 1.4619, "step": 23075 }, { "epoch": 1.82, "learning_rate": 0.00010130523161443708, "loss": 1.5101, "step": 23076 }, { "epoch": 1.82, "learning_rate": 0.00010129354145996967, "loss": 1.5424, "step": 23077 }, { "epoch": 1.82, "learning_rate": 0.00010128185163619227, "loss": 1.497, "step": 23078 }, { "epoch": 1.82, "learning_rate": 0.00010127016214318413, "loss": 1.548, "step": 23079 }, { "epoch": 1.82, "learning_rate": 0.00010125847298102473, "loss": 1.4805, "step": 23080 }, { "epoch": 1.82, "learning_rate": 0.0001012467841497934, "loss": 1.5035, "step": 23081 }, { "epoch": 1.82, "learning_rate": 0.00010123509564956953, "loss": 1.4556, "step": 23082 }, { "epoch": 1.82, "learning_rate": 0.00010122340748043242, "loss": 1.5092, "step": 23083 }, { "epoch": 1.82, "learning_rate": 0.0001012117196424615, "loss": 1.5532, "step": 23084 }, { "epoch": 1.82, "learning_rate": 0.00010120003213573604, "loss": 1.476, "step": 23085 }, { "epoch": 1.82, "learning_rate": 0.00010118834496033542, "loss": 1.5387, "step": 23086 }, { "epoch": 1.82, "learning_rate": 0.00010117665811633905, "loss": 1.4975, "step": 23087 }, { "epoch": 1.82, "learning_rate": 0.0001011649716038262, "loss": 1.4863, "step": 23088 }, { "epoch": 1.82, "learning_rate": 0.00010115328542287622, "loss": 1.5355, "step": 23089 }, { "epoch": 1.82, "learning_rate": 0.00010114159957356854, "loss": 1.4692, "step": 23090 }, { "epoch": 1.82, "learning_rate": 0.00010112991405598238, "loss": 1.4596, "step": 23091 }, { "epoch": 1.82, "learning_rate": 0.00010111822887019717, "loss": 1.498, "step": 23092 }, { "epoch": 1.82, "learning_rate": 0.0001011065440162922, "loss": 1.4717, "step": 23093 }, { "epoch": 1.82, "learning_rate": 0.00010109485949434678, "loss": 1.519, "step": 23094 }, { "epoch": 1.82, "learning_rate": 0.00010108317530444027, "loss": 1.5225, "step": 23095 }, { "epoch": 1.82, "learning_rate": 0.00010107149144665206, "loss": 1.5158, "step": 23096 }, { "epoch": 1.82, "learning_rate": 0.0001010598079210614, "loss": 1.4734, "step": 23097 }, { "epoch": 1.82, "learning_rate": 0.00010104812472774762, "loss": 1.471, "step": 23098 }, { "epoch": 1.82, "learning_rate": 0.00010103644186679009, "loss": 1.4027, "step": 23099 }, { "epoch": 1.82, "learning_rate": 0.00010102475933826809, "loss": 1.4616, "step": 23100 }, { "epoch": 1.82, "learning_rate": 0.00010101307714226093, "loss": 1.44, "step": 23101 }, { "epoch": 1.82, "learning_rate": 0.00010100139527884799, "loss": 1.4507, "step": 23102 }, { "epoch": 1.82, "learning_rate": 0.00010098971374810847, "loss": 1.5042, "step": 23103 }, { "epoch": 1.82, "learning_rate": 0.00010097803255012181, "loss": 1.4895, "step": 23104 }, { "epoch": 1.82, "learning_rate": 0.00010096635168496722, "loss": 1.5046, "step": 23105 }, { "epoch": 1.82, "learning_rate": 0.00010095467115272404, "loss": 1.4742, "step": 23106 }, { "epoch": 1.82, "learning_rate": 0.00010094299095347161, "loss": 1.5331, "step": 23107 }, { "epoch": 1.82, "learning_rate": 0.00010093131108728918, "loss": 1.4922, "step": 23108 }, { "epoch": 1.82, "learning_rate": 0.00010091963155425606, "loss": 1.4882, "step": 23109 }, { "epoch": 1.82, "learning_rate": 0.00010090795235445157, "loss": 1.5499, "step": 23110 }, { "epoch": 1.82, "learning_rate": 0.00010089627348795494, "loss": 1.4763, "step": 23111 }, { "epoch": 1.82, "learning_rate": 0.00010088459495484555, "loss": 1.5037, "step": 23112 }, { "epoch": 1.82, "learning_rate": 0.00010087291675520265, "loss": 1.4663, "step": 23113 }, { "epoch": 1.82, "learning_rate": 0.00010086123888910558, "loss": 1.5126, "step": 23114 }, { "epoch": 1.82, "learning_rate": 0.00010084956135663355, "loss": 1.492, "step": 23115 }, { "epoch": 1.82, "learning_rate": 0.0001008378841578659, "loss": 1.5243, "step": 23116 }, { "epoch": 1.82, "learning_rate": 0.00010082620729288185, "loss": 1.4971, "step": 23117 }, { "epoch": 1.82, "learning_rate": 0.00010081453076176071, "loss": 1.4985, "step": 23118 }, { "epoch": 1.82, "learning_rate": 0.0001008028545645818, "loss": 1.5018, "step": 23119 }, { "epoch": 1.82, "learning_rate": 0.00010079117870142435, "loss": 1.4952, "step": 23120 }, { "epoch": 1.82, "learning_rate": 0.00010077950317236764, "loss": 1.5402, "step": 23121 }, { "epoch": 1.82, "learning_rate": 0.00010076782797749094, "loss": 1.5079, "step": 23122 }, { "epoch": 1.82, "learning_rate": 0.0001007561531168735, "loss": 1.4781, "step": 23123 }, { "epoch": 1.82, "learning_rate": 0.00010074447859059464, "loss": 1.4385, "step": 23124 }, { "epoch": 1.82, "learning_rate": 0.00010073280439873356, "loss": 1.4781, "step": 23125 }, { "epoch": 1.82, "learning_rate": 0.00010072113054136954, "loss": 1.4826, "step": 23126 }, { "epoch": 1.82, "learning_rate": 0.00010070945701858183, "loss": 1.4774, "step": 23127 }, { "epoch": 1.82, "learning_rate": 0.00010069778383044977, "loss": 1.4778, "step": 23128 }, { "epoch": 1.82, "learning_rate": 0.00010068611097705252, "loss": 1.4795, "step": 23129 }, { "epoch": 1.82, "learning_rate": 0.00010067443845846935, "loss": 1.5305, "step": 23130 }, { "epoch": 1.82, "learning_rate": 0.00010066276627477956, "loss": 1.508, "step": 23131 }, { "epoch": 1.82, "learning_rate": 0.00010065109442606234, "loss": 1.5115, "step": 23132 }, { "epoch": 1.82, "learning_rate": 0.00010063942291239697, "loss": 1.5617, "step": 23133 }, { "epoch": 1.82, "learning_rate": 0.00010062775173386266, "loss": 1.5114, "step": 23134 }, { "epoch": 1.82, "learning_rate": 0.00010061608089053865, "loss": 1.4871, "step": 23135 }, { "epoch": 1.82, "learning_rate": 0.00010060441038250424, "loss": 1.4669, "step": 23136 }, { "epoch": 1.82, "learning_rate": 0.0001005927402098386, "loss": 1.4519, "step": 23137 }, { "epoch": 1.82, "learning_rate": 0.00010058107037262102, "loss": 1.4105, "step": 23138 }, { "epoch": 1.82, "learning_rate": 0.00010056940087093068, "loss": 1.5392, "step": 23139 }, { "epoch": 1.82, "learning_rate": 0.00010055773170484681, "loss": 1.4741, "step": 23140 }, { "epoch": 1.82, "learning_rate": 0.0001005460628744487, "loss": 1.4988, "step": 23141 }, { "epoch": 1.82, "learning_rate": 0.00010053439437981544, "loss": 1.4855, "step": 23142 }, { "epoch": 1.82, "learning_rate": 0.00010052272622102644, "loss": 1.4614, "step": 23143 }, { "epoch": 1.82, "learning_rate": 0.00010051105839816078, "loss": 1.4421, "step": 23144 }, { "epoch": 1.82, "learning_rate": 0.00010049939091129776, "loss": 1.482, "step": 23145 }, { "epoch": 1.82, "learning_rate": 0.00010048772376051651, "loss": 1.4988, "step": 23146 }, { "epoch": 1.82, "learning_rate": 0.00010047605694589633, "loss": 1.4412, "step": 23147 }, { "epoch": 1.82, "learning_rate": 0.0001004643904675164, "loss": 1.4968, "step": 23148 }, { "epoch": 1.82, "learning_rate": 0.00010045272432545592, "loss": 1.5058, "step": 23149 }, { "epoch": 1.82, "learning_rate": 0.00010044105851979408, "loss": 1.512, "step": 23150 }, { "epoch": 1.82, "learning_rate": 0.00010042939305061011, "loss": 1.4854, "step": 23151 }, { "epoch": 1.82, "learning_rate": 0.0001004177279179832, "loss": 1.5431, "step": 23152 }, { "epoch": 1.82, "learning_rate": 0.00010040606312199258, "loss": 1.4484, "step": 23153 }, { "epoch": 1.82, "learning_rate": 0.0001003943986627174, "loss": 1.4796, "step": 23154 }, { "epoch": 1.82, "learning_rate": 0.00010038273454023688, "loss": 1.4992, "step": 23155 }, { "epoch": 1.82, "learning_rate": 0.00010037107075463023, "loss": 1.4708, "step": 23156 }, { "epoch": 1.82, "learning_rate": 0.0001003594073059766, "loss": 1.5394, "step": 23157 }, { "epoch": 1.82, "learning_rate": 0.00010034774419435517, "loss": 1.5295, "step": 23158 }, { "epoch": 1.82, "learning_rate": 0.00010033608141984517, "loss": 1.423, "step": 23159 }, { "epoch": 1.82, "learning_rate": 0.00010032441898252584, "loss": 1.4703, "step": 23160 }, { "epoch": 1.82, "learning_rate": 0.00010031275688247622, "loss": 1.543, "step": 23161 }, { "epoch": 1.82, "learning_rate": 0.00010030109511977561, "loss": 1.4311, "step": 23162 }, { "epoch": 1.82, "learning_rate": 0.00010028943369450311, "loss": 1.5006, "step": 23163 }, { "epoch": 1.82, "learning_rate": 0.00010027777260673792, "loss": 1.4791, "step": 23164 }, { "epoch": 1.82, "learning_rate": 0.00010026611185655924, "loss": 1.5414, "step": 23165 }, { "epoch": 1.82, "learning_rate": 0.0001002544514440462, "loss": 1.4892, "step": 23166 }, { "epoch": 1.82, "learning_rate": 0.000100242791369278, "loss": 1.4704, "step": 23167 }, { "epoch": 1.82, "learning_rate": 0.00010023113163233375, "loss": 1.5016, "step": 23168 }, { "epoch": 1.82, "learning_rate": 0.00010021947223329267, "loss": 1.4912, "step": 23169 }, { "epoch": 1.82, "learning_rate": 0.00010020781317223392, "loss": 1.4829, "step": 23170 }, { "epoch": 1.82, "learning_rate": 0.00010019615444923662, "loss": 1.4721, "step": 23171 }, { "epoch": 1.82, "learning_rate": 0.00010018449606437995, "loss": 1.5134, "step": 23172 }, { "epoch": 1.82, "learning_rate": 0.00010017283801774308, "loss": 1.5038, "step": 23173 }, { "epoch": 1.82, "learning_rate": 0.00010016118030940508, "loss": 1.5026, "step": 23174 }, { "epoch": 1.82, "learning_rate": 0.0001001495229394452, "loss": 1.4628, "step": 23175 }, { "epoch": 1.82, "learning_rate": 0.00010013786590794255, "loss": 1.4898, "step": 23176 }, { "epoch": 1.82, "learning_rate": 0.0001001262092149763, "loss": 1.5195, "step": 23177 }, { "epoch": 1.82, "learning_rate": 0.00010011455286062555, "loss": 1.5194, "step": 23178 }, { "epoch": 1.82, "learning_rate": 0.00010010289684496946, "loss": 1.4768, "step": 23179 }, { "epoch": 1.82, "learning_rate": 0.00010009124116808717, "loss": 1.4865, "step": 23180 }, { "epoch": 1.82, "learning_rate": 0.00010007958583005778, "loss": 1.4597, "step": 23181 }, { "epoch": 1.82, "learning_rate": 0.0001000679308309605, "loss": 1.4952, "step": 23182 }, { "epoch": 1.82, "learning_rate": 0.00010005627617087437, "loss": 1.4849, "step": 23183 }, { "epoch": 1.82, "learning_rate": 0.00010004462184987858, "loss": 1.4883, "step": 23184 }, { "epoch": 1.82, "learning_rate": 0.00010003296786805229, "loss": 1.5479, "step": 23185 }, { "epoch": 1.82, "learning_rate": 0.0001000213142254745, "loss": 1.4993, "step": 23186 }, { "epoch": 1.82, "learning_rate": 0.00010000966092222444, "loss": 1.4793, "step": 23187 }, { "epoch": 1.82, "learning_rate": 9.999800795838119e-05, "loss": 1.4786, "step": 23188 }, { "epoch": 1.82, "learning_rate": 9.998635533402383e-05, "loss": 1.4791, "step": 23189 }, { "epoch": 1.82, "learning_rate": 9.997470304923156e-05, "loss": 1.5096, "step": 23190 }, { "epoch": 1.82, "learning_rate": 9.996305110408345e-05, "loss": 1.4732, "step": 23191 }, { "epoch": 1.82, "learning_rate": 9.995139949865862e-05, "loss": 1.4746, "step": 23192 }, { "epoch": 1.82, "learning_rate": 9.993974823303615e-05, "loss": 1.5067, "step": 23193 }, { "epoch": 1.82, "learning_rate": 9.992809730729518e-05, "loss": 1.4806, "step": 23194 }, { "epoch": 1.83, "learning_rate": 9.99164467215148e-05, "loss": 1.4541, "step": 23195 }, { "epoch": 1.83, "learning_rate": 9.990479647577411e-05, "loss": 1.4791, "step": 23196 }, { "epoch": 1.83, "learning_rate": 9.989314657015219e-05, "loss": 1.528, "step": 23197 }, { "epoch": 1.83, "learning_rate": 9.988149700472813e-05, "loss": 1.5084, "step": 23198 }, { "epoch": 1.83, "learning_rate": 9.986984777958112e-05, "loss": 1.5612, "step": 23199 }, { "epoch": 1.83, "learning_rate": 9.985819889479011e-05, "loss": 1.5408, "step": 23200 }, { "epoch": 1.83, "learning_rate": 9.984655035043428e-05, "loss": 1.5164, "step": 23201 }, { "epoch": 1.83, "learning_rate": 9.98349021465927e-05, "loss": 1.4374, "step": 23202 }, { "epoch": 1.83, "learning_rate": 9.982325428334446e-05, "loss": 1.4252, "step": 23203 }, { "epoch": 1.83, "learning_rate": 9.981160676076866e-05, "loss": 1.4942, "step": 23204 }, { "epoch": 1.83, "learning_rate": 9.979995957894424e-05, "loss": 1.4809, "step": 23205 }, { "epoch": 1.83, "learning_rate": 9.978831273795049e-05, "loss": 1.483, "step": 23206 }, { "epoch": 1.83, "learning_rate": 9.977666623786636e-05, "loss": 1.5499, "step": 23207 }, { "epoch": 1.83, "learning_rate": 9.976502007877098e-05, "loss": 1.4879, "step": 23208 }, { "epoch": 1.83, "learning_rate": 9.975337426074335e-05, "loss": 1.5193, "step": 23209 }, { "epoch": 1.83, "learning_rate": 9.97417287838626e-05, "loss": 1.4998, "step": 23210 }, { "epoch": 1.83, "learning_rate": 9.97300836482078e-05, "loss": 1.5015, "step": 23211 }, { "epoch": 1.83, "learning_rate": 9.971843885385795e-05, "loss": 1.52, "step": 23212 }, { "epoch": 1.83, "learning_rate": 9.970679440089218e-05, "loss": 1.51, "step": 23213 }, { "epoch": 1.83, "learning_rate": 9.969515028938954e-05, "loss": 1.5337, "step": 23214 }, { "epoch": 1.83, "learning_rate": 9.968350651942902e-05, "loss": 1.4732, "step": 23215 }, { "epoch": 1.83, "learning_rate": 9.967186309108976e-05, "loss": 1.5094, "step": 23216 }, { "epoch": 1.83, "learning_rate": 9.966022000445076e-05, "loss": 1.5066, "step": 23217 }, { "epoch": 1.83, "learning_rate": 9.964857725959107e-05, "loss": 1.4778, "step": 23218 }, { "epoch": 1.83, "learning_rate": 9.963693485658978e-05, "loss": 1.4559, "step": 23219 }, { "epoch": 1.83, "learning_rate": 9.96252927955259e-05, "loss": 1.5343, "step": 23220 }, { "epoch": 1.83, "learning_rate": 9.961365107647847e-05, "loss": 1.5254, "step": 23221 }, { "epoch": 1.83, "learning_rate": 9.960200969952654e-05, "loss": 1.4689, "step": 23222 }, { "epoch": 1.83, "learning_rate": 9.959036866474917e-05, "loss": 1.4973, "step": 23223 }, { "epoch": 1.83, "learning_rate": 9.957872797222539e-05, "loss": 1.4738, "step": 23224 }, { "epoch": 1.83, "learning_rate": 9.95670876220342e-05, "loss": 1.5202, "step": 23225 }, { "epoch": 1.83, "learning_rate": 9.955544761425468e-05, "loss": 1.4793, "step": 23226 }, { "epoch": 1.83, "learning_rate": 9.954380794896582e-05, "loss": 1.5485, "step": 23227 }, { "epoch": 1.83, "learning_rate": 9.953216862624667e-05, "loss": 1.4828, "step": 23228 }, { "epoch": 1.83, "learning_rate": 9.952052964617624e-05, "loss": 1.5201, "step": 23229 }, { "epoch": 1.83, "learning_rate": 9.950889100883352e-05, "loss": 1.4719, "step": 23230 }, { "epoch": 1.83, "learning_rate": 9.949725271429762e-05, "loss": 1.4592, "step": 23231 }, { "epoch": 1.83, "learning_rate": 9.948561476264749e-05, "loss": 1.5255, "step": 23232 }, { "epoch": 1.83, "learning_rate": 9.947397715396216e-05, "loss": 1.4423, "step": 23233 }, { "epoch": 1.83, "learning_rate": 9.946233988832063e-05, "loss": 1.4989, "step": 23234 }, { "epoch": 1.83, "learning_rate": 9.945070296580192e-05, "loss": 1.5015, "step": 23235 }, { "epoch": 1.83, "learning_rate": 9.943906638648506e-05, "loss": 1.4783, "step": 23236 }, { "epoch": 1.83, "learning_rate": 9.942743015044899e-05, "loss": 1.5405, "step": 23237 }, { "epoch": 1.83, "learning_rate": 9.941579425777279e-05, "loss": 1.476, "step": 23238 }, { "epoch": 1.83, "learning_rate": 9.940415870853542e-05, "loss": 1.4923, "step": 23239 }, { "epoch": 1.83, "learning_rate": 9.939252350281595e-05, "loss": 1.5342, "step": 23240 }, { "epoch": 1.83, "learning_rate": 9.938088864069326e-05, "loss": 1.4878, "step": 23241 }, { "epoch": 1.83, "learning_rate": 9.936925412224642e-05, "loss": 1.4526, "step": 23242 }, { "epoch": 1.83, "learning_rate": 9.935761994755441e-05, "loss": 1.5063, "step": 23243 }, { "epoch": 1.83, "learning_rate": 9.934598611669621e-05, "loss": 1.4893, "step": 23244 }, { "epoch": 1.83, "learning_rate": 9.933435262975082e-05, "loss": 1.4756, "step": 23245 }, { "epoch": 1.83, "learning_rate": 9.93227194867972e-05, "loss": 1.5063, "step": 23246 }, { "epoch": 1.83, "learning_rate": 9.931108668791433e-05, "loss": 1.4604, "step": 23247 }, { "epoch": 1.83, "learning_rate": 9.929945423318127e-05, "loss": 1.5556, "step": 23248 }, { "epoch": 1.83, "learning_rate": 9.92878221226769e-05, "loss": 1.4782, "step": 23249 }, { "epoch": 1.83, "learning_rate": 9.927619035648023e-05, "loss": 1.4677, "step": 23250 }, { "epoch": 1.83, "learning_rate": 9.926455893467024e-05, "loss": 1.4752, "step": 23251 }, { "epoch": 1.83, "learning_rate": 9.925292785732585e-05, "loss": 1.5321, "step": 23252 }, { "epoch": 1.83, "learning_rate": 9.924129712452611e-05, "loss": 1.4372, "step": 23253 }, { "epoch": 1.83, "learning_rate": 9.922966673634995e-05, "loss": 1.4731, "step": 23254 }, { "epoch": 1.83, "learning_rate": 9.921803669287638e-05, "loss": 1.5141, "step": 23255 }, { "epoch": 1.83, "learning_rate": 9.920640699418427e-05, "loss": 1.5115, "step": 23256 }, { "epoch": 1.83, "learning_rate": 9.919477764035266e-05, "loss": 1.5025, "step": 23257 }, { "epoch": 1.83, "learning_rate": 9.918314863146045e-05, "loss": 1.5393, "step": 23258 }, { "epoch": 1.83, "learning_rate": 9.917151996758661e-05, "loss": 1.4938, "step": 23259 }, { "epoch": 1.83, "learning_rate": 9.915989164881013e-05, "loss": 1.5019, "step": 23260 }, { "epoch": 1.83, "learning_rate": 9.91482636752099e-05, "loss": 1.4829, "step": 23261 }, { "epoch": 1.83, "learning_rate": 9.913663604686494e-05, "loss": 1.5005, "step": 23262 }, { "epoch": 1.83, "learning_rate": 9.912500876385411e-05, "loss": 1.4897, "step": 23263 }, { "epoch": 1.83, "learning_rate": 9.911338182625639e-05, "loss": 1.5313, "step": 23264 }, { "epoch": 1.83, "learning_rate": 9.910175523415076e-05, "loss": 1.4891, "step": 23265 }, { "epoch": 1.83, "learning_rate": 9.90901289876161e-05, "loss": 1.4781, "step": 23266 }, { "epoch": 1.83, "learning_rate": 9.907850308673136e-05, "loss": 1.4773, "step": 23267 }, { "epoch": 1.83, "learning_rate": 9.906687753157544e-05, "loss": 1.447, "step": 23268 }, { "epoch": 1.83, "learning_rate": 9.905525232222742e-05, "loss": 1.5631, "step": 23269 }, { "epoch": 1.83, "learning_rate": 9.904362745876608e-05, "loss": 1.4349, "step": 23270 }, { "epoch": 1.83, "learning_rate": 9.903200294127035e-05, "loss": 1.5655, "step": 23271 }, { "epoch": 1.83, "learning_rate": 9.902037876981926e-05, "loss": 1.4839, "step": 23272 }, { "epoch": 1.83, "learning_rate": 9.900875494449162e-05, "loss": 1.4854, "step": 23273 }, { "epoch": 1.83, "learning_rate": 9.899713146536644e-05, "loss": 1.5485, "step": 23274 }, { "epoch": 1.83, "learning_rate": 9.898550833252256e-05, "loss": 1.5119, "step": 23275 }, { "epoch": 1.83, "learning_rate": 9.89738855460389e-05, "loss": 1.4561, "step": 23276 }, { "epoch": 1.83, "learning_rate": 9.896226310599445e-05, "loss": 1.5289, "step": 23277 }, { "epoch": 1.83, "learning_rate": 9.895064101246805e-05, "loss": 1.4963, "step": 23278 }, { "epoch": 1.83, "learning_rate": 9.893901926553862e-05, "loss": 1.463, "step": 23279 }, { "epoch": 1.83, "learning_rate": 9.892739786528508e-05, "loss": 1.4729, "step": 23280 }, { "epoch": 1.83, "learning_rate": 9.891577681178631e-05, "loss": 1.4852, "step": 23281 }, { "epoch": 1.83, "learning_rate": 9.890415610512125e-05, "loss": 1.4672, "step": 23282 }, { "epoch": 1.83, "learning_rate": 9.889253574536874e-05, "loss": 1.4813, "step": 23283 }, { "epoch": 1.83, "learning_rate": 9.888091573260766e-05, "loss": 1.5023, "step": 23284 }, { "epoch": 1.83, "learning_rate": 9.886929606691704e-05, "loss": 1.4814, "step": 23285 }, { "epoch": 1.83, "learning_rate": 9.885767674837566e-05, "loss": 1.5318, "step": 23286 }, { "epoch": 1.83, "learning_rate": 9.884605777706244e-05, "loss": 1.4603, "step": 23287 }, { "epoch": 1.83, "learning_rate": 9.883443915305623e-05, "loss": 1.4687, "step": 23288 }, { "epoch": 1.83, "learning_rate": 9.882282087643597e-05, "loss": 1.4829, "step": 23289 }, { "epoch": 1.83, "learning_rate": 9.881120294728052e-05, "loss": 1.4893, "step": 23290 }, { "epoch": 1.83, "learning_rate": 9.879958536566875e-05, "loss": 1.5107, "step": 23291 }, { "epoch": 1.83, "learning_rate": 9.878796813167952e-05, "loss": 1.4976, "step": 23292 }, { "epoch": 1.83, "learning_rate": 9.877635124539173e-05, "loss": 1.5122, "step": 23293 }, { "epoch": 1.83, "learning_rate": 9.876473470688426e-05, "loss": 1.4882, "step": 23294 }, { "epoch": 1.83, "learning_rate": 9.875311851623596e-05, "loss": 1.4889, "step": 23295 }, { "epoch": 1.83, "learning_rate": 9.87415026735257e-05, "loss": 1.4956, "step": 23296 }, { "epoch": 1.83, "learning_rate": 9.872988717883239e-05, "loss": 1.4513, "step": 23297 }, { "epoch": 1.83, "learning_rate": 9.87182720322348e-05, "loss": 1.5278, "step": 23298 }, { "epoch": 1.83, "learning_rate": 9.870665723381182e-05, "loss": 1.5456, "step": 23299 }, { "epoch": 1.83, "learning_rate": 9.869504278364238e-05, "loss": 1.5336, "step": 23300 }, { "epoch": 1.83, "learning_rate": 9.86834286818053e-05, "loss": 1.4963, "step": 23301 }, { "epoch": 1.83, "learning_rate": 9.867181492837938e-05, "loss": 1.5211, "step": 23302 }, { "epoch": 1.83, "learning_rate": 9.866020152344354e-05, "loss": 1.5356, "step": 23303 }, { "epoch": 1.83, "learning_rate": 9.86485884670766e-05, "loss": 1.505, "step": 23304 }, { "epoch": 1.83, "learning_rate": 9.863697575935738e-05, "loss": 1.4933, "step": 23305 }, { "epoch": 1.83, "learning_rate": 9.862536340036478e-05, "loss": 1.5003, "step": 23306 }, { "epoch": 1.83, "learning_rate": 9.861375139017762e-05, "loss": 1.524, "step": 23307 }, { "epoch": 1.83, "learning_rate": 9.860213972887469e-05, "loss": 1.4502, "step": 23308 }, { "epoch": 1.83, "learning_rate": 9.859052841653492e-05, "loss": 1.5013, "step": 23309 }, { "epoch": 1.83, "learning_rate": 9.857891745323704e-05, "loss": 1.489, "step": 23310 }, { "epoch": 1.83, "learning_rate": 9.856730683905997e-05, "loss": 1.4755, "step": 23311 }, { "epoch": 1.83, "learning_rate": 9.855569657408248e-05, "loss": 1.4971, "step": 23312 }, { "epoch": 1.83, "learning_rate": 9.854408665838343e-05, "loss": 1.5056, "step": 23313 }, { "epoch": 1.83, "learning_rate": 9.853247709204165e-05, "loss": 1.5129, "step": 23314 }, { "epoch": 1.83, "learning_rate": 9.852086787513589e-05, "loss": 1.4901, "step": 23315 }, { "epoch": 1.83, "learning_rate": 9.850925900774508e-05, "loss": 1.4541, "step": 23316 }, { "epoch": 1.83, "learning_rate": 9.849765048994796e-05, "loss": 1.4747, "step": 23317 }, { "epoch": 1.83, "learning_rate": 9.848604232182342e-05, "loss": 1.4944, "step": 23318 }, { "epoch": 1.83, "learning_rate": 9.847443450345018e-05, "loss": 1.482, "step": 23319 }, { "epoch": 1.83, "learning_rate": 9.846282703490715e-05, "loss": 1.4598, "step": 23320 }, { "epoch": 1.83, "learning_rate": 9.8451219916273e-05, "loss": 1.4648, "step": 23321 }, { "epoch": 1.84, "learning_rate": 9.843961314762668e-05, "loss": 1.5068, "step": 23322 }, { "epoch": 1.84, "learning_rate": 9.842800672904693e-05, "loss": 1.4899, "step": 23323 }, { "epoch": 1.84, "learning_rate": 9.841640066061254e-05, "loss": 1.4411, "step": 23324 }, { "epoch": 1.84, "learning_rate": 9.840479494240231e-05, "loss": 1.4817, "step": 23325 }, { "epoch": 1.84, "learning_rate": 9.839318957449509e-05, "loss": 1.5139, "step": 23326 }, { "epoch": 1.84, "learning_rate": 9.83815845569696e-05, "loss": 1.5073, "step": 23327 }, { "epoch": 1.84, "learning_rate": 9.83699798899047e-05, "loss": 1.5103, "step": 23328 }, { "epoch": 1.84, "learning_rate": 9.83583755733791e-05, "loss": 1.4886, "step": 23329 }, { "epoch": 1.84, "learning_rate": 9.834677160747164e-05, "loss": 1.5074, "step": 23330 }, { "epoch": 1.84, "learning_rate": 9.833516799226107e-05, "loss": 1.4846, "step": 23331 }, { "epoch": 1.84, "learning_rate": 9.832356472782626e-05, "loss": 1.5083, "step": 23332 }, { "epoch": 1.84, "learning_rate": 9.83119618142459e-05, "loss": 1.4695, "step": 23333 }, { "epoch": 1.84, "learning_rate": 9.83003592515988e-05, "loss": 1.4922, "step": 23334 }, { "epoch": 1.84, "learning_rate": 9.828875703996372e-05, "loss": 1.4509, "step": 23335 }, { "epoch": 1.84, "learning_rate": 9.827715517941945e-05, "loss": 1.4694, "step": 23336 }, { "epoch": 1.84, "learning_rate": 9.826555367004476e-05, "loss": 1.5196, "step": 23337 }, { "epoch": 1.84, "learning_rate": 9.825395251191842e-05, "loss": 1.4977, "step": 23338 }, { "epoch": 1.84, "learning_rate": 9.824235170511917e-05, "loss": 1.4824, "step": 23339 }, { "epoch": 1.84, "learning_rate": 9.823075124972583e-05, "loss": 1.4403, "step": 23340 }, { "epoch": 1.84, "learning_rate": 9.821915114581706e-05, "loss": 1.4389, "step": 23341 }, { "epoch": 1.84, "learning_rate": 9.82075513934717e-05, "loss": 1.5082, "step": 23342 }, { "epoch": 1.84, "learning_rate": 9.81959519927685e-05, "loss": 1.4626, "step": 23343 }, { "epoch": 1.84, "learning_rate": 9.818435294378617e-05, "loss": 1.4829, "step": 23344 }, { "epoch": 1.84, "learning_rate": 9.817275424660352e-05, "loss": 1.5267, "step": 23345 }, { "epoch": 1.84, "learning_rate": 9.816115590129925e-05, "loss": 1.4914, "step": 23346 }, { "epoch": 1.84, "learning_rate": 9.814955790795211e-05, "loss": 1.4862, "step": 23347 }, { "epoch": 1.84, "learning_rate": 9.813796026664086e-05, "loss": 1.5304, "step": 23348 }, { "epoch": 1.84, "learning_rate": 9.812636297744427e-05, "loss": 1.4628, "step": 23349 }, { "epoch": 1.84, "learning_rate": 9.811476604044102e-05, "loss": 1.4947, "step": 23350 }, { "epoch": 1.84, "learning_rate": 9.81031694557099e-05, "loss": 1.5369, "step": 23351 }, { "epoch": 1.84, "learning_rate": 9.809157322332962e-05, "loss": 1.4544, "step": 23352 }, { "epoch": 1.84, "learning_rate": 9.80799773433789e-05, "loss": 1.4716, "step": 23353 }, { "epoch": 1.84, "learning_rate": 9.806838181593648e-05, "loss": 1.5128, "step": 23354 }, { "epoch": 1.84, "learning_rate": 9.80567866410811e-05, "loss": 1.4711, "step": 23355 }, { "epoch": 1.84, "learning_rate": 9.804519181889146e-05, "loss": 1.5027, "step": 23356 }, { "epoch": 1.84, "learning_rate": 9.803359734944633e-05, "loss": 1.4414, "step": 23357 }, { "epoch": 1.84, "learning_rate": 9.802200323282436e-05, "loss": 1.4758, "step": 23358 }, { "epoch": 1.84, "learning_rate": 9.801040946910431e-05, "loss": 1.4998, "step": 23359 }, { "epoch": 1.84, "learning_rate": 9.799881605836493e-05, "loss": 1.5293, "step": 23360 }, { "epoch": 1.84, "learning_rate": 9.798722300068482e-05, "loss": 1.4766, "step": 23361 }, { "epoch": 1.84, "learning_rate": 9.797563029614278e-05, "loss": 1.4813, "step": 23362 }, { "epoch": 1.84, "learning_rate": 9.796403794481751e-05, "loss": 1.4586, "step": 23363 }, { "epoch": 1.84, "learning_rate": 9.795244594678774e-05, "loss": 1.4692, "step": 23364 }, { "epoch": 1.84, "learning_rate": 9.79408543021321e-05, "loss": 1.461, "step": 23365 }, { "epoch": 1.84, "learning_rate": 9.792926301092934e-05, "loss": 1.492, "step": 23366 }, { "epoch": 1.84, "learning_rate": 9.791767207325819e-05, "loss": 1.5019, "step": 23367 }, { "epoch": 1.84, "learning_rate": 9.790608148919726e-05, "loss": 1.4644, "step": 23368 }, { "epoch": 1.84, "learning_rate": 9.789449125882531e-05, "loss": 1.4834, "step": 23369 }, { "epoch": 1.84, "learning_rate": 9.7882901382221e-05, "loss": 1.4351, "step": 23370 }, { "epoch": 1.84, "learning_rate": 9.787131185946303e-05, "loss": 1.4679, "step": 23371 }, { "epoch": 1.84, "learning_rate": 9.78597226906301e-05, "loss": 1.4277, "step": 23372 }, { "epoch": 1.84, "learning_rate": 9.784813387580086e-05, "loss": 1.494, "step": 23373 }, { "epoch": 1.84, "learning_rate": 9.783654541505404e-05, "loss": 1.4189, "step": 23374 }, { "epoch": 1.84, "learning_rate": 9.782495730846825e-05, "loss": 1.4776, "step": 23375 }, { "epoch": 1.84, "learning_rate": 9.781336955612222e-05, "loss": 1.4519, "step": 23376 }, { "epoch": 1.84, "learning_rate": 9.780178215809465e-05, "loss": 1.4571, "step": 23377 }, { "epoch": 1.84, "learning_rate": 9.779019511446409e-05, "loss": 1.4977, "step": 23378 }, { "epoch": 1.84, "learning_rate": 9.777860842530933e-05, "loss": 1.4889, "step": 23379 }, { "epoch": 1.84, "learning_rate": 9.776702209070901e-05, "loss": 1.5173, "step": 23380 }, { "epoch": 1.84, "learning_rate": 9.77554361107418e-05, "loss": 1.4579, "step": 23381 }, { "epoch": 1.84, "learning_rate": 9.774385048548635e-05, "loss": 1.4513, "step": 23382 }, { "epoch": 1.84, "learning_rate": 9.773226521502128e-05, "loss": 1.4969, "step": 23383 }, { "epoch": 1.84, "learning_rate": 9.772068029942533e-05, "loss": 1.4716, "step": 23384 }, { "epoch": 1.84, "learning_rate": 9.770909573877709e-05, "loss": 1.5082, "step": 23385 }, { "epoch": 1.84, "learning_rate": 9.769751153315525e-05, "loss": 1.4596, "step": 23386 }, { "epoch": 1.84, "learning_rate": 9.768592768263843e-05, "loss": 1.4261, "step": 23387 }, { "epoch": 1.84, "learning_rate": 9.767434418730527e-05, "loss": 1.5104, "step": 23388 }, { "epoch": 1.84, "learning_rate": 9.766276104723447e-05, "loss": 1.4805, "step": 23389 }, { "epoch": 1.84, "learning_rate": 9.765117826250463e-05, "loss": 1.512, "step": 23390 }, { "epoch": 1.84, "learning_rate": 9.763959583319439e-05, "loss": 1.4795, "step": 23391 }, { "epoch": 1.84, "learning_rate": 9.762801375938244e-05, "loss": 1.5051, "step": 23392 }, { "epoch": 1.84, "learning_rate": 9.761643204114733e-05, "loss": 1.4243, "step": 23393 }, { "epoch": 1.84, "learning_rate": 9.760485067856772e-05, "loss": 1.5309, "step": 23394 }, { "epoch": 1.84, "learning_rate": 9.759326967172228e-05, "loss": 1.5165, "step": 23395 }, { "epoch": 1.84, "learning_rate": 9.758168902068965e-05, "loss": 1.465, "step": 23396 }, { "epoch": 1.84, "learning_rate": 9.75701087255484e-05, "loss": 1.5044, "step": 23397 }, { "epoch": 1.84, "learning_rate": 9.755852878637721e-05, "loss": 1.5182, "step": 23398 }, { "epoch": 1.84, "learning_rate": 9.754694920325463e-05, "loss": 1.4665, "step": 23399 }, { "epoch": 1.84, "learning_rate": 9.753536997625933e-05, "loss": 1.5361, "step": 23400 }, { "epoch": 1.84, "learning_rate": 9.752379110546993e-05, "loss": 1.4974, "step": 23401 }, { "epoch": 1.84, "learning_rate": 9.751221259096503e-05, "loss": 1.512, "step": 23402 }, { "epoch": 1.84, "learning_rate": 9.750063443282322e-05, "loss": 1.4664, "step": 23403 }, { "epoch": 1.84, "learning_rate": 9.748905663112313e-05, "loss": 1.5198, "step": 23404 }, { "epoch": 1.84, "learning_rate": 9.747747918594338e-05, "loss": 1.5047, "step": 23405 }, { "epoch": 1.84, "learning_rate": 9.746590209736259e-05, "loss": 1.4858, "step": 23406 }, { "epoch": 1.84, "learning_rate": 9.745432536545929e-05, "loss": 1.4792, "step": 23407 }, { "epoch": 1.84, "learning_rate": 9.744274899031213e-05, "loss": 1.4798, "step": 23408 }, { "epoch": 1.84, "learning_rate": 9.743117297199966e-05, "loss": 1.4948, "step": 23409 }, { "epoch": 1.84, "learning_rate": 9.74195973106006e-05, "loss": 1.4942, "step": 23410 }, { "epoch": 1.84, "learning_rate": 9.74080220061934e-05, "loss": 1.5059, "step": 23411 }, { "epoch": 1.84, "learning_rate": 9.739644705885673e-05, "loss": 1.5608, "step": 23412 }, { "epoch": 1.84, "learning_rate": 9.738487246866916e-05, "loss": 1.4676, "step": 23413 }, { "epoch": 1.84, "learning_rate": 9.737329823570927e-05, "loss": 1.499, "step": 23414 }, { "epoch": 1.84, "learning_rate": 9.736172436005567e-05, "loss": 1.4901, "step": 23415 }, { "epoch": 1.84, "learning_rate": 9.735015084178685e-05, "loss": 1.5026, "step": 23416 }, { "epoch": 1.84, "learning_rate": 9.73385776809815e-05, "loss": 1.5026, "step": 23417 }, { "epoch": 1.84, "learning_rate": 9.732700487771814e-05, "loss": 1.4818, "step": 23418 }, { "epoch": 1.84, "learning_rate": 9.731543243207534e-05, "loss": 1.4671, "step": 23419 }, { "epoch": 1.84, "learning_rate": 9.730386034413166e-05, "loss": 1.5509, "step": 23420 }, { "epoch": 1.84, "learning_rate": 9.729228861396574e-05, "loss": 1.5083, "step": 23421 }, { "epoch": 1.84, "learning_rate": 9.728071724165603e-05, "loss": 1.4984, "step": 23422 }, { "epoch": 1.84, "learning_rate": 9.726914622728121e-05, "loss": 1.5074, "step": 23423 }, { "epoch": 1.84, "learning_rate": 9.725757557091978e-05, "loss": 1.4909, "step": 23424 }, { "epoch": 1.84, "learning_rate": 9.724600527265025e-05, "loss": 1.5224, "step": 23425 }, { "epoch": 1.84, "learning_rate": 9.723443533255126e-05, "loss": 1.4898, "step": 23426 }, { "epoch": 1.84, "learning_rate": 9.722286575070138e-05, "loss": 1.4639, "step": 23427 }, { "epoch": 1.84, "learning_rate": 9.721129652717906e-05, "loss": 1.4479, "step": 23428 }, { "epoch": 1.84, "learning_rate": 9.719972766206294e-05, "loss": 1.4637, "step": 23429 }, { "epoch": 1.84, "learning_rate": 9.718815915543153e-05, "loss": 1.4653, "step": 23430 }, { "epoch": 1.84, "learning_rate": 9.717659100736338e-05, "loss": 1.4824, "step": 23431 }, { "epoch": 1.84, "learning_rate": 9.716502321793702e-05, "loss": 1.5005, "step": 23432 }, { "epoch": 1.84, "learning_rate": 9.715345578723099e-05, "loss": 1.5072, "step": 23433 }, { "epoch": 1.84, "learning_rate": 9.714188871532382e-05, "loss": 1.45, "step": 23434 }, { "epoch": 1.84, "learning_rate": 9.713032200229409e-05, "loss": 1.5104, "step": 23435 }, { "epoch": 1.84, "learning_rate": 9.711875564822027e-05, "loss": 1.569, "step": 23436 }, { "epoch": 1.84, "learning_rate": 9.710718965318093e-05, "loss": 1.5614, "step": 23437 }, { "epoch": 1.84, "learning_rate": 9.70956240172546e-05, "loss": 1.5018, "step": 23438 }, { "epoch": 1.84, "learning_rate": 9.708405874051977e-05, "loss": 1.4734, "step": 23439 }, { "epoch": 1.84, "learning_rate": 9.707249382305499e-05, "loss": 1.4676, "step": 23440 }, { "epoch": 1.84, "learning_rate": 9.706092926493868e-05, "loss": 1.4999, "step": 23441 }, { "epoch": 1.84, "learning_rate": 9.704936506624954e-05, "loss": 1.4864, "step": 23442 }, { "epoch": 1.84, "learning_rate": 9.703780122706598e-05, "loss": 1.4717, "step": 23443 }, { "epoch": 1.84, "learning_rate": 9.702623774746652e-05, "loss": 1.4734, "step": 23444 }, { "epoch": 1.84, "learning_rate": 9.701467462752967e-05, "loss": 1.4778, "step": 23445 }, { "epoch": 1.84, "learning_rate": 9.700311186733391e-05, "loss": 1.5141, "step": 23446 }, { "epoch": 1.84, "learning_rate": 9.699154946695782e-05, "loss": 1.4717, "step": 23447 }, { "epoch": 1.84, "learning_rate": 9.697998742647985e-05, "loss": 1.5033, "step": 23448 }, { "epoch": 1.84, "learning_rate": 9.696842574597847e-05, "loss": 1.4964, "step": 23449 }, { "epoch": 1.85, "learning_rate": 9.695686442553226e-05, "loss": 1.4609, "step": 23450 }, { "epoch": 1.85, "learning_rate": 9.694530346521963e-05, "loss": 1.4683, "step": 23451 }, { "epoch": 1.85, "learning_rate": 9.693374286511915e-05, "loss": 1.5289, "step": 23452 }, { "epoch": 1.85, "learning_rate": 9.692218262530925e-05, "loss": 1.494, "step": 23453 }, { "epoch": 1.85, "learning_rate": 9.691062274586841e-05, "loss": 1.5068, "step": 23454 }, { "epoch": 1.85, "learning_rate": 9.68990632268752e-05, "loss": 1.4706, "step": 23455 }, { "epoch": 1.85, "learning_rate": 9.688750406840802e-05, "loss": 1.5269, "step": 23456 }, { "epoch": 1.85, "learning_rate": 9.687594527054533e-05, "loss": 1.4539, "step": 23457 }, { "epoch": 1.85, "learning_rate": 9.686438683336571e-05, "loss": 1.5188, "step": 23458 }, { "epoch": 1.85, "learning_rate": 9.68528287569476e-05, "loss": 1.4609, "step": 23459 }, { "epoch": 1.85, "learning_rate": 9.68412710413694e-05, "loss": 1.4507, "step": 23460 }, { "epoch": 1.85, "learning_rate": 9.68297136867097e-05, "loss": 1.4885, "step": 23461 }, { "epoch": 1.85, "learning_rate": 9.681815669304685e-05, "loss": 1.5065, "step": 23462 }, { "epoch": 1.85, "learning_rate": 9.680660006045938e-05, "loss": 1.4876, "step": 23463 }, { "epoch": 1.85, "learning_rate": 9.679504378902576e-05, "loss": 1.5133, "step": 23464 }, { "epoch": 1.85, "learning_rate": 9.67834878788244e-05, "loss": 1.4907, "step": 23465 }, { "epoch": 1.85, "learning_rate": 9.677193232993378e-05, "loss": 1.5112, "step": 23466 }, { "epoch": 1.85, "learning_rate": 9.676037714243243e-05, "loss": 1.4446, "step": 23467 }, { "epoch": 1.85, "learning_rate": 9.674882231639869e-05, "loss": 1.5131, "step": 23468 }, { "epoch": 1.85, "learning_rate": 9.67372678519111e-05, "loss": 1.442, "step": 23469 }, { "epoch": 1.85, "learning_rate": 9.672571374904803e-05, "loss": 1.4759, "step": 23470 }, { "epoch": 1.85, "learning_rate": 9.671416000788796e-05, "loss": 1.4635, "step": 23471 }, { "epoch": 1.85, "learning_rate": 9.67026066285093e-05, "loss": 1.4882, "step": 23472 }, { "epoch": 1.85, "learning_rate": 9.669105361099062e-05, "loss": 1.478, "step": 23473 }, { "epoch": 1.85, "learning_rate": 9.667950095541021e-05, "loss": 1.4503, "step": 23474 }, { "epoch": 1.85, "learning_rate": 9.666794866184656e-05, "loss": 1.4998, "step": 23475 }, { "epoch": 1.85, "learning_rate": 9.665639673037815e-05, "loss": 1.4393, "step": 23476 }, { "epoch": 1.85, "learning_rate": 9.664484516108335e-05, "loss": 1.5105, "step": 23477 }, { "epoch": 1.85, "learning_rate": 9.66332939540406e-05, "loss": 1.4936, "step": 23478 }, { "epoch": 1.85, "learning_rate": 9.662174310932835e-05, "loss": 1.5446, "step": 23479 }, { "epoch": 1.85, "learning_rate": 9.661019262702499e-05, "loss": 1.5527, "step": 23480 }, { "epoch": 1.85, "learning_rate": 9.6598642507209e-05, "loss": 1.4658, "step": 23481 }, { "epoch": 1.85, "learning_rate": 9.65870927499587e-05, "loss": 1.5304, "step": 23482 }, { "epoch": 1.85, "learning_rate": 9.657554335535259e-05, "loss": 1.4681, "step": 23483 }, { "epoch": 1.85, "learning_rate": 9.656399432346908e-05, "loss": 1.4807, "step": 23484 }, { "epoch": 1.85, "learning_rate": 9.655244565438653e-05, "loss": 1.4582, "step": 23485 }, { "epoch": 1.85, "learning_rate": 9.654089734818341e-05, "loss": 1.5132, "step": 23486 }, { "epoch": 1.85, "learning_rate": 9.652934940493806e-05, "loss": 1.4245, "step": 23487 }, { "epoch": 1.85, "learning_rate": 9.651780182472888e-05, "loss": 1.5041, "step": 23488 }, { "epoch": 1.85, "learning_rate": 9.650625460763437e-05, "loss": 1.4644, "step": 23489 }, { "epoch": 1.85, "learning_rate": 9.649470775373283e-05, "loss": 1.4746, "step": 23490 }, { "epoch": 1.85, "learning_rate": 9.648316126310278e-05, "loss": 1.5013, "step": 23491 }, { "epoch": 1.85, "learning_rate": 9.647161513582248e-05, "loss": 1.502, "step": 23492 }, { "epoch": 1.85, "learning_rate": 9.646006937197039e-05, "loss": 1.513, "step": 23493 }, { "epoch": 1.85, "learning_rate": 9.644852397162487e-05, "loss": 1.4957, "step": 23494 }, { "epoch": 1.85, "learning_rate": 9.64369789348643e-05, "loss": 1.4874, "step": 23495 }, { "epoch": 1.85, "learning_rate": 9.642543426176714e-05, "loss": 1.4818, "step": 23496 }, { "epoch": 1.85, "learning_rate": 9.641388995241166e-05, "loss": 1.512, "step": 23497 }, { "epoch": 1.85, "learning_rate": 9.640234600687635e-05, "loss": 1.5519, "step": 23498 }, { "epoch": 1.85, "learning_rate": 9.639080242523949e-05, "loss": 1.4904, "step": 23499 }, { "epoch": 1.85, "learning_rate": 9.637925920757949e-05, "loss": 1.4725, "step": 23500 }, { "epoch": 1.85, "learning_rate": 9.636771635397479e-05, "loss": 1.4727, "step": 23501 }, { "epoch": 1.85, "learning_rate": 9.635617386450364e-05, "loss": 1.5369, "step": 23502 }, { "epoch": 1.85, "learning_rate": 9.634463173924448e-05, "loss": 1.5091, "step": 23503 }, { "epoch": 1.85, "learning_rate": 9.633308997827562e-05, "loss": 1.4908, "step": 23504 }, { "epoch": 1.85, "learning_rate": 9.632154858167553e-05, "loss": 1.5146, "step": 23505 }, { "epoch": 1.85, "learning_rate": 9.631000754952248e-05, "loss": 1.4644, "step": 23506 }, { "epoch": 1.85, "learning_rate": 9.629846688189484e-05, "loss": 1.4562, "step": 23507 }, { "epoch": 1.85, "learning_rate": 9.628692657887101e-05, "loss": 1.4431, "step": 23508 }, { "epoch": 1.85, "learning_rate": 9.627538664052927e-05, "loss": 1.5275, "step": 23509 }, { "epoch": 1.85, "learning_rate": 9.626384706694805e-05, "loss": 1.4235, "step": 23510 }, { "epoch": 1.85, "learning_rate": 9.62523078582056e-05, "loss": 1.5252, "step": 23511 }, { "epoch": 1.85, "learning_rate": 9.624076901438035e-05, "loss": 1.452, "step": 23512 }, { "epoch": 1.85, "learning_rate": 9.622923053555063e-05, "loss": 1.4467, "step": 23513 }, { "epoch": 1.85, "learning_rate": 9.621769242179472e-05, "loss": 1.4812, "step": 23514 }, { "epoch": 1.85, "learning_rate": 9.620615467319104e-05, "loss": 1.5035, "step": 23515 }, { "epoch": 1.85, "learning_rate": 9.619461728981785e-05, "loss": 1.4396, "step": 23516 }, { "epoch": 1.85, "learning_rate": 9.618308027175352e-05, "loss": 1.5053, "step": 23517 }, { "epoch": 1.85, "learning_rate": 9.61715436190764e-05, "loss": 1.4416, "step": 23518 }, { "epoch": 1.85, "learning_rate": 9.61600073318647e-05, "loss": 1.5473, "step": 23519 }, { "epoch": 1.85, "learning_rate": 9.614847141019694e-05, "loss": 1.4474, "step": 23520 }, { "epoch": 1.85, "learning_rate": 9.613693585415131e-05, "loss": 1.5306, "step": 23521 }, { "epoch": 1.85, "learning_rate": 9.61254006638062e-05, "loss": 1.4738, "step": 23522 }, { "epoch": 1.85, "learning_rate": 9.611386583923984e-05, "loss": 1.5181, "step": 23523 }, { "epoch": 1.85, "learning_rate": 9.61023313805306e-05, "loss": 1.4235, "step": 23524 }, { "epoch": 1.85, "learning_rate": 9.609079728775682e-05, "loss": 1.497, "step": 23525 }, { "epoch": 1.85, "learning_rate": 9.607926356099676e-05, "loss": 1.4572, "step": 23526 }, { "epoch": 1.85, "learning_rate": 9.606773020032875e-05, "loss": 1.5303, "step": 23527 }, { "epoch": 1.85, "learning_rate": 9.605619720583108e-05, "loss": 1.4556, "step": 23528 }, { "epoch": 1.85, "learning_rate": 9.604466457758203e-05, "loss": 1.4738, "step": 23529 }, { "epoch": 1.85, "learning_rate": 9.603313231565998e-05, "loss": 1.4825, "step": 23530 }, { "epoch": 1.85, "learning_rate": 9.602160042014319e-05, "loss": 1.4584, "step": 23531 }, { "epoch": 1.85, "learning_rate": 9.60100688911099e-05, "loss": 1.468, "step": 23532 }, { "epoch": 1.85, "learning_rate": 9.599853772863848e-05, "loss": 1.4435, "step": 23533 }, { "epoch": 1.85, "learning_rate": 9.598700693280717e-05, "loss": 1.4681, "step": 23534 }, { "epoch": 1.85, "learning_rate": 9.597547650369425e-05, "loss": 1.5119, "step": 23535 }, { "epoch": 1.85, "learning_rate": 9.596394644137803e-05, "loss": 1.4876, "step": 23536 }, { "epoch": 1.85, "learning_rate": 9.595241674593688e-05, "loss": 1.5052, "step": 23537 }, { "epoch": 1.85, "learning_rate": 9.594088741744893e-05, "loss": 1.5067, "step": 23538 }, { "epoch": 1.85, "learning_rate": 9.592935845599255e-05, "loss": 1.4693, "step": 23539 }, { "epoch": 1.85, "learning_rate": 9.591782986164596e-05, "loss": 1.4888, "step": 23540 }, { "epoch": 1.85, "learning_rate": 9.590630163448746e-05, "loss": 1.452, "step": 23541 }, { "epoch": 1.85, "learning_rate": 9.589477377459534e-05, "loss": 1.4813, "step": 23542 }, { "epoch": 1.85, "learning_rate": 9.588324628204785e-05, "loss": 1.5142, "step": 23543 }, { "epoch": 1.85, "learning_rate": 9.587171915692328e-05, "loss": 1.4436, "step": 23544 }, { "epoch": 1.85, "learning_rate": 9.586019239929981e-05, "loss": 1.4372, "step": 23545 }, { "epoch": 1.85, "learning_rate": 9.584866600925576e-05, "loss": 1.4905, "step": 23546 }, { "epoch": 1.85, "learning_rate": 9.583713998686944e-05, "loss": 1.478, "step": 23547 }, { "epoch": 1.85, "learning_rate": 9.582561433221899e-05, "loss": 1.4551, "step": 23548 }, { "epoch": 1.85, "learning_rate": 9.581408904538274e-05, "loss": 1.4336, "step": 23549 }, { "epoch": 1.85, "learning_rate": 9.580256412643894e-05, "loss": 1.4936, "step": 23550 }, { "epoch": 1.85, "learning_rate": 9.579103957546578e-05, "loss": 1.5043, "step": 23551 }, { "epoch": 1.85, "learning_rate": 9.577951539254157e-05, "loss": 1.4979, "step": 23552 }, { "epoch": 1.85, "learning_rate": 9.576799157774453e-05, "loss": 1.4802, "step": 23553 }, { "epoch": 1.85, "learning_rate": 9.575646813115292e-05, "loss": 1.495, "step": 23554 }, { "epoch": 1.85, "learning_rate": 9.574494505284492e-05, "loss": 1.4412, "step": 23555 }, { "epoch": 1.85, "learning_rate": 9.573342234289885e-05, "loss": 1.5015, "step": 23556 }, { "epoch": 1.85, "learning_rate": 9.572190000139286e-05, "loss": 1.4885, "step": 23557 }, { "epoch": 1.85, "learning_rate": 9.571037802840523e-05, "loss": 1.4574, "step": 23558 }, { "epoch": 1.85, "learning_rate": 9.569885642401419e-05, "loss": 1.471, "step": 23559 }, { "epoch": 1.85, "learning_rate": 9.568733518829791e-05, "loss": 1.4651, "step": 23560 }, { "epoch": 1.85, "learning_rate": 9.567581432133466e-05, "loss": 1.4582, "step": 23561 }, { "epoch": 1.85, "learning_rate": 9.566429382320268e-05, "loss": 1.493, "step": 23562 }, { "epoch": 1.85, "learning_rate": 9.565277369398015e-05, "loss": 1.5855, "step": 23563 }, { "epoch": 1.85, "learning_rate": 9.564125393374529e-05, "loss": 1.447, "step": 23564 }, { "epoch": 1.85, "learning_rate": 9.56297345425763e-05, "loss": 1.4764, "step": 23565 }, { "epoch": 1.85, "learning_rate": 9.561821552055143e-05, "loss": 1.5262, "step": 23566 }, { "epoch": 1.85, "learning_rate": 9.560669686774883e-05, "loss": 1.4928, "step": 23567 }, { "epoch": 1.85, "learning_rate": 9.559517858424678e-05, "loss": 1.5065, "step": 23568 }, { "epoch": 1.85, "learning_rate": 9.558366067012344e-05, "loss": 1.52, "step": 23569 }, { "epoch": 1.85, "learning_rate": 9.557214312545699e-05, "loss": 1.5201, "step": 23570 }, { "epoch": 1.85, "learning_rate": 9.55606259503257e-05, "loss": 1.5057, "step": 23571 }, { "epoch": 1.85, "learning_rate": 9.554910914480768e-05, "loss": 1.4658, "step": 23572 }, { "epoch": 1.85, "learning_rate": 9.553759270898117e-05, "loss": 1.4834, "step": 23573 }, { "epoch": 1.85, "learning_rate": 9.552607664292438e-05, "loss": 1.5121, "step": 23574 }, { "epoch": 1.85, "learning_rate": 9.551456094671542e-05, "loss": 1.4826, "step": 23575 }, { "epoch": 1.85, "learning_rate": 9.550304562043257e-05, "loss": 1.4776, "step": 23576 }, { "epoch": 1.86, "learning_rate": 9.549153066415392e-05, "loss": 1.5163, "step": 23577 }, { "epoch": 1.86, "learning_rate": 9.548001607795772e-05, "loss": 1.533, "step": 23578 }, { "epoch": 1.86, "learning_rate": 9.546850186192214e-05, "loss": 1.5099, "step": 23579 }, { "epoch": 1.86, "learning_rate": 9.545698801612531e-05, "loss": 1.4913, "step": 23580 }, { "epoch": 1.86, "learning_rate": 9.544547454064547e-05, "loss": 1.5181, "step": 23581 }, { "epoch": 1.86, "learning_rate": 9.543396143556066e-05, "loss": 1.4623, "step": 23582 }, { "epoch": 1.86, "learning_rate": 9.542244870094922e-05, "loss": 1.4998, "step": 23583 }, { "epoch": 1.86, "learning_rate": 9.54109363368892e-05, "loss": 1.4998, "step": 23584 }, { "epoch": 1.86, "learning_rate": 9.539942434345884e-05, "loss": 1.5091, "step": 23585 }, { "epoch": 1.86, "learning_rate": 9.538791272073623e-05, "loss": 1.5311, "step": 23586 }, { "epoch": 1.86, "learning_rate": 9.537640146879956e-05, "loss": 1.4796, "step": 23587 }, { "epoch": 1.86, "learning_rate": 9.536489058772701e-05, "loss": 1.4939, "step": 23588 }, { "epoch": 1.86, "learning_rate": 9.535338007759665e-05, "loss": 1.4796, "step": 23589 }, { "epoch": 1.86, "learning_rate": 9.53418699384867e-05, "loss": 1.4879, "step": 23590 }, { "epoch": 1.86, "learning_rate": 9.533036017047531e-05, "loss": 1.4894, "step": 23591 }, { "epoch": 1.86, "learning_rate": 9.531885077364058e-05, "loss": 1.4679, "step": 23592 }, { "epoch": 1.86, "learning_rate": 9.530734174806072e-05, "loss": 1.5209, "step": 23593 }, { "epoch": 1.86, "learning_rate": 9.529583309381378e-05, "loss": 1.5179, "step": 23594 }, { "epoch": 1.86, "learning_rate": 9.528432481097796e-05, "loss": 1.5434, "step": 23595 }, { "epoch": 1.86, "learning_rate": 9.527281689963141e-05, "loss": 1.4933, "step": 23596 }, { "epoch": 1.86, "learning_rate": 9.526130935985218e-05, "loss": 1.5067, "step": 23597 }, { "epoch": 1.86, "learning_rate": 9.524980219171844e-05, "loss": 1.4881, "step": 23598 }, { "epoch": 1.86, "learning_rate": 9.523829539530836e-05, "loss": 1.4715, "step": 23599 }, { "epoch": 1.86, "learning_rate": 9.522678897070006e-05, "loss": 1.4894, "step": 23600 }, { "epoch": 1.86, "learning_rate": 9.521528291797162e-05, "loss": 1.4632, "step": 23601 }, { "epoch": 1.86, "learning_rate": 9.520377723720116e-05, "loss": 1.4526, "step": 23602 }, { "epoch": 1.86, "learning_rate": 9.519227192846684e-05, "loss": 1.4627, "step": 23603 }, { "epoch": 1.86, "learning_rate": 9.518076699184674e-05, "loss": 1.5444, "step": 23604 }, { "epoch": 1.86, "learning_rate": 9.516926242741898e-05, "loss": 1.4769, "step": 23605 }, { "epoch": 1.86, "learning_rate": 9.515775823526166e-05, "loss": 1.4415, "step": 23606 }, { "epoch": 1.86, "learning_rate": 9.514625441545288e-05, "loss": 1.5127, "step": 23607 }, { "epoch": 1.86, "learning_rate": 9.513475096807081e-05, "loss": 1.476, "step": 23608 }, { "epoch": 1.86, "learning_rate": 9.512324789319347e-05, "loss": 1.4854, "step": 23609 }, { "epoch": 1.86, "learning_rate": 9.511174519089904e-05, "loss": 1.4735, "step": 23610 }, { "epoch": 1.86, "learning_rate": 9.51002428612655e-05, "loss": 1.5474, "step": 23611 }, { "epoch": 1.86, "learning_rate": 9.508874090437105e-05, "loss": 1.4386, "step": 23612 }, { "epoch": 1.86, "learning_rate": 9.507723932029376e-05, "loss": 1.4908, "step": 23613 }, { "epoch": 1.86, "learning_rate": 9.506573810911164e-05, "loss": 1.4969, "step": 23614 }, { "epoch": 1.86, "learning_rate": 9.50542372709029e-05, "loss": 1.4543, "step": 23615 }, { "epoch": 1.86, "learning_rate": 9.504273680574554e-05, "loss": 1.4916, "step": 23616 }, { "epoch": 1.86, "learning_rate": 9.503123671371772e-05, "loss": 1.4834, "step": 23617 }, { "epoch": 1.86, "learning_rate": 9.501973699489742e-05, "loss": 1.4565, "step": 23618 }, { "epoch": 1.86, "learning_rate": 9.500823764936276e-05, "loss": 1.5081, "step": 23619 }, { "epoch": 1.86, "learning_rate": 9.499673867719188e-05, "loss": 1.4898, "step": 23620 }, { "epoch": 1.86, "learning_rate": 9.498524007846274e-05, "loss": 1.467, "step": 23621 }, { "epoch": 1.86, "learning_rate": 9.497374185325348e-05, "loss": 1.5156, "step": 23622 }, { "epoch": 1.86, "learning_rate": 9.496224400164212e-05, "loss": 1.4746, "step": 23623 }, { "epoch": 1.86, "learning_rate": 9.495074652370677e-05, "loss": 1.4703, "step": 23624 }, { "epoch": 1.86, "learning_rate": 9.49392494195255e-05, "loss": 1.4819, "step": 23625 }, { "epoch": 1.86, "learning_rate": 9.492775268917631e-05, "loss": 1.5061, "step": 23626 }, { "epoch": 1.86, "learning_rate": 9.49162563327373e-05, "loss": 1.47, "step": 23627 }, { "epoch": 1.86, "learning_rate": 9.49047603502865e-05, "loss": 1.483, "step": 23628 }, { "epoch": 1.86, "learning_rate": 9.489326474190196e-05, "loss": 1.4706, "step": 23629 }, { "epoch": 1.86, "learning_rate": 9.488176950766173e-05, "loss": 1.5115, "step": 23630 }, { "epoch": 1.86, "learning_rate": 9.487027464764389e-05, "loss": 1.5075, "step": 23631 }, { "epoch": 1.86, "learning_rate": 9.485878016192648e-05, "loss": 1.4894, "step": 23632 }, { "epoch": 1.86, "learning_rate": 9.484728605058752e-05, "loss": 1.5018, "step": 23633 }, { "epoch": 1.86, "learning_rate": 9.483579231370505e-05, "loss": 1.4826, "step": 23634 }, { "epoch": 1.86, "learning_rate": 9.48242989513571e-05, "loss": 1.5101, "step": 23635 }, { "epoch": 1.86, "learning_rate": 9.481280596362171e-05, "loss": 1.527, "step": 23636 }, { "epoch": 1.86, "learning_rate": 9.480131335057693e-05, "loss": 1.5015, "step": 23637 }, { "epoch": 1.86, "learning_rate": 9.478982111230076e-05, "loss": 1.5156, "step": 23638 }, { "epoch": 1.86, "learning_rate": 9.477832924887127e-05, "loss": 1.5122, "step": 23639 }, { "epoch": 1.86, "learning_rate": 9.47668377603664e-05, "loss": 1.4471, "step": 23640 }, { "epoch": 1.86, "learning_rate": 9.475534664686423e-05, "loss": 1.5034, "step": 23641 }, { "epoch": 1.86, "learning_rate": 9.474385590844279e-05, "loss": 1.5269, "step": 23642 }, { "epoch": 1.86, "learning_rate": 9.473236554518005e-05, "loss": 1.5017, "step": 23643 }, { "epoch": 1.86, "learning_rate": 9.472087555715407e-05, "loss": 1.5045, "step": 23644 }, { "epoch": 1.86, "learning_rate": 9.470938594444279e-05, "loss": 1.4714, "step": 23645 }, { "epoch": 1.86, "learning_rate": 9.469789670712432e-05, "loss": 1.4572, "step": 23646 }, { "epoch": 1.86, "learning_rate": 9.468640784527657e-05, "loss": 1.4937, "step": 23647 }, { "epoch": 1.86, "learning_rate": 9.467491935897763e-05, "loss": 1.4554, "step": 23648 }, { "epoch": 1.86, "learning_rate": 9.466343124830546e-05, "loss": 1.4765, "step": 23649 }, { "epoch": 1.86, "learning_rate": 9.465194351333803e-05, "loss": 1.4685, "step": 23650 }, { "epoch": 1.86, "learning_rate": 9.464045615415338e-05, "loss": 1.503, "step": 23651 }, { "epoch": 1.86, "learning_rate": 9.462896917082948e-05, "loss": 1.468, "step": 23652 }, { "epoch": 1.86, "learning_rate": 9.46174825634443e-05, "loss": 1.5024, "step": 23653 }, { "epoch": 1.86, "learning_rate": 9.460599633207588e-05, "loss": 1.5179, "step": 23654 }, { "epoch": 1.86, "learning_rate": 9.459451047680216e-05, "loss": 1.4898, "step": 23655 }, { "epoch": 1.86, "learning_rate": 9.458302499770116e-05, "loss": 1.4681, "step": 23656 }, { "epoch": 1.86, "learning_rate": 9.45715398948508e-05, "loss": 1.474, "step": 23657 }, { "epoch": 1.86, "learning_rate": 9.456005516832911e-05, "loss": 1.4729, "step": 23658 }, { "epoch": 1.86, "learning_rate": 9.454857081821408e-05, "loss": 1.5008, "step": 23659 }, { "epoch": 1.86, "learning_rate": 9.453708684458361e-05, "loss": 1.4698, "step": 23660 }, { "epoch": 1.86, "learning_rate": 9.45256032475157e-05, "loss": 1.5035, "step": 23661 }, { "epoch": 1.86, "learning_rate": 9.451412002708835e-05, "loss": 1.4384, "step": 23662 }, { "epoch": 1.86, "learning_rate": 9.450263718337954e-05, "loss": 1.4966, "step": 23663 }, { "epoch": 1.86, "learning_rate": 9.449115471646718e-05, "loss": 1.5169, "step": 23664 }, { "epoch": 1.86, "learning_rate": 9.447967262642922e-05, "loss": 1.4934, "step": 23665 }, { "epoch": 1.86, "learning_rate": 9.44681909133437e-05, "loss": 1.4796, "step": 23666 }, { "epoch": 1.86, "learning_rate": 9.445670957728848e-05, "loss": 1.4497, "step": 23667 }, { "epoch": 1.86, "learning_rate": 9.444522861834158e-05, "loss": 1.5203, "step": 23668 }, { "epoch": 1.86, "learning_rate": 9.443374803658087e-05, "loss": 1.5002, "step": 23669 }, { "epoch": 1.86, "learning_rate": 9.442226783208438e-05, "loss": 1.4514, "step": 23670 }, { "epoch": 1.86, "learning_rate": 9.441078800493002e-05, "loss": 1.4279, "step": 23671 }, { "epoch": 1.86, "learning_rate": 9.439930855519572e-05, "loss": 1.4601, "step": 23672 }, { "epoch": 1.86, "learning_rate": 9.438782948295944e-05, "loss": 1.5167, "step": 23673 }, { "epoch": 1.86, "learning_rate": 9.437635078829914e-05, "loss": 1.4628, "step": 23674 }, { "epoch": 1.86, "learning_rate": 9.436487247129266e-05, "loss": 1.483, "step": 23675 }, { "epoch": 1.86, "learning_rate": 9.435339453201805e-05, "loss": 1.4381, "step": 23676 }, { "epoch": 1.86, "learning_rate": 9.434191697055309e-05, "loss": 1.5191, "step": 23677 }, { "epoch": 1.86, "learning_rate": 9.433043978697589e-05, "loss": 1.4998, "step": 23678 }, { "epoch": 1.86, "learning_rate": 9.431896298136425e-05, "loss": 1.5158, "step": 23679 }, { "epoch": 1.86, "learning_rate": 9.430748655379616e-05, "loss": 1.5019, "step": 23680 }, { "epoch": 1.86, "learning_rate": 9.429601050434946e-05, "loss": 1.496, "step": 23681 }, { "epoch": 1.86, "learning_rate": 9.428453483310212e-05, "loss": 1.4946, "step": 23682 }, { "epoch": 1.86, "learning_rate": 9.427305954013206e-05, "loss": 1.48, "step": 23683 }, { "epoch": 1.86, "learning_rate": 9.426158462551716e-05, "loss": 1.4658, "step": 23684 }, { "epoch": 1.86, "learning_rate": 9.425011008933531e-05, "loss": 1.5141, "step": 23685 }, { "epoch": 1.86, "learning_rate": 9.423863593166452e-05, "loss": 1.4942, "step": 23686 }, { "epoch": 1.86, "learning_rate": 9.422716215258256e-05, "loss": 1.5162, "step": 23687 }, { "epoch": 1.86, "learning_rate": 9.421568875216745e-05, "loss": 1.5083, "step": 23688 }, { "epoch": 1.86, "learning_rate": 9.420421573049696e-05, "loss": 1.506, "step": 23689 }, { "epoch": 1.86, "learning_rate": 9.419274308764907e-05, "loss": 1.5304, "step": 23690 }, { "epoch": 1.86, "learning_rate": 9.418127082370169e-05, "loss": 1.4864, "step": 23691 }, { "epoch": 1.86, "learning_rate": 9.416979893873262e-05, "loss": 1.5016, "step": 23692 }, { "epoch": 1.86, "learning_rate": 9.415832743281985e-05, "loss": 1.5017, "step": 23693 }, { "epoch": 1.86, "learning_rate": 9.41468563060412e-05, "loss": 1.4913, "step": 23694 }, { "epoch": 1.86, "learning_rate": 9.413538555847461e-05, "loss": 1.4618, "step": 23695 }, { "epoch": 1.86, "learning_rate": 9.41239151901979e-05, "loss": 1.4556, "step": 23696 }, { "epoch": 1.86, "learning_rate": 9.411244520128898e-05, "loss": 1.4496, "step": 23697 }, { "epoch": 1.86, "learning_rate": 9.41009755918257e-05, "loss": 1.4804, "step": 23698 }, { "epoch": 1.86, "learning_rate": 9.408950636188595e-05, "loss": 1.5475, "step": 23699 }, { "epoch": 1.86, "learning_rate": 9.407803751154762e-05, "loss": 1.4681, "step": 23700 }, { "epoch": 1.86, "learning_rate": 9.406656904088854e-05, "loss": 1.4479, "step": 23701 }, { "epoch": 1.86, "learning_rate": 9.405510094998658e-05, "loss": 1.4703, "step": 23702 }, { "epoch": 1.86, "learning_rate": 9.404363323891964e-05, "loss": 1.4669, "step": 23703 }, { "epoch": 1.87, "learning_rate": 9.403216590776554e-05, "loss": 1.5315, "step": 23704 }, { "epoch": 1.87, "learning_rate": 9.402069895660215e-05, "loss": 1.4958, "step": 23705 }, { "epoch": 1.87, "learning_rate": 9.40092323855073e-05, "loss": 1.4878, "step": 23706 }, { "epoch": 1.87, "learning_rate": 9.399776619455886e-05, "loss": 1.5716, "step": 23707 }, { "epoch": 1.87, "learning_rate": 9.398630038383466e-05, "loss": 1.457, "step": 23708 }, { "epoch": 1.87, "learning_rate": 9.397483495341263e-05, "loss": 1.4601, "step": 23709 }, { "epoch": 1.87, "learning_rate": 9.396336990337053e-05, "loss": 1.464, "step": 23710 }, { "epoch": 1.87, "learning_rate": 9.39519052337862e-05, "loss": 1.4566, "step": 23711 }, { "epoch": 1.87, "learning_rate": 9.394044094473756e-05, "loss": 1.5046, "step": 23712 }, { "epoch": 1.87, "learning_rate": 9.392897703630235e-05, "loss": 1.5005, "step": 23713 }, { "epoch": 1.87, "learning_rate": 9.391751350855843e-05, "loss": 1.5003, "step": 23714 }, { "epoch": 1.87, "learning_rate": 9.39060503615837e-05, "loss": 1.4742, "step": 23715 }, { "epoch": 1.87, "learning_rate": 9.38945875954559e-05, "loss": 1.4918, "step": 23716 }, { "epoch": 1.87, "learning_rate": 9.38831252102529e-05, "loss": 1.4754, "step": 23717 }, { "epoch": 1.87, "learning_rate": 9.387166320605249e-05, "loss": 1.5211, "step": 23718 }, { "epoch": 1.87, "learning_rate": 9.386020158293253e-05, "loss": 1.4687, "step": 23719 }, { "epoch": 1.87, "learning_rate": 9.384874034097083e-05, "loss": 1.4933, "step": 23720 }, { "epoch": 1.87, "learning_rate": 9.383727948024516e-05, "loss": 1.5117, "step": 23721 }, { "epoch": 1.87, "learning_rate": 9.38258190008334e-05, "loss": 1.5352, "step": 23722 }, { "epoch": 1.87, "learning_rate": 9.381435890281332e-05, "loss": 1.5244, "step": 23723 }, { "epoch": 1.87, "learning_rate": 9.38028991862627e-05, "loss": 1.4292, "step": 23724 }, { "epoch": 1.87, "learning_rate": 9.37914398512594e-05, "loss": 1.4568, "step": 23725 }, { "epoch": 1.87, "learning_rate": 9.377998089788126e-05, "loss": 1.461, "step": 23726 }, { "epoch": 1.87, "learning_rate": 9.376852232620597e-05, "loss": 1.468, "step": 23727 }, { "epoch": 1.87, "learning_rate": 9.37570641363114e-05, "loss": 1.4589, "step": 23728 }, { "epoch": 1.87, "learning_rate": 9.374560632827535e-05, "loss": 1.4847, "step": 23729 }, { "epoch": 1.87, "learning_rate": 9.373414890217554e-05, "loss": 1.5068, "step": 23730 }, { "epoch": 1.87, "learning_rate": 9.372269185808983e-05, "loss": 1.4905, "step": 23731 }, { "epoch": 1.87, "learning_rate": 9.371123519609602e-05, "loss": 1.5539, "step": 23732 }, { "epoch": 1.87, "learning_rate": 9.369977891627183e-05, "loss": 1.496, "step": 23733 }, { "epoch": 1.87, "learning_rate": 9.368832301869507e-05, "loss": 1.4659, "step": 23734 }, { "epoch": 1.87, "learning_rate": 9.367686750344354e-05, "loss": 1.4869, "step": 23735 }, { "epoch": 1.87, "learning_rate": 9.366541237059498e-05, "loss": 1.4965, "step": 23736 }, { "epoch": 1.87, "learning_rate": 9.365395762022721e-05, "loss": 1.4868, "step": 23737 }, { "epoch": 1.87, "learning_rate": 9.364250325241792e-05, "loss": 1.5095, "step": 23738 }, { "epoch": 1.87, "learning_rate": 9.3631049267245e-05, "loss": 1.4701, "step": 23739 }, { "epoch": 1.87, "learning_rate": 9.361959566478602e-05, "loss": 1.4996, "step": 23740 }, { "epoch": 1.87, "learning_rate": 9.360814244511899e-05, "loss": 1.5192, "step": 23741 }, { "epoch": 1.87, "learning_rate": 9.359668960832153e-05, "loss": 1.5127, "step": 23742 }, { "epoch": 1.87, "learning_rate": 9.35852371544714e-05, "loss": 1.4697, "step": 23743 }, { "epoch": 1.87, "learning_rate": 9.35737850836464e-05, "loss": 1.5386, "step": 23744 }, { "epoch": 1.87, "learning_rate": 9.356233339592425e-05, "loss": 1.5076, "step": 23745 }, { "epoch": 1.87, "learning_rate": 9.355088209138275e-05, "loss": 1.5276, "step": 23746 }, { "epoch": 1.87, "learning_rate": 9.353943117009957e-05, "loss": 1.4573, "step": 23747 }, { "epoch": 1.87, "learning_rate": 9.352798063215248e-05, "loss": 1.4793, "step": 23748 }, { "epoch": 1.87, "learning_rate": 9.351653047761929e-05, "loss": 1.4331, "step": 23749 }, { "epoch": 1.87, "learning_rate": 9.350508070657764e-05, "loss": 1.5628, "step": 23750 }, { "epoch": 1.87, "learning_rate": 9.349363131910534e-05, "loss": 1.4968, "step": 23751 }, { "epoch": 1.87, "learning_rate": 9.348218231528011e-05, "loss": 1.5699, "step": 23752 }, { "epoch": 1.87, "learning_rate": 9.347073369517963e-05, "loss": 1.4692, "step": 23753 }, { "epoch": 1.87, "learning_rate": 9.345928545888171e-05, "loss": 1.4807, "step": 23754 }, { "epoch": 1.87, "learning_rate": 9.3447837606464e-05, "loss": 1.5306, "step": 23755 }, { "epoch": 1.87, "learning_rate": 9.343639013800429e-05, "loss": 1.4465, "step": 23756 }, { "epoch": 1.87, "learning_rate": 9.342494305358026e-05, "loss": 1.4665, "step": 23757 }, { "epoch": 1.87, "learning_rate": 9.34134963532697e-05, "loss": 1.4899, "step": 23758 }, { "epoch": 1.87, "learning_rate": 9.340205003715022e-05, "loss": 1.4399, "step": 23759 }, { "epoch": 1.87, "learning_rate": 9.33906041052996e-05, "loss": 1.4809, "step": 23760 }, { "epoch": 1.87, "learning_rate": 9.337915855779556e-05, "loss": 1.4921, "step": 23761 }, { "epoch": 1.87, "learning_rate": 9.336771339471577e-05, "loss": 1.4811, "step": 23762 }, { "epoch": 1.87, "learning_rate": 9.335626861613798e-05, "loss": 1.5417, "step": 23763 }, { "epoch": 1.87, "learning_rate": 9.334482422213982e-05, "loss": 1.4367, "step": 23764 }, { "epoch": 1.87, "learning_rate": 9.333338021279905e-05, "loss": 1.478, "step": 23765 }, { "epoch": 1.87, "learning_rate": 9.332193658819338e-05, "loss": 1.4487, "step": 23766 }, { "epoch": 1.87, "learning_rate": 9.331049334840048e-05, "loss": 1.4496, "step": 23767 }, { "epoch": 1.87, "learning_rate": 9.329905049349802e-05, "loss": 1.5131, "step": 23768 }, { "epoch": 1.87, "learning_rate": 9.328760802356375e-05, "loss": 1.4727, "step": 23769 }, { "epoch": 1.87, "learning_rate": 9.327616593867532e-05, "loss": 1.5027, "step": 23770 }, { "epoch": 1.87, "learning_rate": 9.326472423891035e-05, "loss": 1.5027, "step": 23771 }, { "epoch": 1.87, "learning_rate": 9.325328292434665e-05, "loss": 1.5356, "step": 23772 }, { "epoch": 1.87, "learning_rate": 9.324184199506186e-05, "loss": 1.5191, "step": 23773 }, { "epoch": 1.87, "learning_rate": 9.323040145113362e-05, "loss": 1.4605, "step": 23774 }, { "epoch": 1.87, "learning_rate": 9.321896129263966e-05, "loss": 1.4655, "step": 23775 }, { "epoch": 1.87, "learning_rate": 9.32075215196576e-05, "loss": 1.4509, "step": 23776 }, { "epoch": 1.87, "learning_rate": 9.31960821322651e-05, "loss": 1.484, "step": 23777 }, { "epoch": 1.87, "learning_rate": 9.318464313053989e-05, "loss": 1.4689, "step": 23778 }, { "epoch": 1.87, "learning_rate": 9.317320451455958e-05, "loss": 1.526, "step": 23779 }, { "epoch": 1.87, "learning_rate": 9.316176628440188e-05, "loss": 1.4229, "step": 23780 }, { "epoch": 1.87, "learning_rate": 9.315032844014439e-05, "loss": 1.4469, "step": 23781 }, { "epoch": 1.87, "learning_rate": 9.31388909818648e-05, "loss": 1.5076, "step": 23782 }, { "epoch": 1.87, "learning_rate": 9.312745390964078e-05, "loss": 1.4774, "step": 23783 }, { "epoch": 1.87, "learning_rate": 9.311601722354996e-05, "loss": 1.4736, "step": 23784 }, { "epoch": 1.87, "learning_rate": 9.310458092366996e-05, "loss": 1.4782, "step": 23785 }, { "epoch": 1.87, "learning_rate": 9.30931450100785e-05, "loss": 1.5026, "step": 23786 }, { "epoch": 1.87, "learning_rate": 9.308170948285312e-05, "loss": 1.4867, "step": 23787 }, { "epoch": 1.87, "learning_rate": 9.307027434207156e-05, "loss": 1.5132, "step": 23788 }, { "epoch": 1.87, "learning_rate": 9.305883958781141e-05, "loss": 1.5112, "step": 23789 }, { "epoch": 1.87, "learning_rate": 9.304740522015035e-05, "loss": 1.4623, "step": 23790 }, { "epoch": 1.87, "learning_rate": 9.303597123916596e-05, "loss": 1.4409, "step": 23791 }, { "epoch": 1.87, "learning_rate": 9.30245376449359e-05, "loss": 1.5075, "step": 23792 }, { "epoch": 1.87, "learning_rate": 9.301310443753777e-05, "loss": 1.5217, "step": 23793 }, { "epoch": 1.87, "learning_rate": 9.300167161704922e-05, "loss": 1.4766, "step": 23794 }, { "epoch": 1.87, "learning_rate": 9.299023918354789e-05, "loss": 1.5221, "step": 23795 }, { "epoch": 1.87, "learning_rate": 9.297880713711134e-05, "loss": 1.4978, "step": 23796 }, { "epoch": 1.87, "learning_rate": 9.296737547781723e-05, "loss": 1.4537, "step": 23797 }, { "epoch": 1.87, "learning_rate": 9.295594420574321e-05, "loss": 1.5163, "step": 23798 }, { "epoch": 1.87, "learning_rate": 9.294451332096678e-05, "loss": 1.5412, "step": 23799 }, { "epoch": 1.87, "learning_rate": 9.293308282356567e-05, "loss": 1.4259, "step": 23800 }, { "epoch": 1.87, "learning_rate": 9.292165271361741e-05, "loss": 1.4663, "step": 23801 }, { "epoch": 1.87, "learning_rate": 9.29102229911996e-05, "loss": 1.497, "step": 23802 }, { "epoch": 1.87, "learning_rate": 9.289879365638989e-05, "loss": 1.4627, "step": 23803 }, { "epoch": 1.87, "learning_rate": 9.288736470926593e-05, "loss": 1.4462, "step": 23804 }, { "epoch": 1.87, "learning_rate": 9.287593614990516e-05, "loss": 1.4496, "step": 23805 }, { "epoch": 1.87, "learning_rate": 9.286450797838529e-05, "loss": 1.479, "step": 23806 }, { "epoch": 1.87, "learning_rate": 9.285308019478389e-05, "loss": 1.501, "step": 23807 }, { "epoch": 1.87, "learning_rate": 9.284165279917855e-05, "loss": 1.4425, "step": 23808 }, { "epoch": 1.87, "learning_rate": 9.283022579164684e-05, "loss": 1.4799, "step": 23809 }, { "epoch": 1.87, "learning_rate": 9.28187991722663e-05, "loss": 1.4861, "step": 23810 }, { "epoch": 1.87, "learning_rate": 9.28073729411146e-05, "loss": 1.4645, "step": 23811 }, { "epoch": 1.87, "learning_rate": 9.279594709826931e-05, "loss": 1.4083, "step": 23812 }, { "epoch": 1.87, "learning_rate": 9.278452164380791e-05, "loss": 1.4579, "step": 23813 }, { "epoch": 1.87, "learning_rate": 9.277309657780805e-05, "loss": 1.4722, "step": 23814 }, { "epoch": 1.87, "learning_rate": 9.27616719003473e-05, "loss": 1.4563, "step": 23815 }, { "epoch": 1.87, "learning_rate": 9.27502476115032e-05, "loss": 1.4633, "step": 23816 }, { "epoch": 1.87, "learning_rate": 9.273882371135335e-05, "loss": 1.5143, "step": 23817 }, { "epoch": 1.87, "learning_rate": 9.272740019997519e-05, "loss": 1.4736, "step": 23818 }, { "epoch": 1.87, "learning_rate": 9.27159770774465e-05, "loss": 1.5386, "step": 23819 }, { "epoch": 1.87, "learning_rate": 9.270455434384463e-05, "loss": 1.4594, "step": 23820 }, { "epoch": 1.87, "learning_rate": 9.269313199924728e-05, "loss": 1.5193, "step": 23821 }, { "epoch": 1.87, "learning_rate": 9.268171004373189e-05, "loss": 1.4662, "step": 23822 }, { "epoch": 1.87, "learning_rate": 9.267028847737608e-05, "loss": 1.4491, "step": 23823 }, { "epoch": 1.87, "learning_rate": 9.265886730025739e-05, "loss": 1.5192, "step": 23824 }, { "epoch": 1.87, "learning_rate": 9.264744651245334e-05, "loss": 1.4667, "step": 23825 }, { "epoch": 1.87, "learning_rate": 9.263602611404146e-05, "loss": 1.4898, "step": 23826 }, { "epoch": 1.87, "learning_rate": 9.262460610509932e-05, "loss": 1.4932, "step": 23827 }, { "epoch": 1.87, "learning_rate": 9.261318648570444e-05, "loss": 1.4804, "step": 23828 }, { "epoch": 1.87, "learning_rate": 9.260176725593438e-05, "loss": 1.459, "step": 23829 }, { "epoch": 1.87, "learning_rate": 9.259034841586661e-05, "loss": 1.5337, "step": 23830 }, { "epoch": 1.88, "learning_rate": 9.257892996557869e-05, "loss": 1.4955, "step": 23831 }, { "epoch": 1.88, "learning_rate": 9.256751190514818e-05, "loss": 1.5221, "step": 23832 }, { "epoch": 1.88, "learning_rate": 9.255609423465255e-05, "loss": 1.4736, "step": 23833 }, { "epoch": 1.88, "learning_rate": 9.254467695416929e-05, "loss": 1.4622, "step": 23834 }, { "epoch": 1.88, "learning_rate": 9.2533260063776e-05, "loss": 1.4668, "step": 23835 }, { "epoch": 1.88, "learning_rate": 9.252184356355021e-05, "loss": 1.5239, "step": 23836 }, { "epoch": 1.88, "learning_rate": 9.251042745356933e-05, "loss": 1.4742, "step": 23837 }, { "epoch": 1.88, "learning_rate": 9.249901173391099e-05, "loss": 1.5122, "step": 23838 }, { "epoch": 1.88, "learning_rate": 9.248759640465258e-05, "loss": 1.4742, "step": 23839 }, { "epoch": 1.88, "learning_rate": 9.247618146587164e-05, "loss": 1.5387, "step": 23840 }, { "epoch": 1.88, "learning_rate": 9.246476691764571e-05, "loss": 1.4543, "step": 23841 }, { "epoch": 1.88, "learning_rate": 9.245335276005224e-05, "loss": 1.4745, "step": 23842 }, { "epoch": 1.88, "learning_rate": 9.244193899316876e-05, "loss": 1.4979, "step": 23843 }, { "epoch": 1.88, "learning_rate": 9.243052561707277e-05, "loss": 1.4632, "step": 23844 }, { "epoch": 1.88, "learning_rate": 9.24191126318417e-05, "loss": 1.5334, "step": 23845 }, { "epoch": 1.88, "learning_rate": 9.240770003755312e-05, "loss": 1.4532, "step": 23846 }, { "epoch": 1.88, "learning_rate": 9.239628783428446e-05, "loss": 1.4758, "step": 23847 }, { "epoch": 1.88, "learning_rate": 9.23848760221132e-05, "loss": 1.5103, "step": 23848 }, { "epoch": 1.88, "learning_rate": 9.237346460111687e-05, "loss": 1.4991, "step": 23849 }, { "epoch": 1.88, "learning_rate": 9.236205357137286e-05, "loss": 1.4902, "step": 23850 }, { "epoch": 1.88, "learning_rate": 9.235064293295871e-05, "loss": 1.457, "step": 23851 }, { "epoch": 1.88, "learning_rate": 9.233923268595191e-05, "loss": 1.4968, "step": 23852 }, { "epoch": 1.88, "learning_rate": 9.232782283042992e-05, "loss": 1.4332, "step": 23853 }, { "epoch": 1.88, "learning_rate": 9.231641336647014e-05, "loss": 1.484, "step": 23854 }, { "epoch": 1.88, "learning_rate": 9.230500429415008e-05, "loss": 1.4599, "step": 23855 }, { "epoch": 1.88, "learning_rate": 9.229359561354726e-05, "loss": 1.4621, "step": 23856 }, { "epoch": 1.88, "learning_rate": 9.228218732473904e-05, "loss": 1.4847, "step": 23857 }, { "epoch": 1.88, "learning_rate": 9.227077942780295e-05, "loss": 1.4436, "step": 23858 }, { "epoch": 1.88, "learning_rate": 9.225937192281636e-05, "loss": 1.4831, "step": 23859 }, { "epoch": 1.88, "learning_rate": 9.224796480985678e-05, "loss": 1.5593, "step": 23860 }, { "epoch": 1.88, "learning_rate": 9.223655808900169e-05, "loss": 1.5644, "step": 23861 }, { "epoch": 1.88, "learning_rate": 9.222515176032846e-05, "loss": 1.5173, "step": 23862 }, { "epoch": 1.88, "learning_rate": 9.22137458239146e-05, "loss": 1.4468, "step": 23863 }, { "epoch": 1.88, "learning_rate": 9.220234027983748e-05, "loss": 1.4944, "step": 23864 }, { "epoch": 1.88, "learning_rate": 9.219093512817453e-05, "loss": 1.4428, "step": 23865 }, { "epoch": 1.88, "learning_rate": 9.217953036900327e-05, "loss": 1.5095, "step": 23866 }, { "epoch": 1.88, "learning_rate": 9.21681260024011e-05, "loss": 1.47, "step": 23867 }, { "epoch": 1.88, "learning_rate": 9.215672202844547e-05, "loss": 1.4878, "step": 23868 }, { "epoch": 1.88, "learning_rate": 9.214531844721373e-05, "loss": 1.4404, "step": 23869 }, { "epoch": 1.88, "learning_rate": 9.21339152587834e-05, "loss": 1.5205, "step": 23870 }, { "epoch": 1.88, "learning_rate": 9.212251246323181e-05, "loss": 1.4825, "step": 23871 }, { "epoch": 1.88, "learning_rate": 9.211111006063641e-05, "loss": 1.4892, "step": 23872 }, { "epoch": 1.88, "learning_rate": 9.20997080510747e-05, "loss": 1.495, "step": 23873 }, { "epoch": 1.88, "learning_rate": 9.208830643462395e-05, "loss": 1.5124, "step": 23874 }, { "epoch": 1.88, "learning_rate": 9.207690521136168e-05, "loss": 1.4798, "step": 23875 }, { "epoch": 1.88, "learning_rate": 9.206550438136524e-05, "loss": 1.5016, "step": 23876 }, { "epoch": 1.88, "learning_rate": 9.205410394471205e-05, "loss": 1.5329, "step": 23877 }, { "epoch": 1.88, "learning_rate": 9.204270390147953e-05, "loss": 1.5119, "step": 23878 }, { "epoch": 1.88, "learning_rate": 9.203130425174505e-05, "loss": 1.5135, "step": 23879 }, { "epoch": 1.88, "learning_rate": 9.201990499558604e-05, "loss": 1.4969, "step": 23880 }, { "epoch": 1.88, "learning_rate": 9.200850613307981e-05, "loss": 1.4691, "step": 23881 }, { "epoch": 1.88, "learning_rate": 9.199710766430393e-05, "loss": 1.4822, "step": 23882 }, { "epoch": 1.88, "learning_rate": 9.198570958933561e-05, "loss": 1.5163, "step": 23883 }, { "epoch": 1.88, "learning_rate": 9.197431190825234e-05, "loss": 1.5059, "step": 23884 }, { "epoch": 1.88, "learning_rate": 9.196291462113146e-05, "loss": 1.4289, "step": 23885 }, { "epoch": 1.88, "learning_rate": 9.195151772805036e-05, "loss": 1.5112, "step": 23886 }, { "epoch": 1.88, "learning_rate": 9.194012122908647e-05, "loss": 1.4121, "step": 23887 }, { "epoch": 1.88, "learning_rate": 9.192872512431704e-05, "loss": 1.5058, "step": 23888 }, { "epoch": 1.88, "learning_rate": 9.191732941381957e-05, "loss": 1.4845, "step": 23889 }, { "epoch": 1.88, "learning_rate": 9.190593409767137e-05, "loss": 1.538, "step": 23890 }, { "epoch": 1.88, "learning_rate": 9.189453917594982e-05, "loss": 1.4666, "step": 23891 }, { "epoch": 1.88, "learning_rate": 9.188314464873227e-05, "loss": 1.4324, "step": 23892 }, { "epoch": 1.88, "learning_rate": 9.187175051609609e-05, "loss": 1.4943, "step": 23893 }, { "epoch": 1.88, "learning_rate": 9.186035677811865e-05, "loss": 1.4852, "step": 23894 }, { "epoch": 1.88, "learning_rate": 9.184896343487733e-05, "loss": 1.4973, "step": 23895 }, { "epoch": 1.88, "learning_rate": 9.183757048644943e-05, "loss": 1.476, "step": 23896 }, { "epoch": 1.88, "learning_rate": 9.182617793291231e-05, "loss": 1.556, "step": 23897 }, { "epoch": 1.88, "learning_rate": 9.181478577434336e-05, "loss": 1.504, "step": 23898 }, { "epoch": 1.88, "learning_rate": 9.180339401081993e-05, "loss": 1.4643, "step": 23899 }, { "epoch": 1.88, "learning_rate": 9.17920026424193e-05, "loss": 1.4244, "step": 23900 }, { "epoch": 1.88, "learning_rate": 9.178061166921889e-05, "loss": 1.4973, "step": 23901 }, { "epoch": 1.88, "learning_rate": 9.176922109129597e-05, "loss": 1.4411, "step": 23902 }, { "epoch": 1.88, "learning_rate": 9.175783090872791e-05, "loss": 1.5305, "step": 23903 }, { "epoch": 1.88, "learning_rate": 9.174644112159208e-05, "loss": 1.5078, "step": 23904 }, { "epoch": 1.88, "learning_rate": 9.173505172996573e-05, "loss": 1.4977, "step": 23905 }, { "epoch": 1.88, "learning_rate": 9.172366273392621e-05, "loss": 1.5094, "step": 23906 }, { "epoch": 1.88, "learning_rate": 9.17122741335509e-05, "loss": 1.4453, "step": 23907 }, { "epoch": 1.88, "learning_rate": 9.170088592891704e-05, "loss": 1.5058, "step": 23908 }, { "epoch": 1.88, "learning_rate": 9.1689498120102e-05, "loss": 1.536, "step": 23909 }, { "epoch": 1.88, "learning_rate": 9.167811070718312e-05, "loss": 1.5331, "step": 23910 }, { "epoch": 1.88, "learning_rate": 9.166672369023766e-05, "loss": 1.4465, "step": 23911 }, { "epoch": 1.88, "learning_rate": 9.165533706934293e-05, "loss": 1.4734, "step": 23912 }, { "epoch": 1.88, "learning_rate": 9.164395084457628e-05, "loss": 1.4782, "step": 23913 }, { "epoch": 1.88, "learning_rate": 9.163256501601503e-05, "loss": 1.5023, "step": 23914 }, { "epoch": 1.88, "learning_rate": 9.162117958373643e-05, "loss": 1.4937, "step": 23915 }, { "epoch": 1.88, "learning_rate": 9.160979454781782e-05, "loss": 1.4907, "step": 23916 }, { "epoch": 1.88, "learning_rate": 9.15984099083365e-05, "loss": 1.4839, "step": 23917 }, { "epoch": 1.88, "learning_rate": 9.15870256653697e-05, "loss": 1.5095, "step": 23918 }, { "epoch": 1.88, "learning_rate": 9.15756418189948e-05, "loss": 1.4809, "step": 23919 }, { "epoch": 1.88, "learning_rate": 9.156425836928902e-05, "loss": 1.4629, "step": 23920 }, { "epoch": 1.88, "learning_rate": 9.155287531632972e-05, "loss": 1.4828, "step": 23921 }, { "epoch": 1.88, "learning_rate": 9.15414926601941e-05, "loss": 1.5247, "step": 23922 }, { "epoch": 1.88, "learning_rate": 9.153011040095949e-05, "loss": 1.4758, "step": 23923 }, { "epoch": 1.88, "learning_rate": 9.151872853870319e-05, "loss": 1.475, "step": 23924 }, { "epoch": 1.88, "learning_rate": 9.150734707350243e-05, "loss": 1.5095, "step": 23925 }, { "epoch": 1.88, "learning_rate": 9.14959660054345e-05, "loss": 1.507, "step": 23926 }, { "epoch": 1.88, "learning_rate": 9.148458533457671e-05, "loss": 1.4804, "step": 23927 }, { "epoch": 1.88, "learning_rate": 9.147320506100624e-05, "loss": 1.4402, "step": 23928 }, { "epoch": 1.88, "learning_rate": 9.146182518480041e-05, "loss": 1.4994, "step": 23929 }, { "epoch": 1.88, "learning_rate": 9.145044570603652e-05, "loss": 1.4882, "step": 23930 }, { "epoch": 1.88, "learning_rate": 9.143906662479179e-05, "loss": 1.5402, "step": 23931 }, { "epoch": 1.88, "learning_rate": 9.142768794114348e-05, "loss": 1.473, "step": 23932 }, { "epoch": 1.88, "learning_rate": 9.141630965516886e-05, "loss": 1.4819, "step": 23933 }, { "epoch": 1.88, "learning_rate": 9.140493176694514e-05, "loss": 1.5005, "step": 23934 }, { "epoch": 1.88, "learning_rate": 9.13935542765496e-05, "loss": 1.533, "step": 23935 }, { "epoch": 1.88, "learning_rate": 9.138217718405953e-05, "loss": 1.4831, "step": 23936 }, { "epoch": 1.88, "learning_rate": 9.137080048955206e-05, "loss": 1.489, "step": 23937 }, { "epoch": 1.88, "learning_rate": 9.135942419310453e-05, "loss": 1.5341, "step": 23938 }, { "epoch": 1.88, "learning_rate": 9.134804829479417e-05, "loss": 1.4614, "step": 23939 }, { "epoch": 1.88, "learning_rate": 9.133667279469819e-05, "loss": 1.4967, "step": 23940 }, { "epoch": 1.88, "learning_rate": 9.132529769289382e-05, "loss": 1.4846, "step": 23941 }, { "epoch": 1.88, "learning_rate": 9.131392298945827e-05, "loss": 1.4762, "step": 23942 }, { "epoch": 1.88, "learning_rate": 9.130254868446883e-05, "loss": 1.5195, "step": 23943 }, { "epoch": 1.88, "learning_rate": 9.129117477800264e-05, "loss": 1.5096, "step": 23944 }, { "epoch": 1.88, "learning_rate": 9.127980127013704e-05, "loss": 1.5297, "step": 23945 }, { "epoch": 1.88, "learning_rate": 9.126842816094915e-05, "loss": 1.4609, "step": 23946 }, { "epoch": 1.88, "learning_rate": 9.125705545051622e-05, "loss": 1.4828, "step": 23947 }, { "epoch": 1.88, "learning_rate": 9.124568313891552e-05, "loss": 1.4889, "step": 23948 }, { "epoch": 1.88, "learning_rate": 9.123431122622416e-05, "loss": 1.4879, "step": 23949 }, { "epoch": 1.88, "learning_rate": 9.12229397125194e-05, "loss": 1.4758, "step": 23950 }, { "epoch": 1.88, "learning_rate": 9.121156859787848e-05, "loss": 1.4925, "step": 23951 }, { "epoch": 1.88, "learning_rate": 9.120019788237853e-05, "loss": 1.4751, "step": 23952 }, { "epoch": 1.88, "learning_rate": 9.118882756609681e-05, "loss": 1.491, "step": 23953 }, { "epoch": 1.88, "learning_rate": 9.117745764911049e-05, "loss": 1.4986, "step": 23954 }, { "epoch": 1.88, "learning_rate": 9.116608813149674e-05, "loss": 1.4934, "step": 23955 }, { "epoch": 1.88, "learning_rate": 9.115471901333284e-05, "loss": 1.4749, "step": 23956 }, { "epoch": 1.88, "learning_rate": 9.114335029469588e-05, "loss": 1.5112, "step": 23957 }, { "epoch": 1.89, "learning_rate": 9.113198197566312e-05, "loss": 1.4979, "step": 23958 }, { "epoch": 1.89, "learning_rate": 9.11206140563117e-05, "loss": 1.4843, "step": 23959 }, { "epoch": 1.89, "learning_rate": 9.110924653671879e-05, "loss": 1.484, "step": 23960 }, { "epoch": 1.89, "learning_rate": 9.10978794169616e-05, "loss": 1.4861, "step": 23961 }, { "epoch": 1.89, "learning_rate": 9.108651269711735e-05, "loss": 1.5132, "step": 23962 }, { "epoch": 1.89, "learning_rate": 9.107514637726315e-05, "loss": 1.4995, "step": 23963 }, { "epoch": 1.89, "learning_rate": 9.106378045747617e-05, "loss": 1.5152, "step": 23964 }, { "epoch": 1.89, "learning_rate": 9.105241493783363e-05, "loss": 1.4364, "step": 23965 }, { "epoch": 1.89, "learning_rate": 9.104104981841266e-05, "loss": 1.511, "step": 23966 }, { "epoch": 1.89, "learning_rate": 9.102968509929038e-05, "loss": 1.4797, "step": 23967 }, { "epoch": 1.89, "learning_rate": 9.101832078054406e-05, "loss": 1.4761, "step": 23968 }, { "epoch": 1.89, "learning_rate": 9.100695686225075e-05, "loss": 1.5036, "step": 23969 }, { "epoch": 1.89, "learning_rate": 9.099559334448767e-05, "loss": 1.4583, "step": 23970 }, { "epoch": 1.89, "learning_rate": 9.098423022733194e-05, "loss": 1.5036, "step": 23971 }, { "epoch": 1.89, "learning_rate": 9.097286751086071e-05, "loss": 1.5441, "step": 23972 }, { "epoch": 1.89, "learning_rate": 9.096150519515117e-05, "loss": 1.5074, "step": 23973 }, { "epoch": 1.89, "learning_rate": 9.09501432802804e-05, "loss": 1.5034, "step": 23974 }, { "epoch": 1.89, "learning_rate": 9.093878176632553e-05, "loss": 1.4477, "step": 23975 }, { "epoch": 1.89, "learning_rate": 9.092742065336376e-05, "loss": 1.4769, "step": 23976 }, { "epoch": 1.89, "learning_rate": 9.091605994147226e-05, "loss": 1.5192, "step": 23977 }, { "epoch": 1.89, "learning_rate": 9.090469963072806e-05, "loss": 1.4702, "step": 23978 }, { "epoch": 1.89, "learning_rate": 9.089333972120836e-05, "loss": 1.4311, "step": 23979 }, { "epoch": 1.89, "learning_rate": 9.088198021299026e-05, "loss": 1.5035, "step": 23980 }, { "epoch": 1.89, "learning_rate": 9.087062110615089e-05, "loss": 1.518, "step": 23981 }, { "epoch": 1.89, "learning_rate": 9.085926240076738e-05, "loss": 1.4625, "step": 23982 }, { "epoch": 1.89, "learning_rate": 9.084790409691684e-05, "loss": 1.51, "step": 23983 }, { "epoch": 1.89, "learning_rate": 9.083654619467637e-05, "loss": 1.4675, "step": 23984 }, { "epoch": 1.89, "learning_rate": 9.082518869412314e-05, "loss": 1.4465, "step": 23985 }, { "epoch": 1.89, "learning_rate": 9.081383159533419e-05, "loss": 1.4992, "step": 23986 }, { "epoch": 1.89, "learning_rate": 9.080247489838668e-05, "loss": 1.4512, "step": 23987 }, { "epoch": 1.89, "learning_rate": 9.079111860335769e-05, "loss": 1.4538, "step": 23988 }, { "epoch": 1.89, "learning_rate": 9.077976271032431e-05, "loss": 1.5056, "step": 23989 }, { "epoch": 1.89, "learning_rate": 9.076840721936371e-05, "loss": 1.4619, "step": 23990 }, { "epoch": 1.89, "learning_rate": 9.075705213055286e-05, "loss": 1.4871, "step": 23991 }, { "epoch": 1.89, "learning_rate": 9.074569744396896e-05, "loss": 1.4958, "step": 23992 }, { "epoch": 1.89, "learning_rate": 9.07343431596891e-05, "loss": 1.4515, "step": 23993 }, { "epoch": 1.89, "learning_rate": 9.072298927779036e-05, "loss": 1.4322, "step": 23994 }, { "epoch": 1.89, "learning_rate": 9.071163579834977e-05, "loss": 1.4871, "step": 23995 }, { "epoch": 1.89, "learning_rate": 9.070028272144448e-05, "loss": 1.4984, "step": 23996 }, { "epoch": 1.89, "learning_rate": 9.068893004715155e-05, "loss": 1.4409, "step": 23997 }, { "epoch": 1.89, "learning_rate": 9.067757777554805e-05, "loss": 1.4564, "step": 23998 }, { "epoch": 1.89, "learning_rate": 9.066622590671108e-05, "loss": 1.4936, "step": 23999 }, { "epoch": 1.89, "learning_rate": 9.065487444071766e-05, "loss": 1.4891, "step": 24000 }, { "epoch": 1.89, "learning_rate": 9.064352337764487e-05, "loss": 1.5119, "step": 24001 }, { "epoch": 1.89, "learning_rate": 9.063217271756986e-05, "loss": 1.4685, "step": 24002 }, { "epoch": 1.89, "learning_rate": 9.062082246056962e-05, "loss": 1.4967, "step": 24003 }, { "epoch": 1.89, "learning_rate": 9.060947260672123e-05, "loss": 1.5252, "step": 24004 }, { "epoch": 1.89, "learning_rate": 9.05981231561017e-05, "loss": 1.473, "step": 24005 }, { "epoch": 1.89, "learning_rate": 9.058677410878818e-05, "loss": 1.4425, "step": 24006 }, { "epoch": 1.89, "learning_rate": 9.057542546485762e-05, "loss": 1.5045, "step": 24007 }, { "epoch": 1.89, "learning_rate": 9.056407722438716e-05, "loss": 1.4706, "step": 24008 }, { "epoch": 1.89, "learning_rate": 9.055272938745385e-05, "loss": 1.4383, "step": 24009 }, { "epoch": 1.89, "learning_rate": 9.054138195413467e-05, "loss": 1.497, "step": 24010 }, { "epoch": 1.89, "learning_rate": 9.053003492450672e-05, "loss": 1.5409, "step": 24011 }, { "epoch": 1.89, "learning_rate": 9.051868829864698e-05, "loss": 1.4933, "step": 24012 }, { "epoch": 1.89, "learning_rate": 9.050734207663253e-05, "loss": 1.5171, "step": 24013 }, { "epoch": 1.89, "learning_rate": 9.049599625854043e-05, "loss": 1.5332, "step": 24014 }, { "epoch": 1.89, "learning_rate": 9.048465084444765e-05, "loss": 1.4475, "step": 24015 }, { "epoch": 1.89, "learning_rate": 9.047330583443127e-05, "loss": 1.4653, "step": 24016 }, { "epoch": 1.89, "learning_rate": 9.046196122856827e-05, "loss": 1.4629, "step": 24017 }, { "epoch": 1.89, "learning_rate": 9.04506170269357e-05, "loss": 1.4827, "step": 24018 }, { "epoch": 1.89, "learning_rate": 9.043927322961059e-05, "loss": 1.4931, "step": 24019 }, { "epoch": 1.89, "learning_rate": 9.042792983666993e-05, "loss": 1.4209, "step": 24020 }, { "epoch": 1.89, "learning_rate": 9.041658684819074e-05, "loss": 1.516, "step": 24021 }, { "epoch": 1.89, "learning_rate": 9.040524426425003e-05, "loss": 1.476, "step": 24022 }, { "epoch": 1.89, "learning_rate": 9.039390208492488e-05, "loss": 1.4628, "step": 24023 }, { "epoch": 1.89, "learning_rate": 9.038256031029221e-05, "loss": 1.4772, "step": 24024 }, { "epoch": 1.89, "learning_rate": 9.037121894042905e-05, "loss": 1.4913, "step": 24025 }, { "epoch": 1.89, "learning_rate": 9.035987797541246e-05, "loss": 1.5127, "step": 24026 }, { "epoch": 1.89, "learning_rate": 9.034853741531933e-05, "loss": 1.5762, "step": 24027 }, { "epoch": 1.89, "learning_rate": 9.033719726022676e-05, "loss": 1.4936, "step": 24028 }, { "epoch": 1.89, "learning_rate": 9.032585751021166e-05, "loss": 1.4939, "step": 24029 }, { "epoch": 1.89, "learning_rate": 9.031451816535106e-05, "loss": 1.4577, "step": 24030 }, { "epoch": 1.89, "learning_rate": 9.030317922572196e-05, "loss": 1.5092, "step": 24031 }, { "epoch": 1.89, "learning_rate": 9.029184069140131e-05, "loss": 1.4612, "step": 24032 }, { "epoch": 1.89, "learning_rate": 9.028050256246615e-05, "loss": 1.5588, "step": 24033 }, { "epoch": 1.89, "learning_rate": 9.026916483899338e-05, "loss": 1.4946, "step": 24034 }, { "epoch": 1.89, "learning_rate": 9.025782752106002e-05, "loss": 1.4503, "step": 24035 }, { "epoch": 1.89, "learning_rate": 9.024649060874309e-05, "loss": 1.4781, "step": 24036 }, { "epoch": 1.89, "learning_rate": 9.023515410211944e-05, "loss": 1.4777, "step": 24037 }, { "epoch": 1.89, "learning_rate": 9.022381800126612e-05, "loss": 1.5185, "step": 24038 }, { "epoch": 1.89, "learning_rate": 9.021248230626013e-05, "loss": 1.445, "step": 24039 }, { "epoch": 1.89, "learning_rate": 9.020114701717839e-05, "loss": 1.4879, "step": 24040 }, { "epoch": 1.89, "learning_rate": 9.018981213409785e-05, "loss": 1.4154, "step": 24041 }, { "epoch": 1.89, "learning_rate": 9.017847765709545e-05, "loss": 1.4389, "step": 24042 }, { "epoch": 1.89, "learning_rate": 9.016714358624824e-05, "loss": 1.5091, "step": 24043 }, { "epoch": 1.89, "learning_rate": 9.015580992163306e-05, "loss": 1.4793, "step": 24044 }, { "epoch": 1.89, "learning_rate": 9.014447666332694e-05, "loss": 1.4628, "step": 24045 }, { "epoch": 1.89, "learning_rate": 9.013314381140677e-05, "loss": 1.4901, "step": 24046 }, { "epoch": 1.89, "learning_rate": 9.01218113659495e-05, "loss": 1.4701, "step": 24047 }, { "epoch": 1.89, "learning_rate": 9.011047932703213e-05, "loss": 1.5002, "step": 24048 }, { "epoch": 1.89, "learning_rate": 9.009914769473153e-05, "loss": 1.5172, "step": 24049 }, { "epoch": 1.89, "learning_rate": 9.008781646912466e-05, "loss": 1.4886, "step": 24050 }, { "epoch": 1.89, "learning_rate": 9.007648565028845e-05, "loss": 1.4519, "step": 24051 }, { "epoch": 1.89, "learning_rate": 9.006515523829985e-05, "loss": 1.4335, "step": 24052 }, { "epoch": 1.89, "learning_rate": 9.005382523323576e-05, "loss": 1.5332, "step": 24053 }, { "epoch": 1.89, "learning_rate": 9.004249563517306e-05, "loss": 1.5175, "step": 24054 }, { "epoch": 1.89, "learning_rate": 9.00311664441888e-05, "loss": 1.4868, "step": 24055 }, { "epoch": 1.89, "learning_rate": 9.001983766035981e-05, "loss": 1.5179, "step": 24056 }, { "epoch": 1.89, "learning_rate": 9.000850928376304e-05, "loss": 1.4798, "step": 24057 }, { "epoch": 1.89, "learning_rate": 8.999718131447536e-05, "loss": 1.4414, "step": 24058 }, { "epoch": 1.89, "learning_rate": 8.998585375257371e-05, "loss": 1.5221, "step": 24059 }, { "epoch": 1.89, "learning_rate": 8.997452659813501e-05, "loss": 1.5341, "step": 24060 }, { "epoch": 1.89, "learning_rate": 8.996319985123612e-05, "loss": 1.4804, "step": 24061 }, { "epoch": 1.89, "learning_rate": 8.995187351195399e-05, "loss": 1.4423, "step": 24062 }, { "epoch": 1.89, "learning_rate": 8.994054758036553e-05, "loss": 1.4869, "step": 24063 }, { "epoch": 1.89, "learning_rate": 8.992922205654757e-05, "loss": 1.4883, "step": 24064 }, { "epoch": 1.89, "learning_rate": 8.991789694057707e-05, "loss": 1.5262, "step": 24065 }, { "epoch": 1.89, "learning_rate": 8.990657223253088e-05, "loss": 1.5153, "step": 24066 }, { "epoch": 1.89, "learning_rate": 8.98952479324859e-05, "loss": 1.4889, "step": 24067 }, { "epoch": 1.89, "learning_rate": 8.988392404051902e-05, "loss": 1.5229, "step": 24068 }, { "epoch": 1.89, "learning_rate": 8.987260055670712e-05, "loss": 1.4873, "step": 24069 }, { "epoch": 1.89, "learning_rate": 8.986127748112704e-05, "loss": 1.4684, "step": 24070 }, { "epoch": 1.89, "learning_rate": 8.984995481385573e-05, "loss": 1.4908, "step": 24071 }, { "epoch": 1.89, "learning_rate": 8.983863255497005e-05, "loss": 1.4888, "step": 24072 }, { "epoch": 1.89, "learning_rate": 8.982731070454684e-05, "loss": 1.4786, "step": 24073 }, { "epoch": 1.89, "learning_rate": 8.981598926266302e-05, "loss": 1.4742, "step": 24074 }, { "epoch": 1.89, "learning_rate": 8.980466822939537e-05, "loss": 1.4877, "step": 24075 }, { "epoch": 1.89, "learning_rate": 8.979334760482082e-05, "loss": 1.4301, "step": 24076 }, { "epoch": 1.89, "learning_rate": 8.978202738901624e-05, "loss": 1.4516, "step": 24077 }, { "epoch": 1.89, "learning_rate": 8.977070758205845e-05, "loss": 1.471, "step": 24078 }, { "epoch": 1.89, "learning_rate": 8.975938818402428e-05, "loss": 1.4707, "step": 24079 }, { "epoch": 1.89, "learning_rate": 8.974806919499069e-05, "loss": 1.4295, "step": 24080 }, { "epoch": 1.89, "learning_rate": 8.97367506150344e-05, "loss": 1.4508, "step": 24081 }, { "epoch": 1.89, "learning_rate": 8.972543244423236e-05, "loss": 1.4577, "step": 24082 }, { "epoch": 1.89, "learning_rate": 8.971411468266136e-05, "loss": 1.4563, "step": 24083 }, { "epoch": 1.89, "learning_rate": 8.970279733039823e-05, "loss": 1.4694, "step": 24084 }, { "epoch": 1.9, "learning_rate": 8.969148038751981e-05, "loss": 1.4914, "step": 24085 }, { "epoch": 1.9, "learning_rate": 8.968016385410301e-05, "loss": 1.5038, "step": 24086 }, { "epoch": 1.9, "learning_rate": 8.966884773022458e-05, "loss": 1.4647, "step": 24087 }, { "epoch": 1.9, "learning_rate": 8.96575320159614e-05, "loss": 1.4883, "step": 24088 }, { "epoch": 1.9, "learning_rate": 8.964621671139029e-05, "loss": 1.4838, "step": 24089 }, { "epoch": 1.9, "learning_rate": 8.963490181658803e-05, "loss": 1.5443, "step": 24090 }, { "epoch": 1.9, "learning_rate": 8.962358733163148e-05, "loss": 1.4505, "step": 24091 }, { "epoch": 1.9, "learning_rate": 8.961227325659748e-05, "loss": 1.4497, "step": 24092 }, { "epoch": 1.9, "learning_rate": 8.96009595915628e-05, "loss": 1.4848, "step": 24093 }, { "epoch": 1.9, "learning_rate": 8.958964633660429e-05, "loss": 1.5056, "step": 24094 }, { "epoch": 1.9, "learning_rate": 8.957833349179871e-05, "loss": 1.5048, "step": 24095 }, { "epoch": 1.9, "learning_rate": 8.956702105722293e-05, "loss": 1.5127, "step": 24096 }, { "epoch": 1.9, "learning_rate": 8.955570903295373e-05, "loss": 1.4919, "step": 24097 }, { "epoch": 1.9, "learning_rate": 8.95443974190679e-05, "loss": 1.4467, "step": 24098 }, { "epoch": 1.9, "learning_rate": 8.953308621564226e-05, "loss": 1.4803, "step": 24099 }, { "epoch": 1.9, "learning_rate": 8.952177542275357e-05, "loss": 1.492, "step": 24100 }, { "epoch": 1.9, "learning_rate": 8.951046504047863e-05, "loss": 1.4445, "step": 24101 }, { "epoch": 1.9, "learning_rate": 8.949915506889428e-05, "loss": 1.5179, "step": 24102 }, { "epoch": 1.9, "learning_rate": 8.948784550807731e-05, "loss": 1.5102, "step": 24103 }, { "epoch": 1.9, "learning_rate": 8.947653635810444e-05, "loss": 1.4911, "step": 24104 }, { "epoch": 1.9, "learning_rate": 8.946522761905248e-05, "loss": 1.5527, "step": 24105 }, { "epoch": 1.9, "learning_rate": 8.945391929099828e-05, "loss": 1.4633, "step": 24106 }, { "epoch": 1.9, "learning_rate": 8.94426113740185e-05, "loss": 1.4792, "step": 24107 }, { "epoch": 1.9, "learning_rate": 8.943130386818999e-05, "loss": 1.5127, "step": 24108 }, { "epoch": 1.9, "learning_rate": 8.94199967735895e-05, "loss": 1.5, "step": 24109 }, { "epoch": 1.9, "learning_rate": 8.94086900902938e-05, "loss": 1.5141, "step": 24110 }, { "epoch": 1.9, "learning_rate": 8.939738381837966e-05, "loss": 1.4688, "step": 24111 }, { "epoch": 1.9, "learning_rate": 8.938607795792384e-05, "loss": 1.4375, "step": 24112 }, { "epoch": 1.9, "learning_rate": 8.937477250900308e-05, "loss": 1.4993, "step": 24113 }, { "epoch": 1.9, "learning_rate": 8.93634674716942e-05, "loss": 1.4501, "step": 24114 }, { "epoch": 1.9, "learning_rate": 8.935216284607389e-05, "loss": 1.5125, "step": 24115 }, { "epoch": 1.9, "learning_rate": 8.934085863221894e-05, "loss": 1.5187, "step": 24116 }, { "epoch": 1.9, "learning_rate": 8.9329554830206e-05, "loss": 1.4809, "step": 24117 }, { "epoch": 1.9, "learning_rate": 8.9318251440112e-05, "loss": 1.4737, "step": 24118 }, { "epoch": 1.9, "learning_rate": 8.930694846201355e-05, "loss": 1.5312, "step": 24119 }, { "epoch": 1.9, "learning_rate": 8.929564589598743e-05, "loss": 1.5136, "step": 24120 }, { "epoch": 1.9, "learning_rate": 8.928434374211039e-05, "loss": 1.4486, "step": 24121 }, { "epoch": 1.9, "learning_rate": 8.927304200045915e-05, "loss": 1.4801, "step": 24122 }, { "epoch": 1.9, "learning_rate": 8.926174067111043e-05, "loss": 1.4748, "step": 24123 }, { "epoch": 1.9, "learning_rate": 8.9250439754141e-05, "loss": 1.5004, "step": 24124 }, { "epoch": 1.9, "learning_rate": 8.923913924962751e-05, "loss": 1.4864, "step": 24125 }, { "epoch": 1.9, "learning_rate": 8.922783915764678e-05, "loss": 1.4961, "step": 24126 }, { "epoch": 1.9, "learning_rate": 8.921653947827545e-05, "loss": 1.4617, "step": 24127 }, { "epoch": 1.9, "learning_rate": 8.920524021159031e-05, "loss": 1.5361, "step": 24128 }, { "epoch": 1.9, "learning_rate": 8.919394135766803e-05, "loss": 1.4682, "step": 24129 }, { "epoch": 1.9, "learning_rate": 8.918264291658531e-05, "loss": 1.5132, "step": 24130 }, { "epoch": 1.9, "learning_rate": 8.917134488841891e-05, "loss": 1.513, "step": 24131 }, { "epoch": 1.9, "learning_rate": 8.916004727324545e-05, "loss": 1.4824, "step": 24132 }, { "epoch": 1.9, "learning_rate": 8.914875007114173e-05, "loss": 1.4616, "step": 24133 }, { "epoch": 1.9, "learning_rate": 8.913745328218444e-05, "loss": 1.504, "step": 24134 }, { "epoch": 1.9, "learning_rate": 8.912615690645024e-05, "loss": 1.466, "step": 24135 }, { "epoch": 1.9, "learning_rate": 8.911486094401584e-05, "loss": 1.4754, "step": 24136 }, { "epoch": 1.9, "learning_rate": 8.910356539495792e-05, "loss": 1.5432, "step": 24137 }, { "epoch": 1.9, "learning_rate": 8.909227025935323e-05, "loss": 1.4662, "step": 24138 }, { "epoch": 1.9, "learning_rate": 8.908097553727838e-05, "loss": 1.4872, "step": 24139 }, { "epoch": 1.9, "learning_rate": 8.906968122881013e-05, "loss": 1.5041, "step": 24140 }, { "epoch": 1.9, "learning_rate": 8.905838733402507e-05, "loss": 1.5077, "step": 24141 }, { "epoch": 1.9, "learning_rate": 8.904709385299993e-05, "loss": 1.4851, "step": 24142 }, { "epoch": 1.9, "learning_rate": 8.903580078581142e-05, "loss": 1.4696, "step": 24143 }, { "epoch": 1.9, "learning_rate": 8.902450813253615e-05, "loss": 1.4654, "step": 24144 }, { "epoch": 1.9, "learning_rate": 8.901321589325082e-05, "loss": 1.5286, "step": 24145 }, { "epoch": 1.9, "learning_rate": 8.900192406803215e-05, "loss": 1.516, "step": 24146 }, { "epoch": 1.9, "learning_rate": 8.89906326569567e-05, "loss": 1.5013, "step": 24147 }, { "epoch": 1.9, "learning_rate": 8.897934166010116e-05, "loss": 1.476, "step": 24148 }, { "epoch": 1.9, "learning_rate": 8.896805107754225e-05, "loss": 1.474, "step": 24149 }, { "epoch": 1.9, "learning_rate": 8.895676090935662e-05, "loss": 1.57, "step": 24150 }, { "epoch": 1.9, "learning_rate": 8.894547115562088e-05, "loss": 1.5029, "step": 24151 }, { "epoch": 1.9, "learning_rate": 8.893418181641171e-05, "loss": 1.4511, "step": 24152 }, { "epoch": 1.9, "learning_rate": 8.892289289180573e-05, "loss": 1.502, "step": 24153 }, { "epoch": 1.9, "learning_rate": 8.891160438187957e-05, "loss": 1.4996, "step": 24154 }, { "epoch": 1.9, "learning_rate": 8.890031628670998e-05, "loss": 1.4952, "step": 24155 }, { "epoch": 1.9, "learning_rate": 8.888902860637346e-05, "loss": 1.5299, "step": 24156 }, { "epoch": 1.9, "learning_rate": 8.887774134094677e-05, "loss": 1.488, "step": 24157 }, { "epoch": 1.9, "learning_rate": 8.886645449050643e-05, "loss": 1.4931, "step": 24158 }, { "epoch": 1.9, "learning_rate": 8.885516805512914e-05, "loss": 1.4803, "step": 24159 }, { "epoch": 1.9, "learning_rate": 8.884388203489157e-05, "loss": 1.4876, "step": 24160 }, { "epoch": 1.9, "learning_rate": 8.883259642987023e-05, "loss": 1.4319, "step": 24161 }, { "epoch": 1.9, "learning_rate": 8.88213112401418e-05, "loss": 1.4927, "step": 24162 }, { "epoch": 1.9, "learning_rate": 8.881002646578297e-05, "loss": 1.4841, "step": 24163 }, { "epoch": 1.9, "learning_rate": 8.879874210687022e-05, "loss": 1.4905, "step": 24164 }, { "epoch": 1.9, "learning_rate": 8.878745816348025e-05, "loss": 1.4925, "step": 24165 }, { "epoch": 1.9, "learning_rate": 8.877617463568966e-05, "loss": 1.4587, "step": 24166 }, { "epoch": 1.9, "learning_rate": 8.87648915235751e-05, "loss": 1.4487, "step": 24167 }, { "epoch": 1.9, "learning_rate": 8.875360882721311e-05, "loss": 1.4251, "step": 24168 }, { "epoch": 1.9, "learning_rate": 8.874232654668033e-05, "loss": 1.5304, "step": 24169 }, { "epoch": 1.9, "learning_rate": 8.873104468205335e-05, "loss": 1.5663, "step": 24170 }, { "epoch": 1.9, "learning_rate": 8.871976323340873e-05, "loss": 1.525, "step": 24171 }, { "epoch": 1.9, "learning_rate": 8.870848220082314e-05, "loss": 1.5112, "step": 24172 }, { "epoch": 1.9, "learning_rate": 8.86972015843731e-05, "loss": 1.4883, "step": 24173 }, { "epoch": 1.9, "learning_rate": 8.868592138413524e-05, "loss": 1.4824, "step": 24174 }, { "epoch": 1.9, "learning_rate": 8.867464160018617e-05, "loss": 1.5145, "step": 24175 }, { "epoch": 1.9, "learning_rate": 8.866336223260242e-05, "loss": 1.4521, "step": 24176 }, { "epoch": 1.9, "learning_rate": 8.865208328146059e-05, "loss": 1.4846, "step": 24177 }, { "epoch": 1.9, "learning_rate": 8.864080474683726e-05, "loss": 1.5179, "step": 24178 }, { "epoch": 1.9, "learning_rate": 8.8629526628809e-05, "loss": 1.523, "step": 24179 }, { "epoch": 1.9, "learning_rate": 8.861824892745235e-05, "loss": 1.4261, "step": 24180 }, { "epoch": 1.9, "learning_rate": 8.860697164284397e-05, "loss": 1.4949, "step": 24181 }, { "epoch": 1.9, "learning_rate": 8.859569477506035e-05, "loss": 1.5082, "step": 24182 }, { "epoch": 1.9, "learning_rate": 8.858441832417809e-05, "loss": 1.5369, "step": 24183 }, { "epoch": 1.9, "learning_rate": 8.857314229027374e-05, "loss": 1.505, "step": 24184 }, { "epoch": 1.9, "learning_rate": 8.856186667342383e-05, "loss": 1.5105, "step": 24185 }, { "epoch": 1.9, "learning_rate": 8.8550591473705e-05, "loss": 1.4519, "step": 24186 }, { "epoch": 1.9, "learning_rate": 8.85393166911937e-05, "loss": 1.4614, "step": 24187 }, { "epoch": 1.9, "learning_rate": 8.852804232596652e-05, "loss": 1.4924, "step": 24188 }, { "epoch": 1.9, "learning_rate": 8.851676837810003e-05, "loss": 1.5013, "step": 24189 }, { "epoch": 1.9, "learning_rate": 8.850549484767073e-05, "loss": 1.5413, "step": 24190 }, { "epoch": 1.9, "learning_rate": 8.849422173475519e-05, "loss": 1.5119, "step": 24191 }, { "epoch": 1.9, "learning_rate": 8.848294903942997e-05, "loss": 1.4676, "step": 24192 }, { "epoch": 1.9, "learning_rate": 8.847167676177154e-05, "loss": 1.49, "step": 24193 }, { "epoch": 1.9, "learning_rate": 8.84604049018565e-05, "loss": 1.4887, "step": 24194 }, { "epoch": 1.9, "learning_rate": 8.844913345976127e-05, "loss": 1.4882, "step": 24195 }, { "epoch": 1.9, "learning_rate": 8.843786243556256e-05, "loss": 1.482, "step": 24196 }, { "epoch": 1.9, "learning_rate": 8.842659182933673e-05, "loss": 1.4918, "step": 24197 }, { "epoch": 1.9, "learning_rate": 8.841532164116041e-05, "loss": 1.4517, "step": 24198 }, { "epoch": 1.9, "learning_rate": 8.840405187111004e-05, "loss": 1.4837, "step": 24199 }, { "epoch": 1.9, "learning_rate": 8.839278251926217e-05, "loss": 1.4377, "step": 24200 }, { "epoch": 1.9, "learning_rate": 8.838151358569333e-05, "loss": 1.427, "step": 24201 }, { "epoch": 1.9, "learning_rate": 8.837024507047999e-05, "loss": 1.5423, "step": 24202 }, { "epoch": 1.9, "learning_rate": 8.835897697369866e-05, "loss": 1.4865, "step": 24203 }, { "epoch": 1.9, "learning_rate": 8.83477092954259e-05, "loss": 1.4584, "step": 24204 }, { "epoch": 1.9, "learning_rate": 8.833644203573815e-05, "loss": 1.4953, "step": 24205 }, { "epoch": 1.9, "learning_rate": 8.832517519471195e-05, "loss": 1.4728, "step": 24206 }, { "epoch": 1.9, "learning_rate": 8.831390877242375e-05, "loss": 1.477, "step": 24207 }, { "epoch": 1.9, "learning_rate": 8.830264276895005e-05, "loss": 1.4474, "step": 24208 }, { "epoch": 1.9, "learning_rate": 8.829137718436741e-05, "loss": 1.4784, "step": 24209 }, { "epoch": 1.9, "learning_rate": 8.828011201875224e-05, "loss": 1.4759, "step": 24210 }, { "epoch": 1.9, "learning_rate": 8.826884727218099e-05, "loss": 1.4727, "step": 24211 }, { "epoch": 1.91, "learning_rate": 8.825758294473025e-05, "loss": 1.4902, "step": 24212 }, { "epoch": 1.91, "learning_rate": 8.824631903647647e-05, "loss": 1.5376, "step": 24213 }, { "epoch": 1.91, "learning_rate": 8.823505554749608e-05, "loss": 1.4215, "step": 24214 }, { "epoch": 1.91, "learning_rate": 8.822379247786562e-05, "loss": 1.4649, "step": 24215 }, { "epoch": 1.91, "learning_rate": 8.821252982766148e-05, "loss": 1.4872, "step": 24216 }, { "epoch": 1.91, "learning_rate": 8.820126759696017e-05, "loss": 1.4778, "step": 24217 }, { "epoch": 1.91, "learning_rate": 8.819000578583817e-05, "loss": 1.5351, "step": 24218 }, { "epoch": 1.91, "learning_rate": 8.81787443943719e-05, "loss": 1.4541, "step": 24219 }, { "epoch": 1.91, "learning_rate": 8.816748342263783e-05, "loss": 1.553, "step": 24220 }, { "epoch": 1.91, "learning_rate": 8.815622287071247e-05, "loss": 1.4637, "step": 24221 }, { "epoch": 1.91, "learning_rate": 8.814496273867219e-05, "loss": 1.519, "step": 24222 }, { "epoch": 1.91, "learning_rate": 8.81337030265935e-05, "loss": 1.4798, "step": 24223 }, { "epoch": 1.91, "learning_rate": 8.81224437345528e-05, "loss": 1.4856, "step": 24224 }, { "epoch": 1.91, "learning_rate": 8.811118486262656e-05, "loss": 1.444, "step": 24225 }, { "epoch": 1.91, "learning_rate": 8.809992641089126e-05, "loss": 1.5221, "step": 24226 }, { "epoch": 1.91, "learning_rate": 8.808866837942325e-05, "loss": 1.4696, "step": 24227 }, { "epoch": 1.91, "learning_rate": 8.8077410768299e-05, "loss": 1.533, "step": 24228 }, { "epoch": 1.91, "learning_rate": 8.8066153577595e-05, "loss": 1.4718, "step": 24229 }, { "epoch": 1.91, "learning_rate": 8.805489680738766e-05, "loss": 1.488, "step": 24230 }, { "epoch": 1.91, "learning_rate": 8.804364045775337e-05, "loss": 1.4706, "step": 24231 }, { "epoch": 1.91, "learning_rate": 8.803238452876857e-05, "loss": 1.4831, "step": 24232 }, { "epoch": 1.91, "learning_rate": 8.802112902050968e-05, "loss": 1.4621, "step": 24233 }, { "epoch": 1.91, "learning_rate": 8.800987393305311e-05, "loss": 1.5091, "step": 24234 }, { "epoch": 1.91, "learning_rate": 8.799861926647532e-05, "loss": 1.5367, "step": 24235 }, { "epoch": 1.91, "learning_rate": 8.798736502085265e-05, "loss": 1.4395, "step": 24236 }, { "epoch": 1.91, "learning_rate": 8.797611119626156e-05, "loss": 1.4836, "step": 24237 }, { "epoch": 1.91, "learning_rate": 8.796485779277849e-05, "loss": 1.4785, "step": 24238 }, { "epoch": 1.91, "learning_rate": 8.795360481047975e-05, "loss": 1.4857, "step": 24239 }, { "epoch": 1.91, "learning_rate": 8.794235224944183e-05, "loss": 1.5083, "step": 24240 }, { "epoch": 1.91, "learning_rate": 8.793110010974108e-05, "loss": 1.4951, "step": 24241 }, { "epoch": 1.91, "learning_rate": 8.791984839145385e-05, "loss": 1.4795, "step": 24242 }, { "epoch": 1.91, "learning_rate": 8.790859709465664e-05, "loss": 1.5029, "step": 24243 }, { "epoch": 1.91, "learning_rate": 8.789734621942578e-05, "loss": 1.5129, "step": 24244 }, { "epoch": 1.91, "learning_rate": 8.788609576583769e-05, "loss": 1.4797, "step": 24245 }, { "epoch": 1.91, "learning_rate": 8.787484573396873e-05, "loss": 1.5111, "step": 24246 }, { "epoch": 1.91, "learning_rate": 8.786359612389528e-05, "loss": 1.5351, "step": 24247 }, { "epoch": 1.91, "learning_rate": 8.785234693569371e-05, "loss": 1.4886, "step": 24248 }, { "epoch": 1.91, "learning_rate": 8.78410981694404e-05, "loss": 1.4581, "step": 24249 }, { "epoch": 1.91, "learning_rate": 8.782984982521178e-05, "loss": 1.4729, "step": 24250 }, { "epoch": 1.91, "learning_rate": 8.781860190308414e-05, "loss": 1.4775, "step": 24251 }, { "epoch": 1.91, "learning_rate": 8.78073544031339e-05, "loss": 1.4553, "step": 24252 }, { "epoch": 1.91, "learning_rate": 8.779610732543735e-05, "loss": 1.5403, "step": 24253 }, { "epoch": 1.91, "learning_rate": 8.778486067007094e-05, "loss": 1.468, "step": 24254 }, { "epoch": 1.91, "learning_rate": 8.777361443711101e-05, "loss": 1.4837, "step": 24255 }, { "epoch": 1.91, "learning_rate": 8.776236862663386e-05, "loss": 1.4533, "step": 24256 }, { "epoch": 1.91, "learning_rate": 8.77511232387159e-05, "loss": 1.4878, "step": 24257 }, { "epoch": 1.91, "learning_rate": 8.773987827343341e-05, "loss": 1.515, "step": 24258 }, { "epoch": 1.91, "learning_rate": 8.772863373086287e-05, "loss": 1.4717, "step": 24259 }, { "epoch": 1.91, "learning_rate": 8.77173896110805e-05, "loss": 1.4985, "step": 24260 }, { "epoch": 1.91, "learning_rate": 8.770614591416269e-05, "loss": 1.4528, "step": 24261 }, { "epoch": 1.91, "learning_rate": 8.769490264018579e-05, "loss": 1.45, "step": 24262 }, { "epoch": 1.91, "learning_rate": 8.76836597892261e-05, "loss": 1.4852, "step": 24263 }, { "epoch": 1.91, "learning_rate": 8.767241736136e-05, "loss": 1.5282, "step": 24264 }, { "epoch": 1.91, "learning_rate": 8.766117535666376e-05, "loss": 1.4585, "step": 24265 }, { "epoch": 1.91, "learning_rate": 8.764993377521374e-05, "loss": 1.4559, "step": 24266 }, { "epoch": 1.91, "learning_rate": 8.763869261708629e-05, "loss": 1.4526, "step": 24267 }, { "epoch": 1.91, "learning_rate": 8.762745188235766e-05, "loss": 1.483, "step": 24268 }, { "epoch": 1.91, "learning_rate": 8.761621157110426e-05, "loss": 1.4916, "step": 24269 }, { "epoch": 1.91, "learning_rate": 8.760497168340232e-05, "loss": 1.4741, "step": 24270 }, { "epoch": 1.91, "learning_rate": 8.759373221932819e-05, "loss": 1.5096, "step": 24271 }, { "epoch": 1.91, "learning_rate": 8.758249317895822e-05, "loss": 1.513, "step": 24272 }, { "epoch": 1.91, "learning_rate": 8.757125456236863e-05, "loss": 1.4871, "step": 24273 }, { "epoch": 1.91, "learning_rate": 8.756001636963576e-05, "loss": 1.4279, "step": 24274 }, { "epoch": 1.91, "learning_rate": 8.754877860083597e-05, "loss": 1.5045, "step": 24275 }, { "epoch": 1.91, "learning_rate": 8.753754125604543e-05, "loss": 1.4854, "step": 24276 }, { "epoch": 1.91, "learning_rate": 8.752630433534061e-05, "loss": 1.4405, "step": 24277 }, { "epoch": 1.91, "learning_rate": 8.75150678387977e-05, "loss": 1.5058, "step": 24278 }, { "epoch": 1.91, "learning_rate": 8.750383176649291e-05, "loss": 1.4845, "step": 24279 }, { "epoch": 1.91, "learning_rate": 8.749259611850269e-05, "loss": 1.4817, "step": 24280 }, { "epoch": 1.91, "learning_rate": 8.748136089490325e-05, "loss": 1.4792, "step": 24281 }, { "epoch": 1.91, "learning_rate": 8.747012609577082e-05, "loss": 1.5027, "step": 24282 }, { "epoch": 1.91, "learning_rate": 8.745889172118177e-05, "loss": 1.5188, "step": 24283 }, { "epoch": 1.91, "learning_rate": 8.744765777121235e-05, "loss": 1.4977, "step": 24284 }, { "epoch": 1.91, "learning_rate": 8.74364242459388e-05, "loss": 1.5101, "step": 24285 }, { "epoch": 1.91, "learning_rate": 8.742519114543735e-05, "loss": 1.4758, "step": 24286 }, { "epoch": 1.91, "learning_rate": 8.741395846978439e-05, "loss": 1.4678, "step": 24287 }, { "epoch": 1.91, "learning_rate": 8.74027262190561e-05, "loss": 1.5102, "step": 24288 }, { "epoch": 1.91, "learning_rate": 8.739149439332868e-05, "loss": 1.4579, "step": 24289 }, { "epoch": 1.91, "learning_rate": 8.738026299267849e-05, "loss": 1.4929, "step": 24290 }, { "epoch": 1.91, "learning_rate": 8.736903201718179e-05, "loss": 1.4606, "step": 24291 }, { "epoch": 1.91, "learning_rate": 8.735780146691485e-05, "loss": 1.4884, "step": 24292 }, { "epoch": 1.91, "learning_rate": 8.734657134195376e-05, "loss": 1.5173, "step": 24293 }, { "epoch": 1.91, "learning_rate": 8.733534164237496e-05, "loss": 1.5334, "step": 24294 }, { "epoch": 1.91, "learning_rate": 8.73241123682546e-05, "loss": 1.4909, "step": 24295 }, { "epoch": 1.91, "learning_rate": 8.731288351966888e-05, "loss": 1.4448, "step": 24296 }, { "epoch": 1.91, "learning_rate": 8.730165509669413e-05, "loss": 1.4828, "step": 24297 }, { "epoch": 1.91, "learning_rate": 8.729042709940654e-05, "loss": 1.4922, "step": 24298 }, { "epoch": 1.91, "learning_rate": 8.727919952788231e-05, "loss": 1.4059, "step": 24299 }, { "epoch": 1.91, "learning_rate": 8.726797238219775e-05, "loss": 1.4244, "step": 24300 }, { "epoch": 1.91, "learning_rate": 8.725674566242904e-05, "loss": 1.4391, "step": 24301 }, { "epoch": 1.91, "learning_rate": 8.72455193686524e-05, "loss": 1.4566, "step": 24302 }, { "epoch": 1.91, "learning_rate": 8.723429350094398e-05, "loss": 1.4875, "step": 24303 }, { "epoch": 1.91, "learning_rate": 8.722306805938014e-05, "loss": 1.4921, "step": 24304 }, { "epoch": 1.91, "learning_rate": 8.721184304403697e-05, "loss": 1.4189, "step": 24305 }, { "epoch": 1.91, "learning_rate": 8.72006184549908e-05, "loss": 1.5493, "step": 24306 }, { "epoch": 1.91, "learning_rate": 8.71893942923177e-05, "loss": 1.4602, "step": 24307 }, { "epoch": 1.91, "learning_rate": 8.717817055609401e-05, "loss": 1.506, "step": 24308 }, { "epoch": 1.91, "learning_rate": 8.716694724639589e-05, "loss": 1.5242, "step": 24309 }, { "epoch": 1.91, "learning_rate": 8.715572436329946e-05, "loss": 1.5221, "step": 24310 }, { "epoch": 1.91, "learning_rate": 8.714450190688104e-05, "loss": 1.5043, "step": 24311 }, { "epoch": 1.91, "learning_rate": 8.713327987721677e-05, "loss": 1.4906, "step": 24312 }, { "epoch": 1.91, "learning_rate": 8.712205827438277e-05, "loss": 1.4725, "step": 24313 }, { "epoch": 1.91, "learning_rate": 8.711083709845534e-05, "loss": 1.4664, "step": 24314 }, { "epoch": 1.91, "learning_rate": 8.709961634951064e-05, "loss": 1.4454, "step": 24315 }, { "epoch": 1.91, "learning_rate": 8.708839602762477e-05, "loss": 1.4767, "step": 24316 }, { "epoch": 1.91, "learning_rate": 8.707717613287407e-05, "loss": 1.4569, "step": 24317 }, { "epoch": 1.91, "learning_rate": 8.706595666533456e-05, "loss": 1.4442, "step": 24318 }, { "epoch": 1.91, "learning_rate": 8.705473762508244e-05, "loss": 1.5116, "step": 24319 }, { "epoch": 1.91, "learning_rate": 8.704351901219398e-05, "loss": 1.5092, "step": 24320 }, { "epoch": 1.91, "learning_rate": 8.703230082674523e-05, "loss": 1.499, "step": 24321 }, { "epoch": 1.91, "learning_rate": 8.702108306881244e-05, "loss": 1.487, "step": 24322 }, { "epoch": 1.91, "learning_rate": 8.700986573847171e-05, "loss": 1.5369, "step": 24323 }, { "epoch": 1.91, "learning_rate": 8.699864883579928e-05, "loss": 1.5105, "step": 24324 }, { "epoch": 1.91, "learning_rate": 8.698743236087125e-05, "loss": 1.511, "step": 24325 }, { "epoch": 1.91, "learning_rate": 8.697621631376378e-05, "loss": 1.461, "step": 24326 }, { "epoch": 1.91, "learning_rate": 8.6965000694553e-05, "loss": 1.5106, "step": 24327 }, { "epoch": 1.91, "learning_rate": 8.695378550331508e-05, "loss": 1.5158, "step": 24328 }, { "epoch": 1.91, "learning_rate": 8.694257074012622e-05, "loss": 1.4911, "step": 24329 }, { "epoch": 1.91, "learning_rate": 8.693135640506242e-05, "loss": 1.4849, "step": 24330 }, { "epoch": 1.91, "learning_rate": 8.692014249819995e-05, "loss": 1.4602, "step": 24331 }, { "epoch": 1.91, "learning_rate": 8.690892901961491e-05, "loss": 1.4484, "step": 24332 }, { "epoch": 1.91, "learning_rate": 8.689771596938338e-05, "loss": 1.5066, "step": 24333 }, { "epoch": 1.91, "learning_rate": 8.68865033475816e-05, "loss": 1.454, "step": 24334 }, { "epoch": 1.91, "learning_rate": 8.687529115428563e-05, "loss": 1.4626, "step": 24335 }, { "epoch": 1.91, "learning_rate": 8.686407938957152e-05, "loss": 1.4992, "step": 24336 }, { "epoch": 1.91, "learning_rate": 8.685286805351549e-05, "loss": 1.4525, "step": 24337 }, { "epoch": 1.91, "learning_rate": 8.68416571461937e-05, "loss": 1.4694, "step": 24338 }, { "epoch": 1.92, "learning_rate": 8.683044666768218e-05, "loss": 1.5133, "step": 24339 }, { "epoch": 1.92, "learning_rate": 8.681923661805701e-05, "loss": 1.4637, "step": 24340 }, { "epoch": 1.92, "learning_rate": 8.680802699739443e-05, "loss": 1.4798, "step": 24341 }, { "epoch": 1.92, "learning_rate": 8.679681780577046e-05, "loss": 1.5459, "step": 24342 }, { "epoch": 1.92, "learning_rate": 8.678560904326125e-05, "loss": 1.5057, "step": 24343 }, { "epoch": 1.92, "learning_rate": 8.677440070994279e-05, "loss": 1.4671, "step": 24344 }, { "epoch": 1.92, "learning_rate": 8.676319280589134e-05, "loss": 1.4705, "step": 24345 }, { "epoch": 1.92, "learning_rate": 8.675198533118288e-05, "loss": 1.4514, "step": 24346 }, { "epoch": 1.92, "learning_rate": 8.67407782858935e-05, "loss": 1.483, "step": 24347 }, { "epoch": 1.92, "learning_rate": 8.672957167009936e-05, "loss": 1.5204, "step": 24348 }, { "epoch": 1.92, "learning_rate": 8.671836548387654e-05, "loss": 1.5205, "step": 24349 }, { "epoch": 1.92, "learning_rate": 8.670715972730101e-05, "loss": 1.4852, "step": 24350 }, { "epoch": 1.92, "learning_rate": 8.669595440044902e-05, "loss": 1.5154, "step": 24351 }, { "epoch": 1.92, "learning_rate": 8.66847495033965e-05, "loss": 1.4997, "step": 24352 }, { "epoch": 1.92, "learning_rate": 8.667354503621965e-05, "loss": 1.4806, "step": 24353 }, { "epoch": 1.92, "learning_rate": 8.666234099899443e-05, "loss": 1.4809, "step": 24354 }, { "epoch": 1.92, "learning_rate": 8.665113739179702e-05, "loss": 1.4653, "step": 24355 }, { "epoch": 1.92, "learning_rate": 8.663993421470342e-05, "loss": 1.4524, "step": 24356 }, { "epoch": 1.92, "learning_rate": 8.662873146778963e-05, "loss": 1.4529, "step": 24357 }, { "epoch": 1.92, "learning_rate": 8.661752915113188e-05, "loss": 1.4768, "step": 24358 }, { "epoch": 1.92, "learning_rate": 8.660632726480609e-05, "loss": 1.4512, "step": 24359 }, { "epoch": 1.92, "learning_rate": 8.659512580888837e-05, "loss": 1.4284, "step": 24360 }, { "epoch": 1.92, "learning_rate": 8.65839247834547e-05, "loss": 1.4714, "step": 24361 }, { "epoch": 1.92, "learning_rate": 8.657272418858124e-05, "loss": 1.4866, "step": 24362 }, { "epoch": 1.92, "learning_rate": 8.656152402434398e-05, "loss": 1.5329, "step": 24363 }, { "epoch": 1.92, "learning_rate": 8.655032429081892e-05, "loss": 1.5069, "step": 24364 }, { "epoch": 1.92, "learning_rate": 8.653912498808219e-05, "loss": 1.4516, "step": 24365 }, { "epoch": 1.92, "learning_rate": 8.652792611620977e-05, "loss": 1.445, "step": 24366 }, { "epoch": 1.92, "learning_rate": 8.651672767527767e-05, "loss": 1.4797, "step": 24367 }, { "epoch": 1.92, "learning_rate": 8.650552966536193e-05, "loss": 1.4556, "step": 24368 }, { "epoch": 1.92, "learning_rate": 8.649433208653869e-05, "loss": 1.4417, "step": 24369 }, { "epoch": 1.92, "learning_rate": 8.648313493888386e-05, "loss": 1.4703, "step": 24370 }, { "epoch": 1.92, "learning_rate": 8.647193822247345e-05, "loss": 1.5135, "step": 24371 }, { "epoch": 1.92, "learning_rate": 8.64607419373836e-05, "loss": 1.4897, "step": 24372 }, { "epoch": 1.92, "learning_rate": 8.64495460836902e-05, "loss": 1.4699, "step": 24373 }, { "epoch": 1.92, "learning_rate": 8.643835066146928e-05, "loss": 1.4763, "step": 24374 }, { "epoch": 1.92, "learning_rate": 8.642715567079695e-05, "loss": 1.4843, "step": 24375 }, { "epoch": 1.92, "learning_rate": 8.641596111174915e-05, "loss": 1.5064, "step": 24376 }, { "epoch": 1.92, "learning_rate": 8.640476698440182e-05, "loss": 1.5138, "step": 24377 }, { "epoch": 1.92, "learning_rate": 8.639357328883108e-05, "loss": 1.4565, "step": 24378 }, { "epoch": 1.92, "learning_rate": 8.63823800251129e-05, "loss": 1.4456, "step": 24379 }, { "epoch": 1.92, "learning_rate": 8.637118719332322e-05, "loss": 1.4876, "step": 24380 }, { "epoch": 1.92, "learning_rate": 8.635999479353801e-05, "loss": 1.4865, "step": 24381 }, { "epoch": 1.92, "learning_rate": 8.634880282583341e-05, "loss": 1.4697, "step": 24382 }, { "epoch": 1.92, "learning_rate": 8.633761129028527e-05, "loss": 1.5188, "step": 24383 }, { "epoch": 1.92, "learning_rate": 8.632642018696958e-05, "loss": 1.5105, "step": 24384 }, { "epoch": 1.92, "learning_rate": 8.631522951596236e-05, "loss": 1.4762, "step": 24385 }, { "epoch": 1.92, "learning_rate": 8.630403927733966e-05, "loss": 1.4361, "step": 24386 }, { "epoch": 1.92, "learning_rate": 8.629284947117737e-05, "loss": 1.4885, "step": 24387 }, { "epoch": 1.92, "learning_rate": 8.62816600975514e-05, "loss": 1.5013, "step": 24388 }, { "epoch": 1.92, "learning_rate": 8.627047115653787e-05, "loss": 1.52, "step": 24389 }, { "epoch": 1.92, "learning_rate": 8.625928264821268e-05, "loss": 1.5271, "step": 24390 }, { "epoch": 1.92, "learning_rate": 8.624809457265172e-05, "loss": 1.465, "step": 24391 }, { "epoch": 1.92, "learning_rate": 8.623690692993105e-05, "loss": 1.5275, "step": 24392 }, { "epoch": 1.92, "learning_rate": 8.622571972012662e-05, "loss": 1.4936, "step": 24393 }, { "epoch": 1.92, "learning_rate": 8.62145329433143e-05, "loss": 1.4868, "step": 24394 }, { "epoch": 1.92, "learning_rate": 8.620334659957016e-05, "loss": 1.4612, "step": 24395 }, { "epoch": 1.92, "learning_rate": 8.619216068897008e-05, "loss": 1.4762, "step": 24396 }, { "epoch": 1.92, "learning_rate": 8.618097521159005e-05, "loss": 1.4826, "step": 24397 }, { "epoch": 1.92, "learning_rate": 8.616979016750588e-05, "loss": 1.4713, "step": 24398 }, { "epoch": 1.92, "learning_rate": 8.61586055567937e-05, "loss": 1.5297, "step": 24399 }, { "epoch": 1.92, "learning_rate": 8.614742137952928e-05, "loss": 1.4539, "step": 24400 }, { "epoch": 1.92, "learning_rate": 8.613623763578868e-05, "loss": 1.5199, "step": 24401 }, { "epoch": 1.92, "learning_rate": 8.612505432564775e-05, "loss": 1.4291, "step": 24402 }, { "epoch": 1.92, "learning_rate": 8.61138714491825e-05, "loss": 1.5116, "step": 24403 }, { "epoch": 1.92, "learning_rate": 8.610268900646879e-05, "loss": 1.4627, "step": 24404 }, { "epoch": 1.92, "learning_rate": 8.609150699758252e-05, "loss": 1.5116, "step": 24405 }, { "epoch": 1.92, "learning_rate": 8.608032542259972e-05, "loss": 1.4942, "step": 24406 }, { "epoch": 1.92, "learning_rate": 8.606914428159624e-05, "loss": 1.508, "step": 24407 }, { "epoch": 1.92, "learning_rate": 8.60579635746479e-05, "loss": 1.5098, "step": 24408 }, { "epoch": 1.92, "learning_rate": 8.604678330183078e-05, "loss": 1.4495, "step": 24409 }, { "epoch": 1.92, "learning_rate": 8.60356034632207e-05, "loss": 1.5136, "step": 24410 }, { "epoch": 1.92, "learning_rate": 8.602442405889354e-05, "loss": 1.4576, "step": 24411 }, { "epoch": 1.92, "learning_rate": 8.601324508892525e-05, "loss": 1.4636, "step": 24412 }, { "epoch": 1.92, "learning_rate": 8.600206655339175e-05, "loss": 1.4539, "step": 24413 }, { "epoch": 1.92, "learning_rate": 8.59908884523689e-05, "loss": 1.4487, "step": 24414 }, { "epoch": 1.92, "learning_rate": 8.597971078593246e-05, "loss": 1.4628, "step": 24415 }, { "epoch": 1.92, "learning_rate": 8.596853355415859e-05, "loss": 1.4629, "step": 24416 }, { "epoch": 1.92, "learning_rate": 8.595735675712302e-05, "loss": 1.5184, "step": 24417 }, { "epoch": 1.92, "learning_rate": 8.594618039490167e-05, "loss": 1.4827, "step": 24418 }, { "epoch": 1.92, "learning_rate": 8.593500446757035e-05, "loss": 1.4581, "step": 24419 }, { "epoch": 1.92, "learning_rate": 8.592382897520506e-05, "loss": 1.4833, "step": 24420 }, { "epoch": 1.92, "learning_rate": 8.59126539178816e-05, "loss": 1.4539, "step": 24421 }, { "epoch": 1.92, "learning_rate": 8.59014792956758e-05, "loss": 1.477, "step": 24422 }, { "epoch": 1.92, "learning_rate": 8.589030510866363e-05, "loss": 1.5956, "step": 24423 }, { "epoch": 1.92, "learning_rate": 8.587913135692093e-05, "loss": 1.5056, "step": 24424 }, { "epoch": 1.92, "learning_rate": 8.586795804052346e-05, "loss": 1.4961, "step": 24425 }, { "epoch": 1.92, "learning_rate": 8.585678515954724e-05, "loss": 1.4755, "step": 24426 }, { "epoch": 1.92, "learning_rate": 8.584561271406804e-05, "loss": 1.4612, "step": 24427 }, { "epoch": 1.92, "learning_rate": 8.583444070416169e-05, "loss": 1.4737, "step": 24428 }, { "epoch": 1.92, "learning_rate": 8.582326912990412e-05, "loss": 1.4962, "step": 24429 }, { "epoch": 1.92, "learning_rate": 8.581209799137113e-05, "loss": 1.4896, "step": 24430 }, { "epoch": 1.92, "learning_rate": 8.580092728863853e-05, "loss": 1.4408, "step": 24431 }, { "epoch": 1.92, "learning_rate": 8.578975702178219e-05, "loss": 1.4853, "step": 24432 }, { "epoch": 1.92, "learning_rate": 8.577858719087805e-05, "loss": 1.5112, "step": 24433 }, { "epoch": 1.92, "learning_rate": 8.576741779600185e-05, "loss": 1.5085, "step": 24434 }, { "epoch": 1.92, "learning_rate": 8.575624883722937e-05, "loss": 1.4877, "step": 24435 }, { "epoch": 1.92, "learning_rate": 8.574508031463655e-05, "loss": 1.4706, "step": 24436 }, { "epoch": 1.92, "learning_rate": 8.573391222829919e-05, "loss": 1.4606, "step": 24437 }, { "epoch": 1.92, "learning_rate": 8.572274457829312e-05, "loss": 1.4738, "step": 24438 }, { "epoch": 1.92, "learning_rate": 8.571157736469408e-05, "loss": 1.4838, "step": 24439 }, { "epoch": 1.92, "learning_rate": 8.5700410587578e-05, "loss": 1.4535, "step": 24440 }, { "epoch": 1.92, "learning_rate": 8.568924424702065e-05, "loss": 1.529, "step": 24441 }, { "epoch": 1.92, "learning_rate": 8.567807834309777e-05, "loss": 1.4576, "step": 24442 }, { "epoch": 1.92, "learning_rate": 8.566691287588535e-05, "loss": 1.4757, "step": 24443 }, { "epoch": 1.92, "learning_rate": 8.565574784545904e-05, "loss": 1.4405, "step": 24444 }, { "epoch": 1.92, "learning_rate": 8.564458325189464e-05, "loss": 1.4963, "step": 24445 }, { "epoch": 1.92, "learning_rate": 8.563341909526808e-05, "loss": 1.4074, "step": 24446 }, { "epoch": 1.92, "learning_rate": 8.562225537565502e-05, "loss": 1.5201, "step": 24447 }, { "epoch": 1.92, "learning_rate": 8.561109209313138e-05, "loss": 1.4842, "step": 24448 }, { "epoch": 1.92, "learning_rate": 8.559992924777284e-05, "loss": 1.5003, "step": 24449 }, { "epoch": 1.92, "learning_rate": 8.558876683965529e-05, "loss": 1.4728, "step": 24450 }, { "epoch": 1.92, "learning_rate": 8.557760486885446e-05, "loss": 1.4921, "step": 24451 }, { "epoch": 1.92, "learning_rate": 8.556644333544609e-05, "loss": 1.5321, "step": 24452 }, { "epoch": 1.92, "learning_rate": 8.555528223950608e-05, "loss": 1.5264, "step": 24453 }, { "epoch": 1.92, "learning_rate": 8.554412158111014e-05, "loss": 1.5158, "step": 24454 }, { "epoch": 1.92, "learning_rate": 8.553296136033404e-05, "loss": 1.5238, "step": 24455 }, { "epoch": 1.92, "learning_rate": 8.552180157725348e-05, "loss": 1.4768, "step": 24456 }, { "epoch": 1.92, "learning_rate": 8.55106422319444e-05, "loss": 1.5274, "step": 24457 }, { "epoch": 1.92, "learning_rate": 8.549948332448244e-05, "loss": 1.4896, "step": 24458 }, { "epoch": 1.92, "learning_rate": 8.548832485494334e-05, "loss": 1.4735, "step": 24459 }, { "epoch": 1.92, "learning_rate": 8.547716682340297e-05, "loss": 1.4561, "step": 24460 }, { "epoch": 1.92, "learning_rate": 8.546600922993706e-05, "loss": 1.5455, "step": 24461 }, { "epoch": 1.92, "learning_rate": 8.545485207462125e-05, "loss": 1.5336, "step": 24462 }, { "epoch": 1.92, "learning_rate": 8.544369535753138e-05, "loss": 1.5397, "step": 24463 }, { "epoch": 1.92, "learning_rate": 8.543253907874326e-05, "loss": 1.5343, "step": 24464 }, { "epoch": 1.92, "learning_rate": 8.542138323833256e-05, "loss": 1.5033, "step": 24465 }, { "epoch": 1.93, "learning_rate": 8.541022783637498e-05, "loss": 1.486, "step": 24466 }, { "epoch": 1.93, "learning_rate": 8.539907287294635e-05, "loss": 1.4765, "step": 24467 }, { "epoch": 1.93, "learning_rate": 8.538791834812237e-05, "loss": 1.4641, "step": 24468 }, { "epoch": 1.93, "learning_rate": 8.537676426197873e-05, "loss": 1.5246, "step": 24469 }, { "epoch": 1.93, "learning_rate": 8.536561061459125e-05, "loss": 1.4893, "step": 24470 }, { "epoch": 1.93, "learning_rate": 8.53544574060356e-05, "loss": 1.5128, "step": 24471 }, { "epoch": 1.93, "learning_rate": 8.534330463638749e-05, "loss": 1.5002, "step": 24472 }, { "epoch": 1.93, "learning_rate": 8.533215230572263e-05, "loss": 1.475, "step": 24473 }, { "epoch": 1.93, "learning_rate": 8.532100041411683e-05, "loss": 1.4912, "step": 24474 }, { "epoch": 1.93, "learning_rate": 8.530984896164573e-05, "loss": 1.526, "step": 24475 }, { "epoch": 1.93, "learning_rate": 8.5298697948385e-05, "loss": 1.4937, "step": 24476 }, { "epoch": 1.93, "learning_rate": 8.528754737441047e-05, "loss": 1.5134, "step": 24477 }, { "epoch": 1.93, "learning_rate": 8.527639723979773e-05, "loss": 1.4982, "step": 24478 }, { "epoch": 1.93, "learning_rate": 8.526524754462257e-05, "loss": 1.502, "step": 24479 }, { "epoch": 1.93, "learning_rate": 8.525409828896061e-05, "loss": 1.5067, "step": 24480 }, { "epoch": 1.93, "learning_rate": 8.524294947288765e-05, "loss": 1.4666, "step": 24481 }, { "epoch": 1.93, "learning_rate": 8.523180109647932e-05, "loss": 1.5086, "step": 24482 }, { "epoch": 1.93, "learning_rate": 8.522065315981127e-05, "loss": 1.5035, "step": 24483 }, { "epoch": 1.93, "learning_rate": 8.52095056629593e-05, "loss": 1.4904, "step": 24484 }, { "epoch": 1.93, "learning_rate": 8.519835860599903e-05, "loss": 1.4743, "step": 24485 }, { "epoch": 1.93, "learning_rate": 8.518721198900608e-05, "loss": 1.5155, "step": 24486 }, { "epoch": 1.93, "learning_rate": 8.517606581205624e-05, "loss": 1.5025, "step": 24487 }, { "epoch": 1.93, "learning_rate": 8.516492007522517e-05, "loss": 1.5239, "step": 24488 }, { "epoch": 1.93, "learning_rate": 8.515377477858844e-05, "loss": 1.4433, "step": 24489 }, { "epoch": 1.93, "learning_rate": 8.514262992222185e-05, "loss": 1.4885, "step": 24490 }, { "epoch": 1.93, "learning_rate": 8.513148550620102e-05, "loss": 1.464, "step": 24491 }, { "epoch": 1.93, "learning_rate": 8.512034153060161e-05, "loss": 1.4675, "step": 24492 }, { "epoch": 1.93, "learning_rate": 8.51091979954992e-05, "loss": 1.4353, "step": 24493 }, { "epoch": 1.93, "learning_rate": 8.509805490096953e-05, "loss": 1.4863, "step": 24494 }, { "epoch": 1.93, "learning_rate": 8.508691224708833e-05, "loss": 1.4849, "step": 24495 }, { "epoch": 1.93, "learning_rate": 8.507577003393117e-05, "loss": 1.4707, "step": 24496 }, { "epoch": 1.93, "learning_rate": 8.506462826157362e-05, "loss": 1.492, "step": 24497 }, { "epoch": 1.93, "learning_rate": 8.505348693009149e-05, "loss": 1.4896, "step": 24498 }, { "epoch": 1.93, "learning_rate": 8.504234603956034e-05, "loss": 1.5383, "step": 24499 }, { "epoch": 1.93, "learning_rate": 8.503120559005574e-05, "loss": 1.4668, "step": 24500 }, { "epoch": 1.93, "learning_rate": 8.502006558165347e-05, "loss": 1.4953, "step": 24501 }, { "epoch": 1.93, "learning_rate": 8.500892601442911e-05, "loss": 1.5142, "step": 24502 }, { "epoch": 1.93, "learning_rate": 8.49977868884582e-05, "loss": 1.4841, "step": 24503 }, { "epoch": 1.93, "learning_rate": 8.49866482038165e-05, "loss": 1.4614, "step": 24504 }, { "epoch": 1.93, "learning_rate": 8.497550996057959e-05, "loss": 1.461, "step": 24505 }, { "epoch": 1.93, "learning_rate": 8.496437215882304e-05, "loss": 1.4719, "step": 24506 }, { "epoch": 1.93, "learning_rate": 8.495323479862256e-05, "loss": 1.4903, "step": 24507 }, { "epoch": 1.93, "learning_rate": 8.49420978800537e-05, "loss": 1.499, "step": 24508 }, { "epoch": 1.93, "learning_rate": 8.493096140319213e-05, "loss": 1.4909, "step": 24509 }, { "epoch": 1.93, "learning_rate": 8.491982536811328e-05, "loss": 1.5116, "step": 24510 }, { "epoch": 1.93, "learning_rate": 8.490868977489303e-05, "loss": 1.456, "step": 24511 }, { "epoch": 1.93, "learning_rate": 8.489755462360686e-05, "loss": 1.4749, "step": 24512 }, { "epoch": 1.93, "learning_rate": 8.488641991433034e-05, "loss": 1.472, "step": 24513 }, { "epoch": 1.93, "learning_rate": 8.487528564713908e-05, "loss": 1.4975, "step": 24514 }, { "epoch": 1.93, "learning_rate": 8.486415182210871e-05, "loss": 1.4654, "step": 24515 }, { "epoch": 1.93, "learning_rate": 8.485301843931484e-05, "loss": 1.4562, "step": 24516 }, { "epoch": 1.93, "learning_rate": 8.484188549883295e-05, "loss": 1.5077, "step": 24517 }, { "epoch": 1.93, "learning_rate": 8.483075300073876e-05, "loss": 1.412, "step": 24518 }, { "epoch": 1.93, "learning_rate": 8.481962094510778e-05, "loss": 1.5125, "step": 24519 }, { "epoch": 1.93, "learning_rate": 8.480848933201557e-05, "loss": 1.4663, "step": 24520 }, { "epoch": 1.93, "learning_rate": 8.479735816153779e-05, "loss": 1.5914, "step": 24521 }, { "epoch": 1.93, "learning_rate": 8.478622743374996e-05, "loss": 1.4844, "step": 24522 }, { "epoch": 1.93, "learning_rate": 8.477509714872761e-05, "loss": 1.5142, "step": 24523 }, { "epoch": 1.93, "learning_rate": 8.47639673065464e-05, "loss": 1.4877, "step": 24524 }, { "epoch": 1.93, "learning_rate": 8.475283790728178e-05, "loss": 1.4603, "step": 24525 }, { "epoch": 1.93, "learning_rate": 8.474170895100949e-05, "loss": 1.5629, "step": 24526 }, { "epoch": 1.93, "learning_rate": 8.473058043780489e-05, "loss": 1.5086, "step": 24527 }, { "epoch": 1.93, "learning_rate": 8.47194523677437e-05, "loss": 1.4801, "step": 24528 }, { "epoch": 1.93, "learning_rate": 8.470832474090141e-05, "loss": 1.4893, "step": 24529 }, { "epoch": 1.93, "learning_rate": 8.469719755735348e-05, "loss": 1.4938, "step": 24530 }, { "epoch": 1.93, "learning_rate": 8.468607081717562e-05, "loss": 1.4954, "step": 24531 }, { "epoch": 1.93, "learning_rate": 8.46749445204433e-05, "loss": 1.5123, "step": 24532 }, { "epoch": 1.93, "learning_rate": 8.466381866723205e-05, "loss": 1.52, "step": 24533 }, { "epoch": 1.93, "learning_rate": 8.465269325761736e-05, "loss": 1.4975, "step": 24534 }, { "epoch": 1.93, "learning_rate": 8.464156829167487e-05, "loss": 1.4705, "step": 24535 }, { "epoch": 1.93, "learning_rate": 8.463044376948006e-05, "loss": 1.4506, "step": 24536 }, { "epoch": 1.93, "learning_rate": 8.461931969110842e-05, "loss": 1.3977, "step": 24537 }, { "epoch": 1.93, "learning_rate": 8.460819605663558e-05, "loss": 1.4798, "step": 24538 }, { "epoch": 1.93, "learning_rate": 8.459707286613701e-05, "loss": 1.4787, "step": 24539 }, { "epoch": 1.93, "learning_rate": 8.458595011968813e-05, "loss": 1.4565, "step": 24540 }, { "epoch": 1.93, "learning_rate": 8.457482781736458e-05, "loss": 1.4901, "step": 24541 }, { "epoch": 1.93, "learning_rate": 8.45637059592419e-05, "loss": 1.529, "step": 24542 }, { "epoch": 1.93, "learning_rate": 8.455258454539553e-05, "loss": 1.4855, "step": 24543 }, { "epoch": 1.93, "learning_rate": 8.454146357590095e-05, "loss": 1.4821, "step": 24544 }, { "epoch": 1.93, "learning_rate": 8.453034305083374e-05, "loss": 1.499, "step": 24545 }, { "epoch": 1.93, "learning_rate": 8.451922297026941e-05, "loss": 1.4936, "step": 24546 }, { "epoch": 1.93, "learning_rate": 8.450810333428335e-05, "loss": 1.4394, "step": 24547 }, { "epoch": 1.93, "learning_rate": 8.449698414295119e-05, "loss": 1.5055, "step": 24548 }, { "epoch": 1.93, "learning_rate": 8.448586539634833e-05, "loss": 1.512, "step": 24549 }, { "epoch": 1.93, "learning_rate": 8.447474709455032e-05, "loss": 1.4699, "step": 24550 }, { "epoch": 1.93, "learning_rate": 8.446362923763255e-05, "loss": 1.4795, "step": 24551 }, { "epoch": 1.93, "learning_rate": 8.445251182567063e-05, "loss": 1.4733, "step": 24552 }, { "epoch": 1.93, "learning_rate": 8.444139485874e-05, "loss": 1.4559, "step": 24553 }, { "epoch": 1.93, "learning_rate": 8.443027833691603e-05, "loss": 1.4838, "step": 24554 }, { "epoch": 1.93, "learning_rate": 8.441916226027437e-05, "loss": 1.4793, "step": 24555 }, { "epoch": 1.93, "learning_rate": 8.440804662889039e-05, "loss": 1.4772, "step": 24556 }, { "epoch": 1.93, "learning_rate": 8.439693144283952e-05, "loss": 1.463, "step": 24557 }, { "epoch": 1.93, "learning_rate": 8.43858167021973e-05, "loss": 1.4683, "step": 24558 }, { "epoch": 1.93, "learning_rate": 8.437470240703922e-05, "loss": 1.4572, "step": 24559 }, { "epoch": 1.93, "learning_rate": 8.43635885574407e-05, "loss": 1.4492, "step": 24560 }, { "epoch": 1.93, "learning_rate": 8.435247515347712e-05, "loss": 1.4399, "step": 24561 }, { "epoch": 1.93, "learning_rate": 8.434136219522409e-05, "loss": 1.4708, "step": 24562 }, { "epoch": 1.93, "learning_rate": 8.433024968275697e-05, "loss": 1.4803, "step": 24563 }, { "epoch": 1.93, "learning_rate": 8.431913761615113e-05, "loss": 1.4835, "step": 24564 }, { "epoch": 1.93, "learning_rate": 8.430802599548218e-05, "loss": 1.494, "step": 24565 }, { "epoch": 1.93, "learning_rate": 8.42969148208255e-05, "loss": 1.4551, "step": 24566 }, { "epoch": 1.93, "learning_rate": 8.428580409225648e-05, "loss": 1.5268, "step": 24567 }, { "epoch": 1.93, "learning_rate": 8.427469380985054e-05, "loss": 1.4841, "step": 24568 }, { "epoch": 1.93, "learning_rate": 8.426358397368322e-05, "loss": 1.4949, "step": 24569 }, { "epoch": 1.93, "learning_rate": 8.425247458382988e-05, "loss": 1.5569, "step": 24570 }, { "epoch": 1.93, "learning_rate": 8.42413656403659e-05, "loss": 1.497, "step": 24571 }, { "epoch": 1.93, "learning_rate": 8.423025714336677e-05, "loss": 1.5112, "step": 24572 }, { "epoch": 1.93, "learning_rate": 8.421914909290794e-05, "loss": 1.4912, "step": 24573 }, { "epoch": 1.93, "learning_rate": 8.420804148906479e-05, "loss": 1.4912, "step": 24574 }, { "epoch": 1.93, "learning_rate": 8.419693433191269e-05, "loss": 1.4865, "step": 24575 }, { "epoch": 1.93, "learning_rate": 8.418582762152712e-05, "loss": 1.4507, "step": 24576 }, { "epoch": 1.93, "learning_rate": 8.417472135798349e-05, "loss": 1.467, "step": 24577 }, { "epoch": 1.93, "learning_rate": 8.416361554135712e-05, "loss": 1.4702, "step": 24578 }, { "epoch": 1.93, "learning_rate": 8.41525101717235e-05, "loss": 1.5322, "step": 24579 }, { "epoch": 1.93, "learning_rate": 8.414140524915802e-05, "loss": 1.4698, "step": 24580 }, { "epoch": 1.93, "learning_rate": 8.413030077373599e-05, "loss": 1.4756, "step": 24581 }, { "epoch": 1.93, "learning_rate": 8.411919674553292e-05, "loss": 1.4884, "step": 24582 }, { "epoch": 1.93, "learning_rate": 8.410809316462416e-05, "loss": 1.4701, "step": 24583 }, { "epoch": 1.93, "learning_rate": 8.409699003108507e-05, "loss": 1.5337, "step": 24584 }, { "epoch": 1.93, "learning_rate": 8.408588734499102e-05, "loss": 1.4231, "step": 24585 }, { "epoch": 1.93, "learning_rate": 8.407478510641744e-05, "loss": 1.5133, "step": 24586 }, { "epoch": 1.93, "learning_rate": 8.406368331543971e-05, "loss": 1.4489, "step": 24587 }, { "epoch": 1.93, "learning_rate": 8.405258197213306e-05, "loss": 1.4733, "step": 24588 }, { "epoch": 1.93, "learning_rate": 8.404148107657311e-05, "loss": 1.5271, "step": 24589 }, { "epoch": 1.93, "learning_rate": 8.403038062883511e-05, "loss": 1.5109, "step": 24590 }, { "epoch": 1.93, "learning_rate": 8.401928062899442e-05, "loss": 1.4761, "step": 24591 }, { "epoch": 1.93, "learning_rate": 8.400818107712633e-05, "loss": 1.4621, "step": 24592 }, { "epoch": 1.94, "learning_rate": 8.399708197330635e-05, "loss": 1.4828, "step": 24593 }, { "epoch": 1.94, "learning_rate": 8.398598331760974e-05, "loss": 1.5569, "step": 24594 }, { "epoch": 1.94, "learning_rate": 8.397488511011184e-05, "loss": 1.4669, "step": 24595 }, { "epoch": 1.94, "learning_rate": 8.396378735088806e-05, "loss": 1.4675, "step": 24596 }, { "epoch": 1.94, "learning_rate": 8.395269004001375e-05, "loss": 1.4428, "step": 24597 }, { "epoch": 1.94, "learning_rate": 8.394159317756414e-05, "loss": 1.4379, "step": 24598 }, { "epoch": 1.94, "learning_rate": 8.393049676361476e-05, "loss": 1.4338, "step": 24599 }, { "epoch": 1.94, "learning_rate": 8.39194007982408e-05, "loss": 1.4989, "step": 24600 }, { "epoch": 1.94, "learning_rate": 8.390830528151759e-05, "loss": 1.5298, "step": 24601 }, { "epoch": 1.94, "learning_rate": 8.389721021352062e-05, "loss": 1.5006, "step": 24602 }, { "epoch": 1.94, "learning_rate": 8.388611559432506e-05, "loss": 1.4844, "step": 24603 }, { "epoch": 1.94, "learning_rate": 8.387502142400625e-05, "loss": 1.4804, "step": 24604 }, { "epoch": 1.94, "learning_rate": 8.386392770263958e-05, "loss": 1.4562, "step": 24605 }, { "epoch": 1.94, "learning_rate": 8.385283443030036e-05, "loss": 1.5214, "step": 24606 }, { "epoch": 1.94, "learning_rate": 8.384174160706391e-05, "loss": 1.4607, "step": 24607 }, { "epoch": 1.94, "learning_rate": 8.383064923300555e-05, "loss": 1.5175, "step": 24608 }, { "epoch": 1.94, "learning_rate": 8.381955730820048e-05, "loss": 1.4732, "step": 24609 }, { "epoch": 1.94, "learning_rate": 8.380846583272416e-05, "loss": 1.521, "step": 24610 }, { "epoch": 1.94, "learning_rate": 8.379737480665182e-05, "loss": 1.4893, "step": 24611 }, { "epoch": 1.94, "learning_rate": 8.378628423005872e-05, "loss": 1.4692, "step": 24612 }, { "epoch": 1.94, "learning_rate": 8.377519410302027e-05, "loss": 1.5134, "step": 24613 }, { "epoch": 1.94, "learning_rate": 8.37641044256117e-05, "loss": 1.4698, "step": 24614 }, { "epoch": 1.94, "learning_rate": 8.375301519790825e-05, "loss": 1.4911, "step": 24615 }, { "epoch": 1.94, "learning_rate": 8.374192641998533e-05, "loss": 1.4516, "step": 24616 }, { "epoch": 1.94, "learning_rate": 8.373083809191818e-05, "loss": 1.5276, "step": 24617 }, { "epoch": 1.94, "learning_rate": 8.371975021378198e-05, "loss": 1.4931, "step": 24618 }, { "epoch": 1.94, "learning_rate": 8.37086627856522e-05, "loss": 1.431, "step": 24619 }, { "epoch": 1.94, "learning_rate": 8.369757580760393e-05, "loss": 1.5126, "step": 24620 }, { "epoch": 1.94, "learning_rate": 8.368648927971258e-05, "loss": 1.4654, "step": 24621 }, { "epoch": 1.94, "learning_rate": 8.367540320205334e-05, "loss": 1.5655, "step": 24622 }, { "epoch": 1.94, "learning_rate": 8.366431757470157e-05, "loss": 1.5196, "step": 24623 }, { "epoch": 1.94, "learning_rate": 8.365323239773245e-05, "loss": 1.4472, "step": 24624 }, { "epoch": 1.94, "learning_rate": 8.36421476712213e-05, "loss": 1.5191, "step": 24625 }, { "epoch": 1.94, "learning_rate": 8.363106339524326e-05, "loss": 1.4978, "step": 24626 }, { "epoch": 1.94, "learning_rate": 8.361997956987376e-05, "loss": 1.5089, "step": 24627 }, { "epoch": 1.94, "learning_rate": 8.360889619518796e-05, "loss": 1.5283, "step": 24628 }, { "epoch": 1.94, "learning_rate": 8.359781327126104e-05, "loss": 1.4427, "step": 24629 }, { "epoch": 1.94, "learning_rate": 8.35867307981684e-05, "loss": 1.5161, "step": 24630 }, { "epoch": 1.94, "learning_rate": 8.357564877598522e-05, "loss": 1.4508, "step": 24631 }, { "epoch": 1.94, "learning_rate": 8.356456720478665e-05, "loss": 1.5265, "step": 24632 }, { "epoch": 1.94, "learning_rate": 8.355348608464807e-05, "loss": 1.5449, "step": 24633 }, { "epoch": 1.94, "learning_rate": 8.354240541564464e-05, "loss": 1.4073, "step": 24634 }, { "epoch": 1.94, "learning_rate": 8.353132519785155e-05, "loss": 1.5154, "step": 24635 }, { "epoch": 1.94, "learning_rate": 8.35202454313441e-05, "loss": 1.5087, "step": 24636 }, { "epoch": 1.94, "learning_rate": 8.350916611619753e-05, "loss": 1.5139, "step": 24637 }, { "epoch": 1.94, "learning_rate": 8.349808725248705e-05, "loss": 1.43, "step": 24638 }, { "epoch": 1.94, "learning_rate": 8.348700884028779e-05, "loss": 1.4967, "step": 24639 }, { "epoch": 1.94, "learning_rate": 8.34759308796751e-05, "loss": 1.4859, "step": 24640 }, { "epoch": 1.94, "learning_rate": 8.34648533707241e-05, "loss": 1.4615, "step": 24641 }, { "epoch": 1.94, "learning_rate": 8.345377631351e-05, "loss": 1.5272, "step": 24642 }, { "epoch": 1.94, "learning_rate": 8.34426997081081e-05, "loss": 1.426, "step": 24643 }, { "epoch": 1.94, "learning_rate": 8.343162355459353e-05, "loss": 1.508, "step": 24644 }, { "epoch": 1.94, "learning_rate": 8.34205478530415e-05, "loss": 1.4745, "step": 24645 }, { "epoch": 1.94, "learning_rate": 8.340947260352714e-05, "loss": 1.501, "step": 24646 }, { "epoch": 1.94, "learning_rate": 8.339839780612577e-05, "loss": 1.5126, "step": 24647 }, { "epoch": 1.94, "learning_rate": 8.338732346091253e-05, "loss": 1.5188, "step": 24648 }, { "epoch": 1.94, "learning_rate": 8.337624956796258e-05, "loss": 1.4789, "step": 24649 }, { "epoch": 1.94, "learning_rate": 8.336517612735115e-05, "loss": 1.4718, "step": 24650 }, { "epoch": 1.94, "learning_rate": 8.335410313915335e-05, "loss": 1.4366, "step": 24651 }, { "epoch": 1.94, "learning_rate": 8.334303060344447e-05, "loss": 1.4403, "step": 24652 }, { "epoch": 1.94, "learning_rate": 8.333195852029957e-05, "loss": 1.4752, "step": 24653 }, { "epoch": 1.94, "learning_rate": 8.332088688979393e-05, "loss": 1.4804, "step": 24654 }, { "epoch": 1.94, "learning_rate": 8.330981571200268e-05, "loss": 1.5492, "step": 24655 }, { "epoch": 1.94, "learning_rate": 8.329874498700092e-05, "loss": 1.4849, "step": 24656 }, { "epoch": 1.94, "learning_rate": 8.328767471486394e-05, "loss": 1.4908, "step": 24657 }, { "epoch": 1.94, "learning_rate": 8.327660489566682e-05, "loss": 1.4579, "step": 24658 }, { "epoch": 1.94, "learning_rate": 8.326553552948469e-05, "loss": 1.4746, "step": 24659 }, { "epoch": 1.94, "learning_rate": 8.32544666163928e-05, "loss": 1.5145, "step": 24660 }, { "epoch": 1.94, "learning_rate": 8.324339815646623e-05, "loss": 1.4774, "step": 24661 }, { "epoch": 1.94, "learning_rate": 8.323233014978017e-05, "loss": 1.4864, "step": 24662 }, { "epoch": 1.94, "learning_rate": 8.322126259640967e-05, "loss": 1.5234, "step": 24663 }, { "epoch": 1.94, "learning_rate": 8.321019549643001e-05, "loss": 1.5105, "step": 24664 }, { "epoch": 1.94, "learning_rate": 8.319912884991627e-05, "loss": 1.4761, "step": 24665 }, { "epoch": 1.94, "learning_rate": 8.318806265694351e-05, "loss": 1.4973, "step": 24666 }, { "epoch": 1.94, "learning_rate": 8.317699691758695e-05, "loss": 1.5222, "step": 24667 }, { "epoch": 1.94, "learning_rate": 8.316593163192175e-05, "loss": 1.4805, "step": 24668 }, { "epoch": 1.94, "learning_rate": 8.315486680002299e-05, "loss": 1.4751, "step": 24669 }, { "epoch": 1.94, "learning_rate": 8.314380242196576e-05, "loss": 1.4896, "step": 24670 }, { "epoch": 1.94, "learning_rate": 8.313273849782525e-05, "loss": 1.452, "step": 24671 }, { "epoch": 1.94, "learning_rate": 8.312167502767656e-05, "loss": 1.4394, "step": 24672 }, { "epoch": 1.94, "learning_rate": 8.311061201159473e-05, "loss": 1.4811, "step": 24673 }, { "epoch": 1.94, "learning_rate": 8.309954944965499e-05, "loss": 1.4447, "step": 24674 }, { "epoch": 1.94, "learning_rate": 8.308848734193238e-05, "loss": 1.4867, "step": 24675 }, { "epoch": 1.94, "learning_rate": 8.307742568850196e-05, "loss": 1.4764, "step": 24676 }, { "epoch": 1.94, "learning_rate": 8.306636448943896e-05, "loss": 1.5224, "step": 24677 }, { "epoch": 1.94, "learning_rate": 8.30553037448184e-05, "loss": 1.5034, "step": 24678 }, { "epoch": 1.94, "learning_rate": 8.304424345471539e-05, "loss": 1.5122, "step": 24679 }, { "epoch": 1.94, "learning_rate": 8.303318361920495e-05, "loss": 1.4684, "step": 24680 }, { "epoch": 1.94, "learning_rate": 8.30221242383623e-05, "loss": 1.5178, "step": 24681 }, { "epoch": 1.94, "learning_rate": 8.301106531226242e-05, "loss": 1.4731, "step": 24682 }, { "epoch": 1.94, "learning_rate": 8.300000684098047e-05, "loss": 1.5086, "step": 24683 }, { "epoch": 1.94, "learning_rate": 8.298894882459146e-05, "loss": 1.4167, "step": 24684 }, { "epoch": 1.94, "learning_rate": 8.297789126317055e-05, "loss": 1.4997, "step": 24685 }, { "epoch": 1.94, "learning_rate": 8.29668341567928e-05, "loss": 1.5192, "step": 24686 }, { "epoch": 1.94, "learning_rate": 8.295577750553318e-05, "loss": 1.4342, "step": 24687 }, { "epoch": 1.94, "learning_rate": 8.29447213094669e-05, "loss": 1.4956, "step": 24688 }, { "epoch": 1.94, "learning_rate": 8.293366556866894e-05, "loss": 1.4549, "step": 24689 }, { "epoch": 1.94, "learning_rate": 8.292261028321433e-05, "loss": 1.4558, "step": 24690 }, { "epoch": 1.94, "learning_rate": 8.291155545317825e-05, "loss": 1.5062, "step": 24691 }, { "epoch": 1.94, "learning_rate": 8.290050107863568e-05, "loss": 1.4312, "step": 24692 }, { "epoch": 1.94, "learning_rate": 8.288944715966162e-05, "loss": 1.5185, "step": 24693 }, { "epoch": 1.94, "learning_rate": 8.287839369633121e-05, "loss": 1.4898, "step": 24694 }, { "epoch": 1.94, "learning_rate": 8.286734068871951e-05, "loss": 1.4675, "step": 24695 }, { "epoch": 1.94, "learning_rate": 8.285628813690144e-05, "loss": 1.5362, "step": 24696 }, { "epoch": 1.94, "learning_rate": 8.284523604095218e-05, "loss": 1.4953, "step": 24697 }, { "epoch": 1.94, "learning_rate": 8.283418440094663e-05, "loss": 1.5193, "step": 24698 }, { "epoch": 1.94, "learning_rate": 8.282313321696e-05, "loss": 1.5529, "step": 24699 }, { "epoch": 1.94, "learning_rate": 8.281208248906715e-05, "loss": 1.4971, "step": 24700 }, { "epoch": 1.94, "learning_rate": 8.280103221734324e-05, "loss": 1.4502, "step": 24701 }, { "epoch": 1.94, "learning_rate": 8.278998240186322e-05, "loss": 1.4745, "step": 24702 }, { "epoch": 1.94, "learning_rate": 8.277893304270215e-05, "loss": 1.4998, "step": 24703 }, { "epoch": 1.94, "learning_rate": 8.276788413993499e-05, "loss": 1.4461, "step": 24704 }, { "epoch": 1.94, "learning_rate": 8.27568356936368e-05, "loss": 1.5116, "step": 24705 }, { "epoch": 1.94, "learning_rate": 8.274578770388263e-05, "loss": 1.4892, "step": 24706 }, { "epoch": 1.94, "learning_rate": 8.273474017074738e-05, "loss": 1.5141, "step": 24707 }, { "epoch": 1.94, "learning_rate": 8.272369309430618e-05, "loss": 1.4426, "step": 24708 }, { "epoch": 1.94, "learning_rate": 8.271264647463399e-05, "loss": 1.459, "step": 24709 }, { "epoch": 1.94, "learning_rate": 8.270160031180571e-05, "loss": 1.4993, "step": 24710 }, { "epoch": 1.94, "learning_rate": 8.269055460589652e-05, "loss": 1.456, "step": 24711 }, { "epoch": 1.94, "learning_rate": 8.26795093569813e-05, "loss": 1.4784, "step": 24712 }, { "epoch": 1.94, "learning_rate": 8.266846456513499e-05, "loss": 1.4794, "step": 24713 }, { "epoch": 1.94, "learning_rate": 8.265742023043266e-05, "loss": 1.4085, "step": 24714 }, { "epoch": 1.94, "learning_rate": 8.264637635294936e-05, "loss": 1.4605, "step": 24715 }, { "epoch": 1.94, "learning_rate": 8.263533293275999e-05, "loss": 1.4929, "step": 24716 }, { "epoch": 1.94, "learning_rate": 8.262428996993944e-05, "loss": 1.5038, "step": 24717 }, { "epoch": 1.94, "learning_rate": 8.261324746456288e-05, "loss": 1.5064, "step": 24718 }, { "epoch": 1.94, "learning_rate": 8.260220541670516e-05, "loss": 1.5084, "step": 24719 }, { "epoch": 1.95, "learning_rate": 8.259116382644127e-05, "loss": 1.5164, "step": 24720 }, { "epoch": 1.95, "learning_rate": 8.258012269384614e-05, "loss": 1.4367, "step": 24721 }, { "epoch": 1.95, "learning_rate": 8.256908201899481e-05, "loss": 1.4902, "step": 24722 }, { "epoch": 1.95, "learning_rate": 8.255804180196222e-05, "loss": 1.516, "step": 24723 }, { "epoch": 1.95, "learning_rate": 8.254700204282325e-05, "loss": 1.4842, "step": 24724 }, { "epoch": 1.95, "learning_rate": 8.253596274165295e-05, "loss": 1.4824, "step": 24725 }, { "epoch": 1.95, "learning_rate": 8.252492389852626e-05, "loss": 1.4827, "step": 24726 }, { "epoch": 1.95, "learning_rate": 8.251388551351804e-05, "loss": 1.4663, "step": 24727 }, { "epoch": 1.95, "learning_rate": 8.250284758670334e-05, "loss": 1.5492, "step": 24728 }, { "epoch": 1.95, "learning_rate": 8.249181011815705e-05, "loss": 1.4963, "step": 24729 }, { "epoch": 1.95, "learning_rate": 8.248077310795406e-05, "loss": 1.503, "step": 24730 }, { "epoch": 1.95, "learning_rate": 8.246973655616937e-05, "loss": 1.4848, "step": 24731 }, { "epoch": 1.95, "learning_rate": 8.245870046287796e-05, "loss": 1.4653, "step": 24732 }, { "epoch": 1.95, "learning_rate": 8.244766482815469e-05, "loss": 1.4725, "step": 24733 }, { "epoch": 1.95, "learning_rate": 8.243662965207447e-05, "loss": 1.5281, "step": 24734 }, { "epoch": 1.95, "learning_rate": 8.242559493471226e-05, "loss": 1.5073, "step": 24735 }, { "epoch": 1.95, "learning_rate": 8.241456067614302e-05, "loss": 1.4896, "step": 24736 }, { "epoch": 1.95, "learning_rate": 8.240352687644157e-05, "loss": 1.4791, "step": 24737 }, { "epoch": 1.95, "learning_rate": 8.239249353568284e-05, "loss": 1.5123, "step": 24738 }, { "epoch": 1.95, "learning_rate": 8.238146065394181e-05, "loss": 1.5267, "step": 24739 }, { "epoch": 1.95, "learning_rate": 8.237042823129337e-05, "loss": 1.4647, "step": 24740 }, { "epoch": 1.95, "learning_rate": 8.235939626781233e-05, "loss": 1.5042, "step": 24741 }, { "epoch": 1.95, "learning_rate": 8.234836476357372e-05, "loss": 1.4953, "step": 24742 }, { "epoch": 1.95, "learning_rate": 8.23373337186524e-05, "loss": 1.5021, "step": 24743 }, { "epoch": 1.95, "learning_rate": 8.232630313312316e-05, "loss": 1.4386, "step": 24744 }, { "epoch": 1.95, "learning_rate": 8.231527300706098e-05, "loss": 1.4448, "step": 24745 }, { "epoch": 1.95, "learning_rate": 8.23042433405408e-05, "loss": 1.5312, "step": 24746 }, { "epoch": 1.95, "learning_rate": 8.229321413363746e-05, "loss": 1.4863, "step": 24747 }, { "epoch": 1.95, "learning_rate": 8.228218538642578e-05, "loss": 1.4751, "step": 24748 }, { "epoch": 1.95, "learning_rate": 8.227115709898076e-05, "loss": 1.4852, "step": 24749 }, { "epoch": 1.95, "learning_rate": 8.226012927137716e-05, "loss": 1.4725, "step": 24750 }, { "epoch": 1.95, "learning_rate": 8.224910190368988e-05, "loss": 1.4664, "step": 24751 }, { "epoch": 1.95, "learning_rate": 8.223807499599387e-05, "loss": 1.5074, "step": 24752 }, { "epoch": 1.95, "learning_rate": 8.222704854836392e-05, "loss": 1.462, "step": 24753 }, { "epoch": 1.95, "learning_rate": 8.221602256087487e-05, "loss": 1.509, "step": 24754 }, { "epoch": 1.95, "learning_rate": 8.220499703360165e-05, "loss": 1.4378, "step": 24755 }, { "epoch": 1.95, "learning_rate": 8.21939719666191e-05, "loss": 1.506, "step": 24756 }, { "epoch": 1.95, "learning_rate": 8.218294736000207e-05, "loss": 1.5219, "step": 24757 }, { "epoch": 1.95, "learning_rate": 8.217192321382536e-05, "loss": 1.4759, "step": 24758 }, { "epoch": 1.95, "learning_rate": 8.21608995281639e-05, "loss": 1.5087, "step": 24759 }, { "epoch": 1.95, "learning_rate": 8.214987630309248e-05, "loss": 1.4552, "step": 24760 }, { "epoch": 1.95, "learning_rate": 8.213885353868592e-05, "loss": 1.4799, "step": 24761 }, { "epoch": 1.95, "learning_rate": 8.21278312350191e-05, "loss": 1.4389, "step": 24762 }, { "epoch": 1.95, "learning_rate": 8.211680939216691e-05, "loss": 1.4592, "step": 24763 }, { "epoch": 1.95, "learning_rate": 8.21057880102041e-05, "loss": 1.4935, "step": 24764 }, { "epoch": 1.95, "learning_rate": 8.209476708920547e-05, "loss": 1.4832, "step": 24765 }, { "epoch": 1.95, "learning_rate": 8.208374662924596e-05, "loss": 1.5011, "step": 24766 }, { "epoch": 1.95, "learning_rate": 8.207272663040034e-05, "loss": 1.4857, "step": 24767 }, { "epoch": 1.95, "learning_rate": 8.206170709274337e-05, "loss": 1.4961, "step": 24768 }, { "epoch": 1.95, "learning_rate": 8.205068801634994e-05, "loss": 1.474, "step": 24769 }, { "epoch": 1.95, "learning_rate": 8.203966940129487e-05, "loss": 1.4309, "step": 24770 }, { "epoch": 1.95, "learning_rate": 8.202865124765287e-05, "loss": 1.5028, "step": 24771 }, { "epoch": 1.95, "learning_rate": 8.20176335554989e-05, "loss": 1.498, "step": 24772 }, { "epoch": 1.95, "learning_rate": 8.200661632490767e-05, "loss": 1.5187, "step": 24773 }, { "epoch": 1.95, "learning_rate": 8.199559955595397e-05, "loss": 1.4755, "step": 24774 }, { "epoch": 1.95, "learning_rate": 8.19845832487126e-05, "loss": 1.495, "step": 24775 }, { "epoch": 1.95, "learning_rate": 8.197356740325841e-05, "loss": 1.4728, "step": 24776 }, { "epoch": 1.95, "learning_rate": 8.19625520196661e-05, "loss": 1.5097, "step": 24777 }, { "epoch": 1.95, "learning_rate": 8.195153709801059e-05, "loss": 1.4798, "step": 24778 }, { "epoch": 1.95, "learning_rate": 8.194052263836651e-05, "loss": 1.4704, "step": 24779 }, { "epoch": 1.95, "learning_rate": 8.19295086408088e-05, "loss": 1.4801, "step": 24780 }, { "epoch": 1.95, "learning_rate": 8.191849510541215e-05, "loss": 1.4422, "step": 24781 }, { "epoch": 1.95, "learning_rate": 8.190748203225129e-05, "loss": 1.468, "step": 24782 }, { "epoch": 1.95, "learning_rate": 8.189646942140113e-05, "loss": 1.4987, "step": 24783 }, { "epoch": 1.95, "learning_rate": 8.188545727293632e-05, "loss": 1.4856, "step": 24784 }, { "epoch": 1.95, "learning_rate": 8.187444558693165e-05, "loss": 1.4465, "step": 24785 }, { "epoch": 1.95, "learning_rate": 8.186343436346192e-05, "loss": 1.4383, "step": 24786 }, { "epoch": 1.95, "learning_rate": 8.185242360260189e-05, "loss": 1.4398, "step": 24787 }, { "epoch": 1.95, "learning_rate": 8.184141330442622e-05, "loss": 1.4521, "step": 24788 }, { "epoch": 1.95, "learning_rate": 8.183040346900984e-05, "loss": 1.4778, "step": 24789 }, { "epoch": 1.95, "learning_rate": 8.181939409642738e-05, "loss": 1.4978, "step": 24790 }, { "epoch": 1.95, "learning_rate": 8.180838518675359e-05, "loss": 1.5029, "step": 24791 }, { "epoch": 1.95, "learning_rate": 8.179737674006314e-05, "loss": 1.5342, "step": 24792 }, { "epoch": 1.95, "learning_rate": 8.178636875643098e-05, "loss": 1.499, "step": 24793 }, { "epoch": 1.95, "learning_rate": 8.177536123593172e-05, "loss": 1.5218, "step": 24794 }, { "epoch": 1.95, "learning_rate": 8.176435417864012e-05, "loss": 1.4489, "step": 24795 }, { "epoch": 1.95, "learning_rate": 8.175334758463082e-05, "loss": 1.4946, "step": 24796 }, { "epoch": 1.95, "learning_rate": 8.174234145397872e-05, "loss": 1.501, "step": 24797 }, { "epoch": 1.95, "learning_rate": 8.173133578675842e-05, "loss": 1.5398, "step": 24798 }, { "epoch": 1.95, "learning_rate": 8.172033058304465e-05, "loss": 1.5122, "step": 24799 }, { "epoch": 1.95, "learning_rate": 8.17093258429122e-05, "loss": 1.4852, "step": 24800 }, { "epoch": 1.95, "learning_rate": 8.169832156643573e-05, "loss": 1.4959, "step": 24801 }, { "epoch": 1.95, "learning_rate": 8.168731775368993e-05, "loss": 1.499, "step": 24802 }, { "epoch": 1.95, "learning_rate": 8.167631440474957e-05, "loss": 1.4888, "step": 24803 }, { "epoch": 1.95, "learning_rate": 8.166531151968936e-05, "loss": 1.4914, "step": 24804 }, { "epoch": 1.95, "learning_rate": 8.16543090985839e-05, "loss": 1.4974, "step": 24805 }, { "epoch": 1.95, "learning_rate": 8.164330714150805e-05, "loss": 1.4868, "step": 24806 }, { "epoch": 1.95, "learning_rate": 8.16323056485364e-05, "loss": 1.5187, "step": 24807 }, { "epoch": 1.95, "learning_rate": 8.16213046197436e-05, "loss": 1.5439, "step": 24808 }, { "epoch": 1.95, "learning_rate": 8.161030405520441e-05, "loss": 1.4919, "step": 24809 }, { "epoch": 1.95, "learning_rate": 8.159930395499357e-05, "loss": 1.5032, "step": 24810 }, { "epoch": 1.95, "learning_rate": 8.158830431918574e-05, "loss": 1.4903, "step": 24811 }, { "epoch": 1.95, "learning_rate": 8.157730514785547e-05, "loss": 1.5184, "step": 24812 }, { "epoch": 1.95, "learning_rate": 8.156630644107762e-05, "loss": 1.4459, "step": 24813 }, { "epoch": 1.95, "learning_rate": 8.155530819892679e-05, "loss": 1.4975, "step": 24814 }, { "epoch": 1.95, "learning_rate": 8.154431042147764e-05, "loss": 1.4657, "step": 24815 }, { "epoch": 1.95, "learning_rate": 8.153331310880477e-05, "loss": 1.5288, "step": 24816 }, { "epoch": 1.95, "learning_rate": 8.152231626098303e-05, "loss": 1.5515, "step": 24817 }, { "epoch": 1.95, "learning_rate": 8.151131987808694e-05, "loss": 1.4937, "step": 24818 }, { "epoch": 1.95, "learning_rate": 8.150032396019111e-05, "loss": 1.4541, "step": 24819 }, { "epoch": 1.95, "learning_rate": 8.148932850737037e-05, "loss": 1.4667, "step": 24820 }, { "epoch": 1.95, "learning_rate": 8.147833351969928e-05, "loss": 1.5124, "step": 24821 }, { "epoch": 1.95, "learning_rate": 8.146733899725243e-05, "loss": 1.4315, "step": 24822 }, { "epoch": 1.95, "learning_rate": 8.145634494010457e-05, "loss": 1.4396, "step": 24823 }, { "epoch": 1.95, "learning_rate": 8.144535134833026e-05, "loss": 1.481, "step": 24824 }, { "epoch": 1.95, "learning_rate": 8.143435822200423e-05, "loss": 1.463, "step": 24825 }, { "epoch": 1.95, "learning_rate": 8.142336556120104e-05, "loss": 1.4774, "step": 24826 }, { "epoch": 1.95, "learning_rate": 8.141237336599539e-05, "loss": 1.506, "step": 24827 }, { "epoch": 1.95, "learning_rate": 8.140138163646188e-05, "loss": 1.4168, "step": 24828 }, { "epoch": 1.95, "learning_rate": 8.139039037267507e-05, "loss": 1.4765, "step": 24829 }, { "epoch": 1.95, "learning_rate": 8.13793995747097e-05, "loss": 1.4955, "step": 24830 }, { "epoch": 1.95, "learning_rate": 8.136840924264036e-05, "loss": 1.49, "step": 24831 }, { "epoch": 1.95, "learning_rate": 8.135741937654163e-05, "loss": 1.5049, "step": 24832 }, { "epoch": 1.95, "learning_rate": 8.134642997648809e-05, "loss": 1.5028, "step": 24833 }, { "epoch": 1.95, "learning_rate": 8.133544104255447e-05, "loss": 1.504, "step": 24834 }, { "epoch": 1.95, "learning_rate": 8.132445257481531e-05, "loss": 1.4524, "step": 24835 }, { "epoch": 1.95, "learning_rate": 8.131346457334514e-05, "loss": 1.4728, "step": 24836 }, { "epoch": 1.95, "learning_rate": 8.130247703821872e-05, "loss": 1.4982, "step": 24837 }, { "epoch": 1.95, "learning_rate": 8.129148996951057e-05, "loss": 1.4377, "step": 24838 }, { "epoch": 1.95, "learning_rate": 8.128050336729521e-05, "loss": 1.4682, "step": 24839 }, { "epoch": 1.95, "learning_rate": 8.126951723164733e-05, "loss": 1.4707, "step": 24840 }, { "epoch": 1.95, "learning_rate": 8.125853156264156e-05, "loss": 1.4586, "step": 24841 }, { "epoch": 1.95, "learning_rate": 8.124754636035242e-05, "loss": 1.444, "step": 24842 }, { "epoch": 1.95, "learning_rate": 8.123656162485443e-05, "loss": 1.4993, "step": 24843 }, { "epoch": 1.95, "learning_rate": 8.12255773562223e-05, "loss": 1.4362, "step": 24844 }, { "epoch": 1.95, "learning_rate": 8.121459355453056e-05, "loss": 1.4526, "step": 24845 }, { "epoch": 1.95, "learning_rate": 8.120361021985371e-05, "loss": 1.4666, "step": 24846 }, { "epoch": 1.95, "learning_rate": 8.119262735226643e-05, "loss": 1.5049, "step": 24847 }, { "epoch": 1.96, "learning_rate": 8.118164495184325e-05, "loss": 1.4569, "step": 24848 }, { "epoch": 1.96, "learning_rate": 8.117066301865872e-05, "loss": 1.466, "step": 24849 }, { "epoch": 1.96, "learning_rate": 8.115968155278735e-05, "loss": 1.458, "step": 24850 }, { "epoch": 1.96, "learning_rate": 8.11487005543038e-05, "loss": 1.4699, "step": 24851 }, { "epoch": 1.96, "learning_rate": 8.11377200232826e-05, "loss": 1.4838, "step": 24852 }, { "epoch": 1.96, "learning_rate": 8.11267399597982e-05, "loss": 1.5357, "step": 24853 }, { "epoch": 1.96, "learning_rate": 8.111576036392528e-05, "loss": 1.4824, "step": 24854 }, { "epoch": 1.96, "learning_rate": 8.110478123573828e-05, "loss": 1.4863, "step": 24855 }, { "epoch": 1.96, "learning_rate": 8.109380257531186e-05, "loss": 1.4894, "step": 24856 }, { "epoch": 1.96, "learning_rate": 8.108282438272046e-05, "loss": 1.4678, "step": 24857 }, { "epoch": 1.96, "learning_rate": 8.107184665803868e-05, "loss": 1.5087, "step": 24858 }, { "epoch": 1.96, "learning_rate": 8.106086940134103e-05, "loss": 1.5185, "step": 24859 }, { "epoch": 1.96, "learning_rate": 8.104989261270198e-05, "loss": 1.4499, "step": 24860 }, { "epoch": 1.96, "learning_rate": 8.103891629219616e-05, "loss": 1.4939, "step": 24861 }, { "epoch": 1.96, "learning_rate": 8.102794043989804e-05, "loss": 1.4894, "step": 24862 }, { "epoch": 1.96, "learning_rate": 8.101696505588209e-05, "loss": 1.4834, "step": 24863 }, { "epoch": 1.96, "learning_rate": 8.100599014022295e-05, "loss": 1.5038, "step": 24864 }, { "epoch": 1.96, "learning_rate": 8.099501569299503e-05, "loss": 1.523, "step": 24865 }, { "epoch": 1.96, "learning_rate": 8.098404171427285e-05, "loss": 1.4926, "step": 24866 }, { "epoch": 1.96, "learning_rate": 8.097306820413098e-05, "loss": 1.4669, "step": 24867 }, { "epoch": 1.96, "learning_rate": 8.096209516264388e-05, "loss": 1.5244, "step": 24868 }, { "epoch": 1.96, "learning_rate": 8.095112258988608e-05, "loss": 1.515, "step": 24869 }, { "epoch": 1.96, "learning_rate": 8.094015048593199e-05, "loss": 1.4859, "step": 24870 }, { "epoch": 1.96, "learning_rate": 8.092917885085615e-05, "loss": 1.5003, "step": 24871 }, { "epoch": 1.96, "learning_rate": 8.091820768473314e-05, "loss": 1.4707, "step": 24872 }, { "epoch": 1.96, "learning_rate": 8.090723698763738e-05, "loss": 1.4805, "step": 24873 }, { "epoch": 1.96, "learning_rate": 8.089626675964326e-05, "loss": 1.4601, "step": 24874 }, { "epoch": 1.96, "learning_rate": 8.088529700082545e-05, "loss": 1.4812, "step": 24875 }, { "epoch": 1.96, "learning_rate": 8.087432771125832e-05, "loss": 1.4545, "step": 24876 }, { "epoch": 1.96, "learning_rate": 8.08633588910163e-05, "loss": 1.5027, "step": 24877 }, { "epoch": 1.96, "learning_rate": 8.085239054017398e-05, "loss": 1.5181, "step": 24878 }, { "epoch": 1.96, "learning_rate": 8.084142265880578e-05, "loss": 1.5154, "step": 24879 }, { "epoch": 1.96, "learning_rate": 8.083045524698607e-05, "loss": 1.4605, "step": 24880 }, { "epoch": 1.96, "learning_rate": 8.081948830478948e-05, "loss": 1.4951, "step": 24881 }, { "epoch": 1.96, "learning_rate": 8.080852183229038e-05, "loss": 1.5145, "step": 24882 }, { "epoch": 1.96, "learning_rate": 8.079755582956318e-05, "loss": 1.5038, "step": 24883 }, { "epoch": 1.96, "learning_rate": 8.078659029668243e-05, "loss": 1.5011, "step": 24884 }, { "epoch": 1.96, "learning_rate": 8.077562523372255e-05, "loss": 1.434, "step": 24885 }, { "epoch": 1.96, "learning_rate": 8.076466064075799e-05, "loss": 1.4669, "step": 24886 }, { "epoch": 1.96, "learning_rate": 8.075369651786303e-05, "loss": 1.4929, "step": 24887 }, { "epoch": 1.96, "learning_rate": 8.074273286511238e-05, "loss": 1.4241, "step": 24888 }, { "epoch": 1.96, "learning_rate": 8.073176968258038e-05, "loss": 1.5414, "step": 24889 }, { "epoch": 1.96, "learning_rate": 8.07208069703414e-05, "loss": 1.4899, "step": 24890 }, { "epoch": 1.96, "learning_rate": 8.070984472846986e-05, "loss": 1.4402, "step": 24891 }, { "epoch": 1.96, "learning_rate": 8.069888295704032e-05, "loss": 1.5003, "step": 24892 }, { "epoch": 1.96, "learning_rate": 8.068792165612709e-05, "loss": 1.4341, "step": 24893 }, { "epoch": 1.96, "learning_rate": 8.067696082580459e-05, "loss": 1.5233, "step": 24894 }, { "epoch": 1.96, "learning_rate": 8.066600046614733e-05, "loss": 1.4825, "step": 24895 }, { "epoch": 1.96, "learning_rate": 8.065504057722965e-05, "loss": 1.4365, "step": 24896 }, { "epoch": 1.96, "learning_rate": 8.064408115912591e-05, "loss": 1.5282, "step": 24897 }, { "epoch": 1.96, "learning_rate": 8.063312221191066e-05, "loss": 1.4551, "step": 24898 }, { "epoch": 1.96, "learning_rate": 8.062216373565821e-05, "loss": 1.4453, "step": 24899 }, { "epoch": 1.96, "learning_rate": 8.061120573044297e-05, "loss": 1.4783, "step": 24900 }, { "epoch": 1.96, "learning_rate": 8.060024819633937e-05, "loss": 1.5411, "step": 24901 }, { "epoch": 1.96, "learning_rate": 8.058929113342174e-05, "loss": 1.4527, "step": 24902 }, { "epoch": 1.96, "learning_rate": 8.057833454176457e-05, "loss": 1.4717, "step": 24903 }, { "epoch": 1.96, "learning_rate": 8.056737842144215e-05, "loss": 1.4616, "step": 24904 }, { "epoch": 1.96, "learning_rate": 8.055642277252897e-05, "loss": 1.4379, "step": 24905 }, { "epoch": 1.96, "learning_rate": 8.054546759509935e-05, "loss": 1.465, "step": 24906 }, { "epoch": 1.96, "learning_rate": 8.053451288922763e-05, "loss": 1.443, "step": 24907 }, { "epoch": 1.96, "learning_rate": 8.052355865498828e-05, "loss": 1.5032, "step": 24908 }, { "epoch": 1.96, "learning_rate": 8.051260489245564e-05, "loss": 1.5013, "step": 24909 }, { "epoch": 1.96, "learning_rate": 8.050165160170405e-05, "loss": 1.511, "step": 24910 }, { "epoch": 1.96, "learning_rate": 8.049069878280783e-05, "loss": 1.4917, "step": 24911 }, { "epoch": 1.96, "learning_rate": 8.047974643584148e-05, "loss": 1.5094, "step": 24912 }, { "epoch": 1.96, "learning_rate": 8.04687945608793e-05, "loss": 1.5044, "step": 24913 }, { "epoch": 1.96, "learning_rate": 8.045784315799556e-05, "loss": 1.5312, "step": 24914 }, { "epoch": 1.96, "learning_rate": 8.044689222726475e-05, "loss": 1.4927, "step": 24915 }, { "epoch": 1.96, "learning_rate": 8.043594176876117e-05, "loss": 1.5044, "step": 24916 }, { "epoch": 1.96, "learning_rate": 8.042499178255909e-05, "loss": 1.4747, "step": 24917 }, { "epoch": 1.96, "learning_rate": 8.04140422687329e-05, "loss": 1.5439, "step": 24918 }, { "epoch": 1.96, "learning_rate": 8.040309322735705e-05, "loss": 1.4821, "step": 24919 }, { "epoch": 1.96, "learning_rate": 8.039214465850578e-05, "loss": 1.474, "step": 24920 }, { "epoch": 1.96, "learning_rate": 8.038119656225339e-05, "loss": 1.4552, "step": 24921 }, { "epoch": 1.96, "learning_rate": 8.037024893867427e-05, "loss": 1.451, "step": 24922 }, { "epoch": 1.96, "learning_rate": 8.035930178784278e-05, "loss": 1.4318, "step": 24923 }, { "epoch": 1.96, "learning_rate": 8.034835510983312e-05, "loss": 1.484, "step": 24924 }, { "epoch": 1.96, "learning_rate": 8.033740890471976e-05, "loss": 1.4711, "step": 24925 }, { "epoch": 1.96, "learning_rate": 8.032646317257694e-05, "loss": 1.496, "step": 24926 }, { "epoch": 1.96, "learning_rate": 8.031551791347901e-05, "loss": 1.4872, "step": 24927 }, { "epoch": 1.96, "learning_rate": 8.030457312750018e-05, "loss": 1.468, "step": 24928 }, { "epoch": 1.96, "learning_rate": 8.02936288147149e-05, "loss": 1.5012, "step": 24929 }, { "epoch": 1.96, "learning_rate": 8.02826849751974e-05, "loss": 1.4654, "step": 24930 }, { "epoch": 1.96, "learning_rate": 8.027174160902195e-05, "loss": 1.4274, "step": 24931 }, { "epoch": 1.96, "learning_rate": 8.026079871626296e-05, "loss": 1.4545, "step": 24932 }, { "epoch": 1.96, "learning_rate": 8.024985629699465e-05, "loss": 1.4421, "step": 24933 }, { "epoch": 1.96, "learning_rate": 8.023891435129128e-05, "loss": 1.4662, "step": 24934 }, { "epoch": 1.96, "learning_rate": 8.022797287922717e-05, "loss": 1.4223, "step": 24935 }, { "epoch": 1.96, "learning_rate": 8.021703188087668e-05, "loss": 1.4426, "step": 24936 }, { "epoch": 1.96, "learning_rate": 8.020609135631404e-05, "loss": 1.4912, "step": 24937 }, { "epoch": 1.96, "learning_rate": 8.019515130561347e-05, "loss": 1.4966, "step": 24938 }, { "epoch": 1.96, "learning_rate": 8.018421172884935e-05, "loss": 1.4538, "step": 24939 }, { "epoch": 1.96, "learning_rate": 8.017327262609591e-05, "loss": 1.4903, "step": 24940 }, { "epoch": 1.96, "learning_rate": 8.016233399742735e-05, "loss": 1.4715, "step": 24941 }, { "epoch": 1.96, "learning_rate": 8.015139584291808e-05, "loss": 1.4538, "step": 24942 }, { "epoch": 1.96, "learning_rate": 8.014045816264225e-05, "loss": 1.4344, "step": 24943 }, { "epoch": 1.96, "learning_rate": 8.01295209566742e-05, "loss": 1.4437, "step": 24944 }, { "epoch": 1.96, "learning_rate": 8.011858422508806e-05, "loss": 1.4897, "step": 24945 }, { "epoch": 1.96, "learning_rate": 8.010764796795823e-05, "loss": 1.4458, "step": 24946 }, { "epoch": 1.96, "learning_rate": 8.00967121853589e-05, "loss": 1.4712, "step": 24947 }, { "epoch": 1.96, "learning_rate": 8.008577687736427e-05, "loss": 1.4729, "step": 24948 }, { "epoch": 1.96, "learning_rate": 8.007484204404868e-05, "loss": 1.4657, "step": 24949 }, { "epoch": 1.96, "learning_rate": 8.006390768548628e-05, "loss": 1.4942, "step": 24950 }, { "epoch": 1.96, "learning_rate": 8.00529738017514e-05, "loss": 1.4284, "step": 24951 }, { "epoch": 1.96, "learning_rate": 8.004204039291818e-05, "loss": 1.44, "step": 24952 }, { "epoch": 1.96, "learning_rate": 8.003110745906096e-05, "loss": 1.4763, "step": 24953 }, { "epoch": 1.96, "learning_rate": 8.00201750002539e-05, "loss": 1.5157, "step": 24954 }, { "epoch": 1.96, "learning_rate": 8.000924301657117e-05, "loss": 1.4433, "step": 24955 }, { "epoch": 1.96, "learning_rate": 7.999831150808712e-05, "loss": 1.4663, "step": 24956 }, { "epoch": 1.96, "learning_rate": 7.99873804748759e-05, "loss": 1.4931, "step": 24957 }, { "epoch": 1.96, "learning_rate": 7.997644991701168e-05, "loss": 1.4993, "step": 24958 }, { "epoch": 1.96, "learning_rate": 7.996551983456877e-05, "loss": 1.4665, "step": 24959 }, { "epoch": 1.96, "learning_rate": 7.995459022762135e-05, "loss": 1.4746, "step": 24960 }, { "epoch": 1.96, "learning_rate": 7.994366109624359e-05, "loss": 1.504, "step": 24961 }, { "epoch": 1.96, "learning_rate": 7.993273244050967e-05, "loss": 1.4871, "step": 24962 }, { "epoch": 1.96, "learning_rate": 7.992180426049388e-05, "loss": 1.434, "step": 24963 }, { "epoch": 1.96, "learning_rate": 7.991087655627036e-05, "loss": 1.4342, "step": 24964 }, { "epoch": 1.96, "learning_rate": 7.98999493279132e-05, "loss": 1.4622, "step": 24965 }, { "epoch": 1.96, "learning_rate": 7.988902257549682e-05, "loss": 1.4675, "step": 24966 }, { "epoch": 1.96, "learning_rate": 7.987809629909527e-05, "loss": 1.4345, "step": 24967 }, { "epoch": 1.96, "learning_rate": 7.986717049878276e-05, "loss": 1.4862, "step": 24968 }, { "epoch": 1.96, "learning_rate": 7.98562451746334e-05, "loss": 1.5122, "step": 24969 }, { "epoch": 1.96, "learning_rate": 7.98453203267215e-05, "loss": 1.4841, "step": 24970 }, { "epoch": 1.96, "learning_rate": 7.983439595512114e-05, "loss": 1.4973, "step": 24971 }, { "epoch": 1.96, "learning_rate": 7.982347205990646e-05, "loss": 1.4665, "step": 24972 }, { "epoch": 1.96, "learning_rate": 7.981254864115176e-05, "loss": 1.4969, "step": 24973 }, { "epoch": 1.96, "learning_rate": 7.980162569893107e-05, "loss": 1.4697, "step": 24974 }, { "epoch": 1.97, "learning_rate": 7.979070323331858e-05, "loss": 1.4711, "step": 24975 }, { "epoch": 1.97, "learning_rate": 7.977978124438854e-05, "loss": 1.4903, "step": 24976 }, { "epoch": 1.97, "learning_rate": 7.976885973221501e-05, "loss": 1.5597, "step": 24977 }, { "epoch": 1.97, "learning_rate": 7.975793869687212e-05, "loss": 1.554, "step": 24978 }, { "epoch": 1.97, "learning_rate": 7.974701813843411e-05, "loss": 1.49, "step": 24979 }, { "epoch": 1.97, "learning_rate": 7.973609805697508e-05, "loss": 1.5278, "step": 24980 }, { "epoch": 1.97, "learning_rate": 7.972517845256913e-05, "loss": 1.5028, "step": 24981 }, { "epoch": 1.97, "learning_rate": 7.971425932529041e-05, "loss": 1.4653, "step": 24982 }, { "epoch": 1.97, "learning_rate": 7.970334067521316e-05, "loss": 1.4727, "step": 24983 }, { "epoch": 1.97, "learning_rate": 7.969242250241142e-05, "loss": 1.536, "step": 24984 }, { "epoch": 1.97, "learning_rate": 7.968150480695935e-05, "loss": 1.4957, "step": 24985 }, { "epoch": 1.97, "learning_rate": 7.967058758893099e-05, "loss": 1.5061, "step": 24986 }, { "epoch": 1.97, "learning_rate": 7.965967084840057e-05, "loss": 1.4968, "step": 24987 }, { "epoch": 1.97, "learning_rate": 7.964875458544219e-05, "loss": 1.5345, "step": 24988 }, { "epoch": 1.97, "learning_rate": 7.963783880012988e-05, "loss": 1.4997, "step": 24989 }, { "epoch": 1.97, "learning_rate": 7.962692349253787e-05, "loss": 1.4967, "step": 24990 }, { "epoch": 1.97, "learning_rate": 7.961600866274022e-05, "loss": 1.4537, "step": 24991 }, { "epoch": 1.97, "learning_rate": 7.960509431081099e-05, "loss": 1.4477, "step": 24992 }, { "epoch": 1.97, "learning_rate": 7.959418043682433e-05, "loss": 1.4486, "step": 24993 }, { "epoch": 1.97, "learning_rate": 7.958326704085437e-05, "loss": 1.497, "step": 24994 }, { "epoch": 1.97, "learning_rate": 7.957235412297511e-05, "loss": 1.4635, "step": 24995 }, { "epoch": 1.97, "learning_rate": 7.956144168326073e-05, "loss": 1.4733, "step": 24996 }, { "epoch": 1.97, "learning_rate": 7.955052972178526e-05, "loss": 1.494, "step": 24997 }, { "epoch": 1.97, "learning_rate": 7.953961823862287e-05, "loss": 1.415, "step": 24998 }, { "epoch": 1.97, "learning_rate": 7.952870723384754e-05, "loss": 1.5518, "step": 24999 }, { "epoch": 1.97, "learning_rate": 7.951779670753342e-05, "loss": 1.4617, "step": 25000 }, { "epoch": 1.97, "learning_rate": 7.950688665975459e-05, "loss": 1.5204, "step": 25001 }, { "epoch": 1.97, "learning_rate": 7.94959770905851e-05, "loss": 1.4948, "step": 25002 }, { "epoch": 1.97, "learning_rate": 7.948506800009895e-05, "loss": 1.5018, "step": 25003 }, { "epoch": 1.97, "learning_rate": 7.947415938837035e-05, "loss": 1.576, "step": 25004 }, { "epoch": 1.97, "learning_rate": 7.946325125547328e-05, "loss": 1.5086, "step": 25005 }, { "epoch": 1.97, "learning_rate": 7.945234360148175e-05, "loss": 1.455, "step": 25006 }, { "epoch": 1.97, "learning_rate": 7.944143642646993e-05, "loss": 1.5447, "step": 25007 }, { "epoch": 1.97, "learning_rate": 7.943052973051183e-05, "loss": 1.4051, "step": 25008 }, { "epoch": 1.97, "learning_rate": 7.941962351368142e-05, "loss": 1.4728, "step": 25009 }, { "epoch": 1.97, "learning_rate": 7.940871777605285e-05, "loss": 1.4996, "step": 25010 }, { "epoch": 1.97, "learning_rate": 7.939781251770017e-05, "loss": 1.4473, "step": 25011 }, { "epoch": 1.97, "learning_rate": 7.938690773869732e-05, "loss": 1.4776, "step": 25012 }, { "epoch": 1.97, "learning_rate": 7.93760034391184e-05, "loss": 1.4887, "step": 25013 }, { "epoch": 1.97, "learning_rate": 7.936509961903748e-05, "loss": 1.5109, "step": 25014 }, { "epoch": 1.97, "learning_rate": 7.935419627852857e-05, "loss": 1.5318, "step": 25015 }, { "epoch": 1.97, "learning_rate": 7.934329341766561e-05, "loss": 1.499, "step": 25016 }, { "epoch": 1.97, "learning_rate": 7.933239103652276e-05, "loss": 1.4553, "step": 25017 }, { "epoch": 1.97, "learning_rate": 7.932148913517398e-05, "loss": 1.5047, "step": 25018 }, { "epoch": 1.97, "learning_rate": 7.931058771369323e-05, "loss": 1.5009, "step": 25019 }, { "epoch": 1.97, "learning_rate": 7.929968677215464e-05, "loss": 1.4822, "step": 25020 }, { "epoch": 1.97, "learning_rate": 7.928878631063217e-05, "loss": 1.4867, "step": 25021 }, { "epoch": 1.97, "learning_rate": 7.92778863291998e-05, "loss": 1.4973, "step": 25022 }, { "epoch": 1.97, "learning_rate": 7.92669868279315e-05, "loss": 1.4553, "step": 25023 }, { "epoch": 1.97, "learning_rate": 7.925608780690139e-05, "loss": 1.4719, "step": 25024 }, { "epoch": 1.97, "learning_rate": 7.92451892661834e-05, "loss": 1.4339, "step": 25025 }, { "epoch": 1.97, "learning_rate": 7.923429120585147e-05, "loss": 1.4384, "step": 25026 }, { "epoch": 1.97, "learning_rate": 7.922339362597971e-05, "loss": 1.4817, "step": 25027 }, { "epoch": 1.97, "learning_rate": 7.921249652664197e-05, "loss": 1.4585, "step": 25028 }, { "epoch": 1.97, "learning_rate": 7.920159990791241e-05, "loss": 1.5015, "step": 25029 }, { "epoch": 1.97, "learning_rate": 7.919070376986485e-05, "loss": 1.5304, "step": 25030 }, { "epoch": 1.97, "learning_rate": 7.917980811257338e-05, "loss": 1.5347, "step": 25031 }, { "epoch": 1.97, "learning_rate": 7.916891293611195e-05, "loss": 1.4879, "step": 25032 }, { "epoch": 1.97, "learning_rate": 7.915801824055444e-05, "loss": 1.4903, "step": 25033 }, { "epoch": 1.97, "learning_rate": 7.914712402597493e-05, "loss": 1.5098, "step": 25034 }, { "epoch": 1.97, "learning_rate": 7.91362302924474e-05, "loss": 1.444, "step": 25035 }, { "epoch": 1.97, "learning_rate": 7.912533704004568e-05, "loss": 1.5125, "step": 25036 }, { "epoch": 1.97, "learning_rate": 7.911444426884384e-05, "loss": 1.4706, "step": 25037 }, { "epoch": 1.97, "learning_rate": 7.910355197891584e-05, "loss": 1.4917, "step": 25038 }, { "epoch": 1.97, "learning_rate": 7.909266017033559e-05, "loss": 1.4719, "step": 25039 }, { "epoch": 1.97, "learning_rate": 7.908176884317697e-05, "loss": 1.4603, "step": 25040 }, { "epoch": 1.97, "learning_rate": 7.907087799751409e-05, "loss": 1.4608, "step": 25041 }, { "epoch": 1.97, "learning_rate": 7.905998763342078e-05, "loss": 1.4743, "step": 25042 }, { "epoch": 1.97, "learning_rate": 7.904909775097097e-05, "loss": 1.4596, "step": 25043 }, { "epoch": 1.97, "learning_rate": 7.903820835023863e-05, "loss": 1.453, "step": 25044 }, { "epoch": 1.97, "learning_rate": 7.902731943129774e-05, "loss": 1.4713, "step": 25045 }, { "epoch": 1.97, "learning_rate": 7.901643099422221e-05, "loss": 1.4846, "step": 25046 }, { "epoch": 1.97, "learning_rate": 7.900554303908585e-05, "loss": 1.4436, "step": 25047 }, { "epoch": 1.97, "learning_rate": 7.899465556596274e-05, "loss": 1.5001, "step": 25048 }, { "epoch": 1.97, "learning_rate": 7.898376857492674e-05, "loss": 1.4753, "step": 25049 }, { "epoch": 1.97, "learning_rate": 7.897288206605171e-05, "loss": 1.4864, "step": 25050 }, { "epoch": 1.97, "learning_rate": 7.896199603941168e-05, "loss": 1.5096, "step": 25051 }, { "epoch": 1.97, "learning_rate": 7.895111049508049e-05, "loss": 1.4879, "step": 25052 }, { "epoch": 1.97, "learning_rate": 7.894022543313199e-05, "loss": 1.5133, "step": 25053 }, { "epoch": 1.97, "learning_rate": 7.89293408536402e-05, "loss": 1.4839, "step": 25054 }, { "epoch": 1.97, "learning_rate": 7.891845675667897e-05, "loss": 1.5014, "step": 25055 }, { "epoch": 1.97, "learning_rate": 7.890757314232217e-05, "loss": 1.4807, "step": 25056 }, { "epoch": 1.97, "learning_rate": 7.889669001064369e-05, "loss": 1.479, "step": 25057 }, { "epoch": 1.97, "learning_rate": 7.888580736171748e-05, "loss": 1.5129, "step": 25058 }, { "epoch": 1.97, "learning_rate": 7.887492519561742e-05, "loss": 1.495, "step": 25059 }, { "epoch": 1.97, "learning_rate": 7.88640435124173e-05, "loss": 1.52, "step": 25060 }, { "epoch": 1.97, "learning_rate": 7.885316231219104e-05, "loss": 1.4975, "step": 25061 }, { "epoch": 1.97, "learning_rate": 7.884228159501264e-05, "loss": 1.4118, "step": 25062 }, { "epoch": 1.97, "learning_rate": 7.883140136095588e-05, "loss": 1.4446, "step": 25063 }, { "epoch": 1.97, "learning_rate": 7.882052161009456e-05, "loss": 1.451, "step": 25064 }, { "epoch": 1.97, "learning_rate": 7.880964234250267e-05, "loss": 1.4647, "step": 25065 }, { "epoch": 1.97, "learning_rate": 7.879876355825402e-05, "loss": 1.4757, "step": 25066 }, { "epoch": 1.97, "learning_rate": 7.878788525742244e-05, "loss": 1.4794, "step": 25067 }, { "epoch": 1.97, "learning_rate": 7.877700744008186e-05, "loss": 1.4373, "step": 25068 }, { "epoch": 1.97, "learning_rate": 7.87661301063061e-05, "loss": 1.4839, "step": 25069 }, { "epoch": 1.97, "learning_rate": 7.875525325616895e-05, "loss": 1.4959, "step": 25070 }, { "epoch": 1.97, "learning_rate": 7.874437688974437e-05, "loss": 1.5081, "step": 25071 }, { "epoch": 1.97, "learning_rate": 7.873350100710614e-05, "loss": 1.4821, "step": 25072 }, { "epoch": 1.97, "learning_rate": 7.872262560832808e-05, "loss": 1.457, "step": 25073 }, { "epoch": 1.97, "learning_rate": 7.871175069348409e-05, "loss": 1.405, "step": 25074 }, { "epoch": 1.97, "learning_rate": 7.870087626264793e-05, "loss": 1.4248, "step": 25075 }, { "epoch": 1.97, "learning_rate": 7.869000231589351e-05, "loss": 1.4594, "step": 25076 }, { "epoch": 1.97, "learning_rate": 7.867912885329458e-05, "loss": 1.4895, "step": 25077 }, { "epoch": 1.97, "learning_rate": 7.866825587492506e-05, "loss": 1.5107, "step": 25078 }, { "epoch": 1.97, "learning_rate": 7.865738338085873e-05, "loss": 1.4781, "step": 25079 }, { "epoch": 1.97, "learning_rate": 7.864651137116937e-05, "loss": 1.4916, "step": 25080 }, { "epoch": 1.97, "learning_rate": 7.863563984593079e-05, "loss": 1.4333, "step": 25081 }, { "epoch": 1.97, "learning_rate": 7.862476880521687e-05, "loss": 1.4691, "step": 25082 }, { "epoch": 1.97, "learning_rate": 7.861389824910142e-05, "loss": 1.4587, "step": 25083 }, { "epoch": 1.97, "learning_rate": 7.860302817765812e-05, "loss": 1.5424, "step": 25084 }, { "epoch": 1.97, "learning_rate": 7.85921585909609e-05, "loss": 1.4613, "step": 25085 }, { "epoch": 1.97, "learning_rate": 7.858128948908354e-05, "loss": 1.4871, "step": 25086 }, { "epoch": 1.97, "learning_rate": 7.857042087209977e-05, "loss": 1.4898, "step": 25087 }, { "epoch": 1.97, "learning_rate": 7.855955274008346e-05, "loss": 1.4853, "step": 25088 }, { "epoch": 1.97, "learning_rate": 7.854868509310836e-05, "loss": 1.4447, "step": 25089 }, { "epoch": 1.97, "learning_rate": 7.853781793124821e-05, "loss": 1.4637, "step": 25090 }, { "epoch": 1.97, "learning_rate": 7.852695125457683e-05, "loss": 1.5162, "step": 25091 }, { "epoch": 1.97, "learning_rate": 7.851608506316809e-05, "loss": 1.4581, "step": 25092 }, { "epoch": 1.97, "learning_rate": 7.850521935709566e-05, "loss": 1.4937, "step": 25093 }, { "epoch": 1.97, "learning_rate": 7.849435413643328e-05, "loss": 1.4906, "step": 25094 }, { "epoch": 1.97, "learning_rate": 7.848348940125485e-05, "loss": 1.4908, "step": 25095 }, { "epoch": 1.97, "learning_rate": 7.847262515163405e-05, "loss": 1.4943, "step": 25096 }, { "epoch": 1.97, "learning_rate": 7.846176138764466e-05, "loss": 1.4467, "step": 25097 }, { "epoch": 1.97, "learning_rate": 7.845089810936036e-05, "loss": 1.4734, "step": 25098 }, { "epoch": 1.97, "learning_rate": 7.844003531685506e-05, "loss": 1.4948, "step": 25099 }, { "epoch": 1.97, "learning_rate": 7.84291730102024e-05, "loss": 1.5258, "step": 25100 }, { "epoch": 1.97, "learning_rate": 7.841831118947612e-05, "loss": 1.4547, "step": 25101 }, { "epoch": 1.98, "learning_rate": 7.840744985475005e-05, "loss": 1.5625, "step": 25102 }, { "epoch": 1.98, "learning_rate": 7.839658900609791e-05, "loss": 1.4507, "step": 25103 }, { "epoch": 1.98, "learning_rate": 7.838572864359333e-05, "loss": 1.4444, "step": 25104 }, { "epoch": 1.98, "learning_rate": 7.83748687673102e-05, "loss": 1.5009, "step": 25105 }, { "epoch": 1.98, "learning_rate": 7.83640093773222e-05, "loss": 1.4546, "step": 25106 }, { "epoch": 1.98, "learning_rate": 7.835315047370297e-05, "loss": 1.5167, "step": 25107 }, { "epoch": 1.98, "learning_rate": 7.834229205652632e-05, "loss": 1.4891, "step": 25108 }, { "epoch": 1.98, "learning_rate": 7.833143412586603e-05, "loss": 1.4903, "step": 25109 }, { "epoch": 1.98, "learning_rate": 7.832057668179572e-05, "loss": 1.4552, "step": 25110 }, { "epoch": 1.98, "learning_rate": 7.830971972438911e-05, "loss": 1.4879, "step": 25111 }, { "epoch": 1.98, "learning_rate": 7.829886325371999e-05, "loss": 1.4963, "step": 25112 }, { "epoch": 1.98, "learning_rate": 7.828800726986203e-05, "loss": 1.5218, "step": 25113 }, { "epoch": 1.98, "learning_rate": 7.82771517728889e-05, "loss": 1.4182, "step": 25114 }, { "epoch": 1.98, "learning_rate": 7.826629676287428e-05, "loss": 1.4855, "step": 25115 }, { "epoch": 1.98, "learning_rate": 7.825544223989201e-05, "loss": 1.4761, "step": 25116 }, { "epoch": 1.98, "learning_rate": 7.824458820401565e-05, "loss": 1.4586, "step": 25117 }, { "epoch": 1.98, "learning_rate": 7.82337346553189e-05, "loss": 1.519, "step": 25118 }, { "epoch": 1.98, "learning_rate": 7.822288159387555e-05, "loss": 1.5131, "step": 25119 }, { "epoch": 1.98, "learning_rate": 7.821202901975921e-05, "loss": 1.5283, "step": 25120 }, { "epoch": 1.98, "learning_rate": 7.820117693304355e-05, "loss": 1.5091, "step": 25121 }, { "epoch": 1.98, "learning_rate": 7.81903253338023e-05, "loss": 1.4657, "step": 25122 }, { "epoch": 1.98, "learning_rate": 7.817947422210909e-05, "loss": 1.516, "step": 25123 }, { "epoch": 1.98, "learning_rate": 7.816862359803764e-05, "loss": 1.5357, "step": 25124 }, { "epoch": 1.98, "learning_rate": 7.815777346166154e-05, "loss": 1.4981, "step": 25125 }, { "epoch": 1.98, "learning_rate": 7.814692381305461e-05, "loss": 1.5009, "step": 25126 }, { "epoch": 1.98, "learning_rate": 7.813607465229037e-05, "loss": 1.4655, "step": 25127 }, { "epoch": 1.98, "learning_rate": 7.812522597944249e-05, "loss": 1.4645, "step": 25128 }, { "epoch": 1.98, "learning_rate": 7.811437779458471e-05, "loss": 1.4632, "step": 25129 }, { "epoch": 1.98, "learning_rate": 7.810353009779064e-05, "loss": 1.4929, "step": 25130 }, { "epoch": 1.98, "learning_rate": 7.809268288913387e-05, "loss": 1.4943, "step": 25131 }, { "epoch": 1.98, "learning_rate": 7.808183616868815e-05, "loss": 1.4765, "step": 25132 }, { "epoch": 1.98, "learning_rate": 7.807098993652707e-05, "loss": 1.4472, "step": 25133 }, { "epoch": 1.98, "learning_rate": 7.80601441927243e-05, "loss": 1.4586, "step": 25134 }, { "epoch": 1.98, "learning_rate": 7.804929893735338e-05, "loss": 1.4697, "step": 25135 }, { "epoch": 1.98, "learning_rate": 7.803845417048806e-05, "loss": 1.4842, "step": 25136 }, { "epoch": 1.98, "learning_rate": 7.802760989220194e-05, "loss": 1.4554, "step": 25137 }, { "epoch": 1.98, "learning_rate": 7.801676610256858e-05, "loss": 1.5311, "step": 25138 }, { "epoch": 1.98, "learning_rate": 7.800592280166165e-05, "loss": 1.5016, "step": 25139 }, { "epoch": 1.98, "learning_rate": 7.79950799895548e-05, "loss": 1.4656, "step": 25140 }, { "epoch": 1.98, "learning_rate": 7.798423766632165e-05, "loss": 1.4857, "step": 25141 }, { "epoch": 1.98, "learning_rate": 7.797339583203574e-05, "loss": 1.4896, "step": 25142 }, { "epoch": 1.98, "learning_rate": 7.796255448677076e-05, "loss": 1.509, "step": 25143 }, { "epoch": 1.98, "learning_rate": 7.795171363060029e-05, "loss": 1.4526, "step": 25144 }, { "epoch": 1.98, "learning_rate": 7.794087326359787e-05, "loss": 1.4752, "step": 25145 }, { "epoch": 1.98, "learning_rate": 7.79300333858372e-05, "loss": 1.4536, "step": 25146 }, { "epoch": 1.98, "learning_rate": 7.791919399739185e-05, "loss": 1.5175, "step": 25147 }, { "epoch": 1.98, "learning_rate": 7.790835509833531e-05, "loss": 1.524, "step": 25148 }, { "epoch": 1.98, "learning_rate": 7.789751668874134e-05, "loss": 1.5371, "step": 25149 }, { "epoch": 1.98, "learning_rate": 7.788667876868342e-05, "loss": 1.4484, "step": 25150 }, { "epoch": 1.98, "learning_rate": 7.787584133823517e-05, "loss": 1.4567, "step": 25151 }, { "epoch": 1.98, "learning_rate": 7.78650043974701e-05, "loss": 1.5116, "step": 25152 }, { "epoch": 1.98, "learning_rate": 7.78541679464619e-05, "loss": 1.5152, "step": 25153 }, { "epoch": 1.98, "learning_rate": 7.784333198528402e-05, "loss": 1.4682, "step": 25154 }, { "epoch": 1.98, "learning_rate": 7.783249651401017e-05, "loss": 1.4881, "step": 25155 }, { "epoch": 1.98, "learning_rate": 7.782166153271377e-05, "loss": 1.4666, "step": 25156 }, { "epoch": 1.98, "learning_rate": 7.781082704146853e-05, "loss": 1.5137, "step": 25157 }, { "epoch": 1.98, "learning_rate": 7.779999304034791e-05, "loss": 1.506, "step": 25158 }, { "epoch": 1.98, "learning_rate": 7.778915952942545e-05, "loss": 1.4769, "step": 25159 }, { "epoch": 1.98, "learning_rate": 7.777832650877482e-05, "loss": 1.4989, "step": 25160 }, { "epoch": 1.98, "learning_rate": 7.776749397846949e-05, "loss": 1.4513, "step": 25161 }, { "epoch": 1.98, "learning_rate": 7.775666193858295e-05, "loss": 1.4672, "step": 25162 }, { "epoch": 1.98, "learning_rate": 7.774583038918887e-05, "loss": 1.4929, "step": 25163 }, { "epoch": 1.98, "learning_rate": 7.773499933036072e-05, "loss": 1.4486, "step": 25164 }, { "epoch": 1.98, "learning_rate": 7.772416876217199e-05, "loss": 1.419, "step": 25165 }, { "epoch": 1.98, "learning_rate": 7.771333868469633e-05, "loss": 1.457, "step": 25166 }, { "epoch": 1.98, "learning_rate": 7.770250909800722e-05, "loss": 1.488, "step": 25167 }, { "epoch": 1.98, "learning_rate": 7.769168000217817e-05, "loss": 1.4768, "step": 25168 }, { "epoch": 1.98, "learning_rate": 7.768085139728263e-05, "loss": 1.4259, "step": 25169 }, { "epoch": 1.98, "learning_rate": 7.767002328339425e-05, "loss": 1.4983, "step": 25170 }, { "epoch": 1.98, "learning_rate": 7.765919566058652e-05, "loss": 1.4699, "step": 25171 }, { "epoch": 1.98, "learning_rate": 7.764836852893293e-05, "loss": 1.5045, "step": 25172 }, { "epoch": 1.98, "learning_rate": 7.763754188850696e-05, "loss": 1.4686, "step": 25173 }, { "epoch": 1.98, "learning_rate": 7.762671573938217e-05, "loss": 1.4847, "step": 25174 }, { "epoch": 1.98, "learning_rate": 7.761589008163204e-05, "loss": 1.4633, "step": 25175 }, { "epoch": 1.98, "learning_rate": 7.760506491533003e-05, "loss": 1.461, "step": 25176 }, { "epoch": 1.98, "learning_rate": 7.759424024054973e-05, "loss": 1.5068, "step": 25177 }, { "epoch": 1.98, "learning_rate": 7.758341605736459e-05, "loss": 1.4997, "step": 25178 }, { "epoch": 1.98, "learning_rate": 7.757259236584803e-05, "loss": 1.4476, "step": 25179 }, { "epoch": 1.98, "learning_rate": 7.756176916607365e-05, "loss": 1.531, "step": 25180 }, { "epoch": 1.98, "learning_rate": 7.75509464581149e-05, "loss": 1.4764, "step": 25181 }, { "epoch": 1.98, "learning_rate": 7.754012424204518e-05, "loss": 1.4561, "step": 25182 }, { "epoch": 1.98, "learning_rate": 7.752930251793808e-05, "loss": 1.4754, "step": 25183 }, { "epoch": 1.98, "learning_rate": 7.751848128586703e-05, "loss": 1.4961, "step": 25184 }, { "epoch": 1.98, "learning_rate": 7.750766054590544e-05, "loss": 1.4701, "step": 25185 }, { "epoch": 1.98, "learning_rate": 7.749684029812681e-05, "loss": 1.4425, "step": 25186 }, { "epoch": 1.98, "learning_rate": 7.74860205426047e-05, "loss": 1.4797, "step": 25187 }, { "epoch": 1.98, "learning_rate": 7.747520127941249e-05, "loss": 1.4909, "step": 25188 }, { "epoch": 1.98, "learning_rate": 7.746438250862357e-05, "loss": 1.4964, "step": 25189 }, { "epoch": 1.98, "learning_rate": 7.745356423031153e-05, "loss": 1.5383, "step": 25190 }, { "epoch": 1.98, "learning_rate": 7.744274644454977e-05, "loss": 1.4683, "step": 25191 }, { "epoch": 1.98, "learning_rate": 7.74319291514117e-05, "loss": 1.4974, "step": 25192 }, { "epoch": 1.98, "learning_rate": 7.742111235097072e-05, "loss": 1.4823, "step": 25193 }, { "epoch": 1.98, "learning_rate": 7.741029604330043e-05, "loss": 1.4918, "step": 25194 }, { "epoch": 1.98, "learning_rate": 7.739948022847414e-05, "loss": 1.4528, "step": 25195 }, { "epoch": 1.98, "learning_rate": 7.738866490656527e-05, "loss": 1.4413, "step": 25196 }, { "epoch": 1.98, "learning_rate": 7.737785007764735e-05, "loss": 1.5039, "step": 25197 }, { "epoch": 1.98, "learning_rate": 7.736703574179375e-05, "loss": 1.4558, "step": 25198 }, { "epoch": 1.98, "learning_rate": 7.735622189907786e-05, "loss": 1.4677, "step": 25199 }, { "epoch": 1.98, "learning_rate": 7.734540854957316e-05, "loss": 1.5574, "step": 25200 }, { "epoch": 1.98, "learning_rate": 7.733459569335299e-05, "loss": 1.4782, "step": 25201 }, { "epoch": 1.98, "learning_rate": 7.732378333049088e-05, "loss": 1.4317, "step": 25202 }, { "epoch": 1.98, "learning_rate": 7.731297146106011e-05, "loss": 1.4661, "step": 25203 }, { "epoch": 1.98, "learning_rate": 7.730216008513422e-05, "loss": 1.5075, "step": 25204 }, { "epoch": 1.98, "learning_rate": 7.729134920278654e-05, "loss": 1.4705, "step": 25205 }, { "epoch": 1.98, "learning_rate": 7.728053881409042e-05, "loss": 1.4719, "step": 25206 }, { "epoch": 1.98, "learning_rate": 7.726972891911937e-05, "loss": 1.432, "step": 25207 }, { "epoch": 1.98, "learning_rate": 7.725891951794671e-05, "loss": 1.5253, "step": 25208 }, { "epoch": 1.98, "learning_rate": 7.724811061064586e-05, "loss": 1.5127, "step": 25209 }, { "epoch": 1.98, "learning_rate": 7.723730219729013e-05, "loss": 1.491, "step": 25210 }, { "epoch": 1.98, "learning_rate": 7.722649427795302e-05, "loss": 1.47, "step": 25211 }, { "epoch": 1.98, "learning_rate": 7.721568685270786e-05, "loss": 1.4503, "step": 25212 }, { "epoch": 1.98, "learning_rate": 7.720487992162795e-05, "loss": 1.4797, "step": 25213 }, { "epoch": 1.98, "learning_rate": 7.71940734847868e-05, "loss": 1.4921, "step": 25214 }, { "epoch": 1.98, "learning_rate": 7.718326754225773e-05, "loss": 1.4928, "step": 25215 }, { "epoch": 1.98, "learning_rate": 7.7172462094114e-05, "loss": 1.5168, "step": 25216 }, { "epoch": 1.98, "learning_rate": 7.716165714042908e-05, "loss": 1.4833, "step": 25217 }, { "epoch": 1.98, "learning_rate": 7.715085268127638e-05, "loss": 1.4932, "step": 25218 }, { "epoch": 1.98, "learning_rate": 7.714004871672917e-05, "loss": 1.434, "step": 25219 }, { "epoch": 1.98, "learning_rate": 7.712924524686077e-05, "loss": 1.4779, "step": 25220 }, { "epoch": 1.98, "learning_rate": 7.711844227174463e-05, "loss": 1.4955, "step": 25221 }, { "epoch": 1.98, "learning_rate": 7.710763979145407e-05, "loss": 1.4896, "step": 25222 }, { "epoch": 1.98, "learning_rate": 7.709683780606234e-05, "loss": 1.4792, "step": 25223 }, { "epoch": 1.98, "learning_rate": 7.708603631564292e-05, "loss": 1.4406, "step": 25224 }, { "epoch": 1.98, "learning_rate": 7.707523532026907e-05, "loss": 1.528, "step": 25225 }, { "epoch": 1.98, "learning_rate": 7.706443482001412e-05, "loss": 1.4696, "step": 25226 }, { "epoch": 1.98, "learning_rate": 7.705363481495135e-05, "loss": 1.5323, "step": 25227 }, { "epoch": 1.98, "learning_rate": 7.70428353051542e-05, "loss": 1.4984, "step": 25228 }, { "epoch": 1.99, "learning_rate": 7.703203629069594e-05, "loss": 1.4819, "step": 25229 }, { "epoch": 1.99, "learning_rate": 7.702123777164984e-05, "loss": 1.5227, "step": 25230 }, { "epoch": 1.99, "learning_rate": 7.701043974808931e-05, "loss": 1.4708, "step": 25231 }, { "epoch": 1.99, "learning_rate": 7.699964222008762e-05, "loss": 1.4783, "step": 25232 }, { "epoch": 1.99, "learning_rate": 7.6988845187718e-05, "loss": 1.4189, "step": 25233 }, { "epoch": 1.99, "learning_rate": 7.697804865105384e-05, "loss": 1.5195, "step": 25234 }, { "epoch": 1.99, "learning_rate": 7.696725261016851e-05, "loss": 1.4891, "step": 25235 }, { "epoch": 1.99, "learning_rate": 7.695645706513522e-05, "loss": 1.4975, "step": 25236 }, { "epoch": 1.99, "learning_rate": 7.69456620160272e-05, "loss": 1.5652, "step": 25237 }, { "epoch": 1.99, "learning_rate": 7.693486746291791e-05, "loss": 1.5403, "step": 25238 }, { "epoch": 1.99, "learning_rate": 7.692407340588055e-05, "loss": 1.4889, "step": 25239 }, { "epoch": 1.99, "learning_rate": 7.691327984498831e-05, "loss": 1.4567, "step": 25240 }, { "epoch": 1.99, "learning_rate": 7.690248678031466e-05, "loss": 1.4342, "step": 25241 }, { "epoch": 1.99, "learning_rate": 7.689169421193276e-05, "loss": 1.4459, "step": 25242 }, { "epoch": 1.99, "learning_rate": 7.68809021399159e-05, "loss": 1.4673, "step": 25243 }, { "epoch": 1.99, "learning_rate": 7.687011056433738e-05, "loss": 1.4811, "step": 25244 }, { "epoch": 1.99, "learning_rate": 7.685931948527045e-05, "loss": 1.4633, "step": 25245 }, { "epoch": 1.99, "learning_rate": 7.68485289027884e-05, "loss": 1.476, "step": 25246 }, { "epoch": 1.99, "learning_rate": 7.683773881696439e-05, "loss": 1.4704, "step": 25247 }, { "epoch": 1.99, "learning_rate": 7.682694922787177e-05, "loss": 1.4711, "step": 25248 }, { "epoch": 1.99, "learning_rate": 7.681616013558386e-05, "loss": 1.4594, "step": 25249 }, { "epoch": 1.99, "learning_rate": 7.680537154017382e-05, "loss": 1.5027, "step": 25250 }, { "epoch": 1.99, "learning_rate": 7.679458344171485e-05, "loss": 1.4405, "step": 25251 }, { "epoch": 1.99, "learning_rate": 7.678379584028033e-05, "loss": 1.4908, "step": 25252 }, { "epoch": 1.99, "learning_rate": 7.677300873594342e-05, "loss": 1.4903, "step": 25253 }, { "epoch": 1.99, "learning_rate": 7.676222212877732e-05, "loss": 1.4573, "step": 25254 }, { "epoch": 1.99, "learning_rate": 7.675143601885538e-05, "loss": 1.4124, "step": 25255 }, { "epoch": 1.99, "learning_rate": 7.674065040625076e-05, "loss": 1.4727, "step": 25256 }, { "epoch": 1.99, "learning_rate": 7.672986529103665e-05, "loss": 1.5006, "step": 25257 }, { "epoch": 1.99, "learning_rate": 7.671908067328636e-05, "loss": 1.4864, "step": 25258 }, { "epoch": 1.99, "learning_rate": 7.670829655307308e-05, "loss": 1.483, "step": 25259 }, { "epoch": 1.99, "learning_rate": 7.669751293046996e-05, "loss": 1.4344, "step": 25260 }, { "epoch": 1.99, "learning_rate": 7.668672980555033e-05, "loss": 1.4854, "step": 25261 }, { "epoch": 1.99, "learning_rate": 7.667594717838737e-05, "loss": 1.4861, "step": 25262 }, { "epoch": 1.99, "learning_rate": 7.666516504905426e-05, "loss": 1.5601, "step": 25263 }, { "epoch": 1.99, "learning_rate": 7.665438341762408e-05, "loss": 1.4948, "step": 25264 }, { "epoch": 1.99, "learning_rate": 7.664360228417027e-05, "loss": 1.4551, "step": 25265 }, { "epoch": 1.99, "learning_rate": 7.663282164876593e-05, "loss": 1.5351, "step": 25266 }, { "epoch": 1.99, "learning_rate": 7.662204151148424e-05, "loss": 1.4679, "step": 25267 }, { "epoch": 1.99, "learning_rate": 7.661126187239836e-05, "loss": 1.4718, "step": 25268 }, { "epoch": 1.99, "learning_rate": 7.660048273158155e-05, "loss": 1.5264, "step": 25269 }, { "epoch": 1.99, "learning_rate": 7.658970408910696e-05, "loss": 1.4802, "step": 25270 }, { "epoch": 1.99, "learning_rate": 7.657892594504771e-05, "loss": 1.4474, "step": 25271 }, { "epoch": 1.99, "learning_rate": 7.656814829947707e-05, "loss": 1.476, "step": 25272 }, { "epoch": 1.99, "learning_rate": 7.655737115246822e-05, "loss": 1.5106, "step": 25273 }, { "epoch": 1.99, "learning_rate": 7.654659450409421e-05, "loss": 1.4868, "step": 25274 }, { "epoch": 1.99, "learning_rate": 7.653581835442834e-05, "loss": 1.4914, "step": 25275 }, { "epoch": 1.99, "learning_rate": 7.652504270354375e-05, "loss": 1.4402, "step": 25276 }, { "epoch": 1.99, "learning_rate": 7.65142675515135e-05, "loss": 1.4882, "step": 25277 }, { "epoch": 1.99, "learning_rate": 7.650349289841087e-05, "loss": 1.4531, "step": 25278 }, { "epoch": 1.99, "learning_rate": 7.649271874430898e-05, "loss": 1.5186, "step": 25279 }, { "epoch": 1.99, "learning_rate": 7.648194508928091e-05, "loss": 1.4983, "step": 25280 }, { "epoch": 1.99, "learning_rate": 7.647117193339984e-05, "loss": 1.4389, "step": 25281 }, { "epoch": 1.99, "learning_rate": 7.6460399276739e-05, "loss": 1.4981, "step": 25282 }, { "epoch": 1.99, "learning_rate": 7.644962711937147e-05, "loss": 1.4729, "step": 25283 }, { "epoch": 1.99, "learning_rate": 7.643885546137032e-05, "loss": 1.4666, "step": 25284 }, { "epoch": 1.99, "learning_rate": 7.642808430280883e-05, "loss": 1.5055, "step": 25285 }, { "epoch": 1.99, "learning_rate": 7.641731364376001e-05, "loss": 1.5396, "step": 25286 }, { "epoch": 1.99, "learning_rate": 7.640654348429705e-05, "loss": 1.5375, "step": 25287 }, { "epoch": 1.99, "learning_rate": 7.639577382449298e-05, "loss": 1.5267, "step": 25288 }, { "epoch": 1.99, "learning_rate": 7.638500466442105e-05, "loss": 1.4763, "step": 25289 }, { "epoch": 1.99, "learning_rate": 7.637423600415433e-05, "loss": 1.4718, "step": 25290 }, { "epoch": 1.99, "learning_rate": 7.636346784376583e-05, "loss": 1.4899, "step": 25291 }, { "epoch": 1.99, "learning_rate": 7.635270018332883e-05, "loss": 1.494, "step": 25292 }, { "epoch": 1.99, "learning_rate": 7.634193302291633e-05, "loss": 1.5126, "step": 25293 }, { "epoch": 1.99, "learning_rate": 7.633116636260141e-05, "loss": 1.533, "step": 25294 }, { "epoch": 1.99, "learning_rate": 7.632040020245722e-05, "loss": 1.4756, "step": 25295 }, { "epoch": 1.99, "learning_rate": 7.63096345425569e-05, "loss": 1.5112, "step": 25296 }, { "epoch": 1.99, "learning_rate": 7.629886938297351e-05, "loss": 1.4836, "step": 25297 }, { "epoch": 1.99, "learning_rate": 7.628810472378005e-05, "loss": 1.4841, "step": 25298 }, { "epoch": 1.99, "learning_rate": 7.627734056504976e-05, "loss": 1.4758, "step": 25299 }, { "epoch": 1.99, "learning_rate": 7.626657690685565e-05, "loss": 1.4317, "step": 25300 }, { "epoch": 1.99, "learning_rate": 7.62558137492707e-05, "loss": 1.417, "step": 25301 }, { "epoch": 1.99, "learning_rate": 7.624505109236816e-05, "loss": 1.473, "step": 25302 }, { "epoch": 1.99, "learning_rate": 7.623428893622103e-05, "loss": 1.5357, "step": 25303 }, { "epoch": 1.99, "learning_rate": 7.622352728090235e-05, "loss": 1.5497, "step": 25304 }, { "epoch": 1.99, "learning_rate": 7.621276612648516e-05, "loss": 1.5127, "step": 25305 }, { "epoch": 1.99, "learning_rate": 7.620200547304263e-05, "loss": 1.531, "step": 25306 }, { "epoch": 1.99, "learning_rate": 7.619124532064775e-05, "loss": 1.4997, "step": 25307 }, { "epoch": 1.99, "learning_rate": 7.618048566937351e-05, "loss": 1.4252, "step": 25308 }, { "epoch": 1.99, "learning_rate": 7.616972651929311e-05, "loss": 1.4869, "step": 25309 }, { "epoch": 1.99, "learning_rate": 7.615896787047955e-05, "loss": 1.48, "step": 25310 }, { "epoch": 1.99, "learning_rate": 7.614820972300574e-05, "loss": 1.4416, "step": 25311 }, { "epoch": 1.99, "learning_rate": 7.613745207694488e-05, "loss": 1.5106, "step": 25312 }, { "epoch": 1.99, "learning_rate": 7.612669493236999e-05, "loss": 1.4593, "step": 25313 }, { "epoch": 1.99, "learning_rate": 7.611593828935409e-05, "loss": 1.4944, "step": 25314 }, { "epoch": 1.99, "learning_rate": 7.61051821479701e-05, "loss": 1.5605, "step": 25315 }, { "epoch": 1.99, "learning_rate": 7.609442650829126e-05, "loss": 1.4944, "step": 25316 }, { "epoch": 1.99, "learning_rate": 7.608367137039044e-05, "loss": 1.4829, "step": 25317 }, { "epoch": 1.99, "learning_rate": 7.607291673434066e-05, "loss": 1.4577, "step": 25318 }, { "epoch": 1.99, "learning_rate": 7.606216260021502e-05, "loss": 1.4931, "step": 25319 }, { "epoch": 1.99, "learning_rate": 7.605140896808651e-05, "loss": 1.4941, "step": 25320 }, { "epoch": 1.99, "learning_rate": 7.604065583802812e-05, "loss": 1.4737, "step": 25321 }, { "epoch": 1.99, "learning_rate": 7.602990321011281e-05, "loss": 1.4343, "step": 25322 }, { "epoch": 1.99, "learning_rate": 7.601915108441369e-05, "loss": 1.4614, "step": 25323 }, { "epoch": 1.99, "learning_rate": 7.60083994610037e-05, "loss": 1.482, "step": 25324 }, { "epoch": 1.99, "learning_rate": 7.599764833995579e-05, "loss": 1.4988, "step": 25325 }, { "epoch": 1.99, "learning_rate": 7.598689772134309e-05, "loss": 1.4314, "step": 25326 }, { "epoch": 1.99, "learning_rate": 7.597614760523842e-05, "loss": 1.5217, "step": 25327 }, { "epoch": 1.99, "learning_rate": 7.596539799171494e-05, "loss": 1.4392, "step": 25328 }, { "epoch": 1.99, "learning_rate": 7.595464888084547e-05, "loss": 1.4859, "step": 25329 }, { "epoch": 1.99, "learning_rate": 7.594390027270316e-05, "loss": 1.5125, "step": 25330 }, { "epoch": 1.99, "learning_rate": 7.593315216736088e-05, "loss": 1.4937, "step": 25331 }, { "epoch": 1.99, "learning_rate": 7.592240456489157e-05, "loss": 1.4727, "step": 25332 }, { "epoch": 1.99, "learning_rate": 7.591165746536832e-05, "loss": 1.4502, "step": 25333 }, { "epoch": 1.99, "learning_rate": 7.5900910868864e-05, "loss": 1.5005, "step": 25334 }, { "epoch": 1.99, "learning_rate": 7.589016477545158e-05, "loss": 1.4758, "step": 25335 }, { "epoch": 1.99, "learning_rate": 7.587941918520411e-05, "loss": 1.4586, "step": 25336 }, { "epoch": 1.99, "learning_rate": 7.586867409819445e-05, "loss": 1.4434, "step": 25337 }, { "epoch": 1.99, "learning_rate": 7.585792951449558e-05, "loss": 1.5349, "step": 25338 }, { "epoch": 1.99, "learning_rate": 7.584718543418043e-05, "loss": 1.4463, "step": 25339 }, { "epoch": 1.99, "learning_rate": 7.583644185732201e-05, "loss": 1.5021, "step": 25340 }, { "epoch": 1.99, "learning_rate": 7.582569878399321e-05, "loss": 1.5014, "step": 25341 }, { "epoch": 1.99, "learning_rate": 7.581495621426694e-05, "loss": 1.4699, "step": 25342 }, { "epoch": 1.99, "learning_rate": 7.580421414821618e-05, "loss": 1.491, "step": 25343 }, { "epoch": 1.99, "learning_rate": 7.579347258591391e-05, "loss": 1.5199, "step": 25344 }, { "epoch": 1.99, "learning_rate": 7.578273152743302e-05, "loss": 1.4161, "step": 25345 }, { "epoch": 1.99, "learning_rate": 7.577199097284636e-05, "loss": 1.4492, "step": 25346 }, { "epoch": 1.99, "learning_rate": 7.576125092222697e-05, "loss": 1.4535, "step": 25347 }, { "epoch": 1.99, "learning_rate": 7.575051137564774e-05, "loss": 1.5033, "step": 25348 }, { "epoch": 1.99, "learning_rate": 7.573977233318149e-05, "loss": 1.449, "step": 25349 }, { "epoch": 1.99, "learning_rate": 7.572903379490126e-05, "loss": 1.5124, "step": 25350 }, { "epoch": 1.99, "learning_rate": 7.571829576087992e-05, "loss": 1.4637, "step": 25351 }, { "epoch": 1.99, "learning_rate": 7.57075582311903e-05, "loss": 1.5026, "step": 25352 }, { "epoch": 1.99, "learning_rate": 7.56968212059054e-05, "loss": 1.4991, "step": 25353 }, { "epoch": 1.99, "learning_rate": 7.568608468509809e-05, "loss": 1.4946, "step": 25354 }, { "epoch": 1.99, "learning_rate": 7.567534866884122e-05, "loss": 1.5085, "step": 25355 }, { "epoch": 2.0, "learning_rate": 7.566461315720776e-05, "loss": 1.4212, "step": 25356 }, { "epoch": 2.0, "learning_rate": 7.565387815027055e-05, "loss": 1.4722, "step": 25357 }, { "epoch": 2.0, "learning_rate": 7.56431436481024e-05, "loss": 1.4951, "step": 25358 }, { "epoch": 2.0, "learning_rate": 7.563240965077631e-05, "loss": 1.4738, "step": 25359 }, { "epoch": 2.0, "learning_rate": 7.562167615836517e-05, "loss": 1.4781, "step": 25360 }, { "epoch": 2.0, "learning_rate": 7.561094317094177e-05, "loss": 1.5354, "step": 25361 }, { "epoch": 2.0, "learning_rate": 7.560021068857905e-05, "loss": 1.5004, "step": 25362 }, { "epoch": 2.0, "learning_rate": 7.558947871134976e-05, "loss": 1.5234, "step": 25363 }, { "epoch": 2.0, "learning_rate": 7.557874723932693e-05, "loss": 1.4401, "step": 25364 }, { "epoch": 2.0, "learning_rate": 7.556801627258332e-05, "loss": 1.4448, "step": 25365 }, { "epoch": 2.0, "learning_rate": 7.555728581119175e-05, "loss": 1.4828, "step": 25366 }, { "epoch": 2.0, "learning_rate": 7.554655585522518e-05, "loss": 1.4493, "step": 25367 }, { "epoch": 2.0, "learning_rate": 7.553582640475642e-05, "loss": 1.4499, "step": 25368 }, { "epoch": 2.0, "learning_rate": 7.552509745985825e-05, "loss": 1.4675, "step": 25369 }, { "epoch": 2.0, "learning_rate": 7.551436902060362e-05, "loss": 1.463, "step": 25370 }, { "epoch": 2.0, "learning_rate": 7.550364108706532e-05, "loss": 1.4647, "step": 25371 }, { "epoch": 2.0, "learning_rate": 7.549291365931612e-05, "loss": 1.4297, "step": 25372 }, { "epoch": 2.0, "learning_rate": 7.548218673742901e-05, "loss": 1.4531, "step": 25373 }, { "epoch": 2.0, "learning_rate": 7.547146032147664e-05, "loss": 1.4719, "step": 25374 }, { "epoch": 2.0, "learning_rate": 7.5460734411532e-05, "loss": 1.5098, "step": 25375 }, { "epoch": 2.0, "learning_rate": 7.545000900766776e-05, "loss": 1.4535, "step": 25376 }, { "epoch": 2.0, "learning_rate": 7.54392841099569e-05, "loss": 1.5275, "step": 25377 }, { "epoch": 2.0, "learning_rate": 7.542855971847214e-05, "loss": 1.5099, "step": 25378 }, { "epoch": 2.0, "learning_rate": 7.54178358332863e-05, "loss": 1.4374, "step": 25379 }, { "epoch": 2.0, "learning_rate": 7.540711245447216e-05, "loss": 1.466, "step": 25380 }, { "epoch": 2.0, "learning_rate": 7.539638958210263e-05, "loss": 1.5151, "step": 25381 }, { "epoch": 2.0, "learning_rate": 7.538566721625043e-05, "loss": 1.4558, "step": 25382 }, { "epoch": 2.0, "learning_rate": 7.53749453569883e-05, "loss": 1.4859, "step": 25383 }, { "epoch": 2.0, "learning_rate": 7.536422400438918e-05, "loss": 1.5211, "step": 25384 }, { "epoch": 2.0, "learning_rate": 7.53535031585258e-05, "loss": 1.4729, "step": 25385 }, { "epoch": 2.0, "learning_rate": 7.534278281947088e-05, "loss": 1.4581, "step": 25386 }, { "epoch": 2.0, "learning_rate": 7.533206298729732e-05, "loss": 1.509, "step": 25387 }, { "epoch": 2.0, "learning_rate": 7.532134366207786e-05, "loss": 1.5061, "step": 25388 }, { "epoch": 2.0, "learning_rate": 7.531062484388519e-05, "loss": 1.4433, "step": 25389 }, { "epoch": 2.0, "learning_rate": 7.529990653279215e-05, "loss": 1.4436, "step": 25390 }, { "epoch": 2.0, "learning_rate": 7.52891887288716e-05, "loss": 1.5279, "step": 25391 }, { "epoch": 2.0, "learning_rate": 7.527847143219623e-05, "loss": 1.5053, "step": 25392 }, { "epoch": 2.0, "learning_rate": 7.526775464283873e-05, "loss": 1.455, "step": 25393 }, { "epoch": 2.0, "learning_rate": 7.5257038360872e-05, "loss": 1.4662, "step": 25394 }, { "epoch": 2.0, "learning_rate": 7.524632258636874e-05, "loss": 1.4996, "step": 25395 }, { "epoch": 2.0, "learning_rate": 7.523560731940163e-05, "loss": 1.502, "step": 25396 }, { "epoch": 2.0, "learning_rate": 7.522489256004357e-05, "loss": 1.4563, "step": 25397 }, { "epoch": 2.0, "learning_rate": 7.52141783083672e-05, "loss": 1.4695, "step": 25398 }, { "epoch": 2.0, "learning_rate": 7.520346456444531e-05, "loss": 1.4768, "step": 25399 }, { "epoch": 2.0, "learning_rate": 7.519275132835052e-05, "loss": 1.4876, "step": 25400 }, { "epoch": 2.0, "learning_rate": 7.518203860015576e-05, "loss": 1.5487, "step": 25401 }, { "epoch": 2.0, "learning_rate": 7.517132637993366e-05, "loss": 1.5039, "step": 25402 }, { "epoch": 2.0, "learning_rate": 7.51606146677569e-05, "loss": 1.4435, "step": 25403 }, { "epoch": 2.0, "learning_rate": 7.514990346369833e-05, "loss": 1.4866, "step": 25404 }, { "epoch": 2.0, "learning_rate": 7.513919276783055e-05, "loss": 1.4878, "step": 25405 }, { "epoch": 2.0, "learning_rate": 7.51284825802264e-05, "loss": 1.5251, "step": 25406 }, { "epoch": 2.0, "learning_rate": 7.511777290095848e-05, "loss": 1.4809, "step": 25407 }, { "epoch": 2.0, "learning_rate": 7.51070637300996e-05, "loss": 1.4381, "step": 25408 }, { "epoch": 2.0, "learning_rate": 7.509635506772244e-05, "loss": 1.5179, "step": 25409 }, { "epoch": 2.0, "learning_rate": 7.508564691389964e-05, "loss": 1.4522, "step": 25410 }, { "epoch": 2.0, "learning_rate": 7.507493926870403e-05, "loss": 1.4848, "step": 25411 }, { "epoch": 2.0, "learning_rate": 7.50642321322082e-05, "loss": 1.5028, "step": 25412 }, { "epoch": 2.0, "learning_rate": 7.505352550448483e-05, "loss": 1.5235, "step": 25413 }, { "epoch": 2.0, "learning_rate": 7.504281938560673e-05, "loss": 1.5265, "step": 25414 }, { "epoch": 2.0, "learning_rate": 7.503211377564652e-05, "loss": 1.425, "step": 25415 }, { "epoch": 2.0, "learning_rate": 7.50214086746769e-05, "loss": 1.4788, "step": 25416 }, { "epoch": 2.0, "learning_rate": 7.501070408277047e-05, "loss": 1.5071, "step": 25417 }, { "epoch": 2.0, "learning_rate": 7.500000000000002e-05, "loss": 1.4764, "step": 25418 }, { "epoch": 2.0, "learning_rate": 7.49892964264382e-05, "loss": 1.4458, "step": 25419 }, { "epoch": 2.0, "learning_rate": 7.497859336215758e-05, "loss": 1.4265, "step": 25420 }, { "epoch": 2.0, "learning_rate": 7.496789080723093e-05, "loss": 1.4619, "step": 25421 }, { "epoch": 2.0, "learning_rate": 7.495718876173097e-05, "loss": 1.4466, "step": 25422 }, { "epoch": 2.0, "learning_rate": 7.494648722573027e-05, "loss": 1.4412, "step": 25423 }, { "epoch": 2.0, "learning_rate": 7.493578619930145e-05, "loss": 1.4859, "step": 25424 }, { "epoch": 2.0, "learning_rate": 7.492508568251727e-05, "loss": 1.4936, "step": 25425 }, { "epoch": 2.0, "learning_rate": 7.491438567545032e-05, "loss": 1.4631, "step": 25426 }, { "epoch": 2.0, "learning_rate": 7.490368617817321e-05, "loss": 1.4498, "step": 25427 }, { "epoch": 2.0, "learning_rate": 7.489298719075869e-05, "loss": 1.4615, "step": 25428 }, { "epoch": 2.0, "learning_rate": 7.488228871327934e-05, "loss": 1.4935, "step": 25429 }, { "epoch": 2.0, "learning_rate": 7.487159074580772e-05, "loss": 1.4953, "step": 25430 }, { "epoch": 2.0, "learning_rate": 7.486089328841661e-05, "loss": 1.5141, "step": 25431 }, { "epoch": 2.0, "learning_rate": 7.485019634117858e-05, "loss": 1.4864, "step": 25432 }, { "epoch": 2.0, "learning_rate": 7.483949990416622e-05, "loss": 1.4298, "step": 25433 }, { "epoch": 2.0, "learning_rate": 7.482880397745214e-05, "loss": 1.4744, "step": 25434 }, { "epoch": 2.0, "learning_rate": 7.481810856110905e-05, "loss": 1.4144, "step": 25435 }, { "epoch": 2.0, "learning_rate": 7.480741365520951e-05, "loss": 1.4703, "step": 25436 }, { "epoch": 2.0, "learning_rate": 7.479671925982609e-05, "loss": 1.4394, "step": 25437 }, { "epoch": 2.0, "learning_rate": 7.478602537503143e-05, "loss": 1.4375, "step": 25438 }, { "epoch": 2.0, "learning_rate": 7.477533200089822e-05, "loss": 1.438, "step": 25439 }, { "epoch": 2.0, "learning_rate": 7.4764639137499e-05, "loss": 1.457, "step": 25440 }, { "epoch": 2.0, "learning_rate": 7.47539467849063e-05, "loss": 1.4576, "step": 25441 }, { "epoch": 2.0, "learning_rate": 7.474325494319283e-05, "loss": 1.3786, "step": 25442 }, { "epoch": 2.0, "learning_rate": 7.473256361243113e-05, "loss": 1.4951, "step": 25443 }, { "epoch": 2.0, "learning_rate": 7.472187279269373e-05, "loss": 1.4086, "step": 25444 }, { "epoch": 2.0, "learning_rate": 7.471118248405334e-05, "loss": 1.4588, "step": 25445 }, { "epoch": 2.0, "learning_rate": 7.470049268658246e-05, "loss": 1.4566, "step": 25446 }, { "epoch": 2.0, "learning_rate": 7.468980340035361e-05, "loss": 1.5186, "step": 25447 }, { "epoch": 2.0, "learning_rate": 7.46791146254395e-05, "loss": 1.486, "step": 25448 }, { "epoch": 2.0, "learning_rate": 7.466842636191266e-05, "loss": 1.4317, "step": 25449 }, { "epoch": 2.0, "learning_rate": 7.465773860984557e-05, "loss": 1.5232, "step": 25450 }, { "epoch": 2.0, "learning_rate": 7.46470513693109e-05, "loss": 1.4619, "step": 25451 }, { "epoch": 2.0, "learning_rate": 7.463636464038116e-05, "loss": 1.4651, "step": 25452 }, { "epoch": 2.0, "learning_rate": 7.462567842312887e-05, "loss": 1.4532, "step": 25453 }, { "epoch": 2.0, "learning_rate": 7.461499271762664e-05, "loss": 1.4271, "step": 25454 }, { "epoch": 2.0, "learning_rate": 7.460430752394706e-05, "loss": 1.4377, "step": 25455 }, { "epoch": 2.0, "learning_rate": 7.459362284216262e-05, "loss": 1.4718, "step": 25456 }, { "epoch": 2.0, "learning_rate": 7.458293867234588e-05, "loss": 1.5016, "step": 25457 }, { "epoch": 2.0, "learning_rate": 7.457225501456928e-05, "loss": 1.4499, "step": 25458 }, { "epoch": 2.0, "learning_rate": 7.456157186890554e-05, "loss": 1.4567, "step": 25459 }, { "epoch": 2.0, "learning_rate": 7.455088923542707e-05, "loss": 1.4928, "step": 25460 }, { "epoch": 2.0, "learning_rate": 7.454020711420636e-05, "loss": 1.503, "step": 25461 }, { "epoch": 2.0, "learning_rate": 7.452952550531608e-05, "loss": 1.4927, "step": 25462 }, { "epoch": 2.0, "learning_rate": 7.451884440882867e-05, "loss": 1.4439, "step": 25463 }, { "epoch": 2.0, "learning_rate": 7.45081638248166e-05, "loss": 1.4673, "step": 25464 }, { "epoch": 2.0, "learning_rate": 7.449748375335248e-05, "loss": 1.426, "step": 25465 }, { "epoch": 2.0, "learning_rate": 7.448680419450879e-05, "loss": 1.4719, "step": 25466 }, { "epoch": 2.0, "learning_rate": 7.447612514835797e-05, "loss": 1.4429, "step": 25467 }, { "epoch": 2.0, "learning_rate": 7.446544661497258e-05, "loss": 1.4619, "step": 25468 }, { "epoch": 2.0, "learning_rate": 7.445476859442518e-05, "loss": 1.4708, "step": 25469 }, { "epoch": 2.0, "learning_rate": 7.444409108678823e-05, "loss": 1.433, "step": 25470 }, { "epoch": 2.0, "learning_rate": 7.443341409213413e-05, "loss": 1.4392, "step": 25471 }, { "epoch": 2.0, "learning_rate": 7.44227376105355e-05, "loss": 1.4889, "step": 25472 }, { "epoch": 2.0, "learning_rate": 7.441206164206479e-05, "loss": 1.4777, "step": 25473 }, { "epoch": 2.0, "learning_rate": 7.440138618679447e-05, "loss": 1.5297, "step": 25474 }, { "epoch": 2.0, "learning_rate": 7.439071124479693e-05, "loss": 1.4538, "step": 25475 }, { "epoch": 2.0, "learning_rate": 7.438003681614482e-05, "loss": 1.4196, "step": 25476 }, { "epoch": 2.0, "learning_rate": 7.436936290091053e-05, "loss": 1.4915, "step": 25477 }, { "epoch": 2.0, "learning_rate": 7.435868949916648e-05, "loss": 1.3885, "step": 25478 }, { "epoch": 2.0, "learning_rate": 7.434801661098522e-05, "loss": 1.4428, "step": 25479 }, { "epoch": 2.0, "learning_rate": 7.43373442364392e-05, "loss": 1.4019, "step": 25480 }, { "epoch": 2.0, "learning_rate": 7.432667237560079e-05, "loss": 1.46, "step": 25481 }, { "epoch": 2.0, "learning_rate": 7.431600102854258e-05, "loss": 1.4531, "step": 25482 }, { "epoch": 2.01, "learning_rate": 7.430533019533695e-05, "loss": 1.4691, "step": 25483 }, { "epoch": 2.01, "learning_rate": 7.42946598760563e-05, "loss": 1.4919, "step": 25484 }, { "epoch": 2.01, "learning_rate": 7.428399007077312e-05, "loss": 1.4711, "step": 25485 }, { "epoch": 2.01, "learning_rate": 7.427332077955994e-05, "loss": 1.4623, "step": 25486 }, { "epoch": 2.01, "learning_rate": 7.426265200248912e-05, "loss": 1.467, "step": 25487 }, { "epoch": 2.01, "learning_rate": 7.425198373963304e-05, "loss": 1.4705, "step": 25488 }, { "epoch": 2.01, "learning_rate": 7.424131599106423e-05, "loss": 1.4447, "step": 25489 }, { "epoch": 2.01, "learning_rate": 7.42306487568551e-05, "loss": 1.443, "step": 25490 }, { "epoch": 2.01, "learning_rate": 7.421998203707803e-05, "loss": 1.4364, "step": 25491 }, { "epoch": 2.01, "learning_rate": 7.420931583180542e-05, "loss": 1.4071, "step": 25492 }, { "epoch": 2.01, "learning_rate": 7.419865014110978e-05, "loss": 1.4394, "step": 25493 }, { "epoch": 2.01, "learning_rate": 7.418798496506349e-05, "loss": 1.4694, "step": 25494 }, { "epoch": 2.01, "learning_rate": 7.417732030373889e-05, "loss": 1.4471, "step": 25495 }, { "epoch": 2.01, "learning_rate": 7.416665615720848e-05, "loss": 1.4432, "step": 25496 }, { "epoch": 2.01, "learning_rate": 7.415599252554462e-05, "loss": 1.4213, "step": 25497 }, { "epoch": 2.01, "learning_rate": 7.414532940881968e-05, "loss": 1.3855, "step": 25498 }, { "epoch": 2.01, "learning_rate": 7.413466680710615e-05, "loss": 1.4836, "step": 25499 }, { "epoch": 2.01, "learning_rate": 7.41240047204763e-05, "loss": 1.4737, "step": 25500 }, { "epoch": 2.01, "learning_rate": 7.411334314900263e-05, "loss": 1.4467, "step": 25501 }, { "epoch": 2.01, "learning_rate": 7.410268209275747e-05, "loss": 1.515, "step": 25502 }, { "epoch": 2.01, "learning_rate": 7.409202155181324e-05, "loss": 1.4501, "step": 25503 }, { "epoch": 2.01, "learning_rate": 7.408136152624229e-05, "loss": 1.4327, "step": 25504 }, { "epoch": 2.01, "learning_rate": 7.407070201611695e-05, "loss": 1.4359, "step": 25505 }, { "epoch": 2.01, "learning_rate": 7.40600430215097e-05, "loss": 1.4623, "step": 25506 }, { "epoch": 2.01, "learning_rate": 7.404938454249285e-05, "loss": 1.4047, "step": 25507 }, { "epoch": 2.01, "learning_rate": 7.40387265791387e-05, "loss": 1.454, "step": 25508 }, { "epoch": 2.01, "learning_rate": 7.402806913151977e-05, "loss": 1.4623, "step": 25509 }, { "epoch": 2.01, "learning_rate": 7.401741219970829e-05, "loss": 1.4582, "step": 25510 }, { "epoch": 2.01, "learning_rate": 7.400675578377665e-05, "loss": 1.544, "step": 25511 }, { "epoch": 2.01, "learning_rate": 7.399609988379716e-05, "loss": 1.3921, "step": 25512 }, { "epoch": 2.01, "learning_rate": 7.398544449984228e-05, "loss": 1.4797, "step": 25513 }, { "epoch": 2.01, "learning_rate": 7.397478963198425e-05, "loss": 1.4547, "step": 25514 }, { "epoch": 2.01, "learning_rate": 7.39641352802954e-05, "loss": 1.4739, "step": 25515 }, { "epoch": 2.01, "learning_rate": 7.395348144484811e-05, "loss": 1.4869, "step": 25516 }, { "epoch": 2.01, "learning_rate": 7.394282812571479e-05, "loss": 1.469, "step": 25517 }, { "epoch": 2.01, "learning_rate": 7.393217532296769e-05, "loss": 1.447, "step": 25518 }, { "epoch": 2.01, "learning_rate": 7.392152303667907e-05, "loss": 1.478, "step": 25519 }, { "epoch": 2.01, "learning_rate": 7.391087126692139e-05, "loss": 1.4297, "step": 25520 }, { "epoch": 2.01, "learning_rate": 7.39002200137669e-05, "loss": 1.4587, "step": 25521 }, { "epoch": 2.01, "learning_rate": 7.388956927728786e-05, "loss": 1.4586, "step": 25522 }, { "epoch": 2.01, "learning_rate": 7.387891905755672e-05, "loss": 1.4655, "step": 25523 }, { "epoch": 2.01, "learning_rate": 7.386826935464569e-05, "loss": 1.5097, "step": 25524 }, { "epoch": 2.01, "learning_rate": 7.385762016862705e-05, "loss": 1.4864, "step": 25525 }, { "epoch": 2.01, "learning_rate": 7.384697149957321e-05, "loss": 1.4541, "step": 25526 }, { "epoch": 2.01, "learning_rate": 7.383632334755642e-05, "loss": 1.4268, "step": 25527 }, { "epoch": 2.01, "learning_rate": 7.382567571264894e-05, "loss": 1.4596, "step": 25528 }, { "epoch": 2.01, "learning_rate": 7.381502859492303e-05, "loss": 1.4632, "step": 25529 }, { "epoch": 2.01, "learning_rate": 7.380438199445111e-05, "loss": 1.4786, "step": 25530 }, { "epoch": 2.01, "learning_rate": 7.379373591130533e-05, "loss": 1.3976, "step": 25531 }, { "epoch": 2.01, "learning_rate": 7.378309034555807e-05, "loss": 1.4404, "step": 25532 }, { "epoch": 2.01, "learning_rate": 7.377244529728151e-05, "loss": 1.4617, "step": 25533 }, { "epoch": 2.01, "learning_rate": 7.376180076654804e-05, "loss": 1.484, "step": 25534 }, { "epoch": 2.01, "learning_rate": 7.375115675342988e-05, "loss": 1.4699, "step": 25535 }, { "epoch": 2.01, "learning_rate": 7.374051325799923e-05, "loss": 1.4598, "step": 25536 }, { "epoch": 2.01, "learning_rate": 7.372987028032846e-05, "loss": 1.4687, "step": 25537 }, { "epoch": 2.01, "learning_rate": 7.371922782048979e-05, "loss": 1.4898, "step": 25538 }, { "epoch": 2.01, "learning_rate": 7.370858587855541e-05, "loss": 1.446, "step": 25539 }, { "epoch": 2.01, "learning_rate": 7.369794445459768e-05, "loss": 1.4283, "step": 25540 }, { "epoch": 2.01, "learning_rate": 7.36873035486888e-05, "loss": 1.4489, "step": 25541 }, { "epoch": 2.01, "learning_rate": 7.367666316090097e-05, "loss": 1.5041, "step": 25542 }, { "epoch": 2.01, "learning_rate": 7.366602329130653e-05, "loss": 1.4633, "step": 25543 }, { "epoch": 2.01, "learning_rate": 7.365538393997767e-05, "loss": 1.4591, "step": 25544 }, { "epoch": 2.01, "learning_rate": 7.364474510698661e-05, "loss": 1.4809, "step": 25545 }, { "epoch": 2.01, "learning_rate": 7.363410679240556e-05, "loss": 1.4371, "step": 25546 }, { "epoch": 2.01, "learning_rate": 7.362346899630675e-05, "loss": 1.4839, "step": 25547 }, { "epoch": 2.01, "learning_rate": 7.361283171876252e-05, "loss": 1.457, "step": 25548 }, { "epoch": 2.01, "learning_rate": 7.360219495984494e-05, "loss": 1.471, "step": 25549 }, { "epoch": 2.01, "learning_rate": 7.359155871962637e-05, "loss": 1.4229, "step": 25550 }, { "epoch": 2.01, "learning_rate": 7.358092299817894e-05, "loss": 1.449, "step": 25551 }, { "epoch": 2.01, "learning_rate": 7.357028779557488e-05, "loss": 1.4792, "step": 25552 }, { "epoch": 2.01, "learning_rate": 7.355965311188631e-05, "loss": 1.5017, "step": 25553 }, { "epoch": 2.01, "learning_rate": 7.354901894718559e-05, "loss": 1.4585, "step": 25554 }, { "epoch": 2.01, "learning_rate": 7.353838530154483e-05, "loss": 1.4424, "step": 25555 }, { "epoch": 2.01, "learning_rate": 7.352775217503618e-05, "loss": 1.5119, "step": 25556 }, { "epoch": 2.01, "learning_rate": 7.351711956773196e-05, "loss": 1.4173, "step": 25557 }, { "epoch": 2.01, "learning_rate": 7.350648747970428e-05, "loss": 1.5272, "step": 25558 }, { "epoch": 2.01, "learning_rate": 7.349585591102528e-05, "loss": 1.4983, "step": 25559 }, { "epoch": 2.01, "learning_rate": 7.348522486176727e-05, "loss": 1.4607, "step": 25560 }, { "epoch": 2.01, "learning_rate": 7.347459433200235e-05, "loss": 1.4413, "step": 25561 }, { "epoch": 2.01, "learning_rate": 7.346396432180267e-05, "loss": 1.4333, "step": 25562 }, { "epoch": 2.01, "learning_rate": 7.34533348312404e-05, "loss": 1.4416, "step": 25563 }, { "epoch": 2.01, "learning_rate": 7.344270586038782e-05, "loss": 1.4779, "step": 25564 }, { "epoch": 2.01, "learning_rate": 7.343207740931702e-05, "loss": 1.4792, "step": 25565 }, { "epoch": 2.01, "learning_rate": 7.34214494781001e-05, "loss": 1.4726, "step": 25566 }, { "epoch": 2.01, "learning_rate": 7.341082206680932e-05, "loss": 1.4527, "step": 25567 }, { "epoch": 2.01, "learning_rate": 7.340019517551682e-05, "loss": 1.4756, "step": 25568 }, { "epoch": 2.01, "learning_rate": 7.338956880429472e-05, "loss": 1.4614, "step": 25569 }, { "epoch": 2.01, "learning_rate": 7.337894295321509e-05, "loss": 1.4881, "step": 25570 }, { "epoch": 2.01, "learning_rate": 7.336831762235023e-05, "loss": 1.4561, "step": 25571 }, { "epoch": 2.01, "learning_rate": 7.335769281177221e-05, "loss": 1.4298, "step": 25572 }, { "epoch": 2.01, "learning_rate": 7.334706852155308e-05, "loss": 1.4599, "step": 25573 }, { "epoch": 2.01, "learning_rate": 7.333644475176514e-05, "loss": 1.4919, "step": 25574 }, { "epoch": 2.01, "learning_rate": 7.332582150248041e-05, "loss": 1.3991, "step": 25575 }, { "epoch": 2.01, "learning_rate": 7.331519877377099e-05, "loss": 1.4343, "step": 25576 }, { "epoch": 2.01, "learning_rate": 7.330457656570912e-05, "loss": 1.4527, "step": 25577 }, { "epoch": 2.01, "learning_rate": 7.329395487836678e-05, "loss": 1.465, "step": 25578 }, { "epoch": 2.01, "learning_rate": 7.328333371181623e-05, "loss": 1.4584, "step": 25579 }, { "epoch": 2.01, "learning_rate": 7.327271306612944e-05, "loss": 1.4699, "step": 25580 }, { "epoch": 2.01, "learning_rate": 7.326209294137864e-05, "loss": 1.5, "step": 25581 }, { "epoch": 2.01, "learning_rate": 7.325147333763589e-05, "loss": 1.4528, "step": 25582 }, { "epoch": 2.01, "learning_rate": 7.324085425497321e-05, "loss": 1.4377, "step": 25583 }, { "epoch": 2.01, "learning_rate": 7.323023569346285e-05, "loss": 1.4389, "step": 25584 }, { "epoch": 2.01, "learning_rate": 7.32196176531768e-05, "loss": 1.4083, "step": 25585 }, { "epoch": 2.01, "learning_rate": 7.32090001341872e-05, "loss": 1.4255, "step": 25586 }, { "epoch": 2.01, "learning_rate": 7.319838313656605e-05, "loss": 1.462, "step": 25587 }, { "epoch": 2.01, "learning_rate": 7.318776666038556e-05, "loss": 1.4521, "step": 25588 }, { "epoch": 2.01, "learning_rate": 7.317715070571772e-05, "loss": 1.4287, "step": 25589 }, { "epoch": 2.01, "learning_rate": 7.316653527263459e-05, "loss": 1.4599, "step": 25590 }, { "epoch": 2.01, "learning_rate": 7.315592036120835e-05, "loss": 1.4481, "step": 25591 }, { "epoch": 2.01, "learning_rate": 7.314530597151098e-05, "loss": 1.4732, "step": 25592 }, { "epoch": 2.01, "learning_rate": 7.313469210361453e-05, "loss": 1.4625, "step": 25593 }, { "epoch": 2.01, "learning_rate": 7.31240787575911e-05, "loss": 1.4449, "step": 25594 }, { "epoch": 2.01, "learning_rate": 7.31134659335128e-05, "loss": 1.3664, "step": 25595 }, { "epoch": 2.01, "learning_rate": 7.310285363145166e-05, "loss": 1.4845, "step": 25596 }, { "epoch": 2.01, "learning_rate": 7.309224185147965e-05, "loss": 1.4782, "step": 25597 }, { "epoch": 2.01, "learning_rate": 7.308163059366892e-05, "loss": 1.4752, "step": 25598 }, { "epoch": 2.01, "learning_rate": 7.307101985809147e-05, "loss": 1.4511, "step": 25599 }, { "epoch": 2.01, "learning_rate": 7.30604096448193e-05, "loss": 1.4439, "step": 25600 }, { "epoch": 2.01, "learning_rate": 7.304979995392452e-05, "loss": 1.4516, "step": 25601 }, { "epoch": 2.01, "learning_rate": 7.303919078547915e-05, "loss": 1.4269, "step": 25602 }, { "epoch": 2.01, "learning_rate": 7.30285821395552e-05, "loss": 1.4856, "step": 25603 }, { "epoch": 2.01, "learning_rate": 7.301797401622465e-05, "loss": 1.4494, "step": 25604 }, { "epoch": 2.01, "learning_rate": 7.300736641555962e-05, "loss": 1.4761, "step": 25605 }, { "epoch": 2.01, "learning_rate": 7.29967593376321e-05, "loss": 1.4595, "step": 25606 }, { "epoch": 2.01, "learning_rate": 7.298615278251403e-05, "loss": 1.4629, "step": 25607 }, { "epoch": 2.01, "learning_rate": 7.297554675027754e-05, "loss": 1.4501, "step": 25608 }, { "epoch": 2.01, "learning_rate": 7.296494124099457e-05, "loss": 1.4599, "step": 25609 }, { "epoch": 2.02, "learning_rate": 7.295433625473709e-05, "loss": 1.4238, "step": 25610 }, { "epoch": 2.02, "learning_rate": 7.294373179157715e-05, "loss": 1.4652, "step": 25611 }, { "epoch": 2.02, "learning_rate": 7.29331278515868e-05, "loss": 1.4106, "step": 25612 }, { "epoch": 2.02, "learning_rate": 7.292252443483798e-05, "loss": 1.528, "step": 25613 }, { "epoch": 2.02, "learning_rate": 7.291192154140263e-05, "loss": 1.4875, "step": 25614 }, { "epoch": 2.02, "learning_rate": 7.290131917135284e-05, "loss": 1.4733, "step": 25615 }, { "epoch": 2.02, "learning_rate": 7.289071732476057e-05, "loss": 1.4194, "step": 25616 }, { "epoch": 2.02, "learning_rate": 7.28801160016977e-05, "loss": 1.3963, "step": 25617 }, { "epoch": 2.02, "learning_rate": 7.286951520223637e-05, "loss": 1.5206, "step": 25618 }, { "epoch": 2.02, "learning_rate": 7.285891492644843e-05, "loss": 1.4805, "step": 25619 }, { "epoch": 2.02, "learning_rate": 7.284831517440585e-05, "loss": 1.4337, "step": 25620 }, { "epoch": 2.02, "learning_rate": 7.283771594618068e-05, "loss": 1.4366, "step": 25621 }, { "epoch": 2.02, "learning_rate": 7.282711724184487e-05, "loss": 1.4972, "step": 25622 }, { "epoch": 2.02, "learning_rate": 7.281651906147031e-05, "loss": 1.4362, "step": 25623 }, { "epoch": 2.02, "learning_rate": 7.280592140512894e-05, "loss": 1.4789, "step": 25624 }, { "epoch": 2.02, "learning_rate": 7.279532427289277e-05, "loss": 1.497, "step": 25625 }, { "epoch": 2.02, "learning_rate": 7.27847276648338e-05, "loss": 1.481, "step": 25626 }, { "epoch": 2.02, "learning_rate": 7.277413158102393e-05, "loss": 1.4234, "step": 25627 }, { "epoch": 2.02, "learning_rate": 7.276353602153501e-05, "loss": 1.4565, "step": 25628 }, { "epoch": 2.02, "learning_rate": 7.275294098643914e-05, "loss": 1.4568, "step": 25629 }, { "epoch": 2.02, "learning_rate": 7.274234647580814e-05, "loss": 1.4679, "step": 25630 }, { "epoch": 2.02, "learning_rate": 7.273175248971395e-05, "loss": 1.3814, "step": 25631 }, { "epoch": 2.02, "learning_rate": 7.272115902822857e-05, "loss": 1.4777, "step": 25632 }, { "epoch": 2.02, "learning_rate": 7.271056609142387e-05, "loss": 1.4699, "step": 25633 }, { "epoch": 2.02, "learning_rate": 7.26999736793717e-05, "loss": 1.4173, "step": 25634 }, { "epoch": 2.02, "learning_rate": 7.268938179214412e-05, "loss": 1.4689, "step": 25635 }, { "epoch": 2.02, "learning_rate": 7.267879042981299e-05, "loss": 1.4427, "step": 25636 }, { "epoch": 2.02, "learning_rate": 7.266819959245014e-05, "loss": 1.4895, "step": 25637 }, { "epoch": 2.02, "learning_rate": 7.265760928012758e-05, "loss": 1.425, "step": 25638 }, { "epoch": 2.02, "learning_rate": 7.264701949291718e-05, "loss": 1.4569, "step": 25639 }, { "epoch": 2.02, "learning_rate": 7.263643023089084e-05, "loss": 1.4585, "step": 25640 }, { "epoch": 2.02, "learning_rate": 7.262584149412032e-05, "loss": 1.4744, "step": 25641 }, { "epoch": 2.02, "learning_rate": 7.261525328267776e-05, "loss": 1.4576, "step": 25642 }, { "epoch": 2.02, "learning_rate": 7.260466559663492e-05, "loss": 1.4322, "step": 25643 }, { "epoch": 2.02, "learning_rate": 7.259407843606369e-05, "loss": 1.4269, "step": 25644 }, { "epoch": 2.02, "learning_rate": 7.25834918010359e-05, "loss": 1.4392, "step": 25645 }, { "epoch": 2.02, "learning_rate": 7.257290569162353e-05, "loss": 1.4742, "step": 25646 }, { "epoch": 2.02, "learning_rate": 7.256232010789841e-05, "loss": 1.4805, "step": 25647 }, { "epoch": 2.02, "learning_rate": 7.255173504993234e-05, "loss": 1.4428, "step": 25648 }, { "epoch": 2.02, "learning_rate": 7.254115051779729e-05, "loss": 1.4694, "step": 25649 }, { "epoch": 2.02, "learning_rate": 7.25305665115651e-05, "loss": 1.5048, "step": 25650 }, { "epoch": 2.02, "learning_rate": 7.251998303130756e-05, "loss": 1.4405, "step": 25651 }, { "epoch": 2.02, "learning_rate": 7.250940007709665e-05, "loss": 1.4915, "step": 25652 }, { "epoch": 2.02, "learning_rate": 7.249881764900412e-05, "loss": 1.4996, "step": 25653 }, { "epoch": 2.02, "learning_rate": 7.24882357471018e-05, "loss": 1.496, "step": 25654 }, { "epoch": 2.02, "learning_rate": 7.247765437146166e-05, "loss": 1.4777, "step": 25655 }, { "epoch": 2.02, "learning_rate": 7.246707352215545e-05, "loss": 1.5003, "step": 25656 }, { "epoch": 2.02, "learning_rate": 7.245649319925497e-05, "loss": 1.4728, "step": 25657 }, { "epoch": 2.02, "learning_rate": 7.244591340283209e-05, "loss": 1.4705, "step": 25658 }, { "epoch": 2.02, "learning_rate": 7.243533413295875e-05, "loss": 1.472, "step": 25659 }, { "epoch": 2.02, "learning_rate": 7.242475538970667e-05, "loss": 1.4402, "step": 25660 }, { "epoch": 2.02, "learning_rate": 7.241417717314764e-05, "loss": 1.4634, "step": 25661 }, { "epoch": 2.02, "learning_rate": 7.240359948335357e-05, "loss": 1.4586, "step": 25662 }, { "epoch": 2.02, "learning_rate": 7.239302232039626e-05, "loss": 1.4711, "step": 25663 }, { "epoch": 2.02, "learning_rate": 7.238244568434751e-05, "loss": 1.4888, "step": 25664 }, { "epoch": 2.02, "learning_rate": 7.237186957527904e-05, "loss": 1.4524, "step": 25665 }, { "epoch": 2.02, "learning_rate": 7.23612939932628e-05, "loss": 1.4386, "step": 25666 }, { "epoch": 2.02, "learning_rate": 7.235071893837054e-05, "loss": 1.4343, "step": 25667 }, { "epoch": 2.02, "learning_rate": 7.234014441067399e-05, "loss": 1.4803, "step": 25668 }, { "epoch": 2.02, "learning_rate": 7.232957041024506e-05, "loss": 1.4943, "step": 25669 }, { "epoch": 2.02, "learning_rate": 7.231899693715548e-05, "loss": 1.4393, "step": 25670 }, { "epoch": 2.02, "learning_rate": 7.230842399147698e-05, "loss": 1.4388, "step": 25671 }, { "epoch": 2.02, "learning_rate": 7.229785157328146e-05, "loss": 1.4418, "step": 25672 }, { "epoch": 2.02, "learning_rate": 7.228727968264061e-05, "loss": 1.4973, "step": 25673 }, { "epoch": 2.02, "learning_rate": 7.227670831962628e-05, "loss": 1.4557, "step": 25674 }, { "epoch": 2.02, "learning_rate": 7.226613748431017e-05, "loss": 1.4187, "step": 25675 }, { "epoch": 2.02, "learning_rate": 7.225556717676414e-05, "loss": 1.4516, "step": 25676 }, { "epoch": 2.02, "learning_rate": 7.22449973970599e-05, "loss": 1.4773, "step": 25677 }, { "epoch": 2.02, "learning_rate": 7.223442814526918e-05, "loss": 1.4249, "step": 25678 }, { "epoch": 2.02, "learning_rate": 7.222385942146382e-05, "loss": 1.4939, "step": 25679 }, { "epoch": 2.02, "learning_rate": 7.221329122571553e-05, "loss": 1.4377, "step": 25680 }, { "epoch": 2.02, "learning_rate": 7.220272355809609e-05, "loss": 1.394, "step": 25681 }, { "epoch": 2.02, "learning_rate": 7.219215641867714e-05, "loss": 1.4579, "step": 25682 }, { "epoch": 2.02, "learning_rate": 7.218158980753058e-05, "loss": 1.4871, "step": 25683 }, { "epoch": 2.02, "learning_rate": 7.217102372472807e-05, "loss": 1.4623, "step": 25684 }, { "epoch": 2.02, "learning_rate": 7.216045817034132e-05, "loss": 1.5234, "step": 25685 }, { "epoch": 2.02, "learning_rate": 7.214989314444216e-05, "loss": 1.4961, "step": 25686 }, { "epoch": 2.02, "learning_rate": 7.213932864710227e-05, "loss": 1.4325, "step": 25687 }, { "epoch": 2.02, "learning_rate": 7.21287646783933e-05, "loss": 1.4412, "step": 25688 }, { "epoch": 2.02, "learning_rate": 7.211820123838704e-05, "loss": 1.4579, "step": 25689 }, { "epoch": 2.02, "learning_rate": 7.210763832715527e-05, "loss": 1.425, "step": 25690 }, { "epoch": 2.02, "learning_rate": 7.209707594476966e-05, "loss": 1.4707, "step": 25691 }, { "epoch": 2.02, "learning_rate": 7.208651409130186e-05, "loss": 1.5373, "step": 25692 }, { "epoch": 2.02, "learning_rate": 7.20759527668237e-05, "loss": 1.4229, "step": 25693 }, { "epoch": 2.02, "learning_rate": 7.20653919714068e-05, "loss": 1.4435, "step": 25694 }, { "epoch": 2.02, "learning_rate": 7.205483170512283e-05, "loss": 1.4316, "step": 25695 }, { "epoch": 2.02, "learning_rate": 7.20442719680436e-05, "loss": 1.4458, "step": 25696 }, { "epoch": 2.02, "learning_rate": 7.203371276024074e-05, "loss": 1.4264, "step": 25697 }, { "epoch": 2.02, "learning_rate": 7.202315408178596e-05, "loss": 1.4054, "step": 25698 }, { "epoch": 2.02, "learning_rate": 7.201259593275085e-05, "loss": 1.4303, "step": 25699 }, { "epoch": 2.02, "learning_rate": 7.200203831320724e-05, "loss": 1.5127, "step": 25700 }, { "epoch": 2.02, "learning_rate": 7.199148122322675e-05, "loss": 1.4888, "step": 25701 }, { "epoch": 2.02, "learning_rate": 7.198092466288101e-05, "loss": 1.4918, "step": 25702 }, { "epoch": 2.02, "learning_rate": 7.197036863224177e-05, "loss": 1.5063, "step": 25703 }, { "epoch": 2.02, "learning_rate": 7.195981313138063e-05, "loss": 1.4966, "step": 25704 }, { "epoch": 2.02, "learning_rate": 7.194925816036934e-05, "loss": 1.4378, "step": 25705 }, { "epoch": 2.02, "learning_rate": 7.193870371927946e-05, "loss": 1.4988, "step": 25706 }, { "epoch": 2.02, "learning_rate": 7.192814980818277e-05, "loss": 1.4091, "step": 25707 }, { "epoch": 2.02, "learning_rate": 7.191759642715084e-05, "loss": 1.496, "step": 25708 }, { "epoch": 2.02, "learning_rate": 7.190704357625529e-05, "loss": 1.4721, "step": 25709 }, { "epoch": 2.02, "learning_rate": 7.189649125556789e-05, "loss": 1.389, "step": 25710 }, { "epoch": 2.02, "learning_rate": 7.18859394651602e-05, "loss": 1.5081, "step": 25711 }, { "epoch": 2.02, "learning_rate": 7.187538820510382e-05, "loss": 1.4736, "step": 25712 }, { "epoch": 2.02, "learning_rate": 7.186483747547048e-05, "loss": 1.4592, "step": 25713 }, { "epoch": 2.02, "learning_rate": 7.185428727633181e-05, "loss": 1.5167, "step": 25714 }, { "epoch": 2.02, "learning_rate": 7.184373760775939e-05, "loss": 1.4446, "step": 25715 }, { "epoch": 2.02, "learning_rate": 7.183318846982479e-05, "loss": 1.4521, "step": 25716 }, { "epoch": 2.02, "learning_rate": 7.182263986259979e-05, "loss": 1.4538, "step": 25717 }, { "epoch": 2.02, "learning_rate": 7.18120917861559e-05, "loss": 1.487, "step": 25718 }, { "epoch": 2.02, "learning_rate": 7.180154424056472e-05, "loss": 1.4281, "step": 25719 }, { "epoch": 2.02, "learning_rate": 7.179099722589789e-05, "loss": 1.4646, "step": 25720 }, { "epoch": 2.02, "learning_rate": 7.178045074222708e-05, "loss": 1.419, "step": 25721 }, { "epoch": 2.02, "learning_rate": 7.176990478962385e-05, "loss": 1.4527, "step": 25722 }, { "epoch": 2.02, "learning_rate": 7.175935936815974e-05, "loss": 1.4221, "step": 25723 }, { "epoch": 2.02, "learning_rate": 7.174881447790646e-05, "loss": 1.4528, "step": 25724 }, { "epoch": 2.02, "learning_rate": 7.173827011893554e-05, "loss": 1.4695, "step": 25725 }, { "epoch": 2.02, "learning_rate": 7.172772629131854e-05, "loss": 1.4898, "step": 25726 }, { "epoch": 2.02, "learning_rate": 7.171718299512713e-05, "loss": 1.4519, "step": 25727 }, { "epoch": 2.02, "learning_rate": 7.170664023043284e-05, "loss": 1.4707, "step": 25728 }, { "epoch": 2.02, "learning_rate": 7.169609799730722e-05, "loss": 1.4918, "step": 25729 }, { "epoch": 2.02, "learning_rate": 7.168555629582192e-05, "loss": 1.4569, "step": 25730 }, { "epoch": 2.02, "learning_rate": 7.167501512604848e-05, "loss": 1.4614, "step": 25731 }, { "epoch": 2.02, "learning_rate": 7.166447448805842e-05, "loss": 1.4231, "step": 25732 }, { "epoch": 2.02, "learning_rate": 7.165393438192338e-05, "loss": 1.4738, "step": 25733 }, { "epoch": 2.02, "learning_rate": 7.16433948077149e-05, "loss": 1.4488, "step": 25734 }, { "epoch": 2.02, "learning_rate": 7.163285576550449e-05, "loss": 1.4623, "step": 25735 }, { "epoch": 2.02, "learning_rate": 7.162231725536373e-05, "loss": 1.4966, "step": 25736 }, { "epoch": 2.03, "learning_rate": 7.161177927736423e-05, "loss": 1.4131, "step": 25737 }, { "epoch": 2.03, "learning_rate": 7.16012418315775e-05, "loss": 1.454, "step": 25738 }, { "epoch": 2.03, "learning_rate": 7.159070491807508e-05, "loss": 1.4466, "step": 25739 }, { "epoch": 2.03, "learning_rate": 7.158016853692845e-05, "loss": 1.4596, "step": 25740 }, { "epoch": 2.03, "learning_rate": 7.156963268820924e-05, "loss": 1.4617, "step": 25741 }, { "epoch": 2.03, "learning_rate": 7.155909737198895e-05, "loss": 1.4635, "step": 25742 }, { "epoch": 2.03, "learning_rate": 7.154856258833905e-05, "loss": 1.4729, "step": 25743 }, { "epoch": 2.03, "learning_rate": 7.153802833733117e-05, "loss": 1.4537, "step": 25744 }, { "epoch": 2.03, "learning_rate": 7.152749461903679e-05, "loss": 1.4835, "step": 25745 }, { "epoch": 2.03, "learning_rate": 7.151696143352734e-05, "loss": 1.5135, "step": 25746 }, { "epoch": 2.03, "learning_rate": 7.150642878087447e-05, "loss": 1.3621, "step": 25747 }, { "epoch": 2.03, "learning_rate": 7.149589666114965e-05, "loss": 1.4953, "step": 25748 }, { "epoch": 2.03, "learning_rate": 7.148536507442429e-05, "loss": 1.4256, "step": 25749 }, { "epoch": 2.03, "learning_rate": 7.147483402077004e-05, "loss": 1.4808, "step": 25750 }, { "epoch": 2.03, "learning_rate": 7.146430350025828e-05, "loss": 1.4824, "step": 25751 }, { "epoch": 2.03, "learning_rate": 7.145377351296061e-05, "loss": 1.5191, "step": 25752 }, { "epoch": 2.03, "learning_rate": 7.144324405894843e-05, "loss": 1.4634, "step": 25753 }, { "epoch": 2.03, "learning_rate": 7.143271513829331e-05, "loss": 1.4244, "step": 25754 }, { "epoch": 2.03, "learning_rate": 7.142218675106671e-05, "loss": 1.4745, "step": 25755 }, { "epoch": 2.03, "learning_rate": 7.14116588973401e-05, "loss": 1.446, "step": 25756 }, { "epoch": 2.03, "learning_rate": 7.14011315771849e-05, "loss": 1.423, "step": 25757 }, { "epoch": 2.03, "learning_rate": 7.139060479067268e-05, "loss": 1.4625, "step": 25758 }, { "epoch": 2.03, "learning_rate": 7.138007853787489e-05, "loss": 1.4974, "step": 25759 }, { "epoch": 2.03, "learning_rate": 7.136955281886293e-05, "loss": 1.4551, "step": 25760 }, { "epoch": 2.03, "learning_rate": 7.135902763370836e-05, "loss": 1.432, "step": 25761 }, { "epoch": 2.03, "learning_rate": 7.134850298248259e-05, "loss": 1.5176, "step": 25762 }, { "epoch": 2.03, "learning_rate": 7.133797886525705e-05, "loss": 1.4797, "step": 25763 }, { "epoch": 2.03, "learning_rate": 7.132745528210324e-05, "loss": 1.4493, "step": 25764 }, { "epoch": 2.03, "learning_rate": 7.131693223309262e-05, "loss": 1.4894, "step": 25765 }, { "epoch": 2.03, "learning_rate": 7.130640971829655e-05, "loss": 1.447, "step": 25766 }, { "epoch": 2.03, "learning_rate": 7.129588773778653e-05, "loss": 1.4648, "step": 25767 }, { "epoch": 2.03, "learning_rate": 7.128536629163406e-05, "loss": 1.5388, "step": 25768 }, { "epoch": 2.03, "learning_rate": 7.127484537991052e-05, "loss": 1.444, "step": 25769 }, { "epoch": 2.03, "learning_rate": 7.126432500268727e-05, "loss": 1.4356, "step": 25770 }, { "epoch": 2.03, "learning_rate": 7.125380516003586e-05, "loss": 1.4558, "step": 25771 }, { "epoch": 2.03, "learning_rate": 7.124328585202766e-05, "loss": 1.5186, "step": 25772 }, { "epoch": 2.03, "learning_rate": 7.123276707873403e-05, "loss": 1.4155, "step": 25773 }, { "epoch": 2.03, "learning_rate": 7.12222488402265e-05, "loss": 1.411, "step": 25774 }, { "epoch": 2.03, "learning_rate": 7.121173113657642e-05, "loss": 1.4707, "step": 25775 }, { "epoch": 2.03, "learning_rate": 7.12012139678552e-05, "loss": 1.4687, "step": 25776 }, { "epoch": 2.03, "learning_rate": 7.119069733413422e-05, "loss": 1.451, "step": 25777 }, { "epoch": 2.03, "learning_rate": 7.118018123548495e-05, "loss": 1.4244, "step": 25778 }, { "epoch": 2.03, "learning_rate": 7.116966567197877e-05, "loss": 1.5051, "step": 25779 }, { "epoch": 2.03, "learning_rate": 7.1159150643687e-05, "loss": 1.5087, "step": 25780 }, { "epoch": 2.03, "learning_rate": 7.114863615068114e-05, "loss": 1.4448, "step": 25781 }, { "epoch": 2.03, "learning_rate": 7.113812219303252e-05, "loss": 1.4472, "step": 25782 }, { "epoch": 2.03, "learning_rate": 7.112760877081247e-05, "loss": 1.4368, "step": 25783 }, { "epoch": 2.03, "learning_rate": 7.111709588409244e-05, "loss": 1.4193, "step": 25784 }, { "epoch": 2.03, "learning_rate": 7.110658353294388e-05, "loss": 1.4459, "step": 25785 }, { "epoch": 2.03, "learning_rate": 7.109607171743806e-05, "loss": 1.4799, "step": 25786 }, { "epoch": 2.03, "learning_rate": 7.10855604376463e-05, "loss": 1.4149, "step": 25787 }, { "epoch": 2.03, "learning_rate": 7.107504969364009e-05, "loss": 1.4941, "step": 25788 }, { "epoch": 2.03, "learning_rate": 7.106453948549077e-05, "loss": 1.4078, "step": 25789 }, { "epoch": 2.03, "learning_rate": 7.10540298132696e-05, "loss": 1.4309, "step": 25790 }, { "epoch": 2.03, "learning_rate": 7.104352067704804e-05, "loss": 1.4502, "step": 25791 }, { "epoch": 2.03, "learning_rate": 7.103301207689742e-05, "loss": 1.4461, "step": 25792 }, { "epoch": 2.03, "learning_rate": 7.102250401288905e-05, "loss": 1.4533, "step": 25793 }, { "epoch": 2.03, "learning_rate": 7.101199648509424e-05, "loss": 1.4454, "step": 25794 }, { "epoch": 2.03, "learning_rate": 7.100148949358448e-05, "loss": 1.4757, "step": 25795 }, { "epoch": 2.03, "learning_rate": 7.099098303843098e-05, "loss": 1.4924, "step": 25796 }, { "epoch": 2.03, "learning_rate": 7.098047711970505e-05, "loss": 1.4486, "step": 25797 }, { "epoch": 2.03, "learning_rate": 7.096997173747806e-05, "loss": 1.4792, "step": 25798 }, { "epoch": 2.03, "learning_rate": 7.095946689182142e-05, "loss": 1.4257, "step": 25799 }, { "epoch": 2.03, "learning_rate": 7.094896258280639e-05, "loss": 1.4877, "step": 25800 }, { "epoch": 2.03, "learning_rate": 7.093845881050421e-05, "loss": 1.4687, "step": 25801 }, { "epoch": 2.03, "learning_rate": 7.092795557498633e-05, "loss": 1.4544, "step": 25802 }, { "epoch": 2.03, "learning_rate": 7.0917452876324e-05, "loss": 1.4807, "step": 25803 }, { "epoch": 2.03, "learning_rate": 7.090695071458845e-05, "loss": 1.4266, "step": 25804 }, { "epoch": 2.03, "learning_rate": 7.089644908985114e-05, "loss": 1.4569, "step": 25805 }, { "epoch": 2.03, "learning_rate": 7.088594800218327e-05, "loss": 1.462, "step": 25806 }, { "epoch": 2.03, "learning_rate": 7.087544745165609e-05, "loss": 1.4559, "step": 25807 }, { "epoch": 2.03, "learning_rate": 7.086494743834104e-05, "loss": 1.4754, "step": 25808 }, { "epoch": 2.03, "learning_rate": 7.08544479623093e-05, "loss": 1.4533, "step": 25809 }, { "epoch": 2.03, "learning_rate": 7.084394902363221e-05, "loss": 1.4153, "step": 25810 }, { "epoch": 2.03, "learning_rate": 7.083345062238093e-05, "loss": 1.4445, "step": 25811 }, { "epoch": 2.03, "learning_rate": 7.082295275862691e-05, "loss": 1.4847, "step": 25812 }, { "epoch": 2.03, "learning_rate": 7.081245543244137e-05, "loss": 1.4387, "step": 25813 }, { "epoch": 2.03, "learning_rate": 7.080195864389547e-05, "loss": 1.463, "step": 25814 }, { "epoch": 2.03, "learning_rate": 7.079146239306057e-05, "loss": 1.474, "step": 25815 }, { "epoch": 2.03, "learning_rate": 7.078096668000798e-05, "loss": 1.4346, "step": 25816 }, { "epoch": 2.03, "learning_rate": 7.077047150480893e-05, "loss": 1.497, "step": 25817 }, { "epoch": 2.03, "learning_rate": 7.075997686753458e-05, "loss": 1.4808, "step": 25818 }, { "epoch": 2.03, "learning_rate": 7.074948276825633e-05, "loss": 1.5102, "step": 25819 }, { "epoch": 2.03, "learning_rate": 7.073898920704536e-05, "loss": 1.4362, "step": 25820 }, { "epoch": 2.03, "learning_rate": 7.072849618397285e-05, "loss": 1.4353, "step": 25821 }, { "epoch": 2.03, "learning_rate": 7.071800369911016e-05, "loss": 1.4673, "step": 25822 }, { "epoch": 2.03, "learning_rate": 7.070751175252847e-05, "loss": 1.4632, "step": 25823 }, { "epoch": 2.03, "learning_rate": 7.069702034429898e-05, "loss": 1.4466, "step": 25824 }, { "epoch": 2.03, "learning_rate": 7.0686529474493e-05, "loss": 1.4933, "step": 25825 }, { "epoch": 2.03, "learning_rate": 7.067603914318171e-05, "loss": 1.4707, "step": 25826 }, { "epoch": 2.03, "learning_rate": 7.066554935043629e-05, "loss": 1.4303, "step": 25827 }, { "epoch": 2.03, "learning_rate": 7.065506009632807e-05, "loss": 1.4154, "step": 25828 }, { "epoch": 2.03, "learning_rate": 7.06445713809282e-05, "loss": 1.4603, "step": 25829 }, { "epoch": 2.03, "learning_rate": 7.063408320430784e-05, "loss": 1.4538, "step": 25830 }, { "epoch": 2.03, "learning_rate": 7.062359556653827e-05, "loss": 1.4736, "step": 25831 }, { "epoch": 2.03, "learning_rate": 7.061310846769073e-05, "loss": 1.4753, "step": 25832 }, { "epoch": 2.03, "learning_rate": 7.060262190783637e-05, "loss": 1.4381, "step": 25833 }, { "epoch": 2.03, "learning_rate": 7.059213588704641e-05, "loss": 1.4244, "step": 25834 }, { "epoch": 2.03, "learning_rate": 7.058165040539195e-05, "loss": 1.4805, "step": 25835 }, { "epoch": 2.03, "learning_rate": 7.057116546294432e-05, "loss": 1.4427, "step": 25836 }, { "epoch": 2.03, "learning_rate": 7.056068105977465e-05, "loss": 1.4446, "step": 25837 }, { "epoch": 2.03, "learning_rate": 7.055019719595404e-05, "loss": 1.4871, "step": 25838 }, { "epoch": 2.03, "learning_rate": 7.053971387155383e-05, "loss": 1.3956, "step": 25839 }, { "epoch": 2.03, "learning_rate": 7.052923108664511e-05, "loss": 1.4673, "step": 25840 }, { "epoch": 2.03, "learning_rate": 7.051874884129899e-05, "loss": 1.4426, "step": 25841 }, { "epoch": 2.03, "learning_rate": 7.050826713558676e-05, "loss": 1.4426, "step": 25842 }, { "epoch": 2.03, "learning_rate": 7.049778596957954e-05, "loss": 1.4311, "step": 25843 }, { "epoch": 2.03, "learning_rate": 7.048730534334842e-05, "loss": 1.529, "step": 25844 }, { "epoch": 2.03, "learning_rate": 7.047682525696459e-05, "loss": 1.4293, "step": 25845 }, { "epoch": 2.03, "learning_rate": 7.046634571049933e-05, "loss": 1.4347, "step": 25846 }, { "epoch": 2.03, "learning_rate": 7.045586670402366e-05, "loss": 1.4747, "step": 25847 }, { "epoch": 2.03, "learning_rate": 7.044538823760872e-05, "loss": 1.4982, "step": 25848 }, { "epoch": 2.03, "learning_rate": 7.043491031132575e-05, "loss": 1.4841, "step": 25849 }, { "epoch": 2.03, "learning_rate": 7.042443292524583e-05, "loss": 1.5321, "step": 25850 }, { "epoch": 2.03, "learning_rate": 7.041395607944008e-05, "loss": 1.4863, "step": 25851 }, { "epoch": 2.03, "learning_rate": 7.040347977397962e-05, "loss": 1.5371, "step": 25852 }, { "epoch": 2.03, "learning_rate": 7.039300400893564e-05, "loss": 1.4591, "step": 25853 }, { "epoch": 2.03, "learning_rate": 7.038252878437923e-05, "loss": 1.4261, "step": 25854 }, { "epoch": 2.03, "learning_rate": 7.037205410038148e-05, "loss": 1.4262, "step": 25855 }, { "epoch": 2.03, "learning_rate": 7.036157995701358e-05, "loss": 1.4151, "step": 25856 }, { "epoch": 2.03, "learning_rate": 7.035110635434661e-05, "loss": 1.4823, "step": 25857 }, { "epoch": 2.03, "learning_rate": 7.034063329245162e-05, "loss": 1.4545, "step": 25858 }, { "epoch": 2.03, "learning_rate": 7.033016077139981e-05, "loss": 1.408, "step": 25859 }, { "epoch": 2.03, "learning_rate": 7.031968879126227e-05, "loss": 1.4441, "step": 25860 }, { "epoch": 2.03, "learning_rate": 7.030921735210999e-05, "loss": 1.453, "step": 25861 }, { "epoch": 2.03, "learning_rate": 7.029874645401417e-05, "loss": 1.4474, "step": 25862 }, { "epoch": 2.03, "learning_rate": 7.028827609704593e-05, "loss": 1.431, "step": 25863 }, { "epoch": 2.04, "learning_rate": 7.027780628127629e-05, "loss": 1.4708, "step": 25864 }, { "epoch": 2.04, "learning_rate": 7.02673370067763e-05, "loss": 1.5013, "step": 25865 }, { "epoch": 2.04, "learning_rate": 7.025686827361716e-05, "loss": 1.4712, "step": 25866 }, { "epoch": 2.04, "learning_rate": 7.024640008186987e-05, "loss": 1.5144, "step": 25867 }, { "epoch": 2.04, "learning_rate": 7.023593243160551e-05, "loss": 1.4648, "step": 25868 }, { "epoch": 2.04, "learning_rate": 7.02254653228951e-05, "loss": 1.5248, "step": 25869 }, { "epoch": 2.04, "learning_rate": 7.02149987558098e-05, "loss": 1.4961, "step": 25870 }, { "epoch": 2.04, "learning_rate": 7.020453273042066e-05, "loss": 1.4297, "step": 25871 }, { "epoch": 2.04, "learning_rate": 7.019406724679862e-05, "loss": 1.4886, "step": 25872 }, { "epoch": 2.04, "learning_rate": 7.018360230501489e-05, "loss": 1.5233, "step": 25873 }, { "epoch": 2.04, "learning_rate": 7.017313790514047e-05, "loss": 1.4394, "step": 25874 }, { "epoch": 2.04, "learning_rate": 7.01626740472463e-05, "loss": 1.4879, "step": 25875 }, { "epoch": 2.04, "learning_rate": 7.01522107314036e-05, "loss": 1.4279, "step": 25876 }, { "epoch": 2.04, "learning_rate": 7.014174795768328e-05, "loss": 1.4875, "step": 25877 }, { "epoch": 2.04, "learning_rate": 7.013128572615645e-05, "loss": 1.4773, "step": 25878 }, { "epoch": 2.04, "learning_rate": 7.012082403689407e-05, "loss": 1.4004, "step": 25879 }, { "epoch": 2.04, "learning_rate": 7.011036288996728e-05, "loss": 1.4564, "step": 25880 }, { "epoch": 2.04, "learning_rate": 7.009990228544702e-05, "loss": 1.4713, "step": 25881 }, { "epoch": 2.04, "learning_rate": 7.008944222340427e-05, "loss": 1.419, "step": 25882 }, { "epoch": 2.04, "learning_rate": 7.007898270391019e-05, "loss": 1.4995, "step": 25883 }, { "epoch": 2.04, "learning_rate": 7.006852372703569e-05, "loss": 1.451, "step": 25884 }, { "epoch": 2.04, "learning_rate": 7.005806529285177e-05, "loss": 1.4245, "step": 25885 }, { "epoch": 2.04, "learning_rate": 7.00476074014295e-05, "loss": 1.4836, "step": 25886 }, { "epoch": 2.04, "learning_rate": 7.003715005283988e-05, "loss": 1.4111, "step": 25887 }, { "epoch": 2.04, "learning_rate": 7.002669324715388e-05, "loss": 1.4511, "step": 25888 }, { "epoch": 2.04, "learning_rate": 7.001623698444243e-05, "loss": 1.4586, "step": 25889 }, { "epoch": 2.04, "learning_rate": 7.000578126477667e-05, "loss": 1.4734, "step": 25890 }, { "epoch": 2.04, "learning_rate": 6.99953260882275e-05, "loss": 1.4517, "step": 25891 }, { "epoch": 2.04, "learning_rate": 6.998487145486584e-05, "loss": 1.4721, "step": 25892 }, { "epoch": 2.04, "learning_rate": 6.997441736476278e-05, "loss": 1.4777, "step": 25893 }, { "epoch": 2.04, "learning_rate": 6.996396381798931e-05, "loss": 1.4753, "step": 25894 }, { "epoch": 2.04, "learning_rate": 6.995351081461634e-05, "loss": 1.4614, "step": 25895 }, { "epoch": 2.04, "learning_rate": 6.994305835471481e-05, "loss": 1.4342, "step": 25896 }, { "epoch": 2.04, "learning_rate": 6.99326064383558e-05, "loss": 1.4547, "step": 25897 }, { "epoch": 2.04, "learning_rate": 6.99221550656102e-05, "loss": 1.4338, "step": 25898 }, { "epoch": 2.04, "learning_rate": 6.991170423654892e-05, "loss": 1.4117, "step": 25899 }, { "epoch": 2.04, "learning_rate": 6.990125395124303e-05, "loss": 1.4281, "step": 25900 }, { "epoch": 2.04, "learning_rate": 6.989080420976344e-05, "loss": 1.4132, "step": 25901 }, { "epoch": 2.04, "learning_rate": 6.9880355012181e-05, "loss": 1.483, "step": 25902 }, { "epoch": 2.04, "learning_rate": 6.98699063585668e-05, "loss": 1.3947, "step": 25903 }, { "epoch": 2.04, "learning_rate": 6.985945824899173e-05, "loss": 1.4025, "step": 25904 }, { "epoch": 2.04, "learning_rate": 6.98490106835267e-05, "loss": 1.4375, "step": 25905 }, { "epoch": 2.04, "learning_rate": 6.983856366224259e-05, "loss": 1.463, "step": 25906 }, { "epoch": 2.04, "learning_rate": 6.982811718521047e-05, "loss": 1.4547, "step": 25907 }, { "epoch": 2.04, "learning_rate": 6.981767125250113e-05, "loss": 1.4573, "step": 25908 }, { "epoch": 2.04, "learning_rate": 6.980722586418562e-05, "loss": 1.4404, "step": 25909 }, { "epoch": 2.04, "learning_rate": 6.979678102033472e-05, "loss": 1.4776, "step": 25910 }, { "epoch": 2.04, "learning_rate": 6.978633672101947e-05, "loss": 1.5457, "step": 25911 }, { "epoch": 2.04, "learning_rate": 6.977589296631075e-05, "loss": 1.4307, "step": 25912 }, { "epoch": 2.04, "learning_rate": 6.976544975627937e-05, "loss": 1.4529, "step": 25913 }, { "epoch": 2.04, "learning_rate": 6.975500709099638e-05, "loss": 1.474, "step": 25914 }, { "epoch": 2.04, "learning_rate": 6.974456497053258e-05, "loss": 1.4807, "step": 25915 }, { "epoch": 2.04, "learning_rate": 6.973412339495886e-05, "loss": 1.4945, "step": 25916 }, { "epoch": 2.04, "learning_rate": 6.972368236434622e-05, "loss": 1.4763, "step": 25917 }, { "epoch": 2.04, "learning_rate": 6.971324187876546e-05, "loss": 1.4748, "step": 25918 }, { "epoch": 2.04, "learning_rate": 6.970280193828743e-05, "loss": 1.4539, "step": 25919 }, { "epoch": 2.04, "learning_rate": 6.969236254298311e-05, "loss": 1.4525, "step": 25920 }, { "epoch": 2.04, "learning_rate": 6.968192369292334e-05, "loss": 1.4736, "step": 25921 }, { "epoch": 2.04, "learning_rate": 6.967148538817898e-05, "loss": 1.3753, "step": 25922 }, { "epoch": 2.04, "learning_rate": 6.966104762882085e-05, "loss": 1.4326, "step": 25923 }, { "epoch": 2.04, "learning_rate": 6.965061041491988e-05, "loss": 1.4566, "step": 25924 }, { "epoch": 2.04, "learning_rate": 6.964017374654697e-05, "loss": 1.4421, "step": 25925 }, { "epoch": 2.04, "learning_rate": 6.962973762377287e-05, "loss": 1.4685, "step": 25926 }, { "epoch": 2.04, "learning_rate": 6.961930204666857e-05, "loss": 1.4538, "step": 25927 }, { "epoch": 2.04, "learning_rate": 6.960886701530486e-05, "loss": 1.5333, "step": 25928 }, { "epoch": 2.04, "learning_rate": 6.959843252975255e-05, "loss": 1.4297, "step": 25929 }, { "epoch": 2.04, "learning_rate": 6.95879985900825e-05, "loss": 1.5036, "step": 25930 }, { "epoch": 2.04, "learning_rate": 6.957756519636558e-05, "loss": 1.4404, "step": 25931 }, { "epoch": 2.04, "learning_rate": 6.956713234867262e-05, "loss": 1.4683, "step": 25932 }, { "epoch": 2.04, "learning_rate": 6.955670004707441e-05, "loss": 1.4834, "step": 25933 }, { "epoch": 2.04, "learning_rate": 6.954626829164186e-05, "loss": 1.4481, "step": 25934 }, { "epoch": 2.04, "learning_rate": 6.953583708244574e-05, "loss": 1.4471, "step": 25935 }, { "epoch": 2.04, "learning_rate": 6.952540641955685e-05, "loss": 1.4258, "step": 25936 }, { "epoch": 2.04, "learning_rate": 6.951497630304607e-05, "loss": 1.4187, "step": 25937 }, { "epoch": 2.04, "learning_rate": 6.95045467329842e-05, "loss": 1.4567, "step": 25938 }, { "epoch": 2.04, "learning_rate": 6.949411770944197e-05, "loss": 1.4294, "step": 25939 }, { "epoch": 2.04, "learning_rate": 6.948368923249025e-05, "loss": 1.4855, "step": 25940 }, { "epoch": 2.04, "learning_rate": 6.947326130219992e-05, "loss": 1.4653, "step": 25941 }, { "epoch": 2.04, "learning_rate": 6.946283391864171e-05, "loss": 1.4652, "step": 25942 }, { "epoch": 2.04, "learning_rate": 6.945240708188635e-05, "loss": 1.388, "step": 25943 }, { "epoch": 2.04, "learning_rate": 6.944198079200474e-05, "loss": 1.4378, "step": 25944 }, { "epoch": 2.04, "learning_rate": 6.943155504906764e-05, "loss": 1.4289, "step": 25945 }, { "epoch": 2.04, "learning_rate": 6.942112985314581e-05, "loss": 1.4965, "step": 25946 }, { "epoch": 2.04, "learning_rate": 6.941070520431e-05, "loss": 1.4624, "step": 25947 }, { "epoch": 2.04, "learning_rate": 6.940028110263109e-05, "loss": 1.4134, "step": 25948 }, { "epoch": 2.04, "learning_rate": 6.938985754817977e-05, "loss": 1.4507, "step": 25949 }, { "epoch": 2.04, "learning_rate": 6.937943454102678e-05, "loss": 1.4811, "step": 25950 }, { "epoch": 2.04, "learning_rate": 6.9369012081243e-05, "loss": 1.4628, "step": 25951 }, { "epoch": 2.04, "learning_rate": 6.935859016889914e-05, "loss": 1.4481, "step": 25952 }, { "epoch": 2.04, "learning_rate": 6.934816880406587e-05, "loss": 1.4468, "step": 25953 }, { "epoch": 2.04, "learning_rate": 6.933774798681412e-05, "loss": 1.4927, "step": 25954 }, { "epoch": 2.04, "learning_rate": 6.932732771721446e-05, "loss": 1.4827, "step": 25955 }, { "epoch": 2.04, "learning_rate": 6.93169079953378e-05, "loss": 1.4873, "step": 25956 }, { "epoch": 2.04, "learning_rate": 6.930648882125476e-05, "loss": 1.4484, "step": 25957 }, { "epoch": 2.04, "learning_rate": 6.929607019503617e-05, "loss": 1.4411, "step": 25958 }, { "epoch": 2.04, "learning_rate": 6.928565211675273e-05, "loss": 1.4413, "step": 25959 }, { "epoch": 2.04, "learning_rate": 6.927523458647513e-05, "loss": 1.4456, "step": 25960 }, { "epoch": 2.04, "learning_rate": 6.926481760427417e-05, "loss": 1.4398, "step": 25961 }, { "epoch": 2.04, "learning_rate": 6.925440117022056e-05, "loss": 1.4681, "step": 25962 }, { "epoch": 2.04, "learning_rate": 6.924398528438499e-05, "loss": 1.4609, "step": 25963 }, { "epoch": 2.04, "learning_rate": 6.923356994683816e-05, "loss": 1.4286, "step": 25964 }, { "epoch": 2.04, "learning_rate": 6.922315515765087e-05, "loss": 1.4647, "step": 25965 }, { "epoch": 2.04, "learning_rate": 6.921274091689378e-05, "loss": 1.451, "step": 25966 }, { "epoch": 2.04, "learning_rate": 6.920232722463756e-05, "loss": 1.466, "step": 25967 }, { "epoch": 2.04, "learning_rate": 6.919191408095297e-05, "loss": 1.4741, "step": 25968 }, { "epoch": 2.04, "learning_rate": 6.91815014859107e-05, "loss": 1.4352, "step": 25969 }, { "epoch": 2.04, "learning_rate": 6.917108943958138e-05, "loss": 1.5035, "step": 25970 }, { "epoch": 2.04, "learning_rate": 6.916067794203578e-05, "loss": 1.4443, "step": 25971 }, { "epoch": 2.04, "learning_rate": 6.91502669933446e-05, "loss": 1.4853, "step": 25972 }, { "epoch": 2.04, "learning_rate": 6.91398565935785e-05, "loss": 1.4508, "step": 25973 }, { "epoch": 2.04, "learning_rate": 6.912944674280808e-05, "loss": 1.5069, "step": 25974 }, { "epoch": 2.04, "learning_rate": 6.911903744110417e-05, "loss": 1.4136, "step": 25975 }, { "epoch": 2.04, "learning_rate": 6.910862868853735e-05, "loss": 1.4467, "step": 25976 }, { "epoch": 2.04, "learning_rate": 6.909822048517823e-05, "loss": 1.4702, "step": 25977 }, { "epoch": 2.04, "learning_rate": 6.908781283109762e-05, "loss": 1.4706, "step": 25978 }, { "epoch": 2.04, "learning_rate": 6.907740572636611e-05, "loss": 1.4211, "step": 25979 }, { "epoch": 2.04, "learning_rate": 6.906699917105434e-05, "loss": 1.4809, "step": 25980 }, { "epoch": 2.04, "learning_rate": 6.905659316523295e-05, "loss": 1.4667, "step": 25981 }, { "epoch": 2.04, "learning_rate": 6.904618770897269e-05, "loss": 1.4962, "step": 25982 }, { "epoch": 2.04, "learning_rate": 6.903578280234411e-05, "loss": 1.4829, "step": 25983 }, { "epoch": 2.04, "learning_rate": 6.902537844541785e-05, "loss": 1.4471, "step": 25984 }, { "epoch": 2.04, "learning_rate": 6.901497463826464e-05, "loss": 1.4845, "step": 25985 }, { "epoch": 2.04, "learning_rate": 6.900457138095505e-05, "loss": 1.4566, "step": 25986 }, { "epoch": 2.04, "learning_rate": 6.899416867355967e-05, "loss": 1.4978, "step": 25987 }, { "epoch": 2.04, "learning_rate": 6.898376651614918e-05, "loss": 1.4773, "step": 25988 }, { "epoch": 2.04, "learning_rate": 6.897336490879428e-05, "loss": 1.4773, "step": 25989 }, { "epoch": 2.04, "learning_rate": 6.89629638515655e-05, "loss": 1.4775, "step": 25990 }, { "epoch": 2.05, "learning_rate": 6.895256334453343e-05, "loss": 1.4786, "step": 25991 }, { "epoch": 2.05, "learning_rate": 6.894216338776877e-05, "loss": 1.4518, "step": 25992 }, { "epoch": 2.05, "learning_rate": 6.89317639813421e-05, "loss": 1.4121, "step": 25993 }, { "epoch": 2.05, "learning_rate": 6.892136512532396e-05, "loss": 1.425, "step": 25994 }, { "epoch": 2.05, "learning_rate": 6.891096681978507e-05, "loss": 1.3908, "step": 25995 }, { "epoch": 2.05, "learning_rate": 6.890056906479596e-05, "loss": 1.4114, "step": 25996 }, { "epoch": 2.05, "learning_rate": 6.889017186042717e-05, "loss": 1.4256, "step": 25997 }, { "epoch": 2.05, "learning_rate": 6.887977520674941e-05, "loss": 1.4239, "step": 25998 }, { "epoch": 2.05, "learning_rate": 6.886937910383323e-05, "loss": 1.4334, "step": 25999 }, { "epoch": 2.05, "learning_rate": 6.885898355174917e-05, "loss": 1.5033, "step": 26000 }, { "epoch": 2.05, "learning_rate": 6.884858855056777e-05, "loss": 1.454, "step": 26001 }, { "epoch": 2.05, "learning_rate": 6.883819410035976e-05, "loss": 1.5267, "step": 26002 }, { "epoch": 2.05, "learning_rate": 6.882780020119554e-05, "loss": 1.5105, "step": 26003 }, { "epoch": 2.05, "learning_rate": 6.881740685314583e-05, "loss": 1.4872, "step": 26004 }, { "epoch": 2.05, "learning_rate": 6.880701405628108e-05, "loss": 1.4407, "step": 26005 }, { "epoch": 2.05, "learning_rate": 6.879662181067193e-05, "loss": 1.4771, "step": 26006 }, { "epoch": 2.05, "learning_rate": 6.878623011638893e-05, "loss": 1.4005, "step": 26007 }, { "epoch": 2.05, "learning_rate": 6.877583897350255e-05, "loss": 1.4257, "step": 26008 }, { "epoch": 2.05, "learning_rate": 6.876544838208344e-05, "loss": 1.4975, "step": 26009 }, { "epoch": 2.05, "learning_rate": 6.875505834220212e-05, "loss": 1.4794, "step": 26010 }, { "epoch": 2.05, "learning_rate": 6.874466885392907e-05, "loss": 1.4662, "step": 26011 }, { "epoch": 2.05, "learning_rate": 6.873427991733493e-05, "loss": 1.5118, "step": 26012 }, { "epoch": 2.05, "learning_rate": 6.872389153249017e-05, "loss": 1.4034, "step": 26013 }, { "epoch": 2.05, "learning_rate": 6.87135036994653e-05, "loss": 1.5283, "step": 26014 }, { "epoch": 2.05, "learning_rate": 6.870311641833092e-05, "loss": 1.4087, "step": 26015 }, { "epoch": 2.05, "learning_rate": 6.869272968915751e-05, "loss": 1.4688, "step": 26016 }, { "epoch": 2.05, "learning_rate": 6.868234351201562e-05, "loss": 1.4331, "step": 26017 }, { "epoch": 2.05, "learning_rate": 6.86719578869756e-05, "loss": 1.4642, "step": 26018 }, { "epoch": 2.05, "learning_rate": 6.866157281410825e-05, "loss": 1.465, "step": 26019 }, { "epoch": 2.05, "learning_rate": 6.865118829348392e-05, "loss": 1.445, "step": 26020 }, { "epoch": 2.05, "learning_rate": 6.864080432517312e-05, "loss": 1.4197, "step": 26021 }, { "epoch": 2.05, "learning_rate": 6.863042090924633e-05, "loss": 1.4199, "step": 26022 }, { "epoch": 2.05, "learning_rate": 6.862003804577411e-05, "loss": 1.5118, "step": 26023 }, { "epoch": 2.05, "learning_rate": 6.860965573482693e-05, "loss": 1.4164, "step": 26024 }, { "epoch": 2.05, "learning_rate": 6.859927397647521e-05, "loss": 1.4334, "step": 26025 }, { "epoch": 2.05, "learning_rate": 6.858889277078959e-05, "loss": 1.4825, "step": 26026 }, { "epoch": 2.05, "learning_rate": 6.857851211784042e-05, "loss": 1.4575, "step": 26027 }, { "epoch": 2.05, "learning_rate": 6.856813201769818e-05, "loss": 1.4577, "step": 26028 }, { "epoch": 2.05, "learning_rate": 6.855775247043344e-05, "loss": 1.4431, "step": 26029 }, { "epoch": 2.05, "learning_rate": 6.854737347611662e-05, "loss": 1.434, "step": 26030 }, { "epoch": 2.05, "learning_rate": 6.853699503481813e-05, "loss": 1.481, "step": 26031 }, { "epoch": 2.05, "learning_rate": 6.852661714660854e-05, "loss": 1.4533, "step": 26032 }, { "epoch": 2.05, "learning_rate": 6.851623981155826e-05, "loss": 1.4426, "step": 26033 }, { "epoch": 2.05, "learning_rate": 6.85058630297377e-05, "loss": 1.4354, "step": 26034 }, { "epoch": 2.05, "learning_rate": 6.849548680121735e-05, "loss": 1.4805, "step": 26035 }, { "epoch": 2.05, "learning_rate": 6.84851111260677e-05, "loss": 1.4352, "step": 26036 }, { "epoch": 2.05, "learning_rate": 6.847473600435919e-05, "loss": 1.4807, "step": 26037 }, { "epoch": 2.05, "learning_rate": 6.846436143616217e-05, "loss": 1.45, "step": 26038 }, { "epoch": 2.05, "learning_rate": 6.84539874215472e-05, "loss": 1.4742, "step": 26039 }, { "epoch": 2.05, "learning_rate": 6.844361396058466e-05, "loss": 1.4455, "step": 26040 }, { "epoch": 2.05, "learning_rate": 6.843324105334496e-05, "loss": 1.4964, "step": 26041 }, { "epoch": 2.05, "learning_rate": 6.84228686998985e-05, "loss": 1.4335, "step": 26042 }, { "epoch": 2.05, "learning_rate": 6.841249690031578e-05, "loss": 1.4314, "step": 26043 }, { "epoch": 2.05, "learning_rate": 6.840212565466719e-05, "loss": 1.4899, "step": 26044 }, { "epoch": 2.05, "learning_rate": 6.839175496302309e-05, "loss": 1.3959, "step": 26045 }, { "epoch": 2.05, "learning_rate": 6.838138482545398e-05, "loss": 1.4787, "step": 26046 }, { "epoch": 2.05, "learning_rate": 6.837101524203024e-05, "loss": 1.4529, "step": 26047 }, { "epoch": 2.05, "learning_rate": 6.83606462128222e-05, "loss": 1.4482, "step": 26048 }, { "epoch": 2.05, "learning_rate": 6.835027773790037e-05, "loss": 1.4884, "step": 26049 }, { "epoch": 2.05, "learning_rate": 6.833990981733506e-05, "loss": 1.4727, "step": 26050 }, { "epoch": 2.05, "learning_rate": 6.832954245119673e-05, "loss": 1.5095, "step": 26051 }, { "epoch": 2.05, "learning_rate": 6.83191756395557e-05, "loss": 1.4839, "step": 26052 }, { "epoch": 2.05, "learning_rate": 6.830880938248243e-05, "loss": 1.4489, "step": 26053 }, { "epoch": 2.05, "learning_rate": 6.829844368004727e-05, "loss": 1.4929, "step": 26054 }, { "epoch": 2.05, "learning_rate": 6.828807853232053e-05, "loss": 1.4136, "step": 26055 }, { "epoch": 2.05, "learning_rate": 6.827771393937272e-05, "loss": 1.4893, "step": 26056 }, { "epoch": 2.05, "learning_rate": 6.826734990127412e-05, "loss": 1.4335, "step": 26057 }, { "epoch": 2.05, "learning_rate": 6.825698641809512e-05, "loss": 1.4317, "step": 26058 }, { "epoch": 2.05, "learning_rate": 6.8246623489906e-05, "loss": 1.4726, "step": 26059 }, { "epoch": 2.05, "learning_rate": 6.823626111677726e-05, "loss": 1.4438, "step": 26060 }, { "epoch": 2.05, "learning_rate": 6.822589929877918e-05, "loss": 1.3829, "step": 26061 }, { "epoch": 2.05, "learning_rate": 6.821553803598206e-05, "loss": 1.431, "step": 26062 }, { "epoch": 2.05, "learning_rate": 6.820517732845636e-05, "loss": 1.4387, "step": 26063 }, { "epoch": 2.05, "learning_rate": 6.819481717627237e-05, "loss": 1.4373, "step": 26064 }, { "epoch": 2.05, "learning_rate": 6.818445757950038e-05, "loss": 1.4464, "step": 26065 }, { "epoch": 2.05, "learning_rate": 6.817409853821077e-05, "loss": 1.4599, "step": 26066 }, { "epoch": 2.05, "learning_rate": 6.816374005247392e-05, "loss": 1.4456, "step": 26067 }, { "epoch": 2.05, "learning_rate": 6.815338212236012e-05, "loss": 1.5271, "step": 26068 }, { "epoch": 2.05, "learning_rate": 6.814302474793963e-05, "loss": 1.464, "step": 26069 }, { "epoch": 2.05, "learning_rate": 6.813266792928289e-05, "loss": 1.4442, "step": 26070 }, { "epoch": 2.05, "learning_rate": 6.812231166646017e-05, "loss": 1.4486, "step": 26071 }, { "epoch": 2.05, "learning_rate": 6.811195595954171e-05, "loss": 1.4726, "step": 26072 }, { "epoch": 2.05, "learning_rate": 6.810160080859792e-05, "loss": 1.4587, "step": 26073 }, { "epoch": 2.05, "learning_rate": 6.809124621369907e-05, "loss": 1.4483, "step": 26074 }, { "epoch": 2.05, "learning_rate": 6.808089217491545e-05, "loss": 1.4483, "step": 26075 }, { "epoch": 2.05, "learning_rate": 6.807053869231733e-05, "loss": 1.4724, "step": 26076 }, { "epoch": 2.05, "learning_rate": 6.806018576597508e-05, "loss": 1.4877, "step": 26077 }, { "epoch": 2.05, "learning_rate": 6.804983339595894e-05, "loss": 1.4642, "step": 26078 }, { "epoch": 2.05, "learning_rate": 6.803948158233918e-05, "loss": 1.4479, "step": 26079 }, { "epoch": 2.05, "learning_rate": 6.802913032518614e-05, "loss": 1.4311, "step": 26080 }, { "epoch": 2.05, "learning_rate": 6.801877962457003e-05, "loss": 1.4507, "step": 26081 }, { "epoch": 2.05, "learning_rate": 6.800842948056124e-05, "loss": 1.4733, "step": 26082 }, { "epoch": 2.05, "learning_rate": 6.799807989322988e-05, "loss": 1.3995, "step": 26083 }, { "epoch": 2.05, "learning_rate": 6.798773086264636e-05, "loss": 1.4876, "step": 26084 }, { "epoch": 2.05, "learning_rate": 6.797738238888091e-05, "loss": 1.4281, "step": 26085 }, { "epoch": 2.05, "learning_rate": 6.79670344720037e-05, "loss": 1.4656, "step": 26086 }, { "epoch": 2.05, "learning_rate": 6.795668711208512e-05, "loss": 1.4713, "step": 26087 }, { "epoch": 2.05, "learning_rate": 6.794634030919535e-05, "loss": 1.4225, "step": 26088 }, { "epoch": 2.05, "learning_rate": 6.79359940634046e-05, "loss": 1.4483, "step": 26089 }, { "epoch": 2.05, "learning_rate": 6.792564837478322e-05, "loss": 1.4473, "step": 26090 }, { "epoch": 2.05, "learning_rate": 6.791530324340138e-05, "loss": 1.4795, "step": 26091 }, { "epoch": 2.05, "learning_rate": 6.790495866932935e-05, "loss": 1.4913, "step": 26092 }, { "epoch": 2.05, "learning_rate": 6.78946146526373e-05, "loss": 1.4513, "step": 26093 }, { "epoch": 2.05, "learning_rate": 6.788427119339553e-05, "loss": 1.4874, "step": 26094 }, { "epoch": 2.05, "learning_rate": 6.787392829167426e-05, "loss": 1.4595, "step": 26095 }, { "epoch": 2.05, "learning_rate": 6.786358594754366e-05, "loss": 1.4364, "step": 26096 }, { "epoch": 2.05, "learning_rate": 6.785324416107396e-05, "loss": 1.4727, "step": 26097 }, { "epoch": 2.05, "learning_rate": 6.784290293233546e-05, "loss": 1.4071, "step": 26098 }, { "epoch": 2.05, "learning_rate": 6.783256226139833e-05, "loss": 1.4427, "step": 26099 }, { "epoch": 2.05, "learning_rate": 6.782222214833268e-05, "loss": 1.4601, "step": 26100 }, { "epoch": 2.05, "learning_rate": 6.781188259320885e-05, "loss": 1.4354, "step": 26101 }, { "epoch": 2.05, "learning_rate": 6.780154359609698e-05, "loss": 1.4171, "step": 26102 }, { "epoch": 2.05, "learning_rate": 6.779120515706721e-05, "loss": 1.5357, "step": 26103 }, { "epoch": 2.05, "learning_rate": 6.778086727618987e-05, "loss": 1.4728, "step": 26104 }, { "epoch": 2.05, "learning_rate": 6.777052995353505e-05, "loss": 1.3899, "step": 26105 }, { "epoch": 2.05, "learning_rate": 6.77601931891729e-05, "loss": 1.502, "step": 26106 }, { "epoch": 2.05, "learning_rate": 6.77498569831737e-05, "loss": 1.4607, "step": 26107 }, { "epoch": 2.05, "learning_rate": 6.77395213356076e-05, "loss": 1.4252, "step": 26108 }, { "epoch": 2.05, "learning_rate": 6.77291862465447e-05, "loss": 1.4642, "step": 26109 }, { "epoch": 2.05, "learning_rate": 6.771885171605527e-05, "loss": 1.5097, "step": 26110 }, { "epoch": 2.05, "learning_rate": 6.770851774420944e-05, "loss": 1.4552, "step": 26111 }, { "epoch": 2.05, "learning_rate": 6.769818433107735e-05, "loss": 1.4503, "step": 26112 }, { "epoch": 2.05, "learning_rate": 6.768785147672907e-05, "loss": 1.4049, "step": 26113 }, { "epoch": 2.05, "learning_rate": 6.767751918123497e-05, "loss": 1.445, "step": 26114 }, { "epoch": 2.05, "learning_rate": 6.766718744466507e-05, "loss": 1.3894, "step": 26115 }, { "epoch": 2.05, "learning_rate": 6.765685626708954e-05, "loss": 1.4427, "step": 26116 }, { "epoch": 2.05, "learning_rate": 6.764652564857845e-05, "loss": 1.4671, "step": 26117 }, { "epoch": 2.05, "learning_rate": 6.763619558920208e-05, "loss": 1.4223, "step": 26118 }, { "epoch": 2.06, "learning_rate": 6.762586608903047e-05, "loss": 1.5214, "step": 26119 }, { "epoch": 2.06, "learning_rate": 6.761553714813373e-05, "loss": 1.5216, "step": 26120 }, { "epoch": 2.06, "learning_rate": 6.760520876658208e-05, "loss": 1.436, "step": 26121 }, { "epoch": 2.06, "learning_rate": 6.75948809444456e-05, "loss": 1.4839, "step": 26122 }, { "epoch": 2.06, "learning_rate": 6.758455368179434e-05, "loss": 1.4492, "step": 26123 }, { "epoch": 2.06, "learning_rate": 6.757422697869853e-05, "loss": 1.5067, "step": 26124 }, { "epoch": 2.06, "learning_rate": 6.756390083522823e-05, "loss": 1.4788, "step": 26125 }, { "epoch": 2.06, "learning_rate": 6.755357525145351e-05, "loss": 1.4685, "step": 26126 }, { "epoch": 2.06, "learning_rate": 6.754325022744457e-05, "loss": 1.4321, "step": 26127 }, { "epoch": 2.06, "learning_rate": 6.753292576327138e-05, "loss": 1.4808, "step": 26128 }, { "epoch": 2.06, "learning_rate": 6.75226018590042e-05, "loss": 1.4585, "step": 26129 }, { "epoch": 2.06, "learning_rate": 6.751227851471297e-05, "loss": 1.4671, "step": 26130 }, { "epoch": 2.06, "learning_rate": 6.750195573046791e-05, "loss": 1.447, "step": 26131 }, { "epoch": 2.06, "learning_rate": 6.749163350633903e-05, "loss": 1.417, "step": 26132 }, { "epoch": 2.06, "learning_rate": 6.748131184239646e-05, "loss": 1.492, "step": 26133 }, { "epoch": 2.06, "learning_rate": 6.747099073871015e-05, "loss": 1.4587, "step": 26134 }, { "epoch": 2.06, "learning_rate": 6.746067019535034e-05, "loss": 1.4703, "step": 26135 }, { "epoch": 2.06, "learning_rate": 6.745035021238703e-05, "loss": 1.4649, "step": 26136 }, { "epoch": 2.06, "learning_rate": 6.744003078989025e-05, "loss": 1.4378, "step": 26137 }, { "epoch": 2.06, "learning_rate": 6.742971192793014e-05, "loss": 1.4731, "step": 26138 }, { "epoch": 2.06, "learning_rate": 6.741939362657671e-05, "loss": 1.4417, "step": 26139 }, { "epoch": 2.06, "learning_rate": 6.740907588589997e-05, "loss": 1.4441, "step": 26140 }, { "epoch": 2.06, "learning_rate": 6.73987587059701e-05, "loss": 1.4364, "step": 26141 }, { "epoch": 2.06, "learning_rate": 6.738844208685707e-05, "loss": 1.5313, "step": 26142 }, { "epoch": 2.06, "learning_rate": 6.737812602863087e-05, "loss": 1.4421, "step": 26143 }, { "epoch": 2.06, "learning_rate": 6.736781053136161e-05, "loss": 1.4465, "step": 26144 }, { "epoch": 2.06, "learning_rate": 6.735749559511936e-05, "loss": 1.4235, "step": 26145 }, { "epoch": 2.06, "learning_rate": 6.734718121997412e-05, "loss": 1.4975, "step": 26146 }, { "epoch": 2.06, "learning_rate": 6.733686740599582e-05, "loss": 1.4948, "step": 26147 }, { "epoch": 2.06, "learning_rate": 6.732655415325467e-05, "loss": 1.4126, "step": 26148 }, { "epoch": 2.06, "learning_rate": 6.731624146182057e-05, "loss": 1.4249, "step": 26149 }, { "epoch": 2.06, "learning_rate": 6.730592933176351e-05, "loss": 1.4638, "step": 26150 }, { "epoch": 2.06, "learning_rate": 6.729561776315362e-05, "loss": 1.4253, "step": 26151 }, { "epoch": 2.06, "learning_rate": 6.728530675606085e-05, "loss": 1.414, "step": 26152 }, { "epoch": 2.06, "learning_rate": 6.727499631055518e-05, "loss": 1.454, "step": 26153 }, { "epoch": 2.06, "learning_rate": 6.72646864267066e-05, "loss": 1.4875, "step": 26154 }, { "epoch": 2.06, "learning_rate": 6.725437710458518e-05, "loss": 1.4821, "step": 26155 }, { "epoch": 2.06, "learning_rate": 6.724406834426088e-05, "loss": 1.5272, "step": 26156 }, { "epoch": 2.06, "learning_rate": 6.723376014580364e-05, "loss": 1.4288, "step": 26157 }, { "epoch": 2.06, "learning_rate": 6.722345250928355e-05, "loss": 1.4495, "step": 26158 }, { "epoch": 2.06, "learning_rate": 6.721314543477053e-05, "loss": 1.4774, "step": 26159 }, { "epoch": 2.06, "learning_rate": 6.720283892233451e-05, "loss": 1.4917, "step": 26160 }, { "epoch": 2.06, "learning_rate": 6.719253297204553e-05, "loss": 1.4018, "step": 26161 }, { "epoch": 2.06, "learning_rate": 6.718222758397361e-05, "loss": 1.4474, "step": 26162 }, { "epoch": 2.06, "learning_rate": 6.717192275818865e-05, "loss": 1.4464, "step": 26163 }, { "epoch": 2.06, "learning_rate": 6.716161849476059e-05, "loss": 1.4445, "step": 26164 }, { "epoch": 2.06, "learning_rate": 6.715131479375948e-05, "loss": 1.4748, "step": 26165 }, { "epoch": 2.06, "learning_rate": 6.71410116552552e-05, "loss": 1.4825, "step": 26166 }, { "epoch": 2.06, "learning_rate": 6.713070907931769e-05, "loss": 1.4654, "step": 26167 }, { "epoch": 2.06, "learning_rate": 6.712040706601697e-05, "loss": 1.471, "step": 26168 }, { "epoch": 2.06, "learning_rate": 6.711010561542297e-05, "loss": 1.4617, "step": 26169 }, { "epoch": 2.06, "learning_rate": 6.709980472760561e-05, "loss": 1.45, "step": 26170 }, { "epoch": 2.06, "learning_rate": 6.708950440263477e-05, "loss": 1.4413, "step": 26171 }, { "epoch": 2.06, "learning_rate": 6.70792046405805e-05, "loss": 1.4353, "step": 26172 }, { "epoch": 2.06, "learning_rate": 6.706890544151265e-05, "loss": 1.4654, "step": 26173 }, { "epoch": 2.06, "learning_rate": 6.705860680550112e-05, "loss": 1.5221, "step": 26174 }, { "epoch": 2.06, "learning_rate": 6.70483087326159e-05, "loss": 1.409, "step": 26175 }, { "epoch": 2.06, "learning_rate": 6.703801122292692e-05, "loss": 1.4428, "step": 26176 }, { "epoch": 2.06, "learning_rate": 6.702771427650407e-05, "loss": 1.4111, "step": 26177 }, { "epoch": 2.06, "learning_rate": 6.701741789341719e-05, "loss": 1.4423, "step": 26178 }, { "epoch": 2.06, "learning_rate": 6.700712207373631e-05, "loss": 1.4449, "step": 26179 }, { "epoch": 2.06, "learning_rate": 6.699682681753128e-05, "loss": 1.4889, "step": 26180 }, { "epoch": 2.06, "learning_rate": 6.698653212487192e-05, "loss": 1.4898, "step": 26181 }, { "epoch": 2.06, "learning_rate": 6.697623799582826e-05, "loss": 1.4684, "step": 26182 }, { "epoch": 2.06, "learning_rate": 6.696594443047013e-05, "loss": 1.4335, "step": 26183 }, { "epoch": 2.06, "learning_rate": 6.695565142886735e-05, "loss": 1.4338, "step": 26184 }, { "epoch": 2.06, "learning_rate": 6.694535899108994e-05, "loss": 1.4769, "step": 26185 }, { "epoch": 2.06, "learning_rate": 6.693506711720769e-05, "loss": 1.4645, "step": 26186 }, { "epoch": 2.06, "learning_rate": 6.69247758072905e-05, "loss": 1.4445, "step": 26187 }, { "epoch": 2.06, "learning_rate": 6.69144850614082e-05, "loss": 1.4205, "step": 26188 }, { "epoch": 2.06, "learning_rate": 6.690419487963072e-05, "loss": 1.4481, "step": 26189 }, { "epoch": 2.06, "learning_rate": 6.689390526202793e-05, "loss": 1.5238, "step": 26190 }, { "epoch": 2.06, "learning_rate": 6.68836162086696e-05, "loss": 1.425, "step": 26191 }, { "epoch": 2.06, "learning_rate": 6.687332771962564e-05, "loss": 1.473, "step": 26192 }, { "epoch": 2.06, "learning_rate": 6.686303979496596e-05, "loss": 1.4709, "step": 26193 }, { "epoch": 2.06, "learning_rate": 6.685275243476039e-05, "loss": 1.4425, "step": 26194 }, { "epoch": 2.06, "learning_rate": 6.684246563907867e-05, "loss": 1.5366, "step": 26195 }, { "epoch": 2.06, "learning_rate": 6.683217940799077e-05, "loss": 1.4849, "step": 26196 }, { "epoch": 2.06, "learning_rate": 6.682189374156649e-05, "loss": 1.4908, "step": 26197 }, { "epoch": 2.06, "learning_rate": 6.681160863987558e-05, "loss": 1.4614, "step": 26198 }, { "epoch": 2.06, "learning_rate": 6.680132410298802e-05, "loss": 1.4566, "step": 26199 }, { "epoch": 2.06, "learning_rate": 6.679104013097353e-05, "loss": 1.4538, "step": 26200 }, { "epoch": 2.06, "learning_rate": 6.67807567239019e-05, "loss": 1.4207, "step": 26201 }, { "epoch": 2.06, "learning_rate": 6.677047388184308e-05, "loss": 1.4318, "step": 26202 }, { "epoch": 2.06, "learning_rate": 6.676019160486682e-05, "loss": 1.4274, "step": 26203 }, { "epoch": 2.06, "learning_rate": 6.674990989304286e-05, "loss": 1.4927, "step": 26204 }, { "epoch": 2.06, "learning_rate": 6.673962874644113e-05, "loss": 1.4643, "step": 26205 }, { "epoch": 2.06, "learning_rate": 6.672934816513136e-05, "loss": 1.428, "step": 26206 }, { "epoch": 2.06, "learning_rate": 6.671906814918331e-05, "loss": 1.4009, "step": 26207 }, { "epoch": 2.06, "learning_rate": 6.670878869866684e-05, "loss": 1.4459, "step": 26208 }, { "epoch": 2.06, "learning_rate": 6.669850981365177e-05, "loss": 1.4608, "step": 26209 }, { "epoch": 2.06, "learning_rate": 6.668823149420787e-05, "loss": 1.5082, "step": 26210 }, { "epoch": 2.06, "learning_rate": 6.667795374040489e-05, "loss": 1.4515, "step": 26211 }, { "epoch": 2.06, "learning_rate": 6.666767655231256e-05, "loss": 1.4693, "step": 26212 }, { "epoch": 2.06, "learning_rate": 6.665739993000079e-05, "loss": 1.5056, "step": 26213 }, { "epoch": 2.06, "learning_rate": 6.664712387353928e-05, "loss": 1.5139, "step": 26214 }, { "epoch": 2.06, "learning_rate": 6.663684838299774e-05, "loss": 1.4591, "step": 26215 }, { "epoch": 2.06, "learning_rate": 6.662657345844605e-05, "loss": 1.491, "step": 26216 }, { "epoch": 2.06, "learning_rate": 6.661629909995392e-05, "loss": 1.4686, "step": 26217 }, { "epoch": 2.06, "learning_rate": 6.660602530759104e-05, "loss": 1.4659, "step": 26218 }, { "epoch": 2.06, "learning_rate": 6.659575208142731e-05, "loss": 1.4763, "step": 26219 }, { "epoch": 2.06, "learning_rate": 6.658547942153238e-05, "loss": 1.4842, "step": 26220 }, { "epoch": 2.06, "learning_rate": 6.657520732797596e-05, "loss": 1.4521, "step": 26221 }, { "epoch": 2.06, "learning_rate": 6.65649358008279e-05, "loss": 1.4726, "step": 26222 }, { "epoch": 2.06, "learning_rate": 6.655466484015781e-05, "loss": 1.4544, "step": 26223 }, { "epoch": 2.06, "learning_rate": 6.654439444603557e-05, "loss": 1.4395, "step": 26224 }, { "epoch": 2.06, "learning_rate": 6.653412461853078e-05, "loss": 1.4826, "step": 26225 }, { "epoch": 2.06, "learning_rate": 6.652385535771327e-05, "loss": 1.4637, "step": 26226 }, { "epoch": 2.06, "learning_rate": 6.651358666365273e-05, "loss": 1.4196, "step": 26227 }, { "epoch": 2.06, "learning_rate": 6.650331853641886e-05, "loss": 1.5012, "step": 26228 }, { "epoch": 2.06, "learning_rate": 6.649305097608132e-05, "loss": 1.4882, "step": 26229 }, { "epoch": 2.06, "learning_rate": 6.648278398270995e-05, "loss": 1.4164, "step": 26230 }, { "epoch": 2.06, "learning_rate": 6.647251755637437e-05, "loss": 1.4827, "step": 26231 }, { "epoch": 2.06, "learning_rate": 6.646225169714426e-05, "loss": 1.465, "step": 26232 }, { "epoch": 2.06, "learning_rate": 6.645198640508941e-05, "loss": 1.4334, "step": 26233 }, { "epoch": 2.06, "learning_rate": 6.644172168027947e-05, "loss": 1.4291, "step": 26234 }, { "epoch": 2.06, "learning_rate": 6.643145752278405e-05, "loss": 1.4243, "step": 26235 }, { "epoch": 2.06, "learning_rate": 6.6421193932673e-05, "loss": 1.4189, "step": 26236 }, { "epoch": 2.06, "learning_rate": 6.641093091001591e-05, "loss": 1.4842, "step": 26237 }, { "epoch": 2.06, "learning_rate": 6.640066845488242e-05, "loss": 1.4914, "step": 26238 }, { "epoch": 2.06, "learning_rate": 6.639040656734226e-05, "loss": 1.4629, "step": 26239 }, { "epoch": 2.06, "learning_rate": 6.638014524746515e-05, "loss": 1.4438, "step": 26240 }, { "epoch": 2.06, "learning_rate": 6.636988449532071e-05, "loss": 1.4472, "step": 26241 }, { "epoch": 2.06, "learning_rate": 6.635962431097853e-05, "loss": 1.4722, "step": 26242 }, { "epoch": 2.06, "learning_rate": 6.634936469450844e-05, "loss": 1.4336, "step": 26243 }, { "epoch": 2.06, "learning_rate": 6.633910564597998e-05, "loss": 1.4574, "step": 26244 }, { "epoch": 2.06, "learning_rate": 6.632884716546281e-05, "loss": 1.5092, "step": 26245 }, { "epoch": 2.07, "learning_rate": 6.631858925302654e-05, "loss": 1.4867, "step": 26246 }, { "epoch": 2.07, "learning_rate": 6.630833190874095e-05, "loss": 1.4241, "step": 26247 }, { "epoch": 2.07, "learning_rate": 6.629807513267559e-05, "loss": 1.4798, "step": 26248 }, { "epoch": 2.07, "learning_rate": 6.628781892490004e-05, "loss": 1.4446, "step": 26249 }, { "epoch": 2.07, "learning_rate": 6.627756328548408e-05, "loss": 1.4529, "step": 26250 }, { "epoch": 2.07, "learning_rate": 6.626730821449724e-05, "loss": 1.4349, "step": 26251 }, { "epoch": 2.07, "learning_rate": 6.625705371200915e-05, "loss": 1.452, "step": 26252 }, { "epoch": 2.07, "learning_rate": 6.624679977808947e-05, "loss": 1.4674, "step": 26253 }, { "epoch": 2.07, "learning_rate": 6.623654641280776e-05, "loss": 1.4313, "step": 26254 }, { "epoch": 2.07, "learning_rate": 6.622629361623374e-05, "loss": 1.448, "step": 26255 }, { "epoch": 2.07, "learning_rate": 6.62160413884369e-05, "loss": 1.4419, "step": 26256 }, { "epoch": 2.07, "learning_rate": 6.620578972948693e-05, "loss": 1.4573, "step": 26257 }, { "epoch": 2.07, "learning_rate": 6.619553863945343e-05, "loss": 1.4198, "step": 26258 }, { "epoch": 2.07, "learning_rate": 6.618528811840593e-05, "loss": 1.4476, "step": 26259 }, { "epoch": 2.07, "learning_rate": 6.617503816641412e-05, "loss": 1.4392, "step": 26260 }, { "epoch": 2.07, "learning_rate": 6.616478878354752e-05, "loss": 1.4694, "step": 26261 }, { "epoch": 2.07, "learning_rate": 6.615453996987571e-05, "loss": 1.5072, "step": 26262 }, { "epoch": 2.07, "learning_rate": 6.614429172546835e-05, "loss": 1.4231, "step": 26263 }, { "epoch": 2.07, "learning_rate": 6.613404405039498e-05, "loss": 1.4627, "step": 26264 }, { "epoch": 2.07, "learning_rate": 6.612379694472515e-05, "loss": 1.438, "step": 26265 }, { "epoch": 2.07, "learning_rate": 6.611355040852842e-05, "loss": 1.4924, "step": 26266 }, { "epoch": 2.07, "learning_rate": 6.610330444187443e-05, "loss": 1.4191, "step": 26267 }, { "epoch": 2.07, "learning_rate": 6.609305904483272e-05, "loss": 1.4644, "step": 26268 }, { "epoch": 2.07, "learning_rate": 6.608281421747276e-05, "loss": 1.4805, "step": 26269 }, { "epoch": 2.07, "learning_rate": 6.607256995986419e-05, "loss": 1.4664, "step": 26270 }, { "epoch": 2.07, "learning_rate": 6.606232627207664e-05, "loss": 1.4964, "step": 26271 }, { "epoch": 2.07, "learning_rate": 6.605208315417953e-05, "loss": 1.4618, "step": 26272 }, { "epoch": 2.07, "learning_rate": 6.604184060624242e-05, "loss": 1.5477, "step": 26273 }, { "epoch": 2.07, "learning_rate": 6.603159862833492e-05, "loss": 1.4063, "step": 26274 }, { "epoch": 2.07, "learning_rate": 6.602135722052654e-05, "loss": 1.4427, "step": 26275 }, { "epoch": 2.07, "learning_rate": 6.601111638288674e-05, "loss": 1.4569, "step": 26276 }, { "epoch": 2.07, "learning_rate": 6.600087611548516e-05, "loss": 1.4253, "step": 26277 }, { "epoch": 2.07, "learning_rate": 6.599063641839129e-05, "loss": 1.4607, "step": 26278 }, { "epoch": 2.07, "learning_rate": 6.598039729167456e-05, "loss": 1.4602, "step": 26279 }, { "epoch": 2.07, "learning_rate": 6.597015873540464e-05, "loss": 1.4851, "step": 26280 }, { "epoch": 2.07, "learning_rate": 6.595992074965097e-05, "loss": 1.4738, "step": 26281 }, { "epoch": 2.07, "learning_rate": 6.594968333448306e-05, "loss": 1.4157, "step": 26282 }, { "epoch": 2.07, "learning_rate": 6.593944648997037e-05, "loss": 1.4798, "step": 26283 }, { "epoch": 2.07, "learning_rate": 6.59292102161825e-05, "loss": 1.4843, "step": 26284 }, { "epoch": 2.07, "learning_rate": 6.591897451318884e-05, "loss": 1.4617, "step": 26285 }, { "epoch": 2.07, "learning_rate": 6.590873938105899e-05, "loss": 1.4734, "step": 26286 }, { "epoch": 2.07, "learning_rate": 6.589850481986236e-05, "loss": 1.4679, "step": 26287 }, { "epoch": 2.07, "learning_rate": 6.588827082966851e-05, "loss": 1.484, "step": 26288 }, { "epoch": 2.07, "learning_rate": 6.587803741054689e-05, "loss": 1.428, "step": 26289 }, { "epoch": 2.07, "learning_rate": 6.586780456256692e-05, "loss": 1.3617, "step": 26290 }, { "epoch": 2.07, "learning_rate": 6.585757228579818e-05, "loss": 1.4651, "step": 26291 }, { "epoch": 2.07, "learning_rate": 6.584734058031008e-05, "loss": 1.4827, "step": 26292 }, { "epoch": 2.07, "learning_rate": 6.583710944617206e-05, "loss": 1.444, "step": 26293 }, { "epoch": 2.07, "learning_rate": 6.582687888345367e-05, "loss": 1.466, "step": 26294 }, { "epoch": 2.07, "learning_rate": 6.581664889222433e-05, "loss": 1.4992, "step": 26295 }, { "epoch": 2.07, "learning_rate": 6.580641947255343e-05, "loss": 1.4335, "step": 26296 }, { "epoch": 2.07, "learning_rate": 6.579619062451053e-05, "loss": 1.5327, "step": 26297 }, { "epoch": 2.07, "learning_rate": 6.578596234816503e-05, "loss": 1.4818, "step": 26298 }, { "epoch": 2.07, "learning_rate": 6.577573464358637e-05, "loss": 1.4427, "step": 26299 }, { "epoch": 2.07, "learning_rate": 6.576550751084394e-05, "loss": 1.4502, "step": 26300 }, { "epoch": 2.07, "learning_rate": 6.575528095000723e-05, "loss": 1.4387, "step": 26301 }, { "epoch": 2.07, "learning_rate": 6.574505496114573e-05, "loss": 1.4641, "step": 26302 }, { "epoch": 2.07, "learning_rate": 6.573482954432875e-05, "loss": 1.4392, "step": 26303 }, { "epoch": 2.07, "learning_rate": 6.572460469962583e-05, "loss": 1.4815, "step": 26304 }, { "epoch": 2.07, "learning_rate": 6.571438042710635e-05, "loss": 1.4311, "step": 26305 }, { "epoch": 2.07, "learning_rate": 6.57041567268397e-05, "loss": 1.4725, "step": 26306 }, { "epoch": 2.07, "learning_rate": 6.569393359889526e-05, "loss": 1.4688, "step": 26307 }, { "epoch": 2.07, "learning_rate": 6.568371104334255e-05, "loss": 1.4743, "step": 26308 }, { "epoch": 2.07, "learning_rate": 6.567348906025091e-05, "loss": 1.488, "step": 26309 }, { "epoch": 2.07, "learning_rate": 6.566326764968967e-05, "loss": 1.5141, "step": 26310 }, { "epoch": 2.07, "learning_rate": 6.565304681172837e-05, "loss": 1.4263, "step": 26311 }, { "epoch": 2.07, "learning_rate": 6.564282654643634e-05, "loss": 1.4483, "step": 26312 }, { "epoch": 2.07, "learning_rate": 6.56326068538829e-05, "loss": 1.4142, "step": 26313 }, { "epoch": 2.07, "learning_rate": 6.562238773413755e-05, "loss": 1.4498, "step": 26314 }, { "epoch": 2.07, "learning_rate": 6.561216918726963e-05, "loss": 1.4325, "step": 26315 }, { "epoch": 2.07, "learning_rate": 6.560195121334847e-05, "loss": 1.5254, "step": 26316 }, { "epoch": 2.07, "learning_rate": 6.559173381244348e-05, "loss": 1.4379, "step": 26317 }, { "epoch": 2.07, "learning_rate": 6.55815169846241e-05, "loss": 1.513, "step": 26318 }, { "epoch": 2.07, "learning_rate": 6.557130072995962e-05, "loss": 1.4636, "step": 26319 }, { "epoch": 2.07, "learning_rate": 6.556108504851937e-05, "loss": 1.4356, "step": 26320 }, { "epoch": 2.07, "learning_rate": 6.555086994037281e-05, "loss": 1.4513, "step": 26321 }, { "epoch": 2.07, "learning_rate": 6.554065540558924e-05, "loss": 1.4132, "step": 26322 }, { "epoch": 2.07, "learning_rate": 6.553044144423801e-05, "loss": 1.4608, "step": 26323 }, { "epoch": 2.07, "learning_rate": 6.55202280563884e-05, "loss": 1.4391, "step": 26324 }, { "epoch": 2.07, "learning_rate": 6.551001524210988e-05, "loss": 1.4326, "step": 26325 }, { "epoch": 2.07, "learning_rate": 6.549980300147176e-05, "loss": 1.418, "step": 26326 }, { "epoch": 2.07, "learning_rate": 6.548959133454324e-05, "loss": 1.4353, "step": 26327 }, { "epoch": 2.07, "learning_rate": 6.547938024139386e-05, "loss": 1.4798, "step": 26328 }, { "epoch": 2.07, "learning_rate": 6.546916972209283e-05, "loss": 1.4385, "step": 26329 }, { "epoch": 2.07, "learning_rate": 6.545895977670944e-05, "loss": 1.4806, "step": 26330 }, { "epoch": 2.07, "learning_rate": 6.544875040531311e-05, "loss": 1.4543, "step": 26331 }, { "epoch": 2.07, "learning_rate": 6.54385416079731e-05, "loss": 1.4314, "step": 26332 }, { "epoch": 2.07, "learning_rate": 6.542833338475868e-05, "loss": 1.4503, "step": 26333 }, { "epoch": 2.07, "learning_rate": 6.54181257357392e-05, "loss": 1.3937, "step": 26334 }, { "epoch": 2.07, "learning_rate": 6.540791866098403e-05, "loss": 1.4807, "step": 26335 }, { "epoch": 2.07, "learning_rate": 6.53977121605624e-05, "loss": 1.4547, "step": 26336 }, { "epoch": 2.07, "learning_rate": 6.538750623454359e-05, "loss": 1.4607, "step": 26337 }, { "epoch": 2.07, "learning_rate": 6.537730088299694e-05, "loss": 1.4644, "step": 26338 }, { "epoch": 2.07, "learning_rate": 6.536709610599174e-05, "loss": 1.4869, "step": 26339 }, { "epoch": 2.07, "learning_rate": 6.535689190359724e-05, "loss": 1.507, "step": 26340 }, { "epoch": 2.07, "learning_rate": 6.534668827588268e-05, "loss": 1.4947, "step": 26341 }, { "epoch": 2.07, "learning_rate": 6.533648522291747e-05, "loss": 1.4844, "step": 26342 }, { "epoch": 2.07, "learning_rate": 6.532628274477078e-05, "loss": 1.4696, "step": 26343 }, { "epoch": 2.07, "learning_rate": 6.531608084151185e-05, "loss": 1.4212, "step": 26344 }, { "epoch": 2.07, "learning_rate": 6.530587951321006e-05, "loss": 1.4211, "step": 26345 }, { "epoch": 2.07, "learning_rate": 6.52956787599346e-05, "loss": 1.4767, "step": 26346 }, { "epoch": 2.07, "learning_rate": 6.52854785817547e-05, "loss": 1.4824, "step": 26347 }, { "epoch": 2.07, "learning_rate": 6.527527897873965e-05, "loss": 1.4427, "step": 26348 }, { "epoch": 2.07, "learning_rate": 6.526507995095874e-05, "loss": 1.4708, "step": 26349 }, { "epoch": 2.07, "learning_rate": 6.525488149848117e-05, "loss": 1.4509, "step": 26350 }, { "epoch": 2.07, "learning_rate": 6.524468362137616e-05, "loss": 1.4819, "step": 26351 }, { "epoch": 2.07, "learning_rate": 6.523448631971301e-05, "loss": 1.4269, "step": 26352 }, { "epoch": 2.07, "learning_rate": 6.522428959356093e-05, "loss": 1.4352, "step": 26353 }, { "epoch": 2.07, "learning_rate": 6.521409344298908e-05, "loss": 1.4302, "step": 26354 }, { "epoch": 2.07, "learning_rate": 6.520389786806681e-05, "loss": 1.4406, "step": 26355 }, { "epoch": 2.07, "learning_rate": 6.519370286886327e-05, "loss": 1.4412, "step": 26356 }, { "epoch": 2.07, "learning_rate": 6.518350844544771e-05, "loss": 1.4365, "step": 26357 }, { "epoch": 2.07, "learning_rate": 6.517331459788924e-05, "loss": 1.4405, "step": 26358 }, { "epoch": 2.07, "learning_rate": 6.516312132625723e-05, "loss": 1.4117, "step": 26359 }, { "epoch": 2.07, "learning_rate": 6.51529286306208e-05, "loss": 1.4446, "step": 26360 }, { "epoch": 2.07, "learning_rate": 6.51427365110491e-05, "loss": 1.4802, "step": 26361 }, { "epoch": 2.07, "learning_rate": 6.513254496761143e-05, "loss": 1.4551, "step": 26362 }, { "epoch": 2.07, "learning_rate": 6.512235400037698e-05, "loss": 1.4239, "step": 26363 }, { "epoch": 2.07, "learning_rate": 6.511216360941483e-05, "loss": 1.4168, "step": 26364 }, { "epoch": 2.07, "learning_rate": 6.510197379479426e-05, "loss": 1.5528, "step": 26365 }, { "epoch": 2.07, "learning_rate": 6.509178455658447e-05, "loss": 1.4603, "step": 26366 }, { "epoch": 2.07, "learning_rate": 6.508159589485464e-05, "loss": 1.4949, "step": 26367 }, { "epoch": 2.07, "learning_rate": 6.507140780967382e-05, "loss": 1.5011, "step": 26368 }, { "epoch": 2.07, "learning_rate": 6.506122030111134e-05, "loss": 1.4695, "step": 26369 }, { "epoch": 2.07, "learning_rate": 6.505103336923633e-05, "loss": 1.4851, "step": 26370 }, { "epoch": 2.07, "learning_rate": 6.504084701411783e-05, "loss": 1.4252, "step": 26371 }, { "epoch": 2.07, "learning_rate": 6.503066123582517e-05, "loss": 1.4571, "step": 26372 }, { "epoch": 2.08, "learning_rate": 6.502047603442744e-05, "loss": 1.459, "step": 26373 }, { "epoch": 2.08, "learning_rate": 6.501029140999371e-05, "loss": 1.4432, "step": 26374 }, { "epoch": 2.08, "learning_rate": 6.500010736259326e-05, "loss": 1.521, "step": 26375 }, { "epoch": 2.08, "learning_rate": 6.498992389229517e-05, "loss": 1.3807, "step": 26376 }, { "epoch": 2.08, "learning_rate": 6.497974099916859e-05, "loss": 1.4451, "step": 26377 }, { "epoch": 2.08, "learning_rate": 6.49695586832826e-05, "loss": 1.4208, "step": 26378 }, { "epoch": 2.08, "learning_rate": 6.495937694470643e-05, "loss": 1.4882, "step": 26379 }, { "epoch": 2.08, "learning_rate": 6.49491957835091e-05, "loss": 1.4626, "step": 26380 }, { "epoch": 2.08, "learning_rate": 6.493901519975986e-05, "loss": 1.4922, "step": 26381 }, { "epoch": 2.08, "learning_rate": 6.492883519352771e-05, "loss": 1.4815, "step": 26382 }, { "epoch": 2.08, "learning_rate": 6.491865576488187e-05, "loss": 1.431, "step": 26383 }, { "epoch": 2.08, "learning_rate": 6.490847691389142e-05, "loss": 1.4519, "step": 26384 }, { "epoch": 2.08, "learning_rate": 6.489829864062539e-05, "loss": 1.4798, "step": 26385 }, { "epoch": 2.08, "learning_rate": 6.4888120945153e-05, "loss": 1.4597, "step": 26386 }, { "epoch": 2.08, "learning_rate": 6.487794382754331e-05, "loss": 1.4675, "step": 26387 }, { "epoch": 2.08, "learning_rate": 6.486776728786535e-05, "loss": 1.477, "step": 26388 }, { "epoch": 2.08, "learning_rate": 6.485759132618832e-05, "loss": 1.4888, "step": 26389 }, { "epoch": 2.08, "learning_rate": 6.484741594258127e-05, "loss": 1.4635, "step": 26390 }, { "epoch": 2.08, "learning_rate": 6.483724113711322e-05, "loss": 1.4342, "step": 26391 }, { "epoch": 2.08, "learning_rate": 6.482706690985336e-05, "loss": 1.4566, "step": 26392 }, { "epoch": 2.08, "learning_rate": 6.481689326087069e-05, "loss": 1.4324, "step": 26393 }, { "epoch": 2.08, "learning_rate": 6.480672019023433e-05, "loss": 1.4642, "step": 26394 }, { "epoch": 2.08, "learning_rate": 6.479654769801327e-05, "loss": 1.502, "step": 26395 }, { "epoch": 2.08, "learning_rate": 6.478637578427662e-05, "loss": 1.4974, "step": 26396 }, { "epoch": 2.08, "learning_rate": 6.477620444909351e-05, "loss": 1.4181, "step": 26397 }, { "epoch": 2.08, "learning_rate": 6.476603369253296e-05, "loss": 1.4353, "step": 26398 }, { "epoch": 2.08, "learning_rate": 6.475586351466393e-05, "loss": 1.428, "step": 26399 }, { "epoch": 2.08, "learning_rate": 6.474569391555561e-05, "loss": 1.4565, "step": 26400 }, { "epoch": 2.08, "learning_rate": 6.473552489527699e-05, "loss": 1.4905, "step": 26401 }, { "epoch": 2.08, "learning_rate": 6.472535645389703e-05, "loss": 1.4462, "step": 26402 }, { "epoch": 2.08, "learning_rate": 6.471518859148491e-05, "loss": 1.4283, "step": 26403 }, { "epoch": 2.08, "learning_rate": 6.470502130810959e-05, "loss": 1.4279, "step": 26404 }, { "epoch": 2.08, "learning_rate": 6.469485460384005e-05, "loss": 1.4208, "step": 26405 }, { "epoch": 2.08, "learning_rate": 6.468468847874543e-05, "loss": 1.4453, "step": 26406 }, { "epoch": 2.08, "learning_rate": 6.467452293289468e-05, "loss": 1.4739, "step": 26407 }, { "epoch": 2.08, "learning_rate": 6.466435796635678e-05, "loss": 1.4396, "step": 26408 }, { "epoch": 2.08, "learning_rate": 6.465419357920087e-05, "loss": 1.499, "step": 26409 }, { "epoch": 2.08, "learning_rate": 6.464402977149588e-05, "loss": 1.5256, "step": 26410 }, { "epoch": 2.08, "learning_rate": 6.463386654331077e-05, "loss": 1.4427, "step": 26411 }, { "epoch": 2.08, "learning_rate": 6.462370389471459e-05, "loss": 1.4876, "step": 26412 }, { "epoch": 2.08, "learning_rate": 6.461354182577641e-05, "loss": 1.4515, "step": 26413 }, { "epoch": 2.08, "learning_rate": 6.460338033656516e-05, "loss": 1.4525, "step": 26414 }, { "epoch": 2.08, "learning_rate": 6.459321942714977e-05, "loss": 1.4731, "step": 26415 }, { "epoch": 2.08, "learning_rate": 6.458305909759936e-05, "loss": 1.4902, "step": 26416 }, { "epoch": 2.08, "learning_rate": 6.457289934798282e-05, "loss": 1.497, "step": 26417 }, { "epoch": 2.08, "learning_rate": 6.456274017836917e-05, "loss": 1.4594, "step": 26418 }, { "epoch": 2.08, "learning_rate": 6.45525815888273e-05, "loss": 1.4427, "step": 26419 }, { "epoch": 2.08, "learning_rate": 6.454242357942629e-05, "loss": 1.4492, "step": 26420 }, { "epoch": 2.08, "learning_rate": 6.453226615023508e-05, "loss": 1.4704, "step": 26421 }, { "epoch": 2.08, "learning_rate": 6.452210930132257e-05, "loss": 1.5112, "step": 26422 }, { "epoch": 2.08, "learning_rate": 6.451195303275782e-05, "loss": 1.4572, "step": 26423 }, { "epoch": 2.08, "learning_rate": 6.450179734460971e-05, "loss": 1.4572, "step": 26424 }, { "epoch": 2.08, "learning_rate": 6.449164223694718e-05, "loss": 1.4238, "step": 26425 }, { "epoch": 2.08, "learning_rate": 6.448148770983928e-05, "loss": 1.3934, "step": 26426 }, { "epoch": 2.08, "learning_rate": 6.44713337633548e-05, "loss": 1.484, "step": 26427 }, { "epoch": 2.08, "learning_rate": 6.446118039756283e-05, "loss": 1.402, "step": 26428 }, { "epoch": 2.08, "learning_rate": 6.445102761253218e-05, "loss": 1.4699, "step": 26429 }, { "epoch": 2.08, "learning_rate": 6.444087540833191e-05, "loss": 1.3887, "step": 26430 }, { "epoch": 2.08, "learning_rate": 6.443072378503088e-05, "loss": 1.4023, "step": 26431 }, { "epoch": 2.08, "learning_rate": 6.442057274269796e-05, "loss": 1.4503, "step": 26432 }, { "epoch": 2.08, "learning_rate": 6.441042228140218e-05, "loss": 1.4727, "step": 26433 }, { "epoch": 2.08, "learning_rate": 6.440027240121239e-05, "loss": 1.4256, "step": 26434 }, { "epoch": 2.08, "learning_rate": 6.439012310219752e-05, "loss": 1.3808, "step": 26435 }, { "epoch": 2.08, "learning_rate": 6.437997438442642e-05, "loss": 1.4906, "step": 26436 }, { "epoch": 2.08, "learning_rate": 6.436982624796808e-05, "loss": 1.4619, "step": 26437 }, { "epoch": 2.08, "learning_rate": 6.43596786928914e-05, "loss": 1.4347, "step": 26438 }, { "epoch": 2.08, "learning_rate": 6.434953171926517e-05, "loss": 1.4187, "step": 26439 }, { "epoch": 2.08, "learning_rate": 6.43393853271584e-05, "loss": 1.4466, "step": 26440 }, { "epoch": 2.08, "learning_rate": 6.432923951663993e-05, "loss": 1.4354, "step": 26441 }, { "epoch": 2.08, "learning_rate": 6.43190942877786e-05, "loss": 1.4687, "step": 26442 }, { "epoch": 2.08, "learning_rate": 6.430894964064332e-05, "loss": 1.4173, "step": 26443 }, { "epoch": 2.08, "learning_rate": 6.429880557530308e-05, "loss": 1.4328, "step": 26444 }, { "epoch": 2.08, "learning_rate": 6.428866209182663e-05, "loss": 1.4209, "step": 26445 }, { "epoch": 2.08, "learning_rate": 6.427851919028279e-05, "loss": 1.4644, "step": 26446 }, { "epoch": 2.08, "learning_rate": 6.426837687074058e-05, "loss": 1.4258, "step": 26447 }, { "epoch": 2.08, "learning_rate": 6.425823513326879e-05, "loss": 1.4416, "step": 26448 }, { "epoch": 2.08, "learning_rate": 6.424809397793618e-05, "loss": 1.4342, "step": 26449 }, { "epoch": 2.08, "learning_rate": 6.423795340481178e-05, "loss": 1.4207, "step": 26450 }, { "epoch": 2.08, "learning_rate": 6.422781341396432e-05, "loss": 1.3997, "step": 26451 }, { "epoch": 2.08, "learning_rate": 6.421767400546269e-05, "loss": 1.4456, "step": 26452 }, { "epoch": 2.08, "learning_rate": 6.420753517937566e-05, "loss": 1.4468, "step": 26453 }, { "epoch": 2.08, "learning_rate": 6.419739693577217e-05, "loss": 1.4224, "step": 26454 }, { "epoch": 2.08, "learning_rate": 6.418725927472101e-05, "loss": 1.4713, "step": 26455 }, { "epoch": 2.08, "learning_rate": 6.417712219629095e-05, "loss": 1.514, "step": 26456 }, { "epoch": 2.08, "learning_rate": 6.416698570055091e-05, "loss": 1.4857, "step": 26457 }, { "epoch": 2.08, "learning_rate": 6.415684978756964e-05, "loss": 1.4685, "step": 26458 }, { "epoch": 2.08, "learning_rate": 6.414671445741603e-05, "loss": 1.4729, "step": 26459 }, { "epoch": 2.08, "learning_rate": 6.41365797101588e-05, "loss": 1.463, "step": 26460 }, { "epoch": 2.08, "learning_rate": 6.412644554586685e-05, "loss": 1.494, "step": 26461 }, { "epoch": 2.08, "learning_rate": 6.411631196460897e-05, "loss": 1.4874, "step": 26462 }, { "epoch": 2.08, "learning_rate": 6.410617896645385e-05, "loss": 1.4301, "step": 26463 }, { "epoch": 2.08, "learning_rate": 6.409604655147046e-05, "loss": 1.4839, "step": 26464 }, { "epoch": 2.08, "learning_rate": 6.408591471972749e-05, "loss": 1.4446, "step": 26465 }, { "epoch": 2.08, "learning_rate": 6.407578347129371e-05, "loss": 1.447, "step": 26466 }, { "epoch": 2.08, "learning_rate": 6.406565280623798e-05, "loss": 1.4955, "step": 26467 }, { "epoch": 2.08, "learning_rate": 6.405552272462905e-05, "loss": 1.4422, "step": 26468 }, { "epoch": 2.08, "learning_rate": 6.40453932265357e-05, "loss": 1.4591, "step": 26469 }, { "epoch": 2.08, "learning_rate": 6.403526431202663e-05, "loss": 1.4656, "step": 26470 }, { "epoch": 2.08, "learning_rate": 6.402513598117074e-05, "loss": 1.4817, "step": 26471 }, { "epoch": 2.08, "learning_rate": 6.401500823403675e-05, "loss": 1.4535, "step": 26472 }, { "epoch": 2.08, "learning_rate": 6.400488107069332e-05, "loss": 1.4554, "step": 26473 }, { "epoch": 2.08, "learning_rate": 6.39947544912093e-05, "loss": 1.4653, "step": 26474 }, { "epoch": 2.08, "learning_rate": 6.398462849565349e-05, "loss": 1.4393, "step": 26475 }, { "epoch": 2.08, "learning_rate": 6.397450308409459e-05, "loss": 1.4896, "step": 26476 }, { "epoch": 2.08, "learning_rate": 6.396437825660128e-05, "loss": 1.4492, "step": 26477 }, { "epoch": 2.08, "learning_rate": 6.395425401324241e-05, "loss": 1.4932, "step": 26478 }, { "epoch": 2.08, "learning_rate": 6.394413035408668e-05, "loss": 1.4598, "step": 26479 }, { "epoch": 2.08, "learning_rate": 6.393400727920277e-05, "loss": 1.4415, "step": 26480 }, { "epoch": 2.08, "learning_rate": 6.392388478865951e-05, "loss": 1.4442, "step": 26481 }, { "epoch": 2.08, "learning_rate": 6.391376288252555e-05, "loss": 1.4765, "step": 26482 }, { "epoch": 2.08, "learning_rate": 6.39036415608696e-05, "loss": 1.4451, "step": 26483 }, { "epoch": 2.08, "learning_rate": 6.389352082376045e-05, "loss": 1.4338, "step": 26484 }, { "epoch": 2.08, "learning_rate": 6.388340067126679e-05, "loss": 1.4954, "step": 26485 }, { "epoch": 2.08, "learning_rate": 6.387328110345725e-05, "loss": 1.4807, "step": 26486 }, { "epoch": 2.08, "learning_rate": 6.386316212040068e-05, "loss": 1.4546, "step": 26487 }, { "epoch": 2.08, "learning_rate": 6.385304372216569e-05, "loss": 1.4531, "step": 26488 }, { "epoch": 2.08, "learning_rate": 6.384292590882099e-05, "loss": 1.5048, "step": 26489 }, { "epoch": 2.08, "learning_rate": 6.383280868043516e-05, "loss": 1.4356, "step": 26490 }, { "epoch": 2.08, "learning_rate": 6.382269203707714e-05, "loss": 1.4811, "step": 26491 }, { "epoch": 2.08, "learning_rate": 6.381257597881547e-05, "loss": 1.5132, "step": 26492 }, { "epoch": 2.08, "learning_rate": 6.380246050571885e-05, "loss": 1.487, "step": 26493 }, { "epoch": 2.08, "learning_rate": 6.37923456178559e-05, "loss": 1.4155, "step": 26494 }, { "epoch": 2.08, "learning_rate": 6.378223131529542e-05, "loss": 1.4372, "step": 26495 }, { "epoch": 2.08, "learning_rate": 6.377211759810598e-05, "loss": 1.3723, "step": 26496 }, { "epoch": 2.08, "learning_rate": 6.376200446635624e-05, "loss": 1.4635, "step": 26497 }, { "epoch": 2.08, "learning_rate": 6.375189192011496e-05, "loss": 1.4945, "step": 26498 }, { "epoch": 2.08, "learning_rate": 6.374177995945072e-05, "loss": 1.4555, "step": 26499 }, { "epoch": 2.09, "learning_rate": 6.373166858443217e-05, "loss": 1.4114, "step": 26500 }, { "epoch": 2.09, "learning_rate": 6.3721557795128e-05, "loss": 1.4389, "step": 26501 }, { "epoch": 2.09, "learning_rate": 6.371144759160686e-05, "loss": 1.4728, "step": 26502 }, { "epoch": 2.09, "learning_rate": 6.370133797393732e-05, "loss": 1.4685, "step": 26503 }, { "epoch": 2.09, "learning_rate": 6.369122894218812e-05, "loss": 1.4379, "step": 26504 }, { "epoch": 2.09, "learning_rate": 6.368112049642785e-05, "loss": 1.4723, "step": 26505 }, { "epoch": 2.09, "learning_rate": 6.367101263672506e-05, "loss": 1.4693, "step": 26506 }, { "epoch": 2.09, "learning_rate": 6.366090536314849e-05, "loss": 1.4263, "step": 26507 }, { "epoch": 2.09, "learning_rate": 6.365079867576677e-05, "loss": 1.4467, "step": 26508 }, { "epoch": 2.09, "learning_rate": 6.364069257464846e-05, "loss": 1.4348, "step": 26509 }, { "epoch": 2.09, "learning_rate": 6.36305870598622e-05, "loss": 1.4424, "step": 26510 }, { "epoch": 2.09, "learning_rate": 6.362048213147654e-05, "loss": 1.463, "step": 26511 }, { "epoch": 2.09, "learning_rate": 6.36103777895602e-05, "loss": 1.456, "step": 26512 }, { "epoch": 2.09, "learning_rate": 6.360027403418171e-05, "loss": 1.4555, "step": 26513 }, { "epoch": 2.09, "learning_rate": 6.359017086540962e-05, "loss": 1.4717, "step": 26514 }, { "epoch": 2.09, "learning_rate": 6.358006828331266e-05, "loss": 1.438, "step": 26515 }, { "epoch": 2.09, "learning_rate": 6.356996628795933e-05, "loss": 1.4466, "step": 26516 }, { "epoch": 2.09, "learning_rate": 6.355986487941818e-05, "loss": 1.4667, "step": 26517 }, { "epoch": 2.09, "learning_rate": 6.35497640577579e-05, "loss": 1.41, "step": 26518 }, { "epoch": 2.09, "learning_rate": 6.353966382304702e-05, "loss": 1.4647, "step": 26519 }, { "epoch": 2.09, "learning_rate": 6.352956417535405e-05, "loss": 1.4642, "step": 26520 }, { "epoch": 2.09, "learning_rate": 6.351946511474762e-05, "loss": 1.4593, "step": 26521 }, { "epoch": 2.09, "learning_rate": 6.350936664129636e-05, "loss": 1.4564, "step": 26522 }, { "epoch": 2.09, "learning_rate": 6.349926875506877e-05, "loss": 1.471, "step": 26523 }, { "epoch": 2.09, "learning_rate": 6.348917145613335e-05, "loss": 1.4822, "step": 26524 }, { "epoch": 2.09, "learning_rate": 6.347907474455876e-05, "loss": 1.4553, "step": 26525 }, { "epoch": 2.09, "learning_rate": 6.346897862041353e-05, "loss": 1.4618, "step": 26526 }, { "epoch": 2.09, "learning_rate": 6.345888308376612e-05, "loss": 1.4413, "step": 26527 }, { "epoch": 2.09, "learning_rate": 6.344878813468518e-05, "loss": 1.4842, "step": 26528 }, { "epoch": 2.09, "learning_rate": 6.343869377323921e-05, "loss": 1.4991, "step": 26529 }, { "epoch": 2.09, "learning_rate": 6.342859999949676e-05, "loss": 1.4755, "step": 26530 }, { "epoch": 2.09, "learning_rate": 6.341850681352627e-05, "loss": 1.4877, "step": 26531 }, { "epoch": 2.09, "learning_rate": 6.340841421539638e-05, "loss": 1.4576, "step": 26532 }, { "epoch": 2.09, "learning_rate": 6.33983222051756e-05, "loss": 1.4589, "step": 26533 }, { "epoch": 2.09, "learning_rate": 6.338823078293235e-05, "loss": 1.4139, "step": 26534 }, { "epoch": 2.09, "learning_rate": 6.337813994873527e-05, "loss": 1.4486, "step": 26535 }, { "epoch": 2.09, "learning_rate": 6.336804970265284e-05, "loss": 1.4277, "step": 26536 }, { "epoch": 2.09, "learning_rate": 6.335796004475346e-05, "loss": 1.4469, "step": 26537 }, { "epoch": 2.09, "learning_rate": 6.334787097510575e-05, "loss": 1.4414, "step": 26538 }, { "epoch": 2.09, "learning_rate": 6.33377824937782e-05, "loss": 1.4756, "step": 26539 }, { "epoch": 2.09, "learning_rate": 6.33276946008393e-05, "loss": 1.499, "step": 26540 }, { "epoch": 2.09, "learning_rate": 6.331760729635747e-05, "loss": 1.4157, "step": 26541 }, { "epoch": 2.09, "learning_rate": 6.33075205804013e-05, "loss": 1.4733, "step": 26542 }, { "epoch": 2.09, "learning_rate": 6.329743445303922e-05, "loss": 1.4847, "step": 26543 }, { "epoch": 2.09, "learning_rate": 6.328734891433967e-05, "loss": 1.467, "step": 26544 }, { "epoch": 2.09, "learning_rate": 6.327726396437123e-05, "loss": 1.4654, "step": 26545 }, { "epoch": 2.09, "learning_rate": 6.32671796032023e-05, "loss": 1.4492, "step": 26546 }, { "epoch": 2.09, "learning_rate": 6.325709583090135e-05, "loss": 1.5019, "step": 26547 }, { "epoch": 2.09, "learning_rate": 6.32470126475368e-05, "loss": 1.4385, "step": 26548 }, { "epoch": 2.09, "learning_rate": 6.323693005317722e-05, "loss": 1.473, "step": 26549 }, { "epoch": 2.09, "learning_rate": 6.3226848047891e-05, "loss": 1.4376, "step": 26550 }, { "epoch": 2.09, "learning_rate": 6.321676663174656e-05, "loss": 1.4356, "step": 26551 }, { "epoch": 2.09, "learning_rate": 6.320668580481241e-05, "loss": 1.4879, "step": 26552 }, { "epoch": 2.09, "learning_rate": 6.319660556715692e-05, "loss": 1.4166, "step": 26553 }, { "epoch": 2.09, "learning_rate": 6.318652591884865e-05, "loss": 1.4729, "step": 26554 }, { "epoch": 2.09, "learning_rate": 6.317644685995589e-05, "loss": 1.4785, "step": 26555 }, { "epoch": 2.09, "learning_rate": 6.316636839054719e-05, "loss": 1.4754, "step": 26556 }, { "epoch": 2.09, "learning_rate": 6.315629051069095e-05, "loss": 1.4272, "step": 26557 }, { "epoch": 2.09, "learning_rate": 6.31462132204555e-05, "loss": 1.4426, "step": 26558 }, { "epoch": 2.09, "learning_rate": 6.31361365199094e-05, "loss": 1.4279, "step": 26559 }, { "epoch": 2.09, "learning_rate": 6.312606040912099e-05, "loss": 1.4914, "step": 26560 }, { "epoch": 2.09, "learning_rate": 6.311598488815864e-05, "loss": 1.4263, "step": 26561 }, { "epoch": 2.09, "learning_rate": 6.310590995709085e-05, "loss": 1.4829, "step": 26562 }, { "epoch": 2.09, "learning_rate": 6.3095835615986e-05, "loss": 1.4385, "step": 26563 }, { "epoch": 2.09, "learning_rate": 6.308576186491245e-05, "loss": 1.4924, "step": 26564 }, { "epoch": 2.09, "learning_rate": 6.307568870393855e-05, "loss": 1.4519, "step": 26565 }, { "epoch": 2.09, "learning_rate": 6.306561613313284e-05, "loss": 1.4247, "step": 26566 }, { "epoch": 2.09, "learning_rate": 6.30555441525636e-05, "loss": 1.4832, "step": 26567 }, { "epoch": 2.09, "learning_rate": 6.304547276229919e-05, "loss": 1.4836, "step": 26568 }, { "epoch": 2.09, "learning_rate": 6.303540196240802e-05, "loss": 1.4352, "step": 26569 }, { "epoch": 2.09, "learning_rate": 6.302533175295855e-05, "loss": 1.4801, "step": 26570 }, { "epoch": 2.09, "learning_rate": 6.301526213401907e-05, "loss": 1.4405, "step": 26571 }, { "epoch": 2.09, "learning_rate": 6.300519310565791e-05, "loss": 1.4835, "step": 26572 }, { "epoch": 2.09, "learning_rate": 6.299512466794353e-05, "loss": 1.4599, "step": 26573 }, { "epoch": 2.09, "learning_rate": 6.298505682094425e-05, "loss": 1.5011, "step": 26574 }, { "epoch": 2.09, "learning_rate": 6.297498956472836e-05, "loss": 1.4546, "step": 26575 }, { "epoch": 2.09, "learning_rate": 6.296492289936433e-05, "loss": 1.4233, "step": 26576 }, { "epoch": 2.09, "learning_rate": 6.295485682492042e-05, "loss": 1.4342, "step": 26577 }, { "epoch": 2.09, "learning_rate": 6.294479134146496e-05, "loss": 1.414, "step": 26578 }, { "epoch": 2.09, "learning_rate": 6.293472644906637e-05, "loss": 1.446, "step": 26579 }, { "epoch": 2.09, "learning_rate": 6.292466214779294e-05, "loss": 1.4866, "step": 26580 }, { "epoch": 2.09, "learning_rate": 6.291459843771296e-05, "loss": 1.4418, "step": 26581 }, { "epoch": 2.09, "learning_rate": 6.290453531889484e-05, "loss": 1.464, "step": 26582 }, { "epoch": 2.09, "learning_rate": 6.289447279140687e-05, "loss": 1.4417, "step": 26583 }, { "epoch": 2.09, "learning_rate": 6.288441085531729e-05, "loss": 1.5272, "step": 26584 }, { "epoch": 2.09, "learning_rate": 6.287434951069451e-05, "loss": 1.4491, "step": 26585 }, { "epoch": 2.09, "learning_rate": 6.286428875760686e-05, "loss": 1.5196, "step": 26586 }, { "epoch": 2.09, "learning_rate": 6.285422859612261e-05, "loss": 1.4957, "step": 26587 }, { "epoch": 2.09, "learning_rate": 6.284416902631005e-05, "loss": 1.456, "step": 26588 }, { "epoch": 2.09, "learning_rate": 6.283411004823742e-05, "loss": 1.4395, "step": 26589 }, { "epoch": 2.09, "learning_rate": 6.282405166197314e-05, "loss": 1.4182, "step": 26590 }, { "epoch": 2.09, "learning_rate": 6.281399386758545e-05, "loss": 1.4708, "step": 26591 }, { "epoch": 2.09, "learning_rate": 6.280393666514258e-05, "loss": 1.4247, "step": 26592 }, { "epoch": 2.09, "learning_rate": 6.279388005471291e-05, "loss": 1.4368, "step": 26593 }, { "epoch": 2.09, "learning_rate": 6.278382403636467e-05, "loss": 1.4703, "step": 26594 }, { "epoch": 2.09, "learning_rate": 6.277376861016608e-05, "loss": 1.4238, "step": 26595 }, { "epoch": 2.09, "learning_rate": 6.276371377618552e-05, "loss": 1.4209, "step": 26596 }, { "epoch": 2.09, "learning_rate": 6.27536595344912e-05, "loss": 1.4939, "step": 26597 }, { "epoch": 2.09, "learning_rate": 6.274360588515133e-05, "loss": 1.4689, "step": 26598 }, { "epoch": 2.09, "learning_rate": 6.273355282823429e-05, "loss": 1.4505, "step": 26599 }, { "epoch": 2.09, "learning_rate": 6.272350036380821e-05, "loss": 1.4776, "step": 26600 }, { "epoch": 2.09, "learning_rate": 6.271344849194144e-05, "loss": 1.458, "step": 26601 }, { "epoch": 2.09, "learning_rate": 6.270339721270216e-05, "loss": 1.4187, "step": 26602 }, { "epoch": 2.09, "learning_rate": 6.269334652615866e-05, "loss": 1.4211, "step": 26603 }, { "epoch": 2.09, "learning_rate": 6.268329643237917e-05, "loss": 1.4341, "step": 26604 }, { "epoch": 2.09, "learning_rate": 6.267324693143191e-05, "loss": 1.4239, "step": 26605 }, { "epoch": 2.09, "learning_rate": 6.266319802338506e-05, "loss": 1.4541, "step": 26606 }, { "epoch": 2.09, "learning_rate": 6.265314970830696e-05, "loss": 1.4754, "step": 26607 }, { "epoch": 2.09, "learning_rate": 6.264310198626576e-05, "loss": 1.5246, "step": 26608 }, { "epoch": 2.09, "learning_rate": 6.263305485732964e-05, "loss": 1.4669, "step": 26609 }, { "epoch": 2.09, "learning_rate": 6.262300832156693e-05, "loss": 1.4589, "step": 26610 }, { "epoch": 2.09, "learning_rate": 6.261296237904576e-05, "loss": 1.4393, "step": 26611 }, { "epoch": 2.09, "learning_rate": 6.26029170298343e-05, "loss": 1.4533, "step": 26612 }, { "epoch": 2.09, "learning_rate": 6.259287227400087e-05, "loss": 1.4699, "step": 26613 }, { "epoch": 2.09, "learning_rate": 6.258282811161359e-05, "loss": 1.4854, "step": 26614 }, { "epoch": 2.09, "learning_rate": 6.257278454274061e-05, "loss": 1.4435, "step": 26615 }, { "epoch": 2.09, "learning_rate": 6.256274156745018e-05, "loss": 1.4967, "step": 26616 }, { "epoch": 2.09, "learning_rate": 6.255269918581055e-05, "loss": 1.4652, "step": 26617 }, { "epoch": 2.09, "learning_rate": 6.254265739788981e-05, "loss": 1.4681, "step": 26618 }, { "epoch": 2.09, "learning_rate": 6.253261620375612e-05, "loss": 1.4784, "step": 26619 }, { "epoch": 2.09, "learning_rate": 6.252257560347776e-05, "loss": 1.4865, "step": 26620 }, { "epoch": 2.09, "learning_rate": 6.251253559712283e-05, "loss": 1.4539, "step": 26621 }, { "epoch": 2.09, "learning_rate": 6.250249618475952e-05, "loss": 1.4986, "step": 26622 }, { "epoch": 2.09, "learning_rate": 6.249245736645589e-05, "loss": 1.468, "step": 26623 }, { "epoch": 2.09, "learning_rate": 6.248241914228025e-05, "loss": 1.4742, "step": 26624 }, { "epoch": 2.09, "learning_rate": 6.247238151230071e-05, "loss": 1.4153, "step": 26625 }, { "epoch": 2.09, "learning_rate": 6.246234447658532e-05, "loss": 1.52, "step": 26626 }, { "epoch": 2.1, "learning_rate": 6.245230803520237e-05, "loss": 1.439, "step": 26627 }, { "epoch": 2.1, "learning_rate": 6.244227218821992e-05, "loss": 1.4691, "step": 26628 }, { "epoch": 2.1, "learning_rate": 6.243223693570608e-05, "loss": 1.4878, "step": 26629 }, { "epoch": 2.1, "learning_rate": 6.242220227772908e-05, "loss": 1.4242, "step": 26630 }, { "epoch": 2.1, "learning_rate": 6.241216821435695e-05, "loss": 1.4667, "step": 26631 }, { "epoch": 2.1, "learning_rate": 6.240213474565791e-05, "loss": 1.5085, "step": 26632 }, { "epoch": 2.1, "learning_rate": 6.239210187169997e-05, "loss": 1.4728, "step": 26633 }, { "epoch": 2.1, "learning_rate": 6.238206959255138e-05, "loss": 1.5155, "step": 26634 }, { "epoch": 2.1, "learning_rate": 6.23720379082802e-05, "loss": 1.4723, "step": 26635 }, { "epoch": 2.1, "learning_rate": 6.236200681895446e-05, "loss": 1.437, "step": 26636 }, { "epoch": 2.1, "learning_rate": 6.235197632464236e-05, "loss": 1.4305, "step": 26637 }, { "epoch": 2.1, "learning_rate": 6.2341946425412e-05, "loss": 1.4615, "step": 26638 }, { "epoch": 2.1, "learning_rate": 6.233191712133139e-05, "loss": 1.4464, "step": 26639 }, { "epoch": 2.1, "learning_rate": 6.232188841246874e-05, "loss": 1.4047, "step": 26640 }, { "epoch": 2.1, "learning_rate": 6.231186029889207e-05, "loss": 1.3892, "step": 26641 }, { "epoch": 2.1, "learning_rate": 6.23018327806695e-05, "loss": 1.4781, "step": 26642 }, { "epoch": 2.1, "learning_rate": 6.229180585786902e-05, "loss": 1.3912, "step": 26643 }, { "epoch": 2.1, "learning_rate": 6.228177953055882e-05, "loss": 1.4263, "step": 26644 }, { "epoch": 2.1, "learning_rate": 6.227175379880694e-05, "loss": 1.4277, "step": 26645 }, { "epoch": 2.1, "learning_rate": 6.22617286626814e-05, "loss": 1.4224, "step": 26646 }, { "epoch": 2.1, "learning_rate": 6.225170412225029e-05, "loss": 1.4736, "step": 26647 }, { "epoch": 2.1, "learning_rate": 6.224168017758175e-05, "loss": 1.508, "step": 26648 }, { "epoch": 2.1, "learning_rate": 6.223165682874377e-05, "loss": 1.4517, "step": 26649 }, { "epoch": 2.1, "learning_rate": 6.222163407580434e-05, "loss": 1.4649, "step": 26650 }, { "epoch": 2.1, "learning_rate": 6.221161191883164e-05, "loss": 1.4561, "step": 26651 }, { "epoch": 2.1, "learning_rate": 6.220159035789364e-05, "loss": 1.4369, "step": 26652 }, { "epoch": 2.1, "learning_rate": 6.219156939305835e-05, "loss": 1.477, "step": 26653 }, { "epoch": 2.1, "learning_rate": 6.218154902439388e-05, "loss": 1.4635, "step": 26654 }, { "epoch": 2.1, "learning_rate": 6.217152925196824e-05, "loss": 1.481, "step": 26655 }, { "epoch": 2.1, "learning_rate": 6.216151007584941e-05, "loss": 1.4434, "step": 26656 }, { "epoch": 2.1, "learning_rate": 6.215149149610549e-05, "loss": 1.5031, "step": 26657 }, { "epoch": 2.1, "learning_rate": 6.214147351280447e-05, "loss": 1.4586, "step": 26658 }, { "epoch": 2.1, "learning_rate": 6.213145612601436e-05, "loss": 1.4283, "step": 26659 }, { "epoch": 2.1, "learning_rate": 6.212143933580311e-05, "loss": 1.428, "step": 26660 }, { "epoch": 2.1, "learning_rate": 6.211142314223885e-05, "loss": 1.4065, "step": 26661 }, { "epoch": 2.1, "learning_rate": 6.210140754538955e-05, "loss": 1.4827, "step": 26662 }, { "epoch": 2.1, "learning_rate": 6.209139254532311e-05, "loss": 1.4857, "step": 26663 }, { "epoch": 2.1, "learning_rate": 6.208137814210758e-05, "loss": 1.4977, "step": 26664 }, { "epoch": 2.1, "learning_rate": 6.207136433581107e-05, "loss": 1.4854, "step": 26665 }, { "epoch": 2.1, "learning_rate": 6.206135112650145e-05, "loss": 1.4825, "step": 26666 }, { "epoch": 2.1, "learning_rate": 6.205133851424668e-05, "loss": 1.4165, "step": 26667 }, { "epoch": 2.1, "learning_rate": 6.204132649911484e-05, "loss": 1.412, "step": 26668 }, { "epoch": 2.1, "learning_rate": 6.203131508117386e-05, "loss": 1.4902, "step": 26669 }, { "epoch": 2.1, "learning_rate": 6.202130426049163e-05, "loss": 1.4499, "step": 26670 }, { "epoch": 2.1, "learning_rate": 6.201129403713627e-05, "loss": 1.4473, "step": 26671 }, { "epoch": 2.1, "learning_rate": 6.200128441117566e-05, "loss": 1.4945, "step": 26672 }, { "epoch": 2.1, "learning_rate": 6.199127538267772e-05, "loss": 1.476, "step": 26673 }, { "epoch": 2.1, "learning_rate": 6.198126695171051e-05, "loss": 1.4609, "step": 26674 }, { "epoch": 2.1, "learning_rate": 6.19712591183419e-05, "loss": 1.4535, "step": 26675 }, { "epoch": 2.1, "learning_rate": 6.196125188263988e-05, "loss": 1.4467, "step": 26676 }, { "epoch": 2.1, "learning_rate": 6.195124524467232e-05, "loss": 1.4633, "step": 26677 }, { "epoch": 2.1, "learning_rate": 6.19412392045072e-05, "loss": 1.3969, "step": 26678 }, { "epoch": 2.1, "learning_rate": 6.193123376221256e-05, "loss": 1.4735, "step": 26679 }, { "epoch": 2.1, "learning_rate": 6.192122891785617e-05, "loss": 1.4245, "step": 26680 }, { "epoch": 2.1, "learning_rate": 6.191122467150607e-05, "loss": 1.4597, "step": 26681 }, { "epoch": 2.1, "learning_rate": 6.190122102323016e-05, "loss": 1.5169, "step": 26682 }, { "epoch": 2.1, "learning_rate": 6.189121797309634e-05, "loss": 1.3973, "step": 26683 }, { "epoch": 2.1, "learning_rate": 6.188121552117247e-05, "loss": 1.4557, "step": 26684 }, { "epoch": 2.1, "learning_rate": 6.187121366752657e-05, "loss": 1.4852, "step": 26685 }, { "epoch": 2.1, "learning_rate": 6.18612124122265e-05, "loss": 1.4712, "step": 26686 }, { "epoch": 2.1, "learning_rate": 6.185121175534011e-05, "loss": 1.4117, "step": 26687 }, { "epoch": 2.1, "learning_rate": 6.18412116969354e-05, "loss": 1.4481, "step": 26688 }, { "epoch": 2.1, "learning_rate": 6.183121223708019e-05, "loss": 1.443, "step": 26689 }, { "epoch": 2.1, "learning_rate": 6.182121337584236e-05, "loss": 1.501, "step": 26690 }, { "epoch": 2.1, "learning_rate": 6.181121511328989e-05, "loss": 1.4445, "step": 26691 }, { "epoch": 2.1, "learning_rate": 6.18012174494906e-05, "loss": 1.449, "step": 26692 }, { "epoch": 2.1, "learning_rate": 6.179122038451231e-05, "loss": 1.4963, "step": 26693 }, { "epoch": 2.1, "learning_rate": 6.178122391842296e-05, "loss": 1.4433, "step": 26694 }, { "epoch": 2.1, "learning_rate": 6.177122805129046e-05, "loss": 1.4515, "step": 26695 }, { "epoch": 2.1, "learning_rate": 6.176123278318264e-05, "loss": 1.4362, "step": 26696 }, { "epoch": 2.1, "learning_rate": 6.175123811416731e-05, "loss": 1.4589, "step": 26697 }, { "epoch": 2.1, "learning_rate": 6.174124404431242e-05, "loss": 1.4562, "step": 26698 }, { "epoch": 2.1, "learning_rate": 6.173125057368578e-05, "loss": 1.4746, "step": 26699 }, { "epoch": 2.1, "learning_rate": 6.172125770235524e-05, "loss": 1.4712, "step": 26700 }, { "epoch": 2.1, "learning_rate": 6.171126543038857e-05, "loss": 1.4556, "step": 26701 }, { "epoch": 2.1, "learning_rate": 6.170127375785376e-05, "loss": 1.424, "step": 26702 }, { "epoch": 2.1, "learning_rate": 6.169128268481858e-05, "loss": 1.4521, "step": 26703 }, { "epoch": 2.1, "learning_rate": 6.168129221135079e-05, "loss": 1.4737, "step": 26704 }, { "epoch": 2.1, "learning_rate": 6.167130233751834e-05, "loss": 1.4618, "step": 26705 }, { "epoch": 2.1, "learning_rate": 6.1661313063389e-05, "loss": 1.4364, "step": 26706 }, { "epoch": 2.1, "learning_rate": 6.165132438903055e-05, "loss": 1.4394, "step": 26707 }, { "epoch": 2.1, "learning_rate": 6.164133631451091e-05, "loss": 1.4575, "step": 26708 }, { "epoch": 2.1, "learning_rate": 6.163134883989782e-05, "loss": 1.5167, "step": 26709 }, { "epoch": 2.1, "learning_rate": 6.162136196525907e-05, "loss": 1.4884, "step": 26710 }, { "epoch": 2.1, "learning_rate": 6.16113756906625e-05, "loss": 1.4907, "step": 26711 }, { "epoch": 2.1, "learning_rate": 6.160139001617597e-05, "loss": 1.5291, "step": 26712 }, { "epoch": 2.1, "learning_rate": 6.15914049418672e-05, "loss": 1.5077, "step": 26713 }, { "epoch": 2.1, "learning_rate": 6.158142046780396e-05, "loss": 1.459, "step": 26714 }, { "epoch": 2.1, "learning_rate": 6.157143659405412e-05, "loss": 1.4186, "step": 26715 }, { "epoch": 2.1, "learning_rate": 6.156145332068545e-05, "loss": 1.4651, "step": 26716 }, { "epoch": 2.1, "learning_rate": 6.15514706477657e-05, "loss": 1.4465, "step": 26717 }, { "epoch": 2.1, "learning_rate": 6.154148857536261e-05, "loss": 1.464, "step": 26718 }, { "epoch": 2.1, "learning_rate": 6.153150710354403e-05, "loss": 1.4551, "step": 26719 }, { "epoch": 2.1, "learning_rate": 6.152152623237771e-05, "loss": 1.4867, "step": 26720 }, { "epoch": 2.1, "learning_rate": 6.151154596193133e-05, "loss": 1.4172, "step": 26721 }, { "epoch": 2.1, "learning_rate": 6.150156629227279e-05, "loss": 1.447, "step": 26722 }, { "epoch": 2.1, "learning_rate": 6.149158722346977e-05, "loss": 1.4921, "step": 26723 }, { "epoch": 2.1, "learning_rate": 6.148160875558998e-05, "loss": 1.4365, "step": 26724 }, { "epoch": 2.1, "learning_rate": 6.147163088870127e-05, "loss": 1.4825, "step": 26725 }, { "epoch": 2.1, "learning_rate": 6.146165362287128e-05, "loss": 1.4498, "step": 26726 }, { "epoch": 2.1, "learning_rate": 6.145167695816787e-05, "loss": 1.4566, "step": 26727 }, { "epoch": 2.1, "learning_rate": 6.144170089465865e-05, "loss": 1.4651, "step": 26728 }, { "epoch": 2.1, "learning_rate": 6.143172543241144e-05, "loss": 1.4144, "step": 26729 }, { "epoch": 2.1, "learning_rate": 6.142175057149396e-05, "loss": 1.4563, "step": 26730 }, { "epoch": 2.1, "learning_rate": 6.141177631197385e-05, "loss": 1.4688, "step": 26731 }, { "epoch": 2.1, "learning_rate": 6.140180265391895e-05, "loss": 1.4502, "step": 26732 }, { "epoch": 2.1, "learning_rate": 6.139182959739692e-05, "loss": 1.4782, "step": 26733 }, { "epoch": 2.1, "learning_rate": 6.138185714247545e-05, "loss": 1.4743, "step": 26734 }, { "epoch": 2.1, "learning_rate": 6.137188528922224e-05, "loss": 1.4717, "step": 26735 }, { "epoch": 2.1, "learning_rate": 6.136191403770505e-05, "loss": 1.4026, "step": 26736 }, { "epoch": 2.1, "learning_rate": 6.135194338799156e-05, "loss": 1.4782, "step": 26737 }, { "epoch": 2.1, "learning_rate": 6.13419733401494e-05, "loss": 1.4483, "step": 26738 }, { "epoch": 2.1, "learning_rate": 6.133200389424638e-05, "loss": 1.4046, "step": 26739 }, { "epoch": 2.1, "learning_rate": 6.132203505035011e-05, "loss": 1.4719, "step": 26740 }, { "epoch": 2.1, "learning_rate": 6.131206680852823e-05, "loss": 1.4734, "step": 26741 }, { "epoch": 2.1, "learning_rate": 6.130209916884847e-05, "loss": 1.489, "step": 26742 }, { "epoch": 2.1, "learning_rate": 6.129213213137857e-05, "loss": 1.4175, "step": 26743 }, { "epoch": 2.1, "learning_rate": 6.128216569618614e-05, "loss": 1.4407, "step": 26744 }, { "epoch": 2.1, "learning_rate": 6.12721998633388e-05, "loss": 1.4636, "step": 26745 }, { "epoch": 2.1, "learning_rate": 6.126223463290429e-05, "loss": 1.3967, "step": 26746 }, { "epoch": 2.1, "learning_rate": 6.125227000495027e-05, "loss": 1.4899, "step": 26747 }, { "epoch": 2.1, "learning_rate": 6.12423059795443e-05, "loss": 1.4523, "step": 26748 }, { "epoch": 2.1, "learning_rate": 6.123234255675412e-05, "loss": 1.4773, "step": 26749 }, { "epoch": 2.1, "learning_rate": 6.122237973664736e-05, "loss": 1.4904, "step": 26750 }, { "epoch": 2.1, "learning_rate": 6.12124175192916e-05, "loss": 1.545, "step": 26751 }, { "epoch": 2.1, "learning_rate": 6.12024559047546e-05, "loss": 1.4689, "step": 26752 }, { "epoch": 2.1, "learning_rate": 6.11924948931039e-05, "loss": 1.443, "step": 26753 }, { "epoch": 2.11, "learning_rate": 6.118253448440714e-05, "loss": 1.4758, "step": 26754 }, { "epoch": 2.11, "learning_rate": 6.117257467873193e-05, "loss": 1.4495, "step": 26755 }, { "epoch": 2.11, "learning_rate": 6.116261547614597e-05, "loss": 1.4677, "step": 26756 }, { "epoch": 2.11, "learning_rate": 6.115265687671676e-05, "loss": 1.4371, "step": 26757 }, { "epoch": 2.11, "learning_rate": 6.114269888051203e-05, "loss": 1.4328, "step": 26758 }, { "epoch": 2.11, "learning_rate": 6.11327414875993e-05, "loss": 1.4649, "step": 26759 }, { "epoch": 2.11, "learning_rate": 6.112278469804626e-05, "loss": 1.4364, "step": 26760 }, { "epoch": 2.11, "learning_rate": 6.111282851192048e-05, "loss": 1.4496, "step": 26761 }, { "epoch": 2.11, "learning_rate": 6.110287292928945e-05, "loss": 1.47, "step": 26762 }, { "epoch": 2.11, "learning_rate": 6.109291795022094e-05, "loss": 1.4864, "step": 26763 }, { "epoch": 2.11, "learning_rate": 6.108296357478246e-05, "loss": 1.4426, "step": 26764 }, { "epoch": 2.11, "learning_rate": 6.107300980304153e-05, "loss": 1.4674, "step": 26765 }, { "epoch": 2.11, "learning_rate": 6.106305663506584e-05, "loss": 1.4569, "step": 26766 }, { "epoch": 2.11, "learning_rate": 6.10531040709229e-05, "loss": 1.4797, "step": 26767 }, { "epoch": 2.11, "learning_rate": 6.104315211068027e-05, "loss": 1.4134, "step": 26768 }, { "epoch": 2.11, "learning_rate": 6.103320075440559e-05, "loss": 1.4139, "step": 26769 }, { "epoch": 2.11, "learning_rate": 6.102325000216638e-05, "loss": 1.457, "step": 26770 }, { "epoch": 2.11, "learning_rate": 6.1013299854030196e-05, "loss": 1.4548, "step": 26771 }, { "epoch": 2.11, "learning_rate": 6.1003350310064545e-05, "loss": 1.4527, "step": 26772 }, { "epoch": 2.11, "learning_rate": 6.099340137033704e-05, "loss": 1.4983, "step": 26773 }, { "epoch": 2.11, "learning_rate": 6.0983453034915275e-05, "loss": 1.4195, "step": 26774 }, { "epoch": 2.11, "learning_rate": 6.097350530386674e-05, "loss": 1.4714, "step": 26775 }, { "epoch": 2.11, "learning_rate": 6.096355817725891e-05, "loss": 1.4614, "step": 26776 }, { "epoch": 2.11, "learning_rate": 6.095361165515945e-05, "loss": 1.4223, "step": 26777 }, { "epoch": 2.11, "learning_rate": 6.094366573763583e-05, "loss": 1.4405, "step": 26778 }, { "epoch": 2.11, "learning_rate": 6.093372042475552e-05, "loss": 1.4823, "step": 26779 }, { "epoch": 2.11, "learning_rate": 6.0923775716586146e-05, "loss": 1.4427, "step": 26780 }, { "epoch": 2.11, "learning_rate": 6.0913831613195175e-05, "loss": 1.5158, "step": 26781 }, { "epoch": 2.11, "learning_rate": 6.090388811465009e-05, "loss": 1.4502, "step": 26782 }, { "epoch": 2.11, "learning_rate": 6.0893945221018475e-05, "loss": 1.4586, "step": 26783 }, { "epoch": 2.11, "learning_rate": 6.088400293236781e-05, "loss": 1.4643, "step": 26784 }, { "epoch": 2.11, "learning_rate": 6.087406124876552e-05, "loss": 1.4702, "step": 26785 }, { "epoch": 2.11, "learning_rate": 6.0864120170279223e-05, "loss": 1.4939, "step": 26786 }, { "epoch": 2.11, "learning_rate": 6.085417969697638e-05, "loss": 1.4703, "step": 26787 }, { "epoch": 2.11, "learning_rate": 6.084423982892438e-05, "loss": 1.466, "step": 26788 }, { "epoch": 2.11, "learning_rate": 6.083430056619082e-05, "loss": 1.474, "step": 26789 }, { "epoch": 2.11, "learning_rate": 6.082436190884319e-05, "loss": 1.506, "step": 26790 }, { "epoch": 2.11, "learning_rate": 6.081442385694894e-05, "loss": 1.4333, "step": 26791 }, { "epoch": 2.11, "learning_rate": 6.080448641057547e-05, "loss": 1.4539, "step": 26792 }, { "epoch": 2.11, "learning_rate": 6.079454956979038e-05, "loss": 1.4573, "step": 26793 }, { "epoch": 2.11, "learning_rate": 6.078461333466107e-05, "loss": 1.5236, "step": 26794 }, { "epoch": 2.11, "learning_rate": 6.0774677705255004e-05, "loss": 1.4498, "step": 26795 }, { "epoch": 2.11, "learning_rate": 6.076474268163958e-05, "loss": 1.4796, "step": 26796 }, { "epoch": 2.11, "learning_rate": 6.0754808263882366e-05, "loss": 1.4996, "step": 26797 }, { "epoch": 2.11, "learning_rate": 6.074487445205075e-05, "loss": 1.4523, "step": 26798 }, { "epoch": 2.11, "learning_rate": 6.0734941246212134e-05, "loss": 1.5089, "step": 26799 }, { "epoch": 2.11, "learning_rate": 6.072500864643404e-05, "loss": 1.4338, "step": 26800 }, { "epoch": 2.11, "learning_rate": 6.071507665278389e-05, "loss": 1.4667, "step": 26801 }, { "epoch": 2.11, "learning_rate": 6.070514526532904e-05, "loss": 1.4656, "step": 26802 }, { "epoch": 2.11, "learning_rate": 6.069521448413704e-05, "loss": 1.4841, "step": 26803 }, { "epoch": 2.11, "learning_rate": 6.068528430927518e-05, "loss": 1.5121, "step": 26804 }, { "epoch": 2.11, "learning_rate": 6.067535474081102e-05, "loss": 1.4047, "step": 26805 }, { "epoch": 2.11, "learning_rate": 6.066542577881185e-05, "loss": 1.3924, "step": 26806 }, { "epoch": 2.11, "learning_rate": 6.065549742334519e-05, "loss": 1.4338, "step": 26807 }, { "epoch": 2.11, "learning_rate": 6.06455696744784e-05, "loss": 1.445, "step": 26808 }, { "epoch": 2.11, "learning_rate": 6.0635642532278825e-05, "loss": 1.468, "step": 26809 }, { "epoch": 2.11, "learning_rate": 6.0625715996813986e-05, "loss": 1.4397, "step": 26810 }, { "epoch": 2.11, "learning_rate": 6.0615790068151196e-05, "loss": 1.4909, "step": 26811 }, { "epoch": 2.11, "learning_rate": 6.060586474635789e-05, "loss": 1.4624, "step": 26812 }, { "epoch": 2.11, "learning_rate": 6.0595940031501355e-05, "loss": 1.4446, "step": 26813 }, { "epoch": 2.11, "learning_rate": 6.0586015923649103e-05, "loss": 1.3941, "step": 26814 }, { "epoch": 2.11, "learning_rate": 6.057609242286848e-05, "loss": 1.4836, "step": 26815 }, { "epoch": 2.11, "learning_rate": 6.0566169529226766e-05, "loss": 1.5024, "step": 26816 }, { "epoch": 2.11, "learning_rate": 6.055624724279148e-05, "loss": 1.4696, "step": 26817 }, { "epoch": 2.11, "learning_rate": 6.05463255636299e-05, "loss": 1.4171, "step": 26818 }, { "epoch": 2.11, "learning_rate": 6.053640449180936e-05, "loss": 1.4913, "step": 26819 }, { "epoch": 2.11, "learning_rate": 6.052648402739726e-05, "loss": 1.4111, "step": 26820 }, { "epoch": 2.11, "learning_rate": 6.0516564170461014e-05, "loss": 1.4737, "step": 26821 }, { "epoch": 2.11, "learning_rate": 6.050664492106792e-05, "loss": 1.4494, "step": 26822 }, { "epoch": 2.11, "learning_rate": 6.049672627928526e-05, "loss": 1.4407, "step": 26823 }, { "epoch": 2.11, "learning_rate": 6.0486808245180504e-05, "loss": 1.4775, "step": 26824 }, { "epoch": 2.11, "learning_rate": 6.047689081882091e-05, "loss": 1.4963, "step": 26825 }, { "epoch": 2.11, "learning_rate": 6.046697400027377e-05, "loss": 1.4817, "step": 26826 }, { "epoch": 2.11, "learning_rate": 6.045705778960653e-05, "loss": 1.4151, "step": 26827 }, { "epoch": 2.11, "learning_rate": 6.044714218688644e-05, "loss": 1.457, "step": 26828 }, { "epoch": 2.11, "learning_rate": 6.043722719218085e-05, "loss": 1.4622, "step": 26829 }, { "epoch": 2.11, "learning_rate": 6.0427312805556986e-05, "loss": 1.487, "step": 26830 }, { "epoch": 2.11, "learning_rate": 6.0417399027082326e-05, "loss": 1.4734, "step": 26831 }, { "epoch": 2.11, "learning_rate": 6.040748585682406e-05, "loss": 1.4664, "step": 26832 }, { "epoch": 2.11, "learning_rate": 6.039757329484949e-05, "loss": 1.5012, "step": 26833 }, { "epoch": 2.11, "learning_rate": 6.038766134122599e-05, "loss": 1.4607, "step": 26834 }, { "epoch": 2.11, "learning_rate": 6.037774999602082e-05, "loss": 1.4989, "step": 26835 }, { "epoch": 2.11, "learning_rate": 6.036783925930123e-05, "loss": 1.4779, "step": 26836 }, { "epoch": 2.11, "learning_rate": 6.035792913113454e-05, "loss": 1.463, "step": 26837 }, { "epoch": 2.11, "learning_rate": 6.034801961158808e-05, "loss": 1.4409, "step": 26838 }, { "epoch": 2.11, "learning_rate": 6.033811070072911e-05, "loss": 1.4561, "step": 26839 }, { "epoch": 2.11, "learning_rate": 6.032820239862484e-05, "loss": 1.3805, "step": 26840 }, { "epoch": 2.11, "learning_rate": 6.031829470534263e-05, "loss": 1.4626, "step": 26841 }, { "epoch": 2.11, "learning_rate": 6.030838762094972e-05, "loss": 1.4856, "step": 26842 }, { "epoch": 2.11, "learning_rate": 6.02984811455133e-05, "loss": 1.4212, "step": 26843 }, { "epoch": 2.11, "learning_rate": 6.028857527910076e-05, "loss": 1.4824, "step": 26844 }, { "epoch": 2.11, "learning_rate": 6.027867002177928e-05, "loss": 1.4404, "step": 26845 }, { "epoch": 2.11, "learning_rate": 6.026876537361611e-05, "loss": 1.4337, "step": 26846 }, { "epoch": 2.11, "learning_rate": 6.025886133467845e-05, "loss": 1.4108, "step": 26847 }, { "epoch": 2.11, "learning_rate": 6.0248957905033665e-05, "loss": 1.4438, "step": 26848 }, { "epoch": 2.11, "learning_rate": 6.0239055084748913e-05, "loss": 1.5278, "step": 26849 }, { "epoch": 2.11, "learning_rate": 6.02291528738914e-05, "loss": 1.514, "step": 26850 }, { "epoch": 2.11, "learning_rate": 6.02192512725284e-05, "loss": 1.4844, "step": 26851 }, { "epoch": 2.11, "learning_rate": 6.020935028072719e-05, "loss": 1.4314, "step": 26852 }, { "epoch": 2.11, "learning_rate": 6.019944989855493e-05, "loss": 1.4695, "step": 26853 }, { "epoch": 2.11, "learning_rate": 6.018955012607881e-05, "loss": 1.5043, "step": 26854 }, { "epoch": 2.11, "learning_rate": 6.017965096336613e-05, "loss": 1.4415, "step": 26855 }, { "epoch": 2.11, "learning_rate": 6.0169752410484055e-05, "loss": 1.4453, "step": 26856 }, { "epoch": 2.11, "learning_rate": 6.015985446749973e-05, "loss": 1.4459, "step": 26857 }, { "epoch": 2.11, "learning_rate": 6.014995713448048e-05, "loss": 1.469, "step": 26858 }, { "epoch": 2.11, "learning_rate": 6.0140060411493425e-05, "loss": 1.4246, "step": 26859 }, { "epoch": 2.11, "learning_rate": 6.013016429860572e-05, "loss": 1.4535, "step": 26860 }, { "epoch": 2.11, "learning_rate": 6.0120268795884666e-05, "loss": 1.4324, "step": 26861 }, { "epoch": 2.11, "learning_rate": 6.011037390339738e-05, "loss": 1.3968, "step": 26862 }, { "epoch": 2.11, "learning_rate": 6.0100479621211e-05, "loss": 1.408, "step": 26863 }, { "epoch": 2.11, "learning_rate": 6.009058594939281e-05, "loss": 1.4342, "step": 26864 }, { "epoch": 2.11, "learning_rate": 6.008069288800992e-05, "loss": 1.431, "step": 26865 }, { "epoch": 2.11, "learning_rate": 6.00708004371295e-05, "loss": 1.4649, "step": 26866 }, { "epoch": 2.11, "learning_rate": 6.006090859681862e-05, "loss": 1.4547, "step": 26867 }, { "epoch": 2.11, "learning_rate": 6.0051017367144654e-05, "loss": 1.3959, "step": 26868 }, { "epoch": 2.11, "learning_rate": 6.004112674817462e-05, "loss": 1.4762, "step": 26869 }, { "epoch": 2.11, "learning_rate": 6.003123673997571e-05, "loss": 1.4862, "step": 26870 }, { "epoch": 2.11, "learning_rate": 6.002134734261499e-05, "loss": 1.4487, "step": 26871 }, { "epoch": 2.11, "learning_rate": 6.001145855615972e-05, "loss": 1.4827, "step": 26872 }, { "epoch": 2.11, "learning_rate": 6.000157038067698e-05, "loss": 1.418, "step": 26873 }, { "epoch": 2.11, "learning_rate": 5.9991682816233875e-05, "loss": 1.4418, "step": 26874 }, { "epoch": 2.11, "learning_rate": 5.9981795862897626e-05, "loss": 1.4815, "step": 26875 }, { "epoch": 2.11, "learning_rate": 5.997190952073528e-05, "loss": 1.4397, "step": 26876 }, { "epoch": 2.11, "learning_rate": 5.996202378981397e-05, "loss": 1.3879, "step": 26877 }, { "epoch": 2.11, "learning_rate": 5.9952138670200856e-05, "loss": 1.4393, "step": 26878 }, { "epoch": 2.11, "learning_rate": 5.9942254161963045e-05, "loss": 1.4496, "step": 26879 }, { "epoch": 2.11, "learning_rate": 5.993237026516758e-05, "loss": 1.4736, "step": 26880 }, { "epoch": 2.12, "learning_rate": 5.992248697988166e-05, "loss": 1.4365, "step": 26881 }, { "epoch": 2.12, "learning_rate": 5.991260430617234e-05, "loss": 1.4561, "step": 26882 }, { "epoch": 2.12, "learning_rate": 5.9902722244106674e-05, "loss": 1.4174, "step": 26883 }, { "epoch": 2.12, "learning_rate": 5.989284079375181e-05, "loss": 1.4648, "step": 26884 }, { "epoch": 2.12, "learning_rate": 5.9882959955174874e-05, "loss": 1.4571, "step": 26885 }, { "epoch": 2.12, "learning_rate": 5.987307972844293e-05, "loss": 1.46, "step": 26886 }, { "epoch": 2.12, "learning_rate": 5.9863200113623025e-05, "loss": 1.4948, "step": 26887 }, { "epoch": 2.12, "learning_rate": 5.985332111078218e-05, "loss": 1.4555, "step": 26888 }, { "epoch": 2.12, "learning_rate": 5.984344271998762e-05, "loss": 1.4595, "step": 26889 }, { "epoch": 2.12, "learning_rate": 5.983356494130632e-05, "loss": 1.4406, "step": 26890 }, { "epoch": 2.12, "learning_rate": 5.9823687774805295e-05, "loss": 1.4682, "step": 26891 }, { "epoch": 2.12, "learning_rate": 5.981381122055172e-05, "loss": 1.4646, "step": 26892 }, { "epoch": 2.12, "learning_rate": 5.980393527861261e-05, "loss": 1.496, "step": 26893 }, { "epoch": 2.12, "learning_rate": 5.9794059949054954e-05, "loss": 1.4664, "step": 26894 }, { "epoch": 2.12, "learning_rate": 5.97841852319459e-05, "loss": 1.4553, "step": 26895 }, { "epoch": 2.12, "learning_rate": 5.977431112735243e-05, "loss": 1.5042, "step": 26896 }, { "epoch": 2.12, "learning_rate": 5.976443763534155e-05, "loss": 1.4294, "step": 26897 }, { "epoch": 2.12, "learning_rate": 5.975456475598035e-05, "loss": 1.4579, "step": 26898 }, { "epoch": 2.12, "learning_rate": 5.9744692489335896e-05, "loss": 1.4247, "step": 26899 }, { "epoch": 2.12, "learning_rate": 5.973482083547518e-05, "loss": 1.4495, "step": 26900 }, { "epoch": 2.12, "learning_rate": 5.972494979446516e-05, "loss": 1.5311, "step": 26901 }, { "epoch": 2.12, "learning_rate": 5.9715079366372984e-05, "loss": 1.4634, "step": 26902 }, { "epoch": 2.12, "learning_rate": 5.970520955126557e-05, "loss": 1.4611, "step": 26903 }, { "epoch": 2.12, "learning_rate": 5.969534034920991e-05, "loss": 1.4431, "step": 26904 }, { "epoch": 2.12, "learning_rate": 5.968547176027313e-05, "loss": 1.465, "step": 26905 }, { "epoch": 2.12, "learning_rate": 5.967560378452213e-05, "loss": 1.4335, "step": 26906 }, { "epoch": 2.12, "learning_rate": 5.9665736422023946e-05, "loss": 1.4708, "step": 26907 }, { "epoch": 2.12, "learning_rate": 5.965586967284551e-05, "loss": 1.4932, "step": 26908 }, { "epoch": 2.12, "learning_rate": 5.964600353705391e-05, "loss": 1.482, "step": 26909 }, { "epoch": 2.12, "learning_rate": 5.9636138014716087e-05, "loss": 1.4573, "step": 26910 }, { "epoch": 2.12, "learning_rate": 5.962627310589896e-05, "loss": 1.4864, "step": 26911 }, { "epoch": 2.12, "learning_rate": 5.961640881066963e-05, "loss": 1.4803, "step": 26912 }, { "epoch": 2.12, "learning_rate": 5.960654512909499e-05, "loss": 1.4366, "step": 26913 }, { "epoch": 2.12, "learning_rate": 5.9596682061242e-05, "loss": 1.4655, "step": 26914 }, { "epoch": 2.12, "learning_rate": 5.958681960717763e-05, "loss": 1.4809, "step": 26915 }, { "epoch": 2.12, "learning_rate": 5.957695776696892e-05, "loss": 1.4473, "step": 26916 }, { "epoch": 2.12, "learning_rate": 5.956709654068276e-05, "loss": 1.49, "step": 26917 }, { "epoch": 2.12, "learning_rate": 5.955723592838607e-05, "loss": 1.4787, "step": 26918 }, { "epoch": 2.12, "learning_rate": 5.954737593014588e-05, "loss": 1.4459, "step": 26919 }, { "epoch": 2.12, "learning_rate": 5.95375165460291e-05, "loss": 1.4729, "step": 26920 }, { "epoch": 2.12, "learning_rate": 5.9527657776102596e-05, "loss": 1.4641, "step": 26921 }, { "epoch": 2.12, "learning_rate": 5.951779962043343e-05, "loss": 1.4835, "step": 26922 }, { "epoch": 2.12, "learning_rate": 5.950794207908847e-05, "loss": 1.4582, "step": 26923 }, { "epoch": 2.12, "learning_rate": 5.949808515213465e-05, "loss": 1.4249, "step": 26924 }, { "epoch": 2.12, "learning_rate": 5.948822883963883e-05, "loss": 1.4361, "step": 26925 }, { "epoch": 2.12, "learning_rate": 5.947837314166804e-05, "loss": 1.452, "step": 26926 }, { "epoch": 2.12, "learning_rate": 5.9468518058289146e-05, "loss": 1.4558, "step": 26927 }, { "epoch": 2.12, "learning_rate": 5.945866358956899e-05, "loss": 1.4652, "step": 26928 }, { "epoch": 2.12, "learning_rate": 5.944880973557462e-05, "loss": 1.4397, "step": 26929 }, { "epoch": 2.12, "learning_rate": 5.9438956496372784e-05, "loss": 1.4553, "step": 26930 }, { "epoch": 2.12, "learning_rate": 5.9429103872030534e-05, "loss": 1.4857, "step": 26931 }, { "epoch": 2.12, "learning_rate": 5.941925186261462e-05, "loss": 1.4443, "step": 26932 }, { "epoch": 2.12, "learning_rate": 5.940940046819205e-05, "loss": 1.4266, "step": 26933 }, { "epoch": 2.12, "learning_rate": 5.939954968882966e-05, "loss": 1.401, "step": 26934 }, { "epoch": 2.12, "learning_rate": 5.938969952459429e-05, "loss": 1.4706, "step": 26935 }, { "epoch": 2.12, "learning_rate": 5.93798499755529e-05, "loss": 1.5073, "step": 26936 }, { "epoch": 2.12, "learning_rate": 5.9370001041772316e-05, "loss": 1.4676, "step": 26937 }, { "epoch": 2.12, "learning_rate": 5.936015272331938e-05, "loss": 1.493, "step": 26938 }, { "epoch": 2.12, "learning_rate": 5.935030502026102e-05, "loss": 1.4458, "step": 26939 }, { "epoch": 2.12, "learning_rate": 5.934045793266406e-05, "loss": 1.4494, "step": 26940 }, { "epoch": 2.12, "learning_rate": 5.9330611460595376e-05, "loss": 1.4478, "step": 26941 }, { "epoch": 2.12, "learning_rate": 5.932076560412174e-05, "loss": 1.5166, "step": 26942 }, { "epoch": 2.12, "learning_rate": 5.931092036331012e-05, "loss": 1.4558, "step": 26943 }, { "epoch": 2.12, "learning_rate": 5.930107573822732e-05, "loss": 1.461, "step": 26944 }, { "epoch": 2.12, "learning_rate": 5.9291231728940106e-05, "loss": 1.4722, "step": 26945 }, { "epoch": 2.12, "learning_rate": 5.9281388335515346e-05, "loss": 1.4091, "step": 26946 }, { "epoch": 2.12, "learning_rate": 5.927154555801998e-05, "loss": 1.4797, "step": 26947 }, { "epoch": 2.12, "learning_rate": 5.926170339652073e-05, "loss": 1.4295, "step": 26948 }, { "epoch": 2.12, "learning_rate": 5.92518618510844e-05, "loss": 1.4632, "step": 26949 }, { "epoch": 2.12, "learning_rate": 5.924202092177791e-05, "loss": 1.4639, "step": 26950 }, { "epoch": 2.12, "learning_rate": 5.9232180608667986e-05, "loss": 1.4219, "step": 26951 }, { "epoch": 2.12, "learning_rate": 5.9222340911821433e-05, "loss": 1.4335, "step": 26952 }, { "epoch": 2.12, "learning_rate": 5.921250183130514e-05, "loss": 1.4671, "step": 26953 }, { "epoch": 2.12, "learning_rate": 5.920266336718585e-05, "loss": 1.4107, "step": 26954 }, { "epoch": 2.12, "learning_rate": 5.919282551953034e-05, "loss": 1.5062, "step": 26955 }, { "epoch": 2.12, "learning_rate": 5.918298828840546e-05, "loss": 1.4407, "step": 26956 }, { "epoch": 2.12, "learning_rate": 5.9173151673877983e-05, "loss": 1.4686, "step": 26957 }, { "epoch": 2.12, "learning_rate": 5.916331567601464e-05, "loss": 1.4507, "step": 26958 }, { "epoch": 2.12, "learning_rate": 5.91534802948823e-05, "loss": 1.4667, "step": 26959 }, { "epoch": 2.12, "learning_rate": 5.9143645530547676e-05, "loss": 1.4661, "step": 26960 }, { "epoch": 2.12, "learning_rate": 5.913381138307754e-05, "loss": 1.447, "step": 26961 }, { "epoch": 2.12, "learning_rate": 5.912397785253866e-05, "loss": 1.4467, "step": 26962 }, { "epoch": 2.12, "learning_rate": 5.911414493899787e-05, "loss": 1.5049, "step": 26963 }, { "epoch": 2.12, "learning_rate": 5.910431264252191e-05, "loss": 1.4286, "step": 26964 }, { "epoch": 2.12, "learning_rate": 5.9094480963177475e-05, "loss": 1.4703, "step": 26965 }, { "epoch": 2.12, "learning_rate": 5.908464990103132e-05, "loss": 1.4551, "step": 26966 }, { "epoch": 2.12, "learning_rate": 5.9074819456150265e-05, "loss": 1.4593, "step": 26967 }, { "epoch": 2.12, "learning_rate": 5.906498962860099e-05, "loss": 1.4228, "step": 26968 }, { "epoch": 2.12, "learning_rate": 5.905516041845023e-05, "loss": 1.4302, "step": 26969 }, { "epoch": 2.12, "learning_rate": 5.9045331825764784e-05, "loss": 1.4593, "step": 26970 }, { "epoch": 2.12, "learning_rate": 5.903550385061134e-05, "loss": 1.4495, "step": 26971 }, { "epoch": 2.12, "learning_rate": 5.902567649305658e-05, "loss": 1.5098, "step": 26972 }, { "epoch": 2.12, "learning_rate": 5.901584975316732e-05, "loss": 1.4301, "step": 26973 }, { "epoch": 2.12, "learning_rate": 5.900602363101023e-05, "loss": 1.4585, "step": 26974 }, { "epoch": 2.12, "learning_rate": 5.899619812665197e-05, "loss": 1.403, "step": 26975 }, { "epoch": 2.12, "learning_rate": 5.898637324015936e-05, "loss": 1.478, "step": 26976 }, { "epoch": 2.12, "learning_rate": 5.8976548971599e-05, "loss": 1.4594, "step": 26977 }, { "epoch": 2.12, "learning_rate": 5.89667253210377e-05, "loss": 1.4218, "step": 26978 }, { "epoch": 2.12, "learning_rate": 5.8956902288542034e-05, "loss": 1.468, "step": 26979 }, { "epoch": 2.12, "learning_rate": 5.8947079874178814e-05, "loss": 1.4653, "step": 26980 }, { "epoch": 2.12, "learning_rate": 5.893725807801469e-05, "loss": 1.4963, "step": 26981 }, { "epoch": 2.12, "learning_rate": 5.892743690011631e-05, "loss": 1.4131, "step": 26982 }, { "epoch": 2.12, "learning_rate": 5.8917616340550325e-05, "loss": 1.5062, "step": 26983 }, { "epoch": 2.12, "learning_rate": 5.8907796399383523e-05, "loss": 1.4741, "step": 26984 }, { "epoch": 2.12, "learning_rate": 5.889797707668251e-05, "loss": 1.4978, "step": 26985 }, { "epoch": 2.12, "learning_rate": 5.888815837251391e-05, "loss": 1.3676, "step": 26986 }, { "epoch": 2.12, "learning_rate": 5.88783402869445e-05, "loss": 1.4684, "step": 26987 }, { "epoch": 2.12, "learning_rate": 5.8868522820040854e-05, "loss": 1.508, "step": 26988 }, { "epoch": 2.12, "learning_rate": 5.885870597186959e-05, "loss": 1.5134, "step": 26989 }, { "epoch": 2.12, "learning_rate": 5.884888974249749e-05, "loss": 1.4643, "step": 26990 }, { "epoch": 2.12, "learning_rate": 5.883907413199112e-05, "loss": 1.4652, "step": 26991 }, { "epoch": 2.12, "learning_rate": 5.882925914041708e-05, "loss": 1.4091, "step": 26992 }, { "epoch": 2.12, "learning_rate": 5.881944476784204e-05, "loss": 1.4547, "step": 26993 }, { "epoch": 2.12, "learning_rate": 5.8809631014332724e-05, "loss": 1.4487, "step": 26994 }, { "epoch": 2.12, "learning_rate": 5.879981787995569e-05, "loss": 1.4429, "step": 26995 }, { "epoch": 2.12, "learning_rate": 5.87900053647775e-05, "loss": 1.4331, "step": 26996 }, { "epoch": 2.12, "learning_rate": 5.8780193468864894e-05, "loss": 1.4858, "step": 26997 }, { "epoch": 2.12, "learning_rate": 5.8770382192284454e-05, "loss": 1.4595, "step": 26998 }, { "epoch": 2.12, "learning_rate": 5.8760571535102746e-05, "loss": 1.4911, "step": 26999 }, { "epoch": 2.12, "learning_rate": 5.8750761497386366e-05, "loss": 1.4358, "step": 27000 }, { "epoch": 2.12, "learning_rate": 5.8740952079202033e-05, "loss": 1.4759, "step": 27001 }, { "epoch": 2.12, "learning_rate": 5.873114328061625e-05, "loss": 1.4858, "step": 27002 }, { "epoch": 2.12, "learning_rate": 5.872133510169559e-05, "loss": 1.4655, "step": 27003 }, { "epoch": 2.12, "learning_rate": 5.871152754250674e-05, "loss": 1.4684, "step": 27004 }, { "epoch": 2.12, "learning_rate": 5.870172060311626e-05, "loss": 1.4458, "step": 27005 }, { "epoch": 2.12, "learning_rate": 5.8691914283590654e-05, "loss": 1.3995, "step": 27006 }, { "epoch": 2.12, "learning_rate": 5.86821085839966e-05, "loss": 1.4587, "step": 27007 }, { "epoch": 2.13, "learning_rate": 5.8672303504400604e-05, "loss": 1.465, "step": 27008 }, { "epoch": 2.13, "learning_rate": 5.866249904486931e-05, "loss": 1.4327, "step": 27009 }, { "epoch": 2.13, "learning_rate": 5.865269520546919e-05, "loss": 1.4464, "step": 27010 }, { "epoch": 2.13, "learning_rate": 5.864289198626691e-05, "loss": 1.4797, "step": 27011 }, { "epoch": 2.13, "learning_rate": 5.863308938732897e-05, "loss": 1.458, "step": 27012 }, { "epoch": 2.13, "learning_rate": 5.862328740872191e-05, "loss": 1.4241, "step": 27013 }, { "epoch": 2.13, "learning_rate": 5.861348605051233e-05, "loss": 1.4754, "step": 27014 }, { "epoch": 2.13, "learning_rate": 5.8603685312766755e-05, "loss": 1.4611, "step": 27015 }, { "epoch": 2.13, "learning_rate": 5.8593885195551665e-05, "loss": 1.4739, "step": 27016 }, { "epoch": 2.13, "learning_rate": 5.8584085698933715e-05, "loss": 1.4808, "step": 27017 }, { "epoch": 2.13, "learning_rate": 5.857428682297937e-05, "loss": 1.5123, "step": 27018 }, { "epoch": 2.13, "learning_rate": 5.856448856775515e-05, "loss": 1.4517, "step": 27019 }, { "epoch": 2.13, "learning_rate": 5.855469093332757e-05, "loss": 1.4048, "step": 27020 }, { "epoch": 2.13, "learning_rate": 5.854489391976321e-05, "loss": 1.4372, "step": 27021 }, { "epoch": 2.13, "learning_rate": 5.853509752712855e-05, "loss": 1.4501, "step": 27022 }, { "epoch": 2.13, "learning_rate": 5.8525301755490054e-05, "loss": 1.4744, "step": 27023 }, { "epoch": 2.13, "learning_rate": 5.851550660491428e-05, "loss": 1.3978, "step": 27024 }, { "epoch": 2.13, "learning_rate": 5.850571207546779e-05, "loss": 1.4869, "step": 27025 }, { "epoch": 2.13, "learning_rate": 5.849591816721702e-05, "loss": 1.4823, "step": 27026 }, { "epoch": 2.13, "learning_rate": 5.8486124880228414e-05, "loss": 1.4361, "step": 27027 }, { "epoch": 2.13, "learning_rate": 5.847633221456856e-05, "loss": 1.4536, "step": 27028 }, { "epoch": 2.13, "learning_rate": 5.8466540170303925e-05, "loss": 1.4482, "step": 27029 }, { "epoch": 2.13, "learning_rate": 5.845674874750091e-05, "loss": 1.4559, "step": 27030 }, { "epoch": 2.13, "learning_rate": 5.84469579462261e-05, "loss": 1.5109, "step": 27031 }, { "epoch": 2.13, "learning_rate": 5.8437167766545925e-05, "loss": 1.4894, "step": 27032 }, { "epoch": 2.13, "learning_rate": 5.84273782085268e-05, "loss": 1.4531, "step": 27033 }, { "epoch": 2.13, "learning_rate": 5.8417589272235296e-05, "loss": 1.4589, "step": 27034 }, { "epoch": 2.13, "learning_rate": 5.840780095773782e-05, "loss": 1.5049, "step": 27035 }, { "epoch": 2.13, "learning_rate": 5.839801326510083e-05, "loss": 1.4677, "step": 27036 }, { "epoch": 2.13, "learning_rate": 5.838822619439073e-05, "loss": 1.4951, "step": 27037 }, { "epoch": 2.13, "learning_rate": 5.8378439745674074e-05, "loss": 1.4249, "step": 27038 }, { "epoch": 2.13, "learning_rate": 5.836865391901725e-05, "loss": 1.4443, "step": 27039 }, { "epoch": 2.13, "learning_rate": 5.8358868714486644e-05, "loss": 1.443, "step": 27040 }, { "epoch": 2.13, "learning_rate": 5.834908413214874e-05, "loss": 1.4644, "step": 27041 }, { "epoch": 2.13, "learning_rate": 5.833930017207004e-05, "loss": 1.4403, "step": 27042 }, { "epoch": 2.13, "learning_rate": 5.832951683431692e-05, "loss": 1.4523, "step": 27043 }, { "epoch": 2.13, "learning_rate": 5.831973411895572e-05, "loss": 1.4424, "step": 27044 }, { "epoch": 2.13, "learning_rate": 5.830995202605298e-05, "loss": 1.4776, "step": 27045 }, { "epoch": 2.13, "learning_rate": 5.8300170555675087e-05, "loss": 1.4388, "step": 27046 }, { "epoch": 2.13, "learning_rate": 5.829038970788838e-05, "loss": 1.4373, "step": 27047 }, { "epoch": 2.13, "learning_rate": 5.828060948275935e-05, "loss": 1.4793, "step": 27048 }, { "epoch": 2.13, "learning_rate": 5.8270829880354394e-05, "loss": 1.4632, "step": 27049 }, { "epoch": 2.13, "learning_rate": 5.82610509007398e-05, "loss": 1.4227, "step": 27050 }, { "epoch": 2.13, "learning_rate": 5.8251272543982115e-05, "loss": 1.4793, "step": 27051 }, { "epoch": 2.13, "learning_rate": 5.8241494810147656e-05, "loss": 1.4823, "step": 27052 }, { "epoch": 2.13, "learning_rate": 5.8231717699302805e-05, "loss": 1.4874, "step": 27053 }, { "epoch": 2.13, "learning_rate": 5.822194121151391e-05, "loss": 1.4836, "step": 27054 }, { "epoch": 2.13, "learning_rate": 5.8212165346847424e-05, "loss": 1.5146, "step": 27055 }, { "epoch": 2.13, "learning_rate": 5.8202390105369634e-05, "loss": 1.4302, "step": 27056 }, { "epoch": 2.13, "learning_rate": 5.819261548714696e-05, "loss": 1.4753, "step": 27057 }, { "epoch": 2.13, "learning_rate": 5.818284149224581e-05, "loss": 1.5221, "step": 27058 }, { "epoch": 2.13, "learning_rate": 5.8173068120732505e-05, "loss": 1.3962, "step": 27059 }, { "epoch": 2.13, "learning_rate": 5.816329537267341e-05, "loss": 1.51, "step": 27060 }, { "epoch": 2.13, "learning_rate": 5.815352324813477e-05, "loss": 1.4771, "step": 27061 }, { "epoch": 2.13, "learning_rate": 5.8143751747183094e-05, "loss": 1.5091, "step": 27062 }, { "epoch": 2.13, "learning_rate": 5.813398086988466e-05, "loss": 1.442, "step": 27063 }, { "epoch": 2.13, "learning_rate": 5.812421061630574e-05, "loss": 1.462, "step": 27064 }, { "epoch": 2.13, "learning_rate": 5.8114440986512775e-05, "loss": 1.4809, "step": 27065 }, { "epoch": 2.13, "learning_rate": 5.8104671980572056e-05, "loss": 1.4367, "step": 27066 }, { "epoch": 2.13, "learning_rate": 5.8094903598549855e-05, "loss": 1.5339, "step": 27067 }, { "epoch": 2.13, "learning_rate": 5.808513584051258e-05, "loss": 1.4809, "step": 27068 }, { "epoch": 2.13, "learning_rate": 5.807536870652652e-05, "loss": 1.4545, "step": 27069 }, { "epoch": 2.13, "learning_rate": 5.806560219665792e-05, "loss": 1.4615, "step": 27070 }, { "epoch": 2.13, "learning_rate": 5.805583631097315e-05, "loss": 1.4979, "step": 27071 }, { "epoch": 2.13, "learning_rate": 5.804607104953857e-05, "loss": 1.4864, "step": 27072 }, { "epoch": 2.13, "learning_rate": 5.8036306412420405e-05, "loss": 1.4267, "step": 27073 }, { "epoch": 2.13, "learning_rate": 5.8026542399684936e-05, "loss": 1.4676, "step": 27074 }, { "epoch": 2.13, "learning_rate": 5.801677901139855e-05, "loss": 1.4619, "step": 27075 }, { "epoch": 2.13, "learning_rate": 5.800701624762746e-05, "loss": 1.4532, "step": 27076 }, { "epoch": 2.13, "learning_rate": 5.799725410843796e-05, "loss": 1.4252, "step": 27077 }, { "epoch": 2.13, "learning_rate": 5.7987492593896275e-05, "loss": 1.434, "step": 27078 }, { "epoch": 2.13, "learning_rate": 5.7977731704068806e-05, "loss": 1.4241, "step": 27079 }, { "epoch": 2.13, "learning_rate": 5.796797143902174e-05, "loss": 1.4824, "step": 27080 }, { "epoch": 2.13, "learning_rate": 5.795821179882132e-05, "loss": 1.4433, "step": 27081 }, { "epoch": 2.13, "learning_rate": 5.7948452783533914e-05, "loss": 1.4817, "step": 27082 }, { "epoch": 2.13, "learning_rate": 5.79386943932257e-05, "loss": 1.4245, "step": 27083 }, { "epoch": 2.13, "learning_rate": 5.7928936627962904e-05, "loss": 1.3966, "step": 27084 }, { "epoch": 2.13, "learning_rate": 5.791917948781185e-05, "loss": 1.4252, "step": 27085 }, { "epoch": 2.13, "learning_rate": 5.790942297283878e-05, "loss": 1.4571, "step": 27086 }, { "epoch": 2.13, "learning_rate": 5.789966708310984e-05, "loss": 1.4312, "step": 27087 }, { "epoch": 2.13, "learning_rate": 5.788991181869134e-05, "loss": 1.4545, "step": 27088 }, { "epoch": 2.13, "learning_rate": 5.788015717964956e-05, "loss": 1.4625, "step": 27089 }, { "epoch": 2.13, "learning_rate": 5.7870403166050674e-05, "loss": 1.4477, "step": 27090 }, { "epoch": 2.13, "learning_rate": 5.786064977796085e-05, "loss": 1.4534, "step": 27091 }, { "epoch": 2.13, "learning_rate": 5.785089701544644e-05, "loss": 1.4206, "step": 27092 }, { "epoch": 2.13, "learning_rate": 5.7841144878573565e-05, "loss": 1.4171, "step": 27093 }, { "epoch": 2.13, "learning_rate": 5.783139336740847e-05, "loss": 1.4161, "step": 27094 }, { "epoch": 2.13, "learning_rate": 5.78216424820173e-05, "loss": 1.3806, "step": 27095 }, { "epoch": 2.13, "learning_rate": 5.781189222246637e-05, "loss": 1.4987, "step": 27096 }, { "epoch": 2.13, "learning_rate": 5.7802142588821806e-05, "loss": 1.4425, "step": 27097 }, { "epoch": 2.13, "learning_rate": 5.779239358114976e-05, "loss": 1.4802, "step": 27098 }, { "epoch": 2.13, "learning_rate": 5.778264519951654e-05, "loss": 1.4203, "step": 27099 }, { "epoch": 2.13, "learning_rate": 5.7772897443988266e-05, "loss": 1.4832, "step": 27100 }, { "epoch": 2.13, "learning_rate": 5.776315031463106e-05, "loss": 1.4261, "step": 27101 }, { "epoch": 2.13, "learning_rate": 5.775340381151123e-05, "loss": 1.5116, "step": 27102 }, { "epoch": 2.13, "learning_rate": 5.774365793469482e-05, "loss": 1.4642, "step": 27103 }, { "epoch": 2.13, "learning_rate": 5.7733912684248115e-05, "loss": 1.4629, "step": 27104 }, { "epoch": 2.13, "learning_rate": 5.7724168060237186e-05, "loss": 1.4911, "step": 27105 }, { "epoch": 2.13, "learning_rate": 5.7714424062728275e-05, "loss": 1.4637, "step": 27106 }, { "epoch": 2.13, "learning_rate": 5.77046806917875e-05, "loss": 1.4182, "step": 27107 }, { "epoch": 2.13, "learning_rate": 5.769493794748095e-05, "loss": 1.4455, "step": 27108 }, { "epoch": 2.13, "learning_rate": 5.7685195829874886e-05, "loss": 1.4486, "step": 27109 }, { "epoch": 2.13, "learning_rate": 5.7675454339035414e-05, "loss": 1.442, "step": 27110 }, { "epoch": 2.13, "learning_rate": 5.766571347502865e-05, "loss": 1.4889, "step": 27111 }, { "epoch": 2.13, "learning_rate": 5.765597323792068e-05, "loss": 1.5033, "step": 27112 }, { "epoch": 2.13, "learning_rate": 5.764623362777776e-05, "loss": 1.4208, "step": 27113 }, { "epoch": 2.13, "learning_rate": 5.763649464466593e-05, "loss": 1.4645, "step": 27114 }, { "epoch": 2.13, "learning_rate": 5.7626756288651286e-05, "loss": 1.5335, "step": 27115 }, { "epoch": 2.13, "learning_rate": 5.761701855980004e-05, "loss": 1.4643, "step": 27116 }, { "epoch": 2.13, "learning_rate": 5.7607281458178256e-05, "loss": 1.403, "step": 27117 }, { "epoch": 2.13, "learning_rate": 5.7597544983852e-05, "loss": 1.4031, "step": 27118 }, { "epoch": 2.13, "learning_rate": 5.758780913688742e-05, "loss": 1.4602, "step": 27119 }, { "epoch": 2.13, "learning_rate": 5.757807391735066e-05, "loss": 1.522, "step": 27120 }, { "epoch": 2.13, "learning_rate": 5.756833932530779e-05, "loss": 1.4805, "step": 27121 }, { "epoch": 2.13, "learning_rate": 5.755860536082482e-05, "loss": 1.4152, "step": 27122 }, { "epoch": 2.13, "learning_rate": 5.7548872023967974e-05, "loss": 1.4557, "step": 27123 }, { "epoch": 2.13, "learning_rate": 5.753913931480327e-05, "loss": 1.4562, "step": 27124 }, { "epoch": 2.13, "learning_rate": 5.752940723339672e-05, "loss": 1.4991, "step": 27125 }, { "epoch": 2.13, "learning_rate": 5.751967577981452e-05, "loss": 1.4257, "step": 27126 }, { "epoch": 2.13, "learning_rate": 5.75099449541227e-05, "loss": 1.4941, "step": 27127 }, { "epoch": 2.13, "learning_rate": 5.750021475638725e-05, "loss": 1.5313, "step": 27128 }, { "epoch": 2.13, "learning_rate": 5.7490485186674346e-05, "loss": 1.4647, "step": 27129 }, { "epoch": 2.13, "learning_rate": 5.7480756245050006e-05, "loss": 1.4946, "step": 27130 }, { "epoch": 2.13, "learning_rate": 5.7471027931580266e-05, "loss": 1.4743, "step": 27131 }, { "epoch": 2.13, "learning_rate": 5.746130024633113e-05, "loss": 1.4775, "step": 27132 }, { "epoch": 2.13, "learning_rate": 5.7451573189368774e-05, "loss": 1.4541, "step": 27133 }, { "epoch": 2.13, "learning_rate": 5.744184676075908e-05, "loss": 1.4587, "step": 27134 }, { "epoch": 2.14, "learning_rate": 5.743212096056824e-05, "loss": 1.513, "step": 27135 }, { "epoch": 2.14, "learning_rate": 5.742239578886216e-05, "loss": 1.4379, "step": 27136 }, { "epoch": 2.14, "learning_rate": 5.7412671245706966e-05, "loss": 1.4389, "step": 27137 }, { "epoch": 2.14, "learning_rate": 5.740294733116866e-05, "loss": 1.4523, "step": 27138 }, { "epoch": 2.14, "learning_rate": 5.7393224045313176e-05, "loss": 1.4587, "step": 27139 }, { "epoch": 2.14, "learning_rate": 5.7383501388206645e-05, "loss": 1.4225, "step": 27140 }, { "epoch": 2.14, "learning_rate": 5.7373779359915045e-05, "loss": 1.4708, "step": 27141 }, { "epoch": 2.14, "learning_rate": 5.73640579605043e-05, "loss": 1.4128, "step": 27142 }, { "epoch": 2.14, "learning_rate": 5.735433719004054e-05, "loss": 1.4464, "step": 27143 }, { "epoch": 2.14, "learning_rate": 5.7344617048589706e-05, "loss": 1.4844, "step": 27144 }, { "epoch": 2.14, "learning_rate": 5.7334897536217735e-05, "loss": 1.4422, "step": 27145 }, { "epoch": 2.14, "learning_rate": 5.732517865299073e-05, "loss": 1.4046, "step": 27146 }, { "epoch": 2.14, "learning_rate": 5.73154603989746e-05, "loss": 1.5025, "step": 27147 }, { "epoch": 2.14, "learning_rate": 5.730574277423536e-05, "loss": 1.4554, "step": 27148 }, { "epoch": 2.14, "learning_rate": 5.729602577883893e-05, "loss": 1.4344, "step": 27149 }, { "epoch": 2.14, "learning_rate": 5.7286309412851325e-05, "loss": 1.472, "step": 27150 }, { "epoch": 2.14, "learning_rate": 5.7276593676338563e-05, "loss": 1.4339, "step": 27151 }, { "epoch": 2.14, "learning_rate": 5.726687856936657e-05, "loss": 1.4988, "step": 27152 }, { "epoch": 2.14, "learning_rate": 5.7257164092001235e-05, "loss": 1.4222, "step": 27153 }, { "epoch": 2.14, "learning_rate": 5.7247450244308615e-05, "loss": 1.4461, "step": 27154 }, { "epoch": 2.14, "learning_rate": 5.723773702635465e-05, "loss": 1.4247, "step": 27155 }, { "epoch": 2.14, "learning_rate": 5.7228024438205184e-05, "loss": 1.483, "step": 27156 }, { "epoch": 2.14, "learning_rate": 5.721831247992631e-05, "loss": 1.4499, "step": 27157 }, { "epoch": 2.14, "learning_rate": 5.7208601151583874e-05, "loss": 1.4842, "step": 27158 }, { "epoch": 2.14, "learning_rate": 5.7198890453243784e-05, "loss": 1.4122, "step": 27159 }, { "epoch": 2.14, "learning_rate": 5.718918038497208e-05, "loss": 1.4824, "step": 27160 }, { "epoch": 2.14, "learning_rate": 5.71794709468346e-05, "loss": 1.4745, "step": 27161 }, { "epoch": 2.14, "learning_rate": 5.716976213889726e-05, "loss": 1.4854, "step": 27162 }, { "epoch": 2.14, "learning_rate": 5.7160053961226046e-05, "loss": 1.5423, "step": 27163 }, { "epoch": 2.14, "learning_rate": 5.715034641388684e-05, "loss": 1.4465, "step": 27164 }, { "epoch": 2.14, "learning_rate": 5.714063949694554e-05, "loss": 1.4466, "step": 27165 }, { "epoch": 2.14, "learning_rate": 5.713093321046795e-05, "loss": 1.4263, "step": 27166 }, { "epoch": 2.14, "learning_rate": 5.712122755452018e-05, "loss": 1.4939, "step": 27167 }, { "epoch": 2.14, "learning_rate": 5.711152252916801e-05, "loss": 1.4634, "step": 27168 }, { "epoch": 2.14, "learning_rate": 5.710181813447731e-05, "loss": 1.4487, "step": 27169 }, { "epoch": 2.14, "learning_rate": 5.7092114370514044e-05, "loss": 1.4627, "step": 27170 }, { "epoch": 2.14, "learning_rate": 5.708241123734403e-05, "loss": 1.4376, "step": 27171 }, { "epoch": 2.14, "learning_rate": 5.70727087350332e-05, "loss": 1.482, "step": 27172 }, { "epoch": 2.14, "learning_rate": 5.706300686364731e-05, "loss": 1.4567, "step": 27173 }, { "epoch": 2.14, "learning_rate": 5.70533056232524e-05, "loss": 1.4626, "step": 27174 }, { "epoch": 2.14, "learning_rate": 5.704360501391423e-05, "loss": 1.4547, "step": 27175 }, { "epoch": 2.14, "learning_rate": 5.703390503569865e-05, "loss": 1.444, "step": 27176 }, { "epoch": 2.14, "learning_rate": 5.702420568867158e-05, "loss": 1.4606, "step": 27177 }, { "epoch": 2.14, "learning_rate": 5.701450697289886e-05, "loss": 1.3835, "step": 27178 }, { "epoch": 2.14, "learning_rate": 5.700480888844628e-05, "loss": 1.427, "step": 27179 }, { "epoch": 2.14, "learning_rate": 5.699511143537977e-05, "loss": 1.4621, "step": 27180 }, { "epoch": 2.14, "learning_rate": 5.6985414613765085e-05, "loss": 1.4558, "step": 27181 }, { "epoch": 2.14, "learning_rate": 5.6975718423668153e-05, "loss": 1.3981, "step": 27182 }, { "epoch": 2.14, "learning_rate": 5.696602286515471e-05, "loss": 1.4852, "step": 27183 }, { "epoch": 2.14, "learning_rate": 5.695632793829066e-05, "loss": 1.4367, "step": 27184 }, { "epoch": 2.14, "learning_rate": 5.694663364314183e-05, "loss": 1.4527, "step": 27185 }, { "epoch": 2.14, "learning_rate": 5.693693997977394e-05, "loss": 1.4932, "step": 27186 }, { "epoch": 2.14, "learning_rate": 5.6927246948252915e-05, "loss": 1.4958, "step": 27187 }, { "epoch": 2.14, "learning_rate": 5.691755454864454e-05, "loss": 1.4931, "step": 27188 }, { "epoch": 2.14, "learning_rate": 5.690786278101458e-05, "loss": 1.4834, "step": 27189 }, { "epoch": 2.14, "learning_rate": 5.689817164542883e-05, "loss": 1.4708, "step": 27190 }, { "epoch": 2.14, "learning_rate": 5.688848114195316e-05, "loss": 1.4351, "step": 27191 }, { "epoch": 2.14, "learning_rate": 5.6878791270653316e-05, "loss": 1.4249, "step": 27192 }, { "epoch": 2.14, "learning_rate": 5.686910203159504e-05, "loss": 1.4609, "step": 27193 }, { "epoch": 2.14, "learning_rate": 5.685941342484422e-05, "loss": 1.4299, "step": 27194 }, { "epoch": 2.14, "learning_rate": 5.684972545046659e-05, "loss": 1.5034, "step": 27195 }, { "epoch": 2.14, "learning_rate": 5.6840038108527847e-05, "loss": 1.394, "step": 27196 }, { "epoch": 2.14, "learning_rate": 5.6830351399093854e-05, "loss": 1.4616, "step": 27197 }, { "epoch": 2.14, "learning_rate": 5.682066532223041e-05, "loss": 1.501, "step": 27198 }, { "epoch": 2.14, "learning_rate": 5.681097987800322e-05, "loss": 1.4552, "step": 27199 }, { "epoch": 2.14, "learning_rate": 5.6801295066478006e-05, "loss": 1.4769, "step": 27200 }, { "epoch": 2.14, "learning_rate": 5.6791610887720616e-05, "loss": 1.4454, "step": 27201 }, { "epoch": 2.14, "learning_rate": 5.678192734179676e-05, "loss": 1.403, "step": 27202 }, { "epoch": 2.14, "learning_rate": 5.677224442877211e-05, "loss": 1.4906, "step": 27203 }, { "epoch": 2.14, "learning_rate": 5.676256214871253e-05, "loss": 1.4573, "step": 27204 }, { "epoch": 2.14, "learning_rate": 5.67528805016837e-05, "loss": 1.4453, "step": 27205 }, { "epoch": 2.14, "learning_rate": 5.674319948775136e-05, "loss": 1.4641, "step": 27206 }, { "epoch": 2.14, "learning_rate": 5.6733519106981176e-05, "loss": 1.4609, "step": 27207 }, { "epoch": 2.14, "learning_rate": 5.672383935943898e-05, "loss": 1.4433, "step": 27208 }, { "epoch": 2.14, "learning_rate": 5.6714160245190435e-05, "loss": 1.4501, "step": 27209 }, { "epoch": 2.14, "learning_rate": 5.670448176430123e-05, "loss": 1.4519, "step": 27210 }, { "epoch": 2.14, "learning_rate": 5.669480391683714e-05, "loss": 1.4405, "step": 27211 }, { "epoch": 2.14, "learning_rate": 5.668512670286385e-05, "loss": 1.4193, "step": 27212 }, { "epoch": 2.14, "learning_rate": 5.6675450122446994e-05, "loss": 1.5023, "step": 27213 }, { "epoch": 2.14, "learning_rate": 5.666577417565234e-05, "loss": 1.4784, "step": 27214 }, { "epoch": 2.14, "learning_rate": 5.6656098862545626e-05, "loss": 1.456, "step": 27215 }, { "epoch": 2.14, "learning_rate": 5.664642418319248e-05, "loss": 1.4333, "step": 27216 }, { "epoch": 2.14, "learning_rate": 5.663675013765855e-05, "loss": 1.4918, "step": 27217 }, { "epoch": 2.14, "learning_rate": 5.662707672600961e-05, "loss": 1.3908, "step": 27218 }, { "epoch": 2.14, "learning_rate": 5.66174039483113e-05, "loss": 1.4674, "step": 27219 }, { "epoch": 2.14, "learning_rate": 5.660773180462923e-05, "loss": 1.5126, "step": 27220 }, { "epoch": 2.14, "learning_rate": 5.659806029502918e-05, "loss": 1.4369, "step": 27221 }, { "epoch": 2.14, "learning_rate": 5.6588389419576766e-05, "loss": 1.462, "step": 27222 }, { "epoch": 2.14, "learning_rate": 5.657871917833761e-05, "loss": 1.4628, "step": 27223 }, { "epoch": 2.14, "learning_rate": 5.656904957137737e-05, "loss": 1.4239, "step": 27224 }, { "epoch": 2.14, "learning_rate": 5.655938059876176e-05, "loss": 1.4566, "step": 27225 }, { "epoch": 2.14, "learning_rate": 5.6549712260556406e-05, "loss": 1.4044, "step": 27226 }, { "epoch": 2.14, "learning_rate": 5.6540044556826874e-05, "loss": 1.4386, "step": 27227 }, { "epoch": 2.14, "learning_rate": 5.653037748763886e-05, "loss": 1.5016, "step": 27228 }, { "epoch": 2.14, "learning_rate": 5.652071105305807e-05, "loss": 1.4427, "step": 27229 }, { "epoch": 2.14, "learning_rate": 5.651104525315005e-05, "loss": 1.4709, "step": 27230 }, { "epoch": 2.14, "learning_rate": 5.65013800879804e-05, "loss": 1.5034, "step": 27231 }, { "epoch": 2.14, "learning_rate": 5.649171555761482e-05, "loss": 1.4305, "step": 27232 }, { "epoch": 2.14, "learning_rate": 5.64820516621189e-05, "loss": 1.4265, "step": 27233 }, { "epoch": 2.14, "learning_rate": 5.647238840155818e-05, "loss": 1.4474, "step": 27234 }, { "epoch": 2.14, "learning_rate": 5.6462725775998405e-05, "loss": 1.3929, "step": 27235 }, { "epoch": 2.14, "learning_rate": 5.6453063785505086e-05, "loss": 1.4856, "step": 27236 }, { "epoch": 2.14, "learning_rate": 5.644340243014378e-05, "loss": 1.4374, "step": 27237 }, { "epoch": 2.14, "learning_rate": 5.643374170998021e-05, "loss": 1.46, "step": 27238 }, { "epoch": 2.14, "learning_rate": 5.64240816250799e-05, "loss": 1.4212, "step": 27239 }, { "epoch": 2.14, "learning_rate": 5.641442217550837e-05, "loss": 1.4714, "step": 27240 }, { "epoch": 2.14, "learning_rate": 5.640476336133134e-05, "loss": 1.4772, "step": 27241 }, { "epoch": 2.14, "learning_rate": 5.639510518261431e-05, "loss": 1.4966, "step": 27242 }, { "epoch": 2.14, "learning_rate": 5.638544763942286e-05, "loss": 1.4051, "step": 27243 }, { "epoch": 2.14, "learning_rate": 5.637579073182245e-05, "loss": 1.4229, "step": 27244 }, { "epoch": 2.14, "learning_rate": 5.6366134459878855e-05, "loss": 1.3949, "step": 27245 }, { "epoch": 2.14, "learning_rate": 5.635647882365755e-05, "loss": 1.4815, "step": 27246 }, { "epoch": 2.14, "learning_rate": 5.634682382322406e-05, "loss": 1.4897, "step": 27247 }, { "epoch": 2.14, "learning_rate": 5.6337169458643914e-05, "loss": 1.4694, "step": 27248 }, { "epoch": 2.14, "learning_rate": 5.632751572998275e-05, "loss": 1.4716, "step": 27249 }, { "epoch": 2.14, "learning_rate": 5.631786263730607e-05, "loss": 1.466, "step": 27250 }, { "epoch": 2.14, "learning_rate": 5.6308210180679336e-05, "loss": 1.4731, "step": 27251 }, { "epoch": 2.14, "learning_rate": 5.629855836016821e-05, "loss": 1.4193, "step": 27252 }, { "epoch": 2.14, "learning_rate": 5.628890717583818e-05, "loss": 1.4728, "step": 27253 }, { "epoch": 2.14, "learning_rate": 5.627925662775468e-05, "loss": 1.4568, "step": 27254 }, { "epoch": 2.14, "learning_rate": 5.6269606715983375e-05, "loss": 1.4518, "step": 27255 }, { "epoch": 2.14, "learning_rate": 5.625995744058971e-05, "loss": 1.42, "step": 27256 }, { "epoch": 2.14, "learning_rate": 5.625030880163915e-05, "loss": 1.4628, "step": 27257 }, { "epoch": 2.14, "learning_rate": 5.6240660799197306e-05, "loss": 1.454, "step": 27258 }, { "epoch": 2.14, "learning_rate": 5.6231013433329655e-05, "loss": 1.4587, "step": 27259 }, { "epoch": 2.14, "learning_rate": 5.62213667041016e-05, "loss": 1.437, "step": 27260 }, { "epoch": 2.14, "learning_rate": 5.621172061157873e-05, "loss": 1.5211, "step": 27261 }, { "epoch": 2.15, "learning_rate": 5.620207515582656e-05, "loss": 1.4807, "step": 27262 }, { "epoch": 2.15, "learning_rate": 5.6192430336910556e-05, "loss": 1.4691, "step": 27263 }, { "epoch": 2.15, "learning_rate": 5.6182786154896165e-05, "loss": 1.4273, "step": 27264 }, { "epoch": 2.15, "learning_rate": 5.6173142609848835e-05, "loss": 1.5012, "step": 27265 }, { "epoch": 2.15, "learning_rate": 5.6163499701834135e-05, "loss": 1.4546, "step": 27266 }, { "epoch": 2.15, "learning_rate": 5.615385743091751e-05, "loss": 1.4866, "step": 27267 }, { "epoch": 2.15, "learning_rate": 5.614421579716434e-05, "loss": 1.4893, "step": 27268 }, { "epoch": 2.15, "learning_rate": 5.6134574800640206e-05, "loss": 1.4457, "step": 27269 }, { "epoch": 2.15, "learning_rate": 5.61249344414105e-05, "loss": 1.4062, "step": 27270 }, { "epoch": 2.15, "learning_rate": 5.611529471954063e-05, "loss": 1.4384, "step": 27271 }, { "epoch": 2.15, "learning_rate": 5.610565563509616e-05, "loss": 1.4578, "step": 27272 }, { "epoch": 2.15, "learning_rate": 5.6096017188142477e-05, "loss": 1.4949, "step": 27273 }, { "epoch": 2.15, "learning_rate": 5.6086379378744956e-05, "loss": 1.4693, "step": 27274 }, { "epoch": 2.15, "learning_rate": 5.607674220696915e-05, "loss": 1.413, "step": 27275 }, { "epoch": 2.15, "learning_rate": 5.606710567288039e-05, "loss": 1.4653, "step": 27276 }, { "epoch": 2.15, "learning_rate": 5.605746977654418e-05, "loss": 1.5028, "step": 27277 }, { "epoch": 2.15, "learning_rate": 5.6047834518025864e-05, "loss": 1.4799, "step": 27278 }, { "epoch": 2.15, "learning_rate": 5.603819989739096e-05, "loss": 1.4582, "step": 27279 }, { "epoch": 2.15, "learning_rate": 5.6028565914704834e-05, "loss": 1.5207, "step": 27280 }, { "epoch": 2.15, "learning_rate": 5.601893257003282e-05, "loss": 1.442, "step": 27281 }, { "epoch": 2.15, "learning_rate": 5.6009299863440446e-05, "loss": 1.4587, "step": 27282 }, { "epoch": 2.15, "learning_rate": 5.599966779499307e-05, "loss": 1.4518, "step": 27283 }, { "epoch": 2.15, "learning_rate": 5.5990036364756066e-05, "loss": 1.4481, "step": 27284 }, { "epoch": 2.15, "learning_rate": 5.598040557279477e-05, "loss": 1.4499, "step": 27285 }, { "epoch": 2.15, "learning_rate": 5.597077541917471e-05, "loss": 1.4222, "step": 27286 }, { "epoch": 2.15, "learning_rate": 5.5961145903961196e-05, "loss": 1.4737, "step": 27287 }, { "epoch": 2.15, "learning_rate": 5.595151702721954e-05, "loss": 1.4929, "step": 27288 }, { "epoch": 2.15, "learning_rate": 5.594188878901524e-05, "loss": 1.4386, "step": 27289 }, { "epoch": 2.15, "learning_rate": 5.593226118941361e-05, "loss": 1.4781, "step": 27290 }, { "epoch": 2.15, "learning_rate": 5.592263422847996e-05, "loss": 1.4835, "step": 27291 }, { "epoch": 2.15, "learning_rate": 5.5913007906279714e-05, "loss": 1.4308, "step": 27292 }, { "epoch": 2.15, "learning_rate": 5.5903382222878283e-05, "loss": 1.4292, "step": 27293 }, { "epoch": 2.15, "learning_rate": 5.589375717834095e-05, "loss": 1.4788, "step": 27294 }, { "epoch": 2.15, "learning_rate": 5.588413277273302e-05, "loss": 1.4049, "step": 27295 }, { "epoch": 2.15, "learning_rate": 5.5874509006119935e-05, "loss": 1.4614, "step": 27296 }, { "epoch": 2.15, "learning_rate": 5.5864885878567e-05, "loss": 1.4551, "step": 27297 }, { "epoch": 2.15, "learning_rate": 5.5855263390139485e-05, "loss": 1.4577, "step": 27298 }, { "epoch": 2.15, "learning_rate": 5.5845641540902845e-05, "loss": 1.4628, "step": 27299 }, { "epoch": 2.15, "learning_rate": 5.583602033092233e-05, "loss": 1.4551, "step": 27300 }, { "epoch": 2.15, "learning_rate": 5.5826399760263274e-05, "loss": 1.4584, "step": 27301 }, { "epoch": 2.15, "learning_rate": 5.581677982899095e-05, "loss": 1.4782, "step": 27302 }, { "epoch": 2.15, "learning_rate": 5.5807160537170745e-05, "loss": 1.4218, "step": 27303 }, { "epoch": 2.15, "learning_rate": 5.579754188486797e-05, "loss": 1.4601, "step": 27304 }, { "epoch": 2.15, "learning_rate": 5.5787923872147824e-05, "loss": 1.4116, "step": 27305 }, { "epoch": 2.15, "learning_rate": 5.5778306499075754e-05, "loss": 1.4156, "step": 27306 }, { "epoch": 2.15, "learning_rate": 5.576868976571693e-05, "loss": 1.4388, "step": 27307 }, { "epoch": 2.15, "learning_rate": 5.5759073672136736e-05, "loss": 1.4491, "step": 27308 }, { "epoch": 2.15, "learning_rate": 5.57494582184004e-05, "loss": 1.4842, "step": 27309 }, { "epoch": 2.15, "learning_rate": 5.573984340457326e-05, "loss": 1.4153, "step": 27310 }, { "epoch": 2.15, "learning_rate": 5.573022923072058e-05, "loss": 1.4603, "step": 27311 }, { "epoch": 2.15, "learning_rate": 5.572061569690756e-05, "loss": 1.4564, "step": 27312 }, { "epoch": 2.15, "learning_rate": 5.57110028031996e-05, "loss": 1.4994, "step": 27313 }, { "epoch": 2.15, "learning_rate": 5.5701390549661886e-05, "loss": 1.5029, "step": 27314 }, { "epoch": 2.15, "learning_rate": 5.569177893635965e-05, "loss": 1.4399, "step": 27315 }, { "epoch": 2.15, "learning_rate": 5.568216796335823e-05, "loss": 1.4364, "step": 27316 }, { "epoch": 2.15, "learning_rate": 5.567255763072284e-05, "loss": 1.4718, "step": 27317 }, { "epoch": 2.15, "learning_rate": 5.566294793851874e-05, "loss": 1.462, "step": 27318 }, { "epoch": 2.15, "learning_rate": 5.5653338886811114e-05, "loss": 1.4397, "step": 27319 }, { "epoch": 2.15, "learning_rate": 5.564373047566529e-05, "loss": 1.4298, "step": 27320 }, { "epoch": 2.15, "learning_rate": 5.563412270514647e-05, "loss": 1.4713, "step": 27321 }, { "epoch": 2.15, "learning_rate": 5.5624515575319825e-05, "loss": 1.4292, "step": 27322 }, { "epoch": 2.15, "learning_rate": 5.5614909086250654e-05, "loss": 1.4375, "step": 27323 }, { "epoch": 2.15, "learning_rate": 5.5605303238004206e-05, "loss": 1.4472, "step": 27324 }, { "epoch": 2.15, "learning_rate": 5.559569803064567e-05, "loss": 1.4787, "step": 27325 }, { "epoch": 2.15, "learning_rate": 5.558609346424019e-05, "loss": 1.4614, "step": 27326 }, { "epoch": 2.15, "learning_rate": 5.557648953885308e-05, "loss": 1.4684, "step": 27327 }, { "epoch": 2.15, "learning_rate": 5.5566886254549494e-05, "loss": 1.4495, "step": 27328 }, { "epoch": 2.15, "learning_rate": 5.5557283611394586e-05, "loss": 1.4323, "step": 27329 }, { "epoch": 2.15, "learning_rate": 5.554768160945367e-05, "loss": 1.4648, "step": 27330 }, { "epoch": 2.15, "learning_rate": 5.5538080248791874e-05, "loss": 1.5077, "step": 27331 }, { "epoch": 2.15, "learning_rate": 5.552847952947432e-05, "loss": 1.4622, "step": 27332 }, { "epoch": 2.15, "learning_rate": 5.551887945156632e-05, "loss": 1.4462, "step": 27333 }, { "epoch": 2.15, "learning_rate": 5.550928001513297e-05, "loss": 1.4792, "step": 27334 }, { "epoch": 2.15, "learning_rate": 5.549968122023942e-05, "loss": 1.4569, "step": 27335 }, { "epoch": 2.15, "learning_rate": 5.549008306695095e-05, "loss": 1.4534, "step": 27336 }, { "epoch": 2.15, "learning_rate": 5.548048555533265e-05, "loss": 1.4526, "step": 27337 }, { "epoch": 2.15, "learning_rate": 5.547088868544964e-05, "loss": 1.4382, "step": 27338 }, { "epoch": 2.15, "learning_rate": 5.5461292457367144e-05, "loss": 1.48, "step": 27339 }, { "epoch": 2.15, "learning_rate": 5.545169687115034e-05, "loss": 1.4027, "step": 27340 }, { "epoch": 2.15, "learning_rate": 5.5442101926864344e-05, "loss": 1.4344, "step": 27341 }, { "epoch": 2.15, "learning_rate": 5.543250762457429e-05, "loss": 1.4515, "step": 27342 }, { "epoch": 2.15, "learning_rate": 5.542291396434527e-05, "loss": 1.431, "step": 27343 }, { "epoch": 2.15, "learning_rate": 5.541332094624252e-05, "loss": 1.4797, "step": 27344 }, { "epoch": 2.15, "learning_rate": 5.540372857033114e-05, "loss": 1.4685, "step": 27345 }, { "epoch": 2.15, "learning_rate": 5.539413683667617e-05, "loss": 1.4959, "step": 27346 }, { "epoch": 2.15, "learning_rate": 5.538454574534287e-05, "loss": 1.4794, "step": 27347 }, { "epoch": 2.15, "learning_rate": 5.537495529639629e-05, "loss": 1.4685, "step": 27348 }, { "epoch": 2.15, "learning_rate": 5.536536548990149e-05, "loss": 1.4376, "step": 27349 }, { "epoch": 2.15, "learning_rate": 5.535577632592367e-05, "loss": 1.4847, "step": 27350 }, { "epoch": 2.15, "learning_rate": 5.534618780452793e-05, "loss": 1.4189, "step": 27351 }, { "epoch": 2.15, "learning_rate": 5.5336599925779275e-05, "loss": 1.4838, "step": 27352 }, { "epoch": 2.15, "learning_rate": 5.5327012689742914e-05, "loss": 1.4547, "step": 27353 }, { "epoch": 2.15, "learning_rate": 5.531742609648384e-05, "loss": 1.4357, "step": 27354 }, { "epoch": 2.15, "learning_rate": 5.530784014606724e-05, "loss": 1.4615, "step": 27355 }, { "epoch": 2.15, "learning_rate": 5.529825483855811e-05, "loss": 1.4533, "step": 27356 }, { "epoch": 2.15, "learning_rate": 5.5288670174021614e-05, "loss": 1.4774, "step": 27357 }, { "epoch": 2.15, "learning_rate": 5.5279086152522796e-05, "loss": 1.4859, "step": 27358 }, { "epoch": 2.15, "learning_rate": 5.5269502774126696e-05, "loss": 1.5221, "step": 27359 }, { "epoch": 2.15, "learning_rate": 5.5259920038898346e-05, "loss": 1.428, "step": 27360 }, { "epoch": 2.15, "learning_rate": 5.52503379469029e-05, "loss": 1.491, "step": 27361 }, { "epoch": 2.15, "learning_rate": 5.524075649820539e-05, "loss": 1.4413, "step": 27362 }, { "epoch": 2.15, "learning_rate": 5.52311756928708e-05, "loss": 1.5091, "step": 27363 }, { "epoch": 2.15, "learning_rate": 5.5221595530964256e-05, "loss": 1.3943, "step": 27364 }, { "epoch": 2.15, "learning_rate": 5.521201601255079e-05, "loss": 1.4715, "step": 27365 }, { "epoch": 2.15, "learning_rate": 5.520243713769538e-05, "loss": 1.4315, "step": 27366 }, { "epoch": 2.15, "learning_rate": 5.519285890646316e-05, "loss": 1.467, "step": 27367 }, { "epoch": 2.15, "learning_rate": 5.518328131891911e-05, "loss": 1.4762, "step": 27368 }, { "epoch": 2.15, "learning_rate": 5.5173704375128206e-05, "loss": 1.4535, "step": 27369 }, { "epoch": 2.15, "learning_rate": 5.5164128075155505e-05, "loss": 1.4346, "step": 27370 }, { "epoch": 2.15, "learning_rate": 5.51545524190661e-05, "loss": 1.4603, "step": 27371 }, { "epoch": 2.15, "learning_rate": 5.514497740692494e-05, "loss": 1.4752, "step": 27372 }, { "epoch": 2.15, "learning_rate": 5.5135403038797005e-05, "loss": 1.4203, "step": 27373 }, { "epoch": 2.15, "learning_rate": 5.512582931474736e-05, "loss": 1.4906, "step": 27374 }, { "epoch": 2.15, "learning_rate": 5.511625623484099e-05, "loss": 1.4563, "step": 27375 }, { "epoch": 2.15, "learning_rate": 5.510668379914289e-05, "loss": 1.4425, "step": 27376 }, { "epoch": 2.15, "learning_rate": 5.509711200771797e-05, "loss": 1.4121, "step": 27377 }, { "epoch": 2.15, "learning_rate": 5.5087540860631336e-05, "loss": 1.4374, "step": 27378 }, { "epoch": 2.15, "learning_rate": 5.507797035794793e-05, "loss": 1.4718, "step": 27379 }, { "epoch": 2.15, "learning_rate": 5.506840049973267e-05, "loss": 1.4395, "step": 27380 }, { "epoch": 2.15, "learning_rate": 5.505883128605064e-05, "loss": 1.454, "step": 27381 }, { "epoch": 2.15, "learning_rate": 5.504926271696675e-05, "loss": 1.4069, "step": 27382 }, { "epoch": 2.15, "learning_rate": 5.503969479254592e-05, "loss": 1.4176, "step": 27383 }, { "epoch": 2.15, "learning_rate": 5.503012751285321e-05, "loss": 1.4284, "step": 27384 }, { "epoch": 2.15, "learning_rate": 5.502056087795353e-05, "loss": 1.4809, "step": 27385 }, { "epoch": 2.15, "learning_rate": 5.501099488791177e-05, "loss": 1.4386, "step": 27386 }, { "epoch": 2.15, "learning_rate": 5.500142954279293e-05, "loss": 1.4882, "step": 27387 }, { "epoch": 2.15, "learning_rate": 5.4991864842662006e-05, "loss": 1.4752, "step": 27388 }, { "epoch": 2.16, "learning_rate": 5.49823007875839e-05, "loss": 1.4109, "step": 27389 }, { "epoch": 2.16, "learning_rate": 5.4972737377623494e-05, "loss": 1.415, "step": 27390 }, { "epoch": 2.16, "learning_rate": 5.4963174612845805e-05, "loss": 1.4549, "step": 27391 }, { "epoch": 2.16, "learning_rate": 5.495361249331571e-05, "loss": 1.4512, "step": 27392 }, { "epoch": 2.16, "learning_rate": 5.494405101909808e-05, "loss": 1.4385, "step": 27393 }, { "epoch": 2.16, "learning_rate": 5.493449019025795e-05, "loss": 1.4561, "step": 27394 }, { "epoch": 2.16, "learning_rate": 5.4924930006860156e-05, "loss": 1.3984, "step": 27395 }, { "epoch": 2.16, "learning_rate": 5.491537046896963e-05, "loss": 1.4833, "step": 27396 }, { "epoch": 2.16, "learning_rate": 5.490581157665121e-05, "loss": 1.4905, "step": 27397 }, { "epoch": 2.16, "learning_rate": 5.489625332996992e-05, "loss": 1.4676, "step": 27398 }, { "epoch": 2.16, "learning_rate": 5.488669572899057e-05, "loss": 1.4485, "step": 27399 }, { "epoch": 2.16, "learning_rate": 5.487713877377803e-05, "loss": 1.4694, "step": 27400 }, { "epoch": 2.16, "learning_rate": 5.486758246439721e-05, "loss": 1.4613, "step": 27401 }, { "epoch": 2.16, "learning_rate": 5.485802680091306e-05, "loss": 1.4582, "step": 27402 }, { "epoch": 2.16, "learning_rate": 5.4848471783390404e-05, "loss": 1.4767, "step": 27403 }, { "epoch": 2.16, "learning_rate": 5.483891741189407e-05, "loss": 1.4578, "step": 27404 }, { "epoch": 2.16, "learning_rate": 5.482936368648904e-05, "loss": 1.5014, "step": 27405 }, { "epoch": 2.16, "learning_rate": 5.4819810607240075e-05, "loss": 1.4297, "step": 27406 }, { "epoch": 2.16, "learning_rate": 5.481025817421205e-05, "loss": 1.4921, "step": 27407 }, { "epoch": 2.16, "learning_rate": 5.480070638746987e-05, "loss": 1.505, "step": 27408 }, { "epoch": 2.16, "learning_rate": 5.4791155247078374e-05, "loss": 1.5074, "step": 27409 }, { "epoch": 2.16, "learning_rate": 5.478160475310234e-05, "loss": 1.4732, "step": 27410 }, { "epoch": 2.16, "learning_rate": 5.477205490560672e-05, "loss": 1.422, "step": 27411 }, { "epoch": 2.16, "learning_rate": 5.476250570465629e-05, "loss": 1.474, "step": 27412 }, { "epoch": 2.16, "learning_rate": 5.475295715031588e-05, "loss": 1.4626, "step": 27413 }, { "epoch": 2.16, "learning_rate": 5.47434092426503e-05, "loss": 1.3765, "step": 27414 }, { "epoch": 2.16, "learning_rate": 5.473386198172443e-05, "loss": 1.4467, "step": 27415 }, { "epoch": 2.16, "learning_rate": 5.472431536760309e-05, "loss": 1.4202, "step": 27416 }, { "epoch": 2.16, "learning_rate": 5.4714769400351005e-05, "loss": 1.4298, "step": 27417 }, { "epoch": 2.16, "learning_rate": 5.470522408003306e-05, "loss": 1.4242, "step": 27418 }, { "epoch": 2.16, "learning_rate": 5.4695679406714086e-05, "loss": 1.4702, "step": 27419 }, { "epoch": 2.16, "learning_rate": 5.468613538045888e-05, "loss": 1.4871, "step": 27420 }, { "epoch": 2.16, "learning_rate": 5.467659200133216e-05, "loss": 1.4621, "step": 27421 }, { "epoch": 2.16, "learning_rate": 5.4667049269398826e-05, "loss": 1.4593, "step": 27422 }, { "epoch": 2.16, "learning_rate": 5.465750718472362e-05, "loss": 1.49, "step": 27423 }, { "epoch": 2.16, "learning_rate": 5.4647965747371274e-05, "loss": 1.4442, "step": 27424 }, { "epoch": 2.16, "learning_rate": 5.4638424957406654e-05, "loss": 1.5056, "step": 27425 }, { "epoch": 2.16, "learning_rate": 5.462888481489453e-05, "loss": 1.4293, "step": 27426 }, { "epoch": 2.16, "learning_rate": 5.4619345319899594e-05, "loss": 1.4756, "step": 27427 }, { "epoch": 2.16, "learning_rate": 5.460980647248671e-05, "loss": 1.4764, "step": 27428 }, { "epoch": 2.16, "learning_rate": 5.46002682727206e-05, "loss": 1.4386, "step": 27429 }, { "epoch": 2.16, "learning_rate": 5.459073072066602e-05, "loss": 1.4322, "step": 27430 }, { "epoch": 2.16, "learning_rate": 5.4581193816387674e-05, "loss": 1.4925, "step": 27431 }, { "epoch": 2.16, "learning_rate": 5.457165755995043e-05, "loss": 1.4681, "step": 27432 }, { "epoch": 2.16, "learning_rate": 5.456212195141891e-05, "loss": 1.4558, "step": 27433 }, { "epoch": 2.16, "learning_rate": 5.4552586990857914e-05, "loss": 1.4504, "step": 27434 }, { "epoch": 2.16, "learning_rate": 5.454305267833223e-05, "loss": 1.4685, "step": 27435 }, { "epoch": 2.16, "learning_rate": 5.453351901390654e-05, "loss": 1.4634, "step": 27436 }, { "epoch": 2.16, "learning_rate": 5.4523985997645584e-05, "loss": 1.4212, "step": 27437 }, { "epoch": 2.16, "learning_rate": 5.4514453629614016e-05, "loss": 1.4925, "step": 27438 }, { "epoch": 2.16, "learning_rate": 5.450492190987667e-05, "loss": 1.5116, "step": 27439 }, { "epoch": 2.16, "learning_rate": 5.44953908384982e-05, "loss": 1.4875, "step": 27440 }, { "epoch": 2.16, "learning_rate": 5.448586041554327e-05, "loss": 1.3963, "step": 27441 }, { "epoch": 2.16, "learning_rate": 5.44763306410767e-05, "loss": 1.4292, "step": 27442 }, { "epoch": 2.16, "learning_rate": 5.446680151516312e-05, "loss": 1.445, "step": 27443 }, { "epoch": 2.16, "learning_rate": 5.445727303786719e-05, "loss": 1.4459, "step": 27444 }, { "epoch": 2.16, "learning_rate": 5.4447745209253696e-05, "loss": 1.4724, "step": 27445 }, { "epoch": 2.16, "learning_rate": 5.443821802938729e-05, "loss": 1.45, "step": 27446 }, { "epoch": 2.16, "learning_rate": 5.442869149833261e-05, "loss": 1.4881, "step": 27447 }, { "epoch": 2.16, "learning_rate": 5.441916561615435e-05, "loss": 1.4767, "step": 27448 }, { "epoch": 2.16, "learning_rate": 5.440964038291727e-05, "loss": 1.4391, "step": 27449 }, { "epoch": 2.16, "learning_rate": 5.440011579868599e-05, "loss": 1.4819, "step": 27450 }, { "epoch": 2.16, "learning_rate": 5.439059186352511e-05, "loss": 1.472, "step": 27451 }, { "epoch": 2.16, "learning_rate": 5.4381068577499385e-05, "loss": 1.4174, "step": 27452 }, { "epoch": 2.16, "learning_rate": 5.437154594067346e-05, "loss": 1.4235, "step": 27453 }, { "epoch": 2.16, "learning_rate": 5.436202395311196e-05, "loss": 1.4665, "step": 27454 }, { "epoch": 2.16, "learning_rate": 5.435250261487948e-05, "loss": 1.4331, "step": 27455 }, { "epoch": 2.16, "learning_rate": 5.434298192604078e-05, "loss": 1.4817, "step": 27456 }, { "epoch": 2.16, "learning_rate": 5.4333461886660446e-05, "loss": 1.4969, "step": 27457 }, { "epoch": 2.16, "learning_rate": 5.4323942496803064e-05, "loss": 1.4949, "step": 27458 }, { "epoch": 2.16, "learning_rate": 5.4314423756533365e-05, "loss": 1.4807, "step": 27459 }, { "epoch": 2.16, "learning_rate": 5.430490566591591e-05, "loss": 1.4365, "step": 27460 }, { "epoch": 2.16, "learning_rate": 5.4295388225015315e-05, "loss": 1.4274, "step": 27461 }, { "epoch": 2.16, "learning_rate": 5.4285871433896255e-05, "loss": 1.4686, "step": 27462 }, { "epoch": 2.16, "learning_rate": 5.427635529262331e-05, "loss": 1.5194, "step": 27463 }, { "epoch": 2.16, "learning_rate": 5.4266839801261035e-05, "loss": 1.4439, "step": 27464 }, { "epoch": 2.16, "learning_rate": 5.4257324959874086e-05, "loss": 1.4378, "step": 27465 }, { "epoch": 2.16, "learning_rate": 5.424781076852711e-05, "loss": 1.4533, "step": 27466 }, { "epoch": 2.16, "learning_rate": 5.423829722728467e-05, "loss": 1.503, "step": 27467 }, { "epoch": 2.16, "learning_rate": 5.42287843362113e-05, "loss": 1.4334, "step": 27468 }, { "epoch": 2.16, "learning_rate": 5.421927209537166e-05, "loss": 1.4586, "step": 27469 }, { "epoch": 2.16, "learning_rate": 5.420976050483032e-05, "loss": 1.5076, "step": 27470 }, { "epoch": 2.16, "learning_rate": 5.4200249564651865e-05, "loss": 1.4815, "step": 27471 }, { "epoch": 2.16, "learning_rate": 5.419073927490077e-05, "loss": 1.5408, "step": 27472 }, { "epoch": 2.16, "learning_rate": 5.418122963564175e-05, "loss": 1.4493, "step": 27473 }, { "epoch": 2.16, "learning_rate": 5.4171720646939306e-05, "loss": 1.5015, "step": 27474 }, { "epoch": 2.16, "learning_rate": 5.4162212308857934e-05, "loss": 1.4704, "step": 27475 }, { "epoch": 2.16, "learning_rate": 5.41527046214623e-05, "loss": 1.4095, "step": 27476 }, { "epoch": 2.16, "learning_rate": 5.414319758481692e-05, "loss": 1.4041, "step": 27477 }, { "epoch": 2.16, "learning_rate": 5.4133691198986276e-05, "loss": 1.5019, "step": 27478 }, { "epoch": 2.16, "learning_rate": 5.412418546403502e-05, "loss": 1.4777, "step": 27479 }, { "epoch": 2.16, "learning_rate": 5.411468038002758e-05, "loss": 1.4177, "step": 27480 }, { "epoch": 2.16, "learning_rate": 5.41051759470286e-05, "loss": 1.4639, "step": 27481 }, { "epoch": 2.16, "learning_rate": 5.409567216510249e-05, "loss": 1.3983, "step": 27482 }, { "epoch": 2.16, "learning_rate": 5.40861690343139e-05, "loss": 1.4174, "step": 27483 }, { "epoch": 2.16, "learning_rate": 5.40766665547273e-05, "loss": 1.4702, "step": 27484 }, { "epoch": 2.16, "learning_rate": 5.4067164726407146e-05, "loss": 1.4823, "step": 27485 }, { "epoch": 2.16, "learning_rate": 5.405766354941806e-05, "loss": 1.4728, "step": 27486 }, { "epoch": 2.16, "learning_rate": 5.4048163023824496e-05, "loss": 1.4661, "step": 27487 }, { "epoch": 2.16, "learning_rate": 5.4038663149690936e-05, "loss": 1.4242, "step": 27488 }, { "epoch": 2.16, "learning_rate": 5.402916392708186e-05, "loss": 1.4934, "step": 27489 }, { "epoch": 2.16, "learning_rate": 5.4019665356061844e-05, "loss": 1.4638, "step": 27490 }, { "epoch": 2.16, "learning_rate": 5.4010167436695354e-05, "loss": 1.443, "step": 27491 }, { "epoch": 2.16, "learning_rate": 5.400067016904678e-05, "loss": 1.4559, "step": 27492 }, { "epoch": 2.16, "learning_rate": 5.399117355318073e-05, "loss": 1.4414, "step": 27493 }, { "epoch": 2.16, "learning_rate": 5.398167758916165e-05, "loss": 1.4441, "step": 27494 }, { "epoch": 2.16, "learning_rate": 5.397218227705393e-05, "loss": 1.4193, "step": 27495 }, { "epoch": 2.16, "learning_rate": 5.39626876169221e-05, "loss": 1.3986, "step": 27496 }, { "epoch": 2.16, "learning_rate": 5.395319360883067e-05, "loss": 1.5084, "step": 27497 }, { "epoch": 2.16, "learning_rate": 5.394370025284405e-05, "loss": 1.4682, "step": 27498 }, { "epoch": 2.16, "learning_rate": 5.393420754902664e-05, "loss": 1.4535, "step": 27499 }, { "epoch": 2.16, "learning_rate": 5.392471549744302e-05, "loss": 1.4683, "step": 27500 }, { "epoch": 2.16, "learning_rate": 5.391522409815755e-05, "loss": 1.448, "step": 27501 }, { "epoch": 2.16, "learning_rate": 5.3905733351234624e-05, "loss": 1.4522, "step": 27502 }, { "epoch": 2.16, "learning_rate": 5.3896243256738815e-05, "loss": 1.4302, "step": 27503 }, { "epoch": 2.16, "learning_rate": 5.388675381473446e-05, "loss": 1.4711, "step": 27504 }, { "epoch": 2.16, "learning_rate": 5.387726502528597e-05, "loss": 1.5136, "step": 27505 }, { "epoch": 2.16, "learning_rate": 5.386777688845785e-05, "loss": 1.4327, "step": 27506 }, { "epoch": 2.16, "learning_rate": 5.3858289404314476e-05, "loss": 1.4249, "step": 27507 }, { "epoch": 2.16, "learning_rate": 5.3848802572920255e-05, "loss": 1.4532, "step": 27508 }, { "epoch": 2.16, "learning_rate": 5.383931639433955e-05, "loss": 1.4714, "step": 27509 }, { "epoch": 2.16, "learning_rate": 5.382983086863688e-05, "loss": 1.4858, "step": 27510 }, { "epoch": 2.16, "learning_rate": 5.3820345995876545e-05, "loss": 1.4591, "step": 27511 }, { "epoch": 2.16, "learning_rate": 5.3810861776123025e-05, "loss": 1.448, "step": 27512 }, { "epoch": 2.16, "learning_rate": 5.380137820944062e-05, "loss": 1.4594, "step": 27513 }, { "epoch": 2.16, "learning_rate": 5.3791895295893825e-05, "loss": 1.4655, "step": 27514 }, { "epoch": 2.16, "learning_rate": 5.378241303554696e-05, "loss": 1.4109, "step": 27515 }, { "epoch": 2.16, "learning_rate": 5.377293142846437e-05, "loss": 1.5096, "step": 27516 }, { "epoch": 2.17, "learning_rate": 5.3763450474710526e-05, "loss": 1.4883, "step": 27517 }, { "epoch": 2.17, "learning_rate": 5.375397017434975e-05, "loss": 1.4645, "step": 27518 }, { "epoch": 2.17, "learning_rate": 5.3744490527446345e-05, "loss": 1.4582, "step": 27519 }, { "epoch": 2.17, "learning_rate": 5.373501153406477e-05, "loss": 1.4413, "step": 27520 }, { "epoch": 2.17, "learning_rate": 5.372553319426936e-05, "loss": 1.4711, "step": 27521 }, { "epoch": 2.17, "learning_rate": 5.3716055508124395e-05, "loss": 1.4797, "step": 27522 }, { "epoch": 2.17, "learning_rate": 5.370657847569433e-05, "loss": 1.452, "step": 27523 }, { "epoch": 2.17, "learning_rate": 5.369710209704346e-05, "loss": 1.4673, "step": 27524 }, { "epoch": 2.17, "learning_rate": 5.368762637223612e-05, "loss": 1.4625, "step": 27525 }, { "epoch": 2.17, "learning_rate": 5.367815130133661e-05, "loss": 1.4701, "step": 27526 }, { "epoch": 2.17, "learning_rate": 5.366867688440927e-05, "loss": 1.4386, "step": 27527 }, { "epoch": 2.17, "learning_rate": 5.365920312151853e-05, "loss": 1.4863, "step": 27528 }, { "epoch": 2.17, "learning_rate": 5.3649730012728626e-05, "loss": 1.4436, "step": 27529 }, { "epoch": 2.17, "learning_rate": 5.364025755810383e-05, "loss": 1.4038, "step": 27530 }, { "epoch": 2.17, "learning_rate": 5.3630785757708567e-05, "loss": 1.521, "step": 27531 }, { "epoch": 2.17, "learning_rate": 5.362131461160709e-05, "loss": 1.5084, "step": 27532 }, { "epoch": 2.17, "learning_rate": 5.361184411986363e-05, "loss": 1.4888, "step": 27533 }, { "epoch": 2.17, "learning_rate": 5.360237428254264e-05, "loss": 1.4319, "step": 27534 }, { "epoch": 2.17, "learning_rate": 5.3592905099708314e-05, "loss": 1.4449, "step": 27535 }, { "epoch": 2.17, "learning_rate": 5.3583436571424904e-05, "loss": 1.4624, "step": 27536 }, { "epoch": 2.17, "learning_rate": 5.357396869775682e-05, "loss": 1.4153, "step": 27537 }, { "epoch": 2.17, "learning_rate": 5.3564501478768265e-05, "loss": 1.4584, "step": 27538 }, { "epoch": 2.17, "learning_rate": 5.3555034914523466e-05, "loss": 1.4667, "step": 27539 }, { "epoch": 2.17, "learning_rate": 5.3545569005086825e-05, "loss": 1.4451, "step": 27540 }, { "epoch": 2.17, "learning_rate": 5.353610375052254e-05, "loss": 1.4443, "step": 27541 }, { "epoch": 2.17, "learning_rate": 5.352663915089488e-05, "loss": 1.4587, "step": 27542 }, { "epoch": 2.17, "learning_rate": 5.351717520626799e-05, "loss": 1.4558, "step": 27543 }, { "epoch": 2.17, "learning_rate": 5.3507711916706346e-05, "loss": 1.4671, "step": 27544 }, { "epoch": 2.17, "learning_rate": 5.349824928227408e-05, "loss": 1.4792, "step": 27545 }, { "epoch": 2.17, "learning_rate": 5.34887873030354e-05, "loss": 1.4521, "step": 27546 }, { "epoch": 2.17, "learning_rate": 5.347932597905466e-05, "loss": 1.4865, "step": 27547 }, { "epoch": 2.17, "learning_rate": 5.3469865310396015e-05, "loss": 1.4095, "step": 27548 }, { "epoch": 2.17, "learning_rate": 5.3460405297123716e-05, "loss": 1.4546, "step": 27549 }, { "epoch": 2.17, "learning_rate": 5.3450945939301944e-05, "loss": 1.4733, "step": 27550 }, { "epoch": 2.17, "learning_rate": 5.3441487236995025e-05, "loss": 1.4205, "step": 27551 }, { "epoch": 2.17, "learning_rate": 5.3432029190267126e-05, "loss": 1.4632, "step": 27552 }, { "epoch": 2.17, "learning_rate": 5.342257179918239e-05, "loss": 1.458, "step": 27553 }, { "epoch": 2.17, "learning_rate": 5.341311506380516e-05, "loss": 1.5016, "step": 27554 }, { "epoch": 2.17, "learning_rate": 5.340365898419957e-05, "loss": 1.4691, "step": 27555 }, { "epoch": 2.17, "learning_rate": 5.339420356042978e-05, "loss": 1.5226, "step": 27556 }, { "epoch": 2.17, "learning_rate": 5.338474879256008e-05, "loss": 1.4528, "step": 27557 }, { "epoch": 2.17, "learning_rate": 5.3375294680654576e-05, "loss": 1.4736, "step": 27558 }, { "epoch": 2.17, "learning_rate": 5.336584122477755e-05, "loss": 1.4066, "step": 27559 }, { "epoch": 2.17, "learning_rate": 5.335638842499309e-05, "loss": 1.4075, "step": 27560 }, { "epoch": 2.17, "learning_rate": 5.334693628136546e-05, "loss": 1.5, "step": 27561 }, { "epoch": 2.17, "learning_rate": 5.333748479395881e-05, "loss": 1.4631, "step": 27562 }, { "epoch": 2.17, "learning_rate": 5.332803396283723e-05, "loss": 1.4353, "step": 27563 }, { "epoch": 2.17, "learning_rate": 5.331858378806501e-05, "loss": 1.4869, "step": 27564 }, { "epoch": 2.17, "learning_rate": 5.330913426970625e-05, "loss": 1.4251, "step": 27565 }, { "epoch": 2.17, "learning_rate": 5.329968540782511e-05, "loss": 1.434, "step": 27566 }, { "epoch": 2.17, "learning_rate": 5.3290237202485694e-05, "loss": 1.4219, "step": 27567 }, { "epoch": 2.17, "learning_rate": 5.328078965375224e-05, "loss": 1.4713, "step": 27568 }, { "epoch": 2.17, "learning_rate": 5.327134276168886e-05, "loss": 1.4157, "step": 27569 }, { "epoch": 2.17, "learning_rate": 5.326189652635963e-05, "loss": 1.3995, "step": 27570 }, { "epoch": 2.17, "learning_rate": 5.3252450947828786e-05, "loss": 1.4293, "step": 27571 }, { "epoch": 2.17, "learning_rate": 5.324300602616042e-05, "loss": 1.4555, "step": 27572 }, { "epoch": 2.17, "learning_rate": 5.323356176141858e-05, "loss": 1.418, "step": 27573 }, { "epoch": 2.17, "learning_rate": 5.322411815366747e-05, "loss": 1.4371, "step": 27574 }, { "epoch": 2.17, "learning_rate": 5.321467520297124e-05, "loss": 1.5066, "step": 27575 }, { "epoch": 2.17, "learning_rate": 5.320523290939395e-05, "loss": 1.4834, "step": 27576 }, { "epoch": 2.17, "learning_rate": 5.319579127299967e-05, "loss": 1.4922, "step": 27577 }, { "epoch": 2.17, "learning_rate": 5.3186350293852595e-05, "loss": 1.455, "step": 27578 }, { "epoch": 2.17, "learning_rate": 5.317690997201678e-05, "loss": 1.3756, "step": 27579 }, { "epoch": 2.17, "learning_rate": 5.316747030755625e-05, "loss": 1.4329, "step": 27580 }, { "epoch": 2.17, "learning_rate": 5.315803130053522e-05, "loss": 1.3656, "step": 27581 }, { "epoch": 2.17, "learning_rate": 5.314859295101771e-05, "loss": 1.467, "step": 27582 }, { "epoch": 2.17, "learning_rate": 5.313915525906782e-05, "loss": 1.4049, "step": 27583 }, { "epoch": 2.17, "learning_rate": 5.3129718224749543e-05, "loss": 1.44, "step": 27584 }, { "epoch": 2.17, "learning_rate": 5.312028184812708e-05, "loss": 1.4775, "step": 27585 }, { "epoch": 2.17, "learning_rate": 5.3110846129264443e-05, "loss": 1.3787, "step": 27586 }, { "epoch": 2.17, "learning_rate": 5.310141106822564e-05, "loss": 1.4553, "step": 27587 }, { "epoch": 2.17, "learning_rate": 5.309197666507485e-05, "loss": 1.4108, "step": 27588 }, { "epoch": 2.17, "learning_rate": 5.3082542919876046e-05, "loss": 1.3812, "step": 27589 }, { "epoch": 2.17, "learning_rate": 5.307310983269324e-05, "loss": 1.4989, "step": 27590 }, { "epoch": 2.17, "learning_rate": 5.306367740359052e-05, "loss": 1.4844, "step": 27591 }, { "epoch": 2.17, "learning_rate": 5.305424563263201e-05, "loss": 1.4619, "step": 27592 }, { "epoch": 2.17, "learning_rate": 5.3044814519881666e-05, "loss": 1.4231, "step": 27593 }, { "epoch": 2.17, "learning_rate": 5.3035384065403466e-05, "loss": 1.4489, "step": 27594 }, { "epoch": 2.17, "learning_rate": 5.302595426926156e-05, "loss": 1.4557, "step": 27595 }, { "epoch": 2.17, "learning_rate": 5.3016525131519895e-05, "loss": 1.4104, "step": 27596 }, { "epoch": 2.17, "learning_rate": 5.300709665224247e-05, "loss": 1.4368, "step": 27597 }, { "epoch": 2.17, "learning_rate": 5.299766883149337e-05, "loss": 1.5037, "step": 27598 }, { "epoch": 2.17, "learning_rate": 5.298824166933658e-05, "loss": 1.4026, "step": 27599 }, { "epoch": 2.17, "learning_rate": 5.297881516583609e-05, "loss": 1.4583, "step": 27600 }, { "epoch": 2.17, "learning_rate": 5.296938932105586e-05, "loss": 1.437, "step": 27601 }, { "epoch": 2.17, "learning_rate": 5.2959964135059975e-05, "loss": 1.4798, "step": 27602 }, { "epoch": 2.17, "learning_rate": 5.2950539607912376e-05, "loss": 1.4201, "step": 27603 }, { "epoch": 2.17, "learning_rate": 5.2941115739677025e-05, "loss": 1.4488, "step": 27604 }, { "epoch": 2.17, "learning_rate": 5.2931692530417966e-05, "loss": 1.4353, "step": 27605 }, { "epoch": 2.17, "learning_rate": 5.2922269980199105e-05, "loss": 1.4261, "step": 27606 }, { "epoch": 2.17, "learning_rate": 5.291284808908452e-05, "loss": 1.4965, "step": 27607 }, { "epoch": 2.17, "learning_rate": 5.2903426857138054e-05, "loss": 1.4453, "step": 27608 }, { "epoch": 2.17, "learning_rate": 5.289400628442379e-05, "loss": 1.4281, "step": 27609 }, { "epoch": 2.17, "learning_rate": 5.288458637100564e-05, "loss": 1.4662, "step": 27610 }, { "epoch": 2.17, "learning_rate": 5.2875167116947516e-05, "loss": 1.4321, "step": 27611 }, { "epoch": 2.17, "learning_rate": 5.286574852231344e-05, "loss": 1.4433, "step": 27612 }, { "epoch": 2.17, "learning_rate": 5.285633058716733e-05, "loss": 1.4317, "step": 27613 }, { "epoch": 2.17, "learning_rate": 5.28469133115731e-05, "loss": 1.4623, "step": 27614 }, { "epoch": 2.17, "learning_rate": 5.283749669559474e-05, "loss": 1.4589, "step": 27615 }, { "epoch": 2.17, "learning_rate": 5.282808073929617e-05, "loss": 1.5102, "step": 27616 }, { "epoch": 2.17, "learning_rate": 5.2818665442741256e-05, "loss": 1.4178, "step": 27617 }, { "epoch": 2.17, "learning_rate": 5.2809250805994024e-05, "loss": 1.407, "step": 27618 }, { "epoch": 2.17, "learning_rate": 5.279983682911834e-05, "loss": 1.4291, "step": 27619 }, { "epoch": 2.17, "learning_rate": 5.2790423512178134e-05, "loss": 1.4659, "step": 27620 }, { "epoch": 2.17, "learning_rate": 5.2781010855237196e-05, "loss": 1.4105, "step": 27621 }, { "epoch": 2.17, "learning_rate": 5.277159885835965e-05, "loss": 1.482, "step": 27622 }, { "epoch": 2.17, "learning_rate": 5.27621875216093e-05, "loss": 1.4794, "step": 27623 }, { "epoch": 2.17, "learning_rate": 5.275277684505003e-05, "loss": 1.4431, "step": 27624 }, { "epoch": 2.17, "learning_rate": 5.274336682874568e-05, "loss": 1.4757, "step": 27625 }, { "epoch": 2.17, "learning_rate": 5.273395747276026e-05, "loss": 1.4753, "step": 27626 }, { "epoch": 2.17, "learning_rate": 5.272454877715759e-05, "loss": 1.4287, "step": 27627 }, { "epoch": 2.17, "learning_rate": 5.271514074200151e-05, "loss": 1.4122, "step": 27628 }, { "epoch": 2.17, "learning_rate": 5.2705733367355976e-05, "loss": 1.4596, "step": 27629 }, { "epoch": 2.17, "learning_rate": 5.269632665328483e-05, "loss": 1.4581, "step": 27630 }, { "epoch": 2.17, "learning_rate": 5.268692059985188e-05, "loss": 1.4623, "step": 27631 }, { "epoch": 2.17, "learning_rate": 5.267751520712108e-05, "loss": 1.4574, "step": 27632 }, { "epoch": 2.17, "learning_rate": 5.266811047515625e-05, "loss": 1.4338, "step": 27633 }, { "epoch": 2.17, "learning_rate": 5.265870640402119e-05, "loss": 1.4219, "step": 27634 }, { "epoch": 2.17, "learning_rate": 5.264930299377985e-05, "loss": 1.5054, "step": 27635 }, { "epoch": 2.17, "learning_rate": 5.2639900244496e-05, "loss": 1.5123, "step": 27636 }, { "epoch": 2.17, "learning_rate": 5.263049815623348e-05, "loss": 1.4644, "step": 27637 }, { "epoch": 2.17, "learning_rate": 5.262109672905612e-05, "loss": 1.4973, "step": 27638 }, { "epoch": 2.17, "learning_rate": 5.261169596302783e-05, "loss": 1.4549, "step": 27639 }, { "epoch": 2.17, "learning_rate": 5.260229585821239e-05, "loss": 1.4811, "step": 27640 }, { "epoch": 2.17, "learning_rate": 5.2592896414673604e-05, "loss": 1.4159, "step": 27641 }, { "epoch": 2.17, "learning_rate": 5.258349763247525e-05, "loss": 1.4752, "step": 27642 }, { "epoch": 2.17, "learning_rate": 5.257409951168124e-05, "loss": 1.5128, "step": 27643 }, { "epoch": 2.18, "learning_rate": 5.256470205235533e-05, "loss": 1.3962, "step": 27644 }, { "epoch": 2.18, "learning_rate": 5.2555305254561266e-05, "loss": 1.4772, "step": 27645 }, { "epoch": 2.18, "learning_rate": 5.254590911836296e-05, "loss": 1.4691, "step": 27646 }, { "epoch": 2.18, "learning_rate": 5.253651364382415e-05, "loss": 1.5008, "step": 27647 }, { "epoch": 2.18, "learning_rate": 5.2527118831008585e-05, "loss": 1.4641, "step": 27648 }, { "epoch": 2.18, "learning_rate": 5.2517724679980126e-05, "loss": 1.4415, "step": 27649 }, { "epoch": 2.18, "learning_rate": 5.2508331190802545e-05, "loss": 1.4425, "step": 27650 }, { "epoch": 2.18, "learning_rate": 5.249893836353953e-05, "loss": 1.4503, "step": 27651 }, { "epoch": 2.18, "learning_rate": 5.248954619825498e-05, "loss": 1.4628, "step": 27652 }, { "epoch": 2.18, "learning_rate": 5.248015469501253e-05, "loss": 1.4062, "step": 27653 }, { "epoch": 2.18, "learning_rate": 5.247076385387608e-05, "loss": 1.4401, "step": 27654 }, { "epoch": 2.18, "learning_rate": 5.246137367490927e-05, "loss": 1.4362, "step": 27655 }, { "epoch": 2.18, "learning_rate": 5.245198415817596e-05, "loss": 1.4153, "step": 27656 }, { "epoch": 2.18, "learning_rate": 5.244259530373983e-05, "loss": 1.4375, "step": 27657 }, { "epoch": 2.18, "learning_rate": 5.24332071116646e-05, "loss": 1.4307, "step": 27658 }, { "epoch": 2.18, "learning_rate": 5.242381958201411e-05, "loss": 1.4616, "step": 27659 }, { "epoch": 2.18, "learning_rate": 5.241443271485203e-05, "loss": 1.48, "step": 27660 }, { "epoch": 2.18, "learning_rate": 5.240504651024209e-05, "loss": 1.4385, "step": 27661 }, { "epoch": 2.18, "learning_rate": 5.2395660968248005e-05, "loss": 1.451, "step": 27662 }, { "epoch": 2.18, "learning_rate": 5.2386276088933545e-05, "loss": 1.4887, "step": 27663 }, { "epoch": 2.18, "learning_rate": 5.237689187236241e-05, "loss": 1.4436, "step": 27664 }, { "epoch": 2.18, "learning_rate": 5.236750831859825e-05, "loss": 1.4729, "step": 27665 }, { "epoch": 2.18, "learning_rate": 5.23581254277049e-05, "loss": 1.4838, "step": 27666 }, { "epoch": 2.18, "learning_rate": 5.2348743199745975e-05, "loss": 1.513, "step": 27667 }, { "epoch": 2.18, "learning_rate": 5.2339361634785155e-05, "loss": 1.4655, "step": 27668 }, { "epoch": 2.18, "learning_rate": 5.232998073288617e-05, "loss": 1.4126, "step": 27669 }, { "epoch": 2.18, "learning_rate": 5.232060049411278e-05, "loss": 1.4288, "step": 27670 }, { "epoch": 2.18, "learning_rate": 5.231122091852859e-05, "loss": 1.4427, "step": 27671 }, { "epoch": 2.18, "learning_rate": 5.230184200619727e-05, "loss": 1.4581, "step": 27672 }, { "epoch": 2.18, "learning_rate": 5.2292463757182565e-05, "loss": 1.4542, "step": 27673 }, { "epoch": 2.18, "learning_rate": 5.2283086171548115e-05, "loss": 1.4963, "step": 27674 }, { "epoch": 2.18, "learning_rate": 5.227370924935753e-05, "loss": 1.4741, "step": 27675 }, { "epoch": 2.18, "learning_rate": 5.226433299067458e-05, "loss": 1.4762, "step": 27676 }, { "epoch": 2.18, "learning_rate": 5.225495739556289e-05, "loss": 1.4389, "step": 27677 }, { "epoch": 2.18, "learning_rate": 5.224558246408608e-05, "loss": 1.5038, "step": 27678 }, { "epoch": 2.18, "learning_rate": 5.2236208196307775e-05, "loss": 1.466, "step": 27679 }, { "epoch": 2.18, "learning_rate": 5.2226834592291724e-05, "loss": 1.4866, "step": 27680 }, { "epoch": 2.18, "learning_rate": 5.22174616521015e-05, "loss": 1.5459, "step": 27681 }, { "epoch": 2.18, "learning_rate": 5.2208089375800705e-05, "loss": 1.4999, "step": 27682 }, { "epoch": 2.18, "learning_rate": 5.219871776345307e-05, "loss": 1.4578, "step": 27683 }, { "epoch": 2.18, "learning_rate": 5.2189346815122124e-05, "loss": 1.4662, "step": 27684 }, { "epoch": 2.18, "learning_rate": 5.217997653087157e-05, "loss": 1.4823, "step": 27685 }, { "epoch": 2.18, "learning_rate": 5.2170606910764954e-05, "loss": 1.4267, "step": 27686 }, { "epoch": 2.18, "learning_rate": 5.216123795486598e-05, "loss": 1.4724, "step": 27687 }, { "epoch": 2.18, "learning_rate": 5.215186966323821e-05, "loss": 1.4899, "step": 27688 }, { "epoch": 2.18, "learning_rate": 5.2142502035945195e-05, "loss": 1.428, "step": 27689 }, { "epoch": 2.18, "learning_rate": 5.213313507305065e-05, "loss": 1.4193, "step": 27690 }, { "epoch": 2.18, "learning_rate": 5.2123768774618105e-05, "loss": 1.4726, "step": 27691 }, { "epoch": 2.18, "learning_rate": 5.211440314071109e-05, "loss": 1.451, "step": 27692 }, { "epoch": 2.18, "learning_rate": 5.210503817139333e-05, "loss": 1.4431, "step": 27693 }, { "epoch": 2.18, "learning_rate": 5.2095673866728336e-05, "loss": 1.4823, "step": 27694 }, { "epoch": 2.18, "learning_rate": 5.208631022677968e-05, "loss": 1.4634, "step": 27695 }, { "epoch": 2.18, "learning_rate": 5.20769472516109e-05, "loss": 1.4219, "step": 27696 }, { "epoch": 2.18, "learning_rate": 5.206758494128566e-05, "loss": 1.5075, "step": 27697 }, { "epoch": 2.18, "learning_rate": 5.2058223295867475e-05, "loss": 1.4414, "step": 27698 }, { "epoch": 2.18, "learning_rate": 5.204886231541985e-05, "loss": 1.4392, "step": 27699 }, { "epoch": 2.18, "learning_rate": 5.20395020000064e-05, "loss": 1.4694, "step": 27700 }, { "epoch": 2.18, "learning_rate": 5.203014234969071e-05, "loss": 1.4742, "step": 27701 }, { "epoch": 2.18, "learning_rate": 5.20207833645363e-05, "loss": 1.4623, "step": 27702 }, { "epoch": 2.18, "learning_rate": 5.201142504460666e-05, "loss": 1.4485, "step": 27703 }, { "epoch": 2.18, "learning_rate": 5.20020673899654e-05, "loss": 1.4727, "step": 27704 }, { "epoch": 2.18, "learning_rate": 5.199271040067605e-05, "loss": 1.4331, "step": 27705 }, { "epoch": 2.18, "learning_rate": 5.198335407680203e-05, "loss": 1.4327, "step": 27706 }, { "epoch": 2.18, "learning_rate": 5.197399841840702e-05, "loss": 1.4356, "step": 27707 }, { "epoch": 2.18, "learning_rate": 5.1964643425554447e-05, "loss": 1.4902, "step": 27708 }, { "epoch": 2.18, "learning_rate": 5.195528909830781e-05, "loss": 1.4518, "step": 27709 }, { "epoch": 2.18, "learning_rate": 5.19459354367307e-05, "loss": 1.5232, "step": 27710 }, { "epoch": 2.18, "learning_rate": 5.193658244088658e-05, "loss": 1.4425, "step": 27711 }, { "epoch": 2.18, "learning_rate": 5.1927230110838884e-05, "loss": 1.4312, "step": 27712 }, { "epoch": 2.18, "learning_rate": 5.191787844665124e-05, "loss": 1.4901, "step": 27713 }, { "epoch": 2.18, "learning_rate": 5.1908527448387075e-05, "loss": 1.4617, "step": 27714 }, { "epoch": 2.18, "learning_rate": 5.189917711610988e-05, "loss": 1.4726, "step": 27715 }, { "epoch": 2.18, "learning_rate": 5.188982744988303e-05, "loss": 1.452, "step": 27716 }, { "epoch": 2.18, "learning_rate": 5.18804784497702e-05, "loss": 1.4279, "step": 27717 }, { "epoch": 2.18, "learning_rate": 5.187113011583479e-05, "loss": 1.4469, "step": 27718 }, { "epoch": 2.18, "learning_rate": 5.1861782448140246e-05, "loss": 1.4399, "step": 27719 }, { "epoch": 2.18, "learning_rate": 5.185243544675e-05, "loss": 1.4738, "step": 27720 }, { "epoch": 2.18, "learning_rate": 5.18430891117276e-05, "loss": 1.4296, "step": 27721 }, { "epoch": 2.18, "learning_rate": 5.1833743443136456e-05, "loss": 1.4516, "step": 27722 }, { "epoch": 2.18, "learning_rate": 5.182439844103997e-05, "loss": 1.4424, "step": 27723 }, { "epoch": 2.18, "learning_rate": 5.18150541055017e-05, "loss": 1.4667, "step": 27724 }, { "epoch": 2.18, "learning_rate": 5.180571043658501e-05, "loss": 1.4443, "step": 27725 }, { "epoch": 2.18, "learning_rate": 5.179636743435332e-05, "loss": 1.4871, "step": 27726 }, { "epoch": 2.18, "learning_rate": 5.1787025098870164e-05, "loss": 1.5139, "step": 27727 }, { "epoch": 2.18, "learning_rate": 5.177768343019888e-05, "loss": 1.4379, "step": 27728 }, { "epoch": 2.18, "learning_rate": 5.176834242840291e-05, "loss": 1.4596, "step": 27729 }, { "epoch": 2.18, "learning_rate": 5.1759002093545705e-05, "loss": 1.4512, "step": 27730 }, { "epoch": 2.18, "learning_rate": 5.174966242569062e-05, "loss": 1.4246, "step": 27731 }, { "epoch": 2.18, "learning_rate": 5.174032342490117e-05, "loss": 1.4788, "step": 27732 }, { "epoch": 2.18, "learning_rate": 5.173098509124064e-05, "loss": 1.4471, "step": 27733 }, { "epoch": 2.18, "learning_rate": 5.172164742477255e-05, "loss": 1.4302, "step": 27734 }, { "epoch": 2.18, "learning_rate": 5.171231042556023e-05, "loss": 1.447, "step": 27735 }, { "epoch": 2.18, "learning_rate": 5.170297409366709e-05, "loss": 1.4785, "step": 27736 }, { "epoch": 2.18, "learning_rate": 5.169363842915644e-05, "loss": 1.4824, "step": 27737 }, { "epoch": 2.18, "learning_rate": 5.168430343209181e-05, "loss": 1.469, "step": 27738 }, { "epoch": 2.18, "learning_rate": 5.1674969102536494e-05, "loss": 1.4546, "step": 27739 }, { "epoch": 2.18, "learning_rate": 5.166563544055383e-05, "loss": 1.4133, "step": 27740 }, { "epoch": 2.18, "learning_rate": 5.165630244620729e-05, "loss": 1.4716, "step": 27741 }, { "epoch": 2.18, "learning_rate": 5.164697011956018e-05, "loss": 1.4701, "step": 27742 }, { "epoch": 2.18, "learning_rate": 5.1637638460675815e-05, "loss": 1.4541, "step": 27743 }, { "epoch": 2.18, "learning_rate": 5.162830746961766e-05, "loss": 1.4438, "step": 27744 }, { "epoch": 2.18, "learning_rate": 5.1618977146449e-05, "loss": 1.5184, "step": 27745 }, { "epoch": 2.18, "learning_rate": 5.160964749123316e-05, "loss": 1.4985, "step": 27746 }, { "epoch": 2.18, "learning_rate": 5.1600318504033505e-05, "loss": 1.3676, "step": 27747 }, { "epoch": 2.18, "learning_rate": 5.159099018491344e-05, "loss": 1.4896, "step": 27748 }, { "epoch": 2.18, "learning_rate": 5.158166253393625e-05, "loss": 1.4644, "step": 27749 }, { "epoch": 2.18, "learning_rate": 5.157233555116521e-05, "loss": 1.4595, "step": 27750 }, { "epoch": 2.18, "learning_rate": 5.1563009236663735e-05, "loss": 1.4255, "step": 27751 }, { "epoch": 2.18, "learning_rate": 5.155368359049511e-05, "loss": 1.4832, "step": 27752 }, { "epoch": 2.18, "learning_rate": 5.154435861272264e-05, "loss": 1.4875, "step": 27753 }, { "epoch": 2.18, "learning_rate": 5.1535034303409614e-05, "loss": 1.4609, "step": 27754 }, { "epoch": 2.18, "learning_rate": 5.15257106626194e-05, "loss": 1.4728, "step": 27755 }, { "epoch": 2.18, "learning_rate": 5.151638769041526e-05, "loss": 1.4643, "step": 27756 }, { "epoch": 2.18, "learning_rate": 5.150706538686048e-05, "loss": 1.4467, "step": 27757 }, { "epoch": 2.18, "learning_rate": 5.1497743752018386e-05, "loss": 1.4376, "step": 27758 }, { "epoch": 2.18, "learning_rate": 5.148842278595229e-05, "loss": 1.399, "step": 27759 }, { "epoch": 2.18, "learning_rate": 5.147910248872535e-05, "loss": 1.4039, "step": 27760 }, { "epoch": 2.18, "learning_rate": 5.146978286040102e-05, "loss": 1.4623, "step": 27761 }, { "epoch": 2.18, "learning_rate": 5.1460463901042484e-05, "loss": 1.4046, "step": 27762 }, { "epoch": 2.18, "learning_rate": 5.145114561071295e-05, "loss": 1.4393, "step": 27763 }, { "epoch": 2.18, "learning_rate": 5.144182798947578e-05, "loss": 1.5334, "step": 27764 }, { "epoch": 2.18, "learning_rate": 5.1432511037394244e-05, "loss": 1.4064, "step": 27765 }, { "epoch": 2.18, "learning_rate": 5.1423194754531565e-05, "loss": 1.4187, "step": 27766 }, { "epoch": 2.18, "learning_rate": 5.141387914095095e-05, "loss": 1.4536, "step": 27767 }, { "epoch": 2.18, "learning_rate": 5.140456419671574e-05, "loss": 1.4904, "step": 27768 }, { "epoch": 2.18, "learning_rate": 5.139524992188913e-05, "loss": 1.4809, "step": 27769 }, { "epoch": 2.18, "learning_rate": 5.1385936316534305e-05, "loss": 1.4276, "step": 27770 }, { "epoch": 2.19, "learning_rate": 5.1376623380714606e-05, "loss": 1.4188, "step": 27771 }, { "epoch": 2.19, "learning_rate": 5.1367311114493195e-05, "loss": 1.4623, "step": 27772 }, { "epoch": 2.19, "learning_rate": 5.1357999517933335e-05, "loss": 1.4744, "step": 27773 }, { "epoch": 2.19, "learning_rate": 5.1348688591098147e-05, "loss": 1.4458, "step": 27774 }, { "epoch": 2.19, "learning_rate": 5.1339378334051e-05, "loss": 1.4368, "step": 27775 }, { "epoch": 2.19, "learning_rate": 5.1330068746855015e-05, "loss": 1.4673, "step": 27776 }, { "epoch": 2.19, "learning_rate": 5.132075982957337e-05, "loss": 1.4096, "step": 27777 }, { "epoch": 2.19, "learning_rate": 5.1311451582269344e-05, "loss": 1.4511, "step": 27778 }, { "epoch": 2.19, "learning_rate": 5.130214400500606e-05, "loss": 1.4302, "step": 27779 }, { "epoch": 2.19, "learning_rate": 5.129283709784681e-05, "loss": 1.4507, "step": 27780 }, { "epoch": 2.19, "learning_rate": 5.1283530860854655e-05, "loss": 1.4633, "step": 27781 }, { "epoch": 2.19, "learning_rate": 5.127422529409292e-05, "loss": 1.4984, "step": 27782 }, { "epoch": 2.19, "learning_rate": 5.12649203976247e-05, "loss": 1.3867, "step": 27783 }, { "epoch": 2.19, "learning_rate": 5.125561617151314e-05, "loss": 1.507, "step": 27784 }, { "epoch": 2.19, "learning_rate": 5.124631261582152e-05, "loss": 1.494, "step": 27785 }, { "epoch": 2.19, "learning_rate": 5.123700973061291e-05, "loss": 1.4224, "step": 27786 }, { "epoch": 2.19, "learning_rate": 5.122770751595047e-05, "loss": 1.4046, "step": 27787 }, { "epoch": 2.19, "learning_rate": 5.121840597189743e-05, "loss": 1.4673, "step": 27788 }, { "epoch": 2.19, "learning_rate": 5.1209105098516916e-05, "loss": 1.4744, "step": 27789 }, { "epoch": 2.19, "learning_rate": 5.119980489587205e-05, "loss": 1.4598, "step": 27790 }, { "epoch": 2.19, "learning_rate": 5.1190505364025946e-05, "loss": 1.4553, "step": 27791 }, { "epoch": 2.19, "learning_rate": 5.118120650304183e-05, "loss": 1.5134, "step": 27792 }, { "epoch": 2.19, "learning_rate": 5.117190831298277e-05, "loss": 1.4295, "step": 27793 }, { "epoch": 2.19, "learning_rate": 5.1162610793911884e-05, "loss": 1.4362, "step": 27794 }, { "epoch": 2.19, "learning_rate": 5.115331394589233e-05, "loss": 1.4445, "step": 27795 }, { "epoch": 2.19, "learning_rate": 5.114401776898727e-05, "loss": 1.4254, "step": 27796 }, { "epoch": 2.19, "learning_rate": 5.113472226325977e-05, "loss": 1.4709, "step": 27797 }, { "epoch": 2.19, "learning_rate": 5.11254274287729e-05, "loss": 1.4383, "step": 27798 }, { "epoch": 2.19, "learning_rate": 5.1116133265589864e-05, "loss": 1.4875, "step": 27799 }, { "epoch": 2.19, "learning_rate": 5.110683977377372e-05, "loss": 1.4018, "step": 27800 }, { "epoch": 2.19, "learning_rate": 5.109754695338751e-05, "loss": 1.5055, "step": 27801 }, { "epoch": 2.19, "learning_rate": 5.108825480449442e-05, "loss": 1.4028, "step": 27802 }, { "epoch": 2.19, "learning_rate": 5.107896332715751e-05, "loss": 1.4849, "step": 27803 }, { "epoch": 2.19, "learning_rate": 5.10696725214398e-05, "loss": 1.4359, "step": 27804 }, { "epoch": 2.19, "learning_rate": 5.106038238740446e-05, "loss": 1.4408, "step": 27805 }, { "epoch": 2.19, "learning_rate": 5.105109292511451e-05, "loss": 1.464, "step": 27806 }, { "epoch": 2.19, "learning_rate": 5.1041804134633055e-05, "loss": 1.4176, "step": 27807 }, { "epoch": 2.19, "learning_rate": 5.103251601602308e-05, "loss": 1.489, "step": 27808 }, { "epoch": 2.19, "learning_rate": 5.102322856934777e-05, "loss": 1.4677, "step": 27809 }, { "epoch": 2.19, "learning_rate": 5.1013941794670063e-05, "loss": 1.4712, "step": 27810 }, { "epoch": 2.19, "learning_rate": 5.100465569205306e-05, "loss": 1.4269, "step": 27811 }, { "epoch": 2.19, "learning_rate": 5.099537026155985e-05, "loss": 1.418, "step": 27812 }, { "epoch": 2.19, "learning_rate": 5.098608550325346e-05, "loss": 1.472, "step": 27813 }, { "epoch": 2.19, "learning_rate": 5.097680141719692e-05, "loss": 1.4933, "step": 27814 }, { "epoch": 2.19, "learning_rate": 5.096751800345319e-05, "loss": 1.431, "step": 27815 }, { "epoch": 2.19, "learning_rate": 5.095823526208541e-05, "loss": 1.4859, "step": 27816 }, { "epoch": 2.19, "learning_rate": 5.0948953193156554e-05, "loss": 1.4167, "step": 27817 }, { "epoch": 2.19, "learning_rate": 5.09396717967296e-05, "loss": 1.4347, "step": 27818 }, { "epoch": 2.19, "learning_rate": 5.0930391072867654e-05, "loss": 1.4064, "step": 27819 }, { "epoch": 2.19, "learning_rate": 5.0921111021633695e-05, "loss": 1.4878, "step": 27820 }, { "epoch": 2.19, "learning_rate": 5.091183164309065e-05, "loss": 1.4083, "step": 27821 }, { "epoch": 2.19, "learning_rate": 5.0902552937301646e-05, "loss": 1.4486, "step": 27822 }, { "epoch": 2.19, "learning_rate": 5.089327490432961e-05, "loss": 1.4661, "step": 27823 }, { "epoch": 2.19, "learning_rate": 5.08839975442375e-05, "loss": 1.4436, "step": 27824 }, { "epoch": 2.19, "learning_rate": 5.087472085708842e-05, "loss": 1.4709, "step": 27825 }, { "epoch": 2.19, "learning_rate": 5.08654448429452e-05, "loss": 1.4499, "step": 27826 }, { "epoch": 2.19, "learning_rate": 5.085616950187098e-05, "loss": 1.4325, "step": 27827 }, { "epoch": 2.19, "learning_rate": 5.08468948339286e-05, "loss": 1.4007, "step": 27828 }, { "epoch": 2.19, "learning_rate": 5.083762083918114e-05, "loss": 1.4655, "step": 27829 }, { "epoch": 2.19, "learning_rate": 5.0828347517691505e-05, "loss": 1.4389, "step": 27830 }, { "epoch": 2.19, "learning_rate": 5.081907486952265e-05, "loss": 1.4688, "step": 27831 }, { "epoch": 2.19, "learning_rate": 5.080980289473752e-05, "loss": 1.4344, "step": 27832 }, { "epoch": 2.19, "learning_rate": 5.080053159339911e-05, "loss": 1.446, "step": 27833 }, { "epoch": 2.19, "learning_rate": 5.079126096557038e-05, "loss": 1.4709, "step": 27834 }, { "epoch": 2.19, "learning_rate": 5.078199101131416e-05, "loss": 1.4605, "step": 27835 }, { "epoch": 2.19, "learning_rate": 5.0772721730693555e-05, "loss": 1.4707, "step": 27836 }, { "epoch": 2.19, "learning_rate": 5.0763453123771376e-05, "loss": 1.5137, "step": 27837 }, { "epoch": 2.19, "learning_rate": 5.075418519061056e-05, "loss": 1.458, "step": 27838 }, { "epoch": 2.19, "learning_rate": 5.07449179312741e-05, "loss": 1.479, "step": 27839 }, { "epoch": 2.19, "learning_rate": 5.073565134582488e-05, "loss": 1.4208, "step": 27840 }, { "epoch": 2.19, "learning_rate": 5.072638543432575e-05, "loss": 1.4854, "step": 27841 }, { "epoch": 2.19, "learning_rate": 5.071712019683969e-05, "loss": 1.4285, "step": 27842 }, { "epoch": 2.19, "learning_rate": 5.070785563342963e-05, "loss": 1.435, "step": 27843 }, { "epoch": 2.19, "learning_rate": 5.0698591744158436e-05, "loss": 1.4455, "step": 27844 }, { "epoch": 2.19, "learning_rate": 5.0689328529088965e-05, "loss": 1.4568, "step": 27845 }, { "epoch": 2.19, "learning_rate": 5.0680065988284196e-05, "loss": 1.4387, "step": 27846 }, { "epoch": 2.19, "learning_rate": 5.067080412180697e-05, "loss": 1.4497, "step": 27847 }, { "epoch": 2.19, "learning_rate": 5.0661542929720166e-05, "loss": 1.4513, "step": 27848 }, { "epoch": 2.19, "learning_rate": 5.0652282412086625e-05, "loss": 1.4392, "step": 27849 }, { "epoch": 2.19, "learning_rate": 5.064302256896929e-05, "loss": 1.5183, "step": 27850 }, { "epoch": 2.19, "learning_rate": 5.063376340043102e-05, "loss": 1.3761, "step": 27851 }, { "epoch": 2.19, "learning_rate": 5.062450490653463e-05, "loss": 1.4755, "step": 27852 }, { "epoch": 2.19, "learning_rate": 5.0615247087343034e-05, "loss": 1.4388, "step": 27853 }, { "epoch": 2.19, "learning_rate": 5.0605989942919075e-05, "loss": 1.443, "step": 27854 }, { "epoch": 2.19, "learning_rate": 5.0596733473325534e-05, "loss": 1.4785, "step": 27855 }, { "epoch": 2.19, "learning_rate": 5.058747767862537e-05, "loss": 1.4355, "step": 27856 }, { "epoch": 2.19, "learning_rate": 5.0578222558881334e-05, "loss": 1.4392, "step": 27857 }, { "epoch": 2.19, "learning_rate": 5.056896811415635e-05, "loss": 1.4313, "step": 27858 }, { "epoch": 2.19, "learning_rate": 5.055971434451314e-05, "loss": 1.3836, "step": 27859 }, { "epoch": 2.19, "learning_rate": 5.055046125001466e-05, "loss": 1.4552, "step": 27860 }, { "epoch": 2.19, "learning_rate": 5.0541208830723645e-05, "loss": 1.4141, "step": 27861 }, { "epoch": 2.19, "learning_rate": 5.053195708670291e-05, "loss": 1.4257, "step": 27862 }, { "epoch": 2.19, "learning_rate": 5.0522706018015327e-05, "loss": 1.4328, "step": 27863 }, { "epoch": 2.19, "learning_rate": 5.051345562472368e-05, "loss": 1.3691, "step": 27864 }, { "epoch": 2.19, "learning_rate": 5.050420590689078e-05, "loss": 1.5239, "step": 27865 }, { "epoch": 2.19, "learning_rate": 5.0494956864579346e-05, "loss": 1.4071, "step": 27866 }, { "epoch": 2.19, "learning_rate": 5.04857084978523e-05, "loss": 1.4928, "step": 27867 }, { "epoch": 2.19, "learning_rate": 5.0476460806772395e-05, "loss": 1.4379, "step": 27868 }, { "epoch": 2.19, "learning_rate": 5.046721379140233e-05, "loss": 1.4247, "step": 27869 }, { "epoch": 2.19, "learning_rate": 5.0457967451805016e-05, "loss": 1.4525, "step": 27870 }, { "epoch": 2.19, "learning_rate": 5.0448721788043155e-05, "loss": 1.4298, "step": 27871 }, { "epoch": 2.19, "learning_rate": 5.04394768001795e-05, "loss": 1.4565, "step": 27872 }, { "epoch": 2.19, "learning_rate": 5.043023248827685e-05, "loss": 1.4714, "step": 27873 }, { "epoch": 2.19, "learning_rate": 5.042098885239804e-05, "loss": 1.4496, "step": 27874 }, { "epoch": 2.19, "learning_rate": 5.0411745892605746e-05, "loss": 1.4032, "step": 27875 }, { "epoch": 2.19, "learning_rate": 5.040250360896269e-05, "loss": 1.4723, "step": 27876 }, { "epoch": 2.19, "learning_rate": 5.0393262001531734e-05, "loss": 1.4765, "step": 27877 }, { "epoch": 2.19, "learning_rate": 5.0384021070375544e-05, "loss": 1.4756, "step": 27878 }, { "epoch": 2.19, "learning_rate": 5.037478081555683e-05, "loss": 1.4415, "step": 27879 }, { "epoch": 2.19, "learning_rate": 5.036554123713844e-05, "loss": 1.3896, "step": 27880 }, { "epoch": 2.19, "learning_rate": 5.035630233518304e-05, "loss": 1.4712, "step": 27881 }, { "epoch": 2.19, "learning_rate": 5.03470641097533e-05, "loss": 1.4, "step": 27882 }, { "epoch": 2.19, "learning_rate": 5.033782656091206e-05, "loss": 1.5031, "step": 27883 }, { "epoch": 2.19, "learning_rate": 5.032858968872199e-05, "loss": 1.4282, "step": 27884 }, { "epoch": 2.19, "learning_rate": 5.031935349324577e-05, "loss": 1.4457, "step": 27885 }, { "epoch": 2.19, "learning_rate": 5.03101179745461e-05, "loss": 1.4613, "step": 27886 }, { "epoch": 2.19, "learning_rate": 5.030088313268575e-05, "loss": 1.4634, "step": 27887 }, { "epoch": 2.19, "learning_rate": 5.029164896772738e-05, "loss": 1.4419, "step": 27888 }, { "epoch": 2.19, "learning_rate": 5.028241547973367e-05, "loss": 1.4775, "step": 27889 }, { "epoch": 2.19, "learning_rate": 5.0273182668767304e-05, "loss": 1.4336, "step": 27890 }, { "epoch": 2.19, "learning_rate": 5.0263950534891055e-05, "loss": 1.4292, "step": 27891 }, { "epoch": 2.19, "learning_rate": 5.0254719078167545e-05, "loss": 1.4602, "step": 27892 }, { "epoch": 2.19, "learning_rate": 5.024548829865938e-05, "loss": 1.373, "step": 27893 }, { "epoch": 2.19, "learning_rate": 5.023625819642937e-05, "loss": 1.4195, "step": 27894 }, { "epoch": 2.19, "learning_rate": 5.022702877154011e-05, "loss": 1.4833, "step": 27895 }, { "epoch": 2.19, "learning_rate": 5.021780002405421e-05, "loss": 1.4985, "step": 27896 }, { "epoch": 2.19, "learning_rate": 5.020857195403443e-05, "loss": 1.458, "step": 27897 }, { "epoch": 2.2, "learning_rate": 5.0199344561543385e-05, "loss": 1.4595, "step": 27898 }, { "epoch": 2.2, "learning_rate": 5.019011784664366e-05, "loss": 1.4585, "step": 27899 }, { "epoch": 2.2, "learning_rate": 5.018089180939801e-05, "loss": 1.4827, "step": 27900 }, { "epoch": 2.2, "learning_rate": 5.017166644986902e-05, "loss": 1.4556, "step": 27901 }, { "epoch": 2.2, "learning_rate": 5.016244176811932e-05, "loss": 1.4789, "step": 27902 }, { "epoch": 2.2, "learning_rate": 5.01532177642115e-05, "loss": 1.3989, "step": 27903 }, { "epoch": 2.2, "learning_rate": 5.0143994438208236e-05, "loss": 1.4385, "step": 27904 }, { "epoch": 2.2, "learning_rate": 5.013477179017218e-05, "loss": 1.4706, "step": 27905 }, { "epoch": 2.2, "learning_rate": 5.0125549820165916e-05, "loss": 1.4706, "step": 27906 }, { "epoch": 2.2, "learning_rate": 5.011632852825201e-05, "loss": 1.4772, "step": 27907 }, { "epoch": 2.2, "learning_rate": 5.010710791449318e-05, "loss": 1.4653, "step": 27908 }, { "epoch": 2.2, "learning_rate": 5.009788797895194e-05, "loss": 1.4883, "step": 27909 }, { "epoch": 2.2, "learning_rate": 5.008866872169087e-05, "loss": 1.4753, "step": 27910 }, { "epoch": 2.2, "learning_rate": 5.0079450142772645e-05, "loss": 1.4263, "step": 27911 }, { "epoch": 2.2, "learning_rate": 5.00702322422598e-05, "loss": 1.3759, "step": 27912 }, { "epoch": 2.2, "learning_rate": 5.0061015020214904e-05, "loss": 1.5047, "step": 27913 }, { "epoch": 2.2, "learning_rate": 5.005179847670061e-05, "loss": 1.4721, "step": 27914 }, { "epoch": 2.2, "learning_rate": 5.0042582611779445e-05, "loss": 1.477, "step": 27915 }, { "epoch": 2.2, "learning_rate": 5.003336742551393e-05, "loss": 1.457, "step": 27916 }, { "epoch": 2.2, "learning_rate": 5.002415291796675e-05, "loss": 1.4027, "step": 27917 }, { "epoch": 2.2, "learning_rate": 5.00149390892004e-05, "loss": 1.4846, "step": 27918 }, { "epoch": 2.2, "learning_rate": 5.0005725939277407e-05, "loss": 1.5141, "step": 27919 }, { "epoch": 2.2, "learning_rate": 4.999651346826029e-05, "loss": 1.4485, "step": 27920 }, { "epoch": 2.2, "learning_rate": 4.998730167621173e-05, "loss": 1.5029, "step": 27921 }, { "epoch": 2.2, "learning_rate": 4.997809056319422e-05, "loss": 1.4695, "step": 27922 }, { "epoch": 2.2, "learning_rate": 4.9968880129270225e-05, "loss": 1.4936, "step": 27923 }, { "epoch": 2.2, "learning_rate": 4.995967037450238e-05, "loss": 1.416, "step": 27924 }, { "epoch": 2.2, "learning_rate": 4.995046129895316e-05, "loss": 1.4916, "step": 27925 }, { "epoch": 2.2, "learning_rate": 4.994125290268511e-05, "loss": 1.515, "step": 27926 }, { "epoch": 2.2, "learning_rate": 4.9932045185760673e-05, "loss": 1.4071, "step": 27927 }, { "epoch": 2.2, "learning_rate": 4.992283814824248e-05, "loss": 1.4286, "step": 27928 }, { "epoch": 2.2, "learning_rate": 4.991363179019299e-05, "loss": 1.4352, "step": 27929 }, { "epoch": 2.2, "learning_rate": 4.990442611167465e-05, "loss": 1.5264, "step": 27930 }, { "epoch": 2.2, "learning_rate": 4.989522111275009e-05, "loss": 1.4908, "step": 27931 }, { "epoch": 2.2, "learning_rate": 4.988601679348173e-05, "loss": 1.4235, "step": 27932 }, { "epoch": 2.2, "learning_rate": 4.9876813153931994e-05, "loss": 1.4379, "step": 27933 }, { "epoch": 2.2, "learning_rate": 4.9867610194163524e-05, "loss": 1.5151, "step": 27934 }, { "epoch": 2.2, "learning_rate": 4.9858407914238706e-05, "loss": 1.4836, "step": 27935 }, { "epoch": 2.2, "learning_rate": 4.9849206314219984e-05, "loss": 1.4528, "step": 27936 }, { "epoch": 2.2, "learning_rate": 4.9840005394169897e-05, "loss": 1.461, "step": 27937 }, { "epoch": 2.2, "learning_rate": 4.9830805154150955e-05, "loss": 1.4215, "step": 27938 }, { "epoch": 2.2, "learning_rate": 4.982160559422555e-05, "loss": 1.47, "step": 27939 }, { "epoch": 2.2, "learning_rate": 4.981240671445612e-05, "loss": 1.4645, "step": 27940 }, { "epoch": 2.2, "learning_rate": 4.98032085149052e-05, "loss": 1.4642, "step": 27941 }, { "epoch": 2.2, "learning_rate": 4.979401099563522e-05, "loss": 1.4667, "step": 27942 }, { "epoch": 2.2, "learning_rate": 4.9784814156708586e-05, "loss": 1.4493, "step": 27943 }, { "epoch": 2.2, "learning_rate": 4.9775617998187716e-05, "loss": 1.4741, "step": 27944 }, { "epoch": 2.2, "learning_rate": 4.976642252013515e-05, "loss": 1.4536, "step": 27945 }, { "epoch": 2.2, "learning_rate": 4.975722772261326e-05, "loss": 1.4898, "step": 27946 }, { "epoch": 2.2, "learning_rate": 4.9748033605684416e-05, "loss": 1.3754, "step": 27947 }, { "epoch": 2.2, "learning_rate": 4.973884016941116e-05, "loss": 1.4409, "step": 27948 }, { "epoch": 2.2, "learning_rate": 4.972964741385585e-05, "loss": 1.4417, "step": 27949 }, { "epoch": 2.2, "learning_rate": 4.972045533908086e-05, "loss": 1.4638, "step": 27950 }, { "epoch": 2.2, "learning_rate": 4.971126394514861e-05, "loss": 1.4803, "step": 27951 }, { "epoch": 2.2, "learning_rate": 4.970207323212161e-05, "loss": 1.4429, "step": 27952 }, { "epoch": 2.2, "learning_rate": 4.969288320006217e-05, "loss": 1.5004, "step": 27953 }, { "epoch": 2.2, "learning_rate": 4.968369384903265e-05, "loss": 1.4608, "step": 27954 }, { "epoch": 2.2, "learning_rate": 4.9674505179095556e-05, "loss": 1.45, "step": 27955 }, { "epoch": 2.2, "learning_rate": 4.9665317190313186e-05, "loss": 1.4734, "step": 27956 }, { "epoch": 2.2, "learning_rate": 4.96561298827479e-05, "loss": 1.4909, "step": 27957 }, { "epoch": 2.2, "learning_rate": 4.964694325646217e-05, "loss": 1.4622, "step": 27958 }, { "epoch": 2.2, "learning_rate": 4.963775731151832e-05, "loss": 1.4851, "step": 27959 }, { "epoch": 2.2, "learning_rate": 4.9628572047978715e-05, "loss": 1.4281, "step": 27960 }, { "epoch": 2.2, "learning_rate": 4.961938746590565e-05, "loss": 1.4883, "step": 27961 }, { "epoch": 2.2, "learning_rate": 4.961020356536161e-05, "loss": 1.4298, "step": 27962 }, { "epoch": 2.2, "learning_rate": 4.960102034640889e-05, "loss": 1.4756, "step": 27963 }, { "epoch": 2.2, "learning_rate": 4.9591837809109794e-05, "loss": 1.5244, "step": 27964 }, { "epoch": 2.2, "learning_rate": 4.958265595352674e-05, "loss": 1.4688, "step": 27965 }, { "epoch": 2.2, "learning_rate": 4.9573474779722056e-05, "loss": 1.4641, "step": 27966 }, { "epoch": 2.2, "learning_rate": 4.956429428775799e-05, "loss": 1.4226, "step": 27967 }, { "epoch": 2.2, "learning_rate": 4.955511447769696e-05, "loss": 1.4619, "step": 27968 }, { "epoch": 2.2, "learning_rate": 4.954593534960131e-05, "loss": 1.4902, "step": 27969 }, { "epoch": 2.2, "learning_rate": 4.953675690353333e-05, "loss": 1.4607, "step": 27970 }, { "epoch": 2.2, "learning_rate": 4.952757913955528e-05, "loss": 1.4146, "step": 27971 }, { "epoch": 2.2, "learning_rate": 4.951840205772957e-05, "loss": 1.4271, "step": 27972 }, { "epoch": 2.2, "learning_rate": 4.9509225658118456e-05, "loss": 1.4947, "step": 27973 }, { "epoch": 2.2, "learning_rate": 4.95000499407842e-05, "loss": 1.4699, "step": 27974 }, { "epoch": 2.2, "learning_rate": 4.949087490578919e-05, "loss": 1.4431, "step": 27975 }, { "epoch": 2.2, "learning_rate": 4.948170055319567e-05, "loss": 1.4664, "step": 27976 }, { "epoch": 2.2, "learning_rate": 4.947252688306595e-05, "loss": 1.474, "step": 27977 }, { "epoch": 2.2, "learning_rate": 4.9463353895462235e-05, "loss": 1.4223, "step": 27978 }, { "epoch": 2.2, "learning_rate": 4.9454181590446914e-05, "loss": 1.5026, "step": 27979 }, { "epoch": 2.2, "learning_rate": 4.944500996808222e-05, "loss": 1.4591, "step": 27980 }, { "epoch": 2.2, "learning_rate": 4.943583902843036e-05, "loss": 1.4784, "step": 27981 }, { "epoch": 2.2, "learning_rate": 4.9426668771553704e-05, "loss": 1.4172, "step": 27982 }, { "epoch": 2.2, "learning_rate": 4.941749919751444e-05, "loss": 1.4211, "step": 27983 }, { "epoch": 2.2, "learning_rate": 4.9408330306374874e-05, "loss": 1.4409, "step": 27984 }, { "epoch": 2.2, "learning_rate": 4.939916209819719e-05, "loss": 1.4276, "step": 27985 }, { "epoch": 2.2, "learning_rate": 4.938999457304375e-05, "loss": 1.3878, "step": 27986 }, { "epoch": 2.2, "learning_rate": 4.9380827730976695e-05, "loss": 1.4321, "step": 27987 }, { "epoch": 2.2, "learning_rate": 4.9371661572058263e-05, "loss": 1.4748, "step": 27988 }, { "epoch": 2.2, "learning_rate": 4.9362496096350766e-05, "loss": 1.4177, "step": 27989 }, { "epoch": 2.2, "learning_rate": 4.9353331303916376e-05, "loss": 1.4492, "step": 27990 }, { "epoch": 2.2, "learning_rate": 4.934416719481729e-05, "loss": 1.4296, "step": 27991 }, { "epoch": 2.2, "learning_rate": 4.933500376911579e-05, "loss": 1.455, "step": 27992 }, { "epoch": 2.2, "learning_rate": 4.9325841026874085e-05, "loss": 1.4902, "step": 27993 }, { "epoch": 2.2, "learning_rate": 4.9316678968154296e-05, "loss": 1.4936, "step": 27994 }, { "epoch": 2.2, "learning_rate": 4.930751759301875e-05, "loss": 1.4709, "step": 27995 }, { "epoch": 2.2, "learning_rate": 4.929835690152959e-05, "loss": 1.4598, "step": 27996 }, { "epoch": 2.2, "learning_rate": 4.928919689374903e-05, "loss": 1.5004, "step": 27997 }, { "epoch": 2.2, "learning_rate": 4.9280037569739186e-05, "loss": 1.4492, "step": 27998 }, { "epoch": 2.2, "learning_rate": 4.927087892956231e-05, "loss": 1.4401, "step": 27999 }, { "epoch": 2.2, "learning_rate": 4.926172097328062e-05, "loss": 1.4432, "step": 28000 }, { "epoch": 2.2, "learning_rate": 4.925256370095626e-05, "loss": 1.4244, "step": 28001 }, { "epoch": 2.2, "learning_rate": 4.9243407112651346e-05, "loss": 1.4528, "step": 28002 }, { "epoch": 2.2, "learning_rate": 4.923425120842814e-05, "loss": 1.4602, "step": 28003 }, { "epoch": 2.2, "learning_rate": 4.922509598834876e-05, "loss": 1.4916, "step": 28004 }, { "epoch": 2.2, "learning_rate": 4.9215941452475313e-05, "loss": 1.4671, "step": 28005 }, { "epoch": 2.2, "learning_rate": 4.920678760087007e-05, "loss": 1.465, "step": 28006 }, { "epoch": 2.2, "learning_rate": 4.919763443359511e-05, "loss": 1.4664, "step": 28007 }, { "epoch": 2.2, "learning_rate": 4.918848195071253e-05, "loss": 1.482, "step": 28008 }, { "epoch": 2.2, "learning_rate": 4.917933015228458e-05, "loss": 1.4122, "step": 28009 }, { "epoch": 2.2, "learning_rate": 4.917017903837334e-05, "loss": 1.4794, "step": 28010 }, { "epoch": 2.2, "learning_rate": 4.916102860904089e-05, "loss": 1.4807, "step": 28011 }, { "epoch": 2.2, "learning_rate": 4.9151878864349464e-05, "loss": 1.4032, "step": 28012 }, { "epoch": 2.2, "learning_rate": 4.914272980436112e-05, "loss": 1.4704, "step": 28013 }, { "epoch": 2.2, "learning_rate": 4.9133581429137935e-05, "loss": 1.4318, "step": 28014 }, { "epoch": 2.2, "learning_rate": 4.912443373874208e-05, "loss": 1.4459, "step": 28015 }, { "epoch": 2.2, "learning_rate": 4.9115286733235686e-05, "loss": 1.5126, "step": 28016 }, { "epoch": 2.2, "learning_rate": 4.910614041268084e-05, "loss": 1.461, "step": 28017 }, { "epoch": 2.2, "learning_rate": 4.90969947771396e-05, "loss": 1.4801, "step": 28018 }, { "epoch": 2.2, "learning_rate": 4.9087849826674045e-05, "loss": 1.4356, "step": 28019 }, { "epoch": 2.2, "learning_rate": 4.9078705561346354e-05, "loss": 1.453, "step": 28020 }, { "epoch": 2.2, "learning_rate": 4.906956198121856e-05, "loss": 1.4619, "step": 28021 }, { "epoch": 2.2, "learning_rate": 4.906041908635269e-05, "loss": 1.4329, "step": 28022 }, { "epoch": 2.2, "learning_rate": 4.905127687681092e-05, "loss": 1.4675, "step": 28023 }, { "epoch": 2.2, "learning_rate": 4.904213535265527e-05, "loss": 1.5015, "step": 28024 }, { "epoch": 2.21, "learning_rate": 4.9032994513947764e-05, "loss": 1.4516, "step": 28025 }, { "epoch": 2.21, "learning_rate": 4.902385436075056e-05, "loss": 1.472, "step": 28026 }, { "epoch": 2.21, "learning_rate": 4.901471489312565e-05, "loss": 1.4907, "step": 28027 }, { "epoch": 2.21, "learning_rate": 4.900557611113506e-05, "loss": 1.4626, "step": 28028 }, { "epoch": 2.21, "learning_rate": 4.899643801484091e-05, "loss": 1.4465, "step": 28029 }, { "epoch": 2.21, "learning_rate": 4.898730060430517e-05, "loss": 1.4587, "step": 28030 }, { "epoch": 2.21, "learning_rate": 4.897816387958995e-05, "loss": 1.4285, "step": 28031 }, { "epoch": 2.21, "learning_rate": 4.8969027840757225e-05, "loss": 1.4247, "step": 28032 }, { "epoch": 2.21, "learning_rate": 4.895989248786907e-05, "loss": 1.4778, "step": 28033 }, { "epoch": 2.21, "learning_rate": 4.89507578209875e-05, "loss": 1.4282, "step": 28034 }, { "epoch": 2.21, "learning_rate": 4.8941623840174476e-05, "loss": 1.4524, "step": 28035 }, { "epoch": 2.21, "learning_rate": 4.893249054549209e-05, "loss": 1.4589, "step": 28036 }, { "epoch": 2.21, "learning_rate": 4.892335793700233e-05, "loss": 1.4198, "step": 28037 }, { "epoch": 2.21, "learning_rate": 4.89142260147672e-05, "loss": 1.5035, "step": 28038 }, { "epoch": 2.21, "learning_rate": 4.890509477884862e-05, "loss": 1.47, "step": 28039 }, { "epoch": 2.21, "learning_rate": 4.8895964229308735e-05, "loss": 1.4139, "step": 28040 }, { "epoch": 2.21, "learning_rate": 4.888683436620944e-05, "loss": 1.4564, "step": 28041 }, { "epoch": 2.21, "learning_rate": 4.887770518961269e-05, "loss": 1.4377, "step": 28042 }, { "epoch": 2.21, "learning_rate": 4.886857669958057e-05, "loss": 1.4134, "step": 28043 }, { "epoch": 2.21, "learning_rate": 4.885944889617502e-05, "loss": 1.4132, "step": 28044 }, { "epoch": 2.21, "learning_rate": 4.8850321779457925e-05, "loss": 1.4254, "step": 28045 }, { "epoch": 2.21, "learning_rate": 4.884119534949135e-05, "loss": 1.4565, "step": 28046 }, { "epoch": 2.21, "learning_rate": 4.883206960633727e-05, "loss": 1.4466, "step": 28047 }, { "epoch": 2.21, "learning_rate": 4.8822944550057616e-05, "loss": 1.4788, "step": 28048 }, { "epoch": 2.21, "learning_rate": 4.881382018071426e-05, "loss": 1.4722, "step": 28049 }, { "epoch": 2.21, "learning_rate": 4.88046964983693e-05, "loss": 1.4285, "step": 28050 }, { "epoch": 2.21, "learning_rate": 4.8795573503084604e-05, "loss": 1.4704, "step": 28051 }, { "epoch": 2.21, "learning_rate": 4.8786451194922065e-05, "loss": 1.4401, "step": 28052 }, { "epoch": 2.21, "learning_rate": 4.877732957394372e-05, "loss": 1.4305, "step": 28053 }, { "epoch": 2.21, "learning_rate": 4.876820864021143e-05, "loss": 1.4731, "step": 28054 }, { "epoch": 2.21, "learning_rate": 4.8759088393787155e-05, "loss": 1.439, "step": 28055 }, { "epoch": 2.21, "learning_rate": 4.874996883473275e-05, "loss": 1.4705, "step": 28056 }, { "epoch": 2.21, "learning_rate": 4.8740849963110234e-05, "loss": 1.4623, "step": 28057 }, { "epoch": 2.21, "learning_rate": 4.873173177898146e-05, "loss": 1.4883, "step": 28058 }, { "epoch": 2.21, "learning_rate": 4.87226142824083e-05, "loss": 1.4432, "step": 28059 }, { "epoch": 2.21, "learning_rate": 4.8713497473452744e-05, "loss": 1.4416, "step": 28060 }, { "epoch": 2.21, "learning_rate": 4.870438135217659e-05, "loss": 1.427, "step": 28061 }, { "epoch": 2.21, "learning_rate": 4.869526591864185e-05, "loss": 1.4412, "step": 28062 }, { "epoch": 2.21, "learning_rate": 4.868615117291029e-05, "loss": 1.459, "step": 28063 }, { "epoch": 2.21, "learning_rate": 4.8677037115043916e-05, "loss": 1.4599, "step": 28064 }, { "epoch": 2.21, "learning_rate": 4.866792374510452e-05, "loss": 1.475, "step": 28065 }, { "epoch": 2.21, "learning_rate": 4.8658811063153976e-05, "loss": 1.4477, "step": 28066 }, { "epoch": 2.21, "learning_rate": 4.864969906925423e-05, "loss": 1.4513, "step": 28067 }, { "epoch": 2.21, "learning_rate": 4.864058776346708e-05, "loss": 1.4903, "step": 28068 }, { "epoch": 2.21, "learning_rate": 4.863147714585437e-05, "loss": 1.5022, "step": 28069 }, { "epoch": 2.21, "learning_rate": 4.862236721647804e-05, "loss": 1.4449, "step": 28070 }, { "epoch": 2.21, "learning_rate": 4.861325797539988e-05, "loss": 1.4877, "step": 28071 }, { "epoch": 2.21, "learning_rate": 4.860414942268176e-05, "loss": 1.4994, "step": 28072 }, { "epoch": 2.21, "learning_rate": 4.8595041558385454e-05, "loss": 1.4703, "step": 28073 }, { "epoch": 2.21, "learning_rate": 4.8585934382572905e-05, "loss": 1.5322, "step": 28074 }, { "epoch": 2.21, "learning_rate": 4.857682789530591e-05, "loss": 1.4338, "step": 28075 }, { "epoch": 2.21, "learning_rate": 4.8567722096646215e-05, "loss": 1.4745, "step": 28076 }, { "epoch": 2.21, "learning_rate": 4.855861698665573e-05, "loss": 1.4234, "step": 28077 }, { "epoch": 2.21, "learning_rate": 4.85495125653963e-05, "loss": 1.4131, "step": 28078 }, { "epoch": 2.21, "learning_rate": 4.854040883292969e-05, "loss": 1.4713, "step": 28079 }, { "epoch": 2.21, "learning_rate": 4.8531305789317655e-05, "loss": 1.4615, "step": 28080 }, { "epoch": 2.21, "learning_rate": 4.852220343462213e-05, "loss": 1.4626, "step": 28081 }, { "epoch": 2.21, "learning_rate": 4.851310176890482e-05, "loss": 1.4903, "step": 28082 }, { "epoch": 2.21, "learning_rate": 4.850400079222751e-05, "loss": 1.4207, "step": 28083 }, { "epoch": 2.21, "learning_rate": 4.8494900504652075e-05, "loss": 1.4972, "step": 28084 }, { "epoch": 2.21, "learning_rate": 4.848580090624025e-05, "loss": 1.4636, "step": 28085 }, { "epoch": 2.21, "learning_rate": 4.8476701997053764e-05, "loss": 1.4347, "step": 28086 }, { "epoch": 2.21, "learning_rate": 4.846760377715449e-05, "loss": 1.449, "step": 28087 }, { "epoch": 2.21, "learning_rate": 4.845850624660416e-05, "loss": 1.4396, "step": 28088 }, { "epoch": 2.21, "learning_rate": 4.8449409405464476e-05, "loss": 1.4563, "step": 28089 }, { "epoch": 2.21, "learning_rate": 4.844031325379734e-05, "loss": 1.4345, "step": 28090 }, { "epoch": 2.21, "learning_rate": 4.8431217791664414e-05, "loss": 1.4713, "step": 28091 }, { "epoch": 2.21, "learning_rate": 4.8422123019127476e-05, "loss": 1.458, "step": 28092 }, { "epoch": 2.21, "learning_rate": 4.841302893624816e-05, "loss": 1.3999, "step": 28093 }, { "epoch": 2.21, "learning_rate": 4.840393554308841e-05, "loss": 1.471, "step": 28094 }, { "epoch": 2.21, "learning_rate": 4.839484283970988e-05, "loss": 1.459, "step": 28095 }, { "epoch": 2.21, "learning_rate": 4.83857508261743e-05, "loss": 1.4403, "step": 28096 }, { "epoch": 2.21, "learning_rate": 4.837665950254335e-05, "loss": 1.4374, "step": 28097 }, { "epoch": 2.21, "learning_rate": 4.836756886887885e-05, "loss": 1.5062, "step": 28098 }, { "epoch": 2.21, "learning_rate": 4.835847892524247e-05, "loss": 1.5252, "step": 28099 }, { "epoch": 2.21, "learning_rate": 4.834938967169587e-05, "loss": 1.4594, "step": 28100 }, { "epoch": 2.21, "learning_rate": 4.834030110830088e-05, "loss": 1.4875, "step": 28101 }, { "epoch": 2.21, "learning_rate": 4.833121323511914e-05, "loss": 1.4216, "step": 28102 }, { "epoch": 2.21, "learning_rate": 4.8322126052212304e-05, "loss": 1.4079, "step": 28103 }, { "epoch": 2.21, "learning_rate": 4.8313039559642166e-05, "loss": 1.4874, "step": 28104 }, { "epoch": 2.21, "learning_rate": 4.8303953757470396e-05, "loss": 1.4428, "step": 28105 }, { "epoch": 2.21, "learning_rate": 4.829486864575859e-05, "loss": 1.5167, "step": 28106 }, { "epoch": 2.21, "learning_rate": 4.828578422456856e-05, "loss": 1.4307, "step": 28107 }, { "epoch": 2.21, "learning_rate": 4.827670049396192e-05, "loss": 1.4553, "step": 28108 }, { "epoch": 2.21, "learning_rate": 4.82676174540003e-05, "loss": 1.4967, "step": 28109 }, { "epoch": 2.21, "learning_rate": 4.825853510474541e-05, "loss": 1.4575, "step": 28110 }, { "epoch": 2.21, "learning_rate": 4.824945344625898e-05, "loss": 1.4381, "step": 28111 }, { "epoch": 2.21, "learning_rate": 4.824037247860261e-05, "loss": 1.4504, "step": 28112 }, { "epoch": 2.21, "learning_rate": 4.823129220183795e-05, "loss": 1.4499, "step": 28113 }, { "epoch": 2.21, "learning_rate": 4.822221261602661e-05, "loss": 1.4823, "step": 28114 }, { "epoch": 2.21, "learning_rate": 4.8213133721230324e-05, "loss": 1.3937, "step": 28115 }, { "epoch": 2.21, "learning_rate": 4.8204055517510695e-05, "loss": 1.4539, "step": 28116 }, { "epoch": 2.21, "learning_rate": 4.81949780049293e-05, "loss": 1.4807, "step": 28117 }, { "epoch": 2.21, "learning_rate": 4.8185901183547884e-05, "loss": 1.4447, "step": 28118 }, { "epoch": 2.21, "learning_rate": 4.8176825053428003e-05, "loss": 1.4403, "step": 28119 }, { "epoch": 2.21, "learning_rate": 4.8167749614631234e-05, "loss": 1.4744, "step": 28120 }, { "epoch": 2.21, "learning_rate": 4.8158674867219314e-05, "loss": 1.4279, "step": 28121 }, { "epoch": 2.21, "learning_rate": 4.814960081125378e-05, "loss": 1.4417, "step": 28122 }, { "epoch": 2.21, "learning_rate": 4.814052744679621e-05, "loss": 1.4512, "step": 28123 }, { "epoch": 2.21, "learning_rate": 4.8131454773908246e-05, "loss": 1.4625, "step": 28124 }, { "epoch": 2.21, "learning_rate": 4.812238279265153e-05, "loss": 1.4908, "step": 28125 }, { "epoch": 2.21, "learning_rate": 4.811331150308762e-05, "loss": 1.4366, "step": 28126 }, { "epoch": 2.21, "learning_rate": 4.8104240905278045e-05, "loss": 1.4236, "step": 28127 }, { "epoch": 2.21, "learning_rate": 4.8095170999284495e-05, "loss": 1.4085, "step": 28128 }, { "epoch": 2.21, "learning_rate": 4.808610178516851e-05, "loss": 1.4572, "step": 28129 }, { "epoch": 2.21, "learning_rate": 4.807703326299164e-05, "loss": 1.4642, "step": 28130 }, { "epoch": 2.21, "learning_rate": 4.806796543281542e-05, "loss": 1.3985, "step": 28131 }, { "epoch": 2.21, "learning_rate": 4.805889829470151e-05, "loss": 1.4802, "step": 28132 }, { "epoch": 2.21, "learning_rate": 4.804983184871144e-05, "loss": 1.4869, "step": 28133 }, { "epoch": 2.21, "learning_rate": 4.804076609490668e-05, "loss": 1.5123, "step": 28134 }, { "epoch": 2.21, "learning_rate": 4.803170103334891e-05, "loss": 1.4677, "step": 28135 }, { "epoch": 2.21, "learning_rate": 4.8022636664099636e-05, "loss": 1.4601, "step": 28136 }, { "epoch": 2.21, "learning_rate": 4.801357298722031e-05, "loss": 1.4122, "step": 28137 }, { "epoch": 2.21, "learning_rate": 4.800451000277261e-05, "loss": 1.472, "step": 28138 }, { "epoch": 2.21, "learning_rate": 4.7995447710817994e-05, "loss": 1.5081, "step": 28139 }, { "epoch": 2.21, "learning_rate": 4.798638611141795e-05, "loss": 1.3878, "step": 28140 }, { "epoch": 2.21, "learning_rate": 4.797732520463404e-05, "loss": 1.4752, "step": 28141 }, { "epoch": 2.21, "learning_rate": 4.796826499052785e-05, "loss": 1.486, "step": 28142 }, { "epoch": 2.21, "learning_rate": 4.7959205469160836e-05, "loss": 1.4218, "step": 28143 }, { "epoch": 2.21, "learning_rate": 4.795014664059444e-05, "loss": 1.4388, "step": 28144 }, { "epoch": 2.21, "learning_rate": 4.79410885048903e-05, "loss": 1.4829, "step": 28145 }, { "epoch": 2.21, "learning_rate": 4.793203106210984e-05, "loss": 1.472, "step": 28146 }, { "epoch": 2.21, "learning_rate": 4.792297431231452e-05, "loss": 1.4028, "step": 28147 }, { "epoch": 2.21, "learning_rate": 4.791391825556592e-05, "loss": 1.4391, "step": 28148 }, { "epoch": 2.21, "learning_rate": 4.790486289192549e-05, "loss": 1.4302, "step": 28149 }, { "epoch": 2.21, "learning_rate": 4.789580822145468e-05, "loss": 1.4044, "step": 28150 }, { "epoch": 2.21, "learning_rate": 4.788675424421496e-05, "loss": 1.4639, "step": 28151 }, { "epoch": 2.22, "learning_rate": 4.787770096026786e-05, "loss": 1.4737, "step": 28152 }, { "epoch": 2.22, "learning_rate": 4.7868648369674806e-05, "loss": 1.478, "step": 28153 }, { "epoch": 2.22, "learning_rate": 4.785959647249724e-05, "loss": 1.5162, "step": 28154 }, { "epoch": 2.22, "learning_rate": 4.7850545268796685e-05, "loss": 1.4496, "step": 28155 }, { "epoch": 2.22, "learning_rate": 4.7841494758634525e-05, "loss": 1.4787, "step": 28156 }, { "epoch": 2.22, "learning_rate": 4.783244494207227e-05, "loss": 1.4657, "step": 28157 }, { "epoch": 2.22, "learning_rate": 4.782339581917128e-05, "loss": 1.4623, "step": 28158 }, { "epoch": 2.22, "learning_rate": 4.781434738999311e-05, "loss": 1.4421, "step": 28159 }, { "epoch": 2.22, "learning_rate": 4.780529965459913e-05, "loss": 1.4427, "step": 28160 }, { "epoch": 2.22, "learning_rate": 4.779625261305071e-05, "loss": 1.417, "step": 28161 }, { "epoch": 2.22, "learning_rate": 4.77872062654094e-05, "loss": 1.4254, "step": 28162 }, { "epoch": 2.22, "learning_rate": 4.7778160611736546e-05, "loss": 1.458, "step": 28163 }, { "epoch": 2.22, "learning_rate": 4.776911565209351e-05, "loss": 1.4348, "step": 28164 }, { "epoch": 2.22, "learning_rate": 4.776007138654182e-05, "loss": 1.4733, "step": 28165 }, { "epoch": 2.22, "learning_rate": 4.7751027815142826e-05, "loss": 1.4758, "step": 28166 }, { "epoch": 2.22, "learning_rate": 4.774198493795793e-05, "loss": 1.4679, "step": 28167 }, { "epoch": 2.22, "learning_rate": 4.7732942755048476e-05, "loss": 1.4292, "step": 28168 }, { "epoch": 2.22, "learning_rate": 4.772390126647596e-05, "loss": 1.4575, "step": 28169 }, { "epoch": 2.22, "learning_rate": 4.7714860472301706e-05, "loss": 1.4406, "step": 28170 }, { "epoch": 2.22, "learning_rate": 4.7705820372587054e-05, "loss": 1.4618, "step": 28171 }, { "epoch": 2.22, "learning_rate": 4.7696780967393435e-05, "loss": 1.4435, "step": 28172 }, { "epoch": 2.22, "learning_rate": 4.7687742256782255e-05, "loss": 1.4592, "step": 28173 }, { "epoch": 2.22, "learning_rate": 4.767870424081486e-05, "loss": 1.4858, "step": 28174 }, { "epoch": 2.22, "learning_rate": 4.7669666919552536e-05, "loss": 1.4763, "step": 28175 }, { "epoch": 2.22, "learning_rate": 4.7660630293056755e-05, "loss": 1.4314, "step": 28176 }, { "epoch": 2.22, "learning_rate": 4.765159436138882e-05, "loss": 1.4703, "step": 28177 }, { "epoch": 2.22, "learning_rate": 4.764255912461004e-05, "loss": 1.4412, "step": 28178 }, { "epoch": 2.22, "learning_rate": 4.7633524582781845e-05, "loss": 1.4124, "step": 28179 }, { "epoch": 2.22, "learning_rate": 4.762449073596552e-05, "loss": 1.4718, "step": 28180 }, { "epoch": 2.22, "learning_rate": 4.761545758422236e-05, "loss": 1.4103, "step": 28181 }, { "epoch": 2.22, "learning_rate": 4.760642512761378e-05, "loss": 1.5032, "step": 28182 }, { "epoch": 2.22, "learning_rate": 4.7597393366201095e-05, "loss": 1.4771, "step": 28183 }, { "epoch": 2.22, "learning_rate": 4.758836230004557e-05, "loss": 1.4684, "step": 28184 }, { "epoch": 2.22, "learning_rate": 4.757933192920851e-05, "loss": 1.4223, "step": 28185 }, { "epoch": 2.22, "learning_rate": 4.757030225375133e-05, "loss": 1.4694, "step": 28186 }, { "epoch": 2.22, "learning_rate": 4.75612732737352e-05, "loss": 1.4579, "step": 28187 }, { "epoch": 2.22, "learning_rate": 4.755224498922151e-05, "loss": 1.4281, "step": 28188 }, { "epoch": 2.22, "learning_rate": 4.7543217400271595e-05, "loss": 1.4439, "step": 28189 }, { "epoch": 2.22, "learning_rate": 4.753419050694669e-05, "loss": 1.4374, "step": 28190 }, { "epoch": 2.22, "learning_rate": 4.7525164309308065e-05, "loss": 1.4814, "step": 28191 }, { "epoch": 2.22, "learning_rate": 4.7516138807416994e-05, "loss": 1.4291, "step": 28192 }, { "epoch": 2.22, "learning_rate": 4.7507114001334825e-05, "loss": 1.4364, "step": 28193 }, { "epoch": 2.22, "learning_rate": 4.749808989112281e-05, "loss": 1.4392, "step": 28194 }, { "epoch": 2.22, "learning_rate": 4.748906647684214e-05, "loss": 1.4071, "step": 28195 }, { "epoch": 2.22, "learning_rate": 4.748004375855417e-05, "loss": 1.4755, "step": 28196 }, { "epoch": 2.22, "learning_rate": 4.747102173632015e-05, "loss": 1.4271, "step": 28197 }, { "epoch": 2.22, "learning_rate": 4.746200041020125e-05, "loss": 1.4094, "step": 28198 }, { "epoch": 2.22, "learning_rate": 4.7452979780258837e-05, "loss": 1.4892, "step": 28199 }, { "epoch": 2.22, "learning_rate": 4.7443959846554106e-05, "loss": 1.4553, "step": 28200 }, { "epoch": 2.22, "learning_rate": 4.743494060914823e-05, "loss": 1.4356, "step": 28201 }, { "epoch": 2.22, "learning_rate": 4.742592206810257e-05, "loss": 1.4639, "step": 28202 }, { "epoch": 2.22, "learning_rate": 4.741690422347825e-05, "loss": 1.4185, "step": 28203 }, { "epoch": 2.22, "learning_rate": 4.740788707533657e-05, "loss": 1.4367, "step": 28204 }, { "epoch": 2.22, "learning_rate": 4.739887062373869e-05, "loss": 1.4269, "step": 28205 }, { "epoch": 2.22, "learning_rate": 4.738985486874589e-05, "loss": 1.4804, "step": 28206 }, { "epoch": 2.22, "learning_rate": 4.7380839810419364e-05, "loss": 1.41, "step": 28207 }, { "epoch": 2.22, "learning_rate": 4.737182544882031e-05, "loss": 1.4949, "step": 28208 }, { "epoch": 2.22, "learning_rate": 4.736281178400987e-05, "loss": 1.4799, "step": 28209 }, { "epoch": 2.22, "learning_rate": 4.735379881604934e-05, "loss": 1.4951, "step": 28210 }, { "epoch": 2.22, "learning_rate": 4.7344786544999887e-05, "loss": 1.4699, "step": 28211 }, { "epoch": 2.22, "learning_rate": 4.733577497092261e-05, "loss": 1.4533, "step": 28212 }, { "epoch": 2.22, "learning_rate": 4.732676409387884e-05, "loss": 1.4946, "step": 28213 }, { "epoch": 2.22, "learning_rate": 4.7317753913929666e-05, "loss": 1.4598, "step": 28214 }, { "epoch": 2.22, "learning_rate": 4.7308744431136237e-05, "loss": 1.4549, "step": 28215 }, { "epoch": 2.22, "learning_rate": 4.729973564555981e-05, "loss": 1.4559, "step": 28216 }, { "epoch": 2.22, "learning_rate": 4.7290727557261504e-05, "loss": 1.4482, "step": 28217 }, { "epoch": 2.22, "learning_rate": 4.728172016630244e-05, "loss": 1.432, "step": 28218 }, { "epoch": 2.22, "learning_rate": 4.727271347274379e-05, "loss": 1.4569, "step": 28219 }, { "epoch": 2.22, "learning_rate": 4.726370747664679e-05, "loss": 1.4333, "step": 28220 }, { "epoch": 2.22, "learning_rate": 4.7254702178072515e-05, "loss": 1.4125, "step": 28221 }, { "epoch": 2.22, "learning_rate": 4.724569757708207e-05, "loss": 1.4014, "step": 28222 }, { "epoch": 2.22, "learning_rate": 4.723669367373668e-05, "loss": 1.449, "step": 28223 }, { "epoch": 2.22, "learning_rate": 4.722769046809742e-05, "loss": 1.4677, "step": 28224 }, { "epoch": 2.22, "learning_rate": 4.721868796022545e-05, "loss": 1.4633, "step": 28225 }, { "epoch": 2.22, "learning_rate": 4.720968615018179e-05, "loss": 1.4879, "step": 28226 }, { "epoch": 2.22, "learning_rate": 4.7200685038027716e-05, "loss": 1.4206, "step": 28227 }, { "epoch": 2.22, "learning_rate": 4.719168462382425e-05, "loss": 1.431, "step": 28228 }, { "epoch": 2.22, "learning_rate": 4.718268490763245e-05, "loss": 1.4964, "step": 28229 }, { "epoch": 2.22, "learning_rate": 4.717368588951355e-05, "loss": 1.3807, "step": 28230 }, { "epoch": 2.22, "learning_rate": 4.716468756952857e-05, "loss": 1.4299, "step": 28231 }, { "epoch": 2.22, "learning_rate": 4.7155689947738554e-05, "loss": 1.4689, "step": 28232 }, { "epoch": 2.22, "learning_rate": 4.714669302420469e-05, "loss": 1.5141, "step": 28233 }, { "epoch": 2.22, "learning_rate": 4.713769679898801e-05, "loss": 1.4765, "step": 28234 }, { "epoch": 2.22, "learning_rate": 4.7128701272149624e-05, "loss": 1.4767, "step": 28235 }, { "epoch": 2.22, "learning_rate": 4.7119706443750544e-05, "loss": 1.4782, "step": 28236 }, { "epoch": 2.22, "learning_rate": 4.711071231385194e-05, "loss": 1.4379, "step": 28237 }, { "epoch": 2.22, "learning_rate": 4.710171888251481e-05, "loss": 1.4801, "step": 28238 }, { "epoch": 2.22, "learning_rate": 4.709272614980018e-05, "loss": 1.4589, "step": 28239 }, { "epoch": 2.22, "learning_rate": 4.70837341157692e-05, "loss": 1.441, "step": 28240 }, { "epoch": 2.22, "learning_rate": 4.707474278048287e-05, "loss": 1.4694, "step": 28241 }, { "epoch": 2.22, "learning_rate": 4.7065752144002236e-05, "loss": 1.4902, "step": 28242 }, { "epoch": 2.22, "learning_rate": 4.705676220638829e-05, "loss": 1.4383, "step": 28243 }, { "epoch": 2.22, "learning_rate": 4.7047772967702186e-05, "loss": 1.4334, "step": 28244 }, { "epoch": 2.22, "learning_rate": 4.7038784428004865e-05, "loss": 1.4177, "step": 28245 }, { "epoch": 2.22, "learning_rate": 4.702979658735735e-05, "loss": 1.4819, "step": 28246 }, { "epoch": 2.22, "learning_rate": 4.7020809445820735e-05, "loss": 1.4113, "step": 28247 }, { "epoch": 2.22, "learning_rate": 4.701182300345599e-05, "loss": 1.4572, "step": 28248 }, { "epoch": 2.22, "learning_rate": 4.700283726032408e-05, "loss": 1.4888, "step": 28249 }, { "epoch": 2.22, "learning_rate": 4.699385221648608e-05, "loss": 1.4686, "step": 28250 }, { "epoch": 2.22, "learning_rate": 4.6984867872003026e-05, "loss": 1.4863, "step": 28251 }, { "epoch": 2.22, "learning_rate": 4.697588422693587e-05, "loss": 1.468, "step": 28252 }, { "epoch": 2.22, "learning_rate": 4.6966901281345546e-05, "loss": 1.4052, "step": 28253 }, { "epoch": 2.22, "learning_rate": 4.695791903529317e-05, "loss": 1.4812, "step": 28254 }, { "epoch": 2.22, "learning_rate": 4.694893748883965e-05, "loss": 1.4609, "step": 28255 }, { "epoch": 2.22, "learning_rate": 4.6939956642045927e-05, "loss": 1.4462, "step": 28256 }, { "epoch": 2.22, "learning_rate": 4.693097649497309e-05, "loss": 1.4539, "step": 28257 }, { "epoch": 2.22, "learning_rate": 4.692199704768203e-05, "loss": 1.4686, "step": 28258 }, { "epoch": 2.22, "learning_rate": 4.691301830023367e-05, "loss": 1.4878, "step": 28259 }, { "epoch": 2.22, "learning_rate": 4.6904040252689105e-05, "loss": 1.4441, "step": 28260 }, { "epoch": 2.22, "learning_rate": 4.689506290510918e-05, "loss": 1.5174, "step": 28261 }, { "epoch": 2.22, "learning_rate": 4.68860862575549e-05, "loss": 1.455, "step": 28262 }, { "epoch": 2.22, "learning_rate": 4.687711031008714e-05, "loss": 1.4162, "step": 28263 }, { "epoch": 2.22, "learning_rate": 4.686813506276694e-05, "loss": 1.5034, "step": 28264 }, { "epoch": 2.22, "learning_rate": 4.685916051565519e-05, "loss": 1.4631, "step": 28265 }, { "epoch": 2.22, "learning_rate": 4.685018666881277e-05, "loss": 1.4475, "step": 28266 }, { "epoch": 2.22, "learning_rate": 4.6841213522300665e-05, "loss": 1.4708, "step": 28267 }, { "epoch": 2.22, "learning_rate": 4.683224107617983e-05, "loss": 1.4307, "step": 28268 }, { "epoch": 2.22, "learning_rate": 4.682326933051116e-05, "loss": 1.4597, "step": 28269 }, { "epoch": 2.22, "learning_rate": 4.68142982853555e-05, "loss": 1.4647, "step": 28270 }, { "epoch": 2.22, "learning_rate": 4.680532794077386e-05, "loss": 1.4595, "step": 28271 }, { "epoch": 2.22, "learning_rate": 4.67963582968271e-05, "loss": 1.4496, "step": 28272 }, { "epoch": 2.22, "learning_rate": 4.678738935357605e-05, "loss": 1.4665, "step": 28273 }, { "epoch": 2.22, "learning_rate": 4.6778421111081734e-05, "loss": 1.4632, "step": 28274 }, { "epoch": 2.22, "learning_rate": 4.676945356940497e-05, "loss": 1.4272, "step": 28275 }, { "epoch": 2.22, "learning_rate": 4.676048672860661e-05, "loss": 1.476, "step": 28276 }, { "epoch": 2.22, "learning_rate": 4.675152058874761e-05, "loss": 1.4271, "step": 28277 }, { "epoch": 2.22, "learning_rate": 4.6742555149888815e-05, "loss": 1.4552, "step": 28278 }, { "epoch": 2.23, "learning_rate": 4.6733590412091085e-05, "loss": 1.4878, "step": 28279 }, { "epoch": 2.23, "learning_rate": 4.672462637541524e-05, "loss": 1.4773, "step": 28280 }, { "epoch": 2.23, "learning_rate": 4.671566303992218e-05, "loss": 1.4462, "step": 28281 }, { "epoch": 2.23, "learning_rate": 4.670670040567283e-05, "loss": 1.4342, "step": 28282 }, { "epoch": 2.23, "learning_rate": 4.669773847272798e-05, "loss": 1.4536, "step": 28283 }, { "epoch": 2.23, "learning_rate": 4.668877724114845e-05, "loss": 1.4631, "step": 28284 }, { "epoch": 2.23, "learning_rate": 4.667981671099513e-05, "loss": 1.46, "step": 28285 }, { "epoch": 2.23, "learning_rate": 4.6670856882328844e-05, "loss": 1.5063, "step": 28286 }, { "epoch": 2.23, "learning_rate": 4.666189775521038e-05, "loss": 1.47, "step": 28287 }, { "epoch": 2.23, "learning_rate": 4.665293932970064e-05, "loss": 1.486, "step": 28288 }, { "epoch": 2.23, "learning_rate": 4.664398160586042e-05, "loss": 1.4992, "step": 28289 }, { "epoch": 2.23, "learning_rate": 4.663502458375047e-05, "loss": 1.4631, "step": 28290 }, { "epoch": 2.23, "learning_rate": 4.662606826343172e-05, "loss": 1.4022, "step": 28291 }, { "epoch": 2.23, "learning_rate": 4.661711264496493e-05, "loss": 1.4407, "step": 28292 }, { "epoch": 2.23, "learning_rate": 4.660815772841083e-05, "loss": 1.4629, "step": 28293 }, { "epoch": 2.23, "learning_rate": 4.6599203513830326e-05, "loss": 1.49, "step": 28294 }, { "epoch": 2.23, "learning_rate": 4.659025000128419e-05, "loss": 1.4136, "step": 28295 }, { "epoch": 2.23, "learning_rate": 4.658129719083316e-05, "loss": 1.3973, "step": 28296 }, { "epoch": 2.23, "learning_rate": 4.657234508253797e-05, "loss": 1.379, "step": 28297 }, { "epoch": 2.23, "learning_rate": 4.656339367645958e-05, "loss": 1.4862, "step": 28298 }, { "epoch": 2.23, "learning_rate": 4.6554442972658664e-05, "loss": 1.4878, "step": 28299 }, { "epoch": 2.23, "learning_rate": 4.6545492971195944e-05, "loss": 1.4845, "step": 28300 }, { "epoch": 2.23, "learning_rate": 4.653654367213229e-05, "loss": 1.458, "step": 28301 }, { "epoch": 2.23, "learning_rate": 4.65275950755284e-05, "loss": 1.43, "step": 28302 }, { "epoch": 2.23, "learning_rate": 4.6518647181445056e-05, "loss": 1.4786, "step": 28303 }, { "epoch": 2.23, "learning_rate": 4.650969998994292e-05, "loss": 1.4723, "step": 28304 }, { "epoch": 2.23, "learning_rate": 4.6500753501082884e-05, "loss": 1.4525, "step": 28305 }, { "epoch": 2.23, "learning_rate": 4.649180771492559e-05, "loss": 1.4663, "step": 28306 }, { "epoch": 2.23, "learning_rate": 4.648286263153178e-05, "loss": 1.4229, "step": 28307 }, { "epoch": 2.23, "learning_rate": 4.647391825096223e-05, "loss": 1.4322, "step": 28308 }, { "epoch": 2.23, "learning_rate": 4.6464974573277644e-05, "loss": 1.4298, "step": 28309 }, { "epoch": 2.23, "learning_rate": 4.645603159853872e-05, "loss": 1.3811, "step": 28310 }, { "epoch": 2.23, "learning_rate": 4.6447089326806244e-05, "loss": 1.4798, "step": 28311 }, { "epoch": 2.23, "learning_rate": 4.643814775814087e-05, "loss": 1.4636, "step": 28312 }, { "epoch": 2.23, "learning_rate": 4.642920689260329e-05, "loss": 1.4672, "step": 28313 }, { "epoch": 2.23, "learning_rate": 4.642026673025423e-05, "loss": 1.4152, "step": 28314 }, { "epoch": 2.23, "learning_rate": 4.6411327271154445e-05, "loss": 1.4533, "step": 28315 }, { "epoch": 2.23, "learning_rate": 4.640238851536459e-05, "loss": 1.4946, "step": 28316 }, { "epoch": 2.23, "learning_rate": 4.63934504629453e-05, "loss": 1.4672, "step": 28317 }, { "epoch": 2.23, "learning_rate": 4.638451311395735e-05, "loss": 1.4656, "step": 28318 }, { "epoch": 2.23, "learning_rate": 4.637557646846138e-05, "loss": 1.4495, "step": 28319 }, { "epoch": 2.23, "learning_rate": 4.6366640526518066e-05, "loss": 1.4533, "step": 28320 }, { "epoch": 2.23, "learning_rate": 4.635770528818802e-05, "loss": 1.4737, "step": 28321 }, { "epoch": 2.23, "learning_rate": 4.6348770753532006e-05, "loss": 1.4532, "step": 28322 }, { "epoch": 2.23, "learning_rate": 4.633983692261063e-05, "loss": 1.4668, "step": 28323 }, { "epoch": 2.23, "learning_rate": 4.633090379548452e-05, "loss": 1.4581, "step": 28324 }, { "epoch": 2.23, "learning_rate": 4.6321971372214414e-05, "loss": 1.5157, "step": 28325 }, { "epoch": 2.23, "learning_rate": 4.6313039652860905e-05, "loss": 1.4561, "step": 28326 }, { "epoch": 2.23, "learning_rate": 4.63041086374846e-05, "loss": 1.4858, "step": 28327 }, { "epoch": 2.23, "learning_rate": 4.629517832614621e-05, "loss": 1.423, "step": 28328 }, { "epoch": 2.23, "learning_rate": 4.6286248718906273e-05, "loss": 1.4253, "step": 28329 }, { "epoch": 2.23, "learning_rate": 4.627731981582553e-05, "loss": 1.4553, "step": 28330 }, { "epoch": 2.23, "learning_rate": 4.626839161696451e-05, "loss": 1.451, "step": 28331 }, { "epoch": 2.23, "learning_rate": 4.62594641223839e-05, "loss": 1.4713, "step": 28332 }, { "epoch": 2.23, "learning_rate": 4.6250537332144294e-05, "loss": 1.4523, "step": 28333 }, { "epoch": 2.23, "learning_rate": 4.624161124630623e-05, "loss": 1.4012, "step": 28334 }, { "epoch": 2.23, "learning_rate": 4.6232685864930416e-05, "loss": 1.4932, "step": 28335 }, { "epoch": 2.23, "learning_rate": 4.6223761188077394e-05, "loss": 1.4987, "step": 28336 }, { "epoch": 2.23, "learning_rate": 4.621483721580776e-05, "loss": 1.427, "step": 28337 }, { "epoch": 2.23, "learning_rate": 4.620591394818207e-05, "loss": 1.5141, "step": 28338 }, { "epoch": 2.23, "learning_rate": 4.6196991385261e-05, "loss": 1.4289, "step": 28339 }, { "epoch": 2.23, "learning_rate": 4.618806952710507e-05, "loss": 1.4444, "step": 28340 }, { "epoch": 2.23, "learning_rate": 4.6179148373774814e-05, "loss": 1.419, "step": 28341 }, { "epoch": 2.23, "learning_rate": 4.6170227925330885e-05, "loss": 1.4368, "step": 28342 }, { "epoch": 2.23, "learning_rate": 4.616130818183382e-05, "loss": 1.4341, "step": 28343 }, { "epoch": 2.23, "learning_rate": 4.615238914334412e-05, "loss": 1.3862, "step": 28344 }, { "epoch": 2.23, "learning_rate": 4.6143470809922395e-05, "loss": 1.4791, "step": 28345 }, { "epoch": 2.23, "learning_rate": 4.613455318162922e-05, "loss": 1.46, "step": 28346 }, { "epoch": 2.23, "learning_rate": 4.612563625852513e-05, "loss": 1.4532, "step": 28347 }, { "epoch": 2.23, "learning_rate": 4.611672004067059e-05, "loss": 1.4082, "step": 28348 }, { "epoch": 2.23, "learning_rate": 4.6107804528126246e-05, "loss": 1.3987, "step": 28349 }, { "epoch": 2.23, "learning_rate": 4.6098889720952584e-05, "loss": 1.4466, "step": 28350 }, { "epoch": 2.23, "learning_rate": 4.608997561921006e-05, "loss": 1.4863, "step": 28351 }, { "epoch": 2.23, "learning_rate": 4.6081062222959324e-05, "loss": 1.4636, "step": 28352 }, { "epoch": 2.23, "learning_rate": 4.607214953226082e-05, "loss": 1.4973, "step": 28353 }, { "epoch": 2.23, "learning_rate": 4.6063237547175055e-05, "loss": 1.513, "step": 28354 }, { "epoch": 2.23, "learning_rate": 4.605432626776252e-05, "loss": 1.4668, "step": 28355 }, { "epoch": 2.23, "learning_rate": 4.6045415694083794e-05, "loss": 1.4563, "step": 28356 }, { "epoch": 2.23, "learning_rate": 4.6036505826199324e-05, "loss": 1.469, "step": 28357 }, { "epoch": 2.23, "learning_rate": 4.602759666416956e-05, "loss": 1.427, "step": 28358 }, { "epoch": 2.23, "learning_rate": 4.601868820805509e-05, "loss": 1.4696, "step": 28359 }, { "epoch": 2.23, "learning_rate": 4.600978045791628e-05, "loss": 1.4011, "step": 28360 }, { "epoch": 2.23, "learning_rate": 4.600087341381373e-05, "loss": 1.4544, "step": 28361 }, { "epoch": 2.23, "learning_rate": 4.5991967075807835e-05, "loss": 1.4352, "step": 28362 }, { "epoch": 2.23, "learning_rate": 4.59830614439591e-05, "loss": 1.4338, "step": 28363 }, { "epoch": 2.23, "learning_rate": 4.5974156518328006e-05, "loss": 1.4379, "step": 28364 }, { "epoch": 2.23, "learning_rate": 4.596525229897491e-05, "loss": 1.5218, "step": 28365 }, { "epoch": 2.23, "learning_rate": 4.59563487859604e-05, "loss": 1.5033, "step": 28366 }, { "epoch": 2.23, "learning_rate": 4.5947445979344863e-05, "loss": 1.4384, "step": 28367 }, { "epoch": 2.23, "learning_rate": 4.593854387918871e-05, "loss": 1.43, "step": 28368 }, { "epoch": 2.23, "learning_rate": 4.592964248555245e-05, "loss": 1.4761, "step": 28369 }, { "epoch": 2.23, "learning_rate": 4.59207417984965e-05, "loss": 1.4417, "step": 28370 }, { "epoch": 2.23, "learning_rate": 4.591184181808122e-05, "loss": 1.4783, "step": 28371 }, { "epoch": 2.23, "learning_rate": 4.5902942544367135e-05, "loss": 1.4676, "step": 28372 }, { "epoch": 2.23, "learning_rate": 4.589404397741464e-05, "loss": 1.4781, "step": 28373 }, { "epoch": 2.23, "learning_rate": 4.588514611728413e-05, "loss": 1.442, "step": 28374 }, { "epoch": 2.23, "learning_rate": 4.5876248964035984e-05, "loss": 1.4797, "step": 28375 }, { "epoch": 2.23, "learning_rate": 4.586735251773063e-05, "loss": 1.4057, "step": 28376 }, { "epoch": 2.23, "learning_rate": 4.5858456778428545e-05, "loss": 1.4842, "step": 28377 }, { "epoch": 2.23, "learning_rate": 4.5849561746190065e-05, "loss": 1.4569, "step": 28378 }, { "epoch": 2.23, "learning_rate": 4.5840667421075534e-05, "loss": 1.5276, "step": 28379 }, { "epoch": 2.23, "learning_rate": 4.583177380314544e-05, "loss": 1.4282, "step": 28380 }, { "epoch": 2.23, "learning_rate": 4.5822880892460134e-05, "loss": 1.4225, "step": 28381 }, { "epoch": 2.23, "learning_rate": 4.581398868907992e-05, "loss": 1.4316, "step": 28382 }, { "epoch": 2.23, "learning_rate": 4.580509719306526e-05, "loss": 1.4483, "step": 28383 }, { "epoch": 2.23, "learning_rate": 4.579620640447652e-05, "loss": 1.4515, "step": 28384 }, { "epoch": 2.23, "learning_rate": 4.5787316323373955e-05, "loss": 1.4474, "step": 28385 }, { "epoch": 2.23, "learning_rate": 4.577842694981807e-05, "loss": 1.4144, "step": 28386 }, { "epoch": 2.23, "learning_rate": 4.5769538283869154e-05, "loss": 1.4844, "step": 28387 }, { "epoch": 2.23, "learning_rate": 4.57606503255875e-05, "loss": 1.47, "step": 28388 }, { "epoch": 2.23, "learning_rate": 4.5751763075033556e-05, "loss": 1.38, "step": 28389 }, { "epoch": 2.23, "learning_rate": 4.57428765322676e-05, "loss": 1.4261, "step": 28390 }, { "epoch": 2.23, "learning_rate": 4.5733990697349946e-05, "loss": 1.4499, "step": 28391 }, { "epoch": 2.23, "learning_rate": 4.572510557034094e-05, "loss": 1.4635, "step": 28392 }, { "epoch": 2.23, "learning_rate": 4.571622115130099e-05, "loss": 1.41, "step": 28393 }, { "epoch": 2.23, "learning_rate": 4.570733744029033e-05, "loss": 1.4718, "step": 28394 }, { "epoch": 2.23, "learning_rate": 4.5698454437369315e-05, "loss": 1.437, "step": 28395 }, { "epoch": 2.23, "learning_rate": 4.568957214259819e-05, "loss": 1.4255, "step": 28396 }, { "epoch": 2.23, "learning_rate": 4.568069055603733e-05, "loss": 1.4297, "step": 28397 }, { "epoch": 2.23, "learning_rate": 4.567180967774703e-05, "loss": 1.4479, "step": 28398 }, { "epoch": 2.23, "learning_rate": 4.5662929507787516e-05, "loss": 1.4227, "step": 28399 }, { "epoch": 2.23, "learning_rate": 4.565405004621919e-05, "loss": 1.4289, "step": 28400 }, { "epoch": 2.23, "learning_rate": 4.564517129310227e-05, "loss": 1.4928, "step": 28401 }, { "epoch": 2.23, "learning_rate": 4.5636293248497006e-05, "loss": 1.4635, "step": 28402 }, { "epoch": 2.23, "learning_rate": 4.5627415912463766e-05, "loss": 1.4112, "step": 28403 }, { "epoch": 2.23, "learning_rate": 4.5618539285062776e-05, "loss": 1.4366, "step": 28404 }, { "epoch": 2.23, "learning_rate": 4.560966336635426e-05, "loss": 1.4367, "step": 28405 }, { "epoch": 2.24, "learning_rate": 4.560078815639857e-05, "loss": 1.4493, "step": 28406 }, { "epoch": 2.24, "learning_rate": 4.559191365525585e-05, "loss": 1.4677, "step": 28407 }, { "epoch": 2.24, "learning_rate": 4.558303986298649e-05, "loss": 1.4204, "step": 28408 }, { "epoch": 2.24, "learning_rate": 4.5574166779650604e-05, "loss": 1.4062, "step": 28409 }, { "epoch": 2.24, "learning_rate": 4.556529440530854e-05, "loss": 1.5089, "step": 28410 }, { "epoch": 2.24, "learning_rate": 4.55564227400205e-05, "loss": 1.4318, "step": 28411 }, { "epoch": 2.24, "learning_rate": 4.5547551783846685e-05, "loss": 1.3867, "step": 28412 }, { "epoch": 2.24, "learning_rate": 4.553868153684739e-05, "loss": 1.4398, "step": 28413 }, { "epoch": 2.24, "learning_rate": 4.552981199908279e-05, "loss": 1.46, "step": 28414 }, { "epoch": 2.24, "learning_rate": 4.552094317061312e-05, "loss": 1.5307, "step": 28415 }, { "epoch": 2.24, "learning_rate": 4.5512075051498545e-05, "loss": 1.4397, "step": 28416 }, { "epoch": 2.24, "learning_rate": 4.550320764179935e-05, "loss": 1.5078, "step": 28417 }, { "epoch": 2.24, "learning_rate": 4.549434094157573e-05, "loss": 1.4171, "step": 28418 }, { "epoch": 2.24, "learning_rate": 4.548547495088782e-05, "loss": 1.4541, "step": 28419 }, { "epoch": 2.24, "learning_rate": 4.5476609669795886e-05, "loss": 1.4681, "step": 28420 }, { "epoch": 2.24, "learning_rate": 4.546774509836011e-05, "loss": 1.4508, "step": 28421 }, { "epoch": 2.24, "learning_rate": 4.5458881236640596e-05, "loss": 1.3954, "step": 28422 }, { "epoch": 2.24, "learning_rate": 4.545001808469759e-05, "loss": 1.4582, "step": 28423 }, { "epoch": 2.24, "learning_rate": 4.5441155642591325e-05, "loss": 1.4295, "step": 28424 }, { "epoch": 2.24, "learning_rate": 4.5432293910381914e-05, "loss": 1.4496, "step": 28425 }, { "epoch": 2.24, "learning_rate": 4.542343288812947e-05, "loss": 1.4906, "step": 28426 }, { "epoch": 2.24, "learning_rate": 4.5414572575894246e-05, "loss": 1.4724, "step": 28427 }, { "epoch": 2.24, "learning_rate": 4.5405712973736355e-05, "loss": 1.4485, "step": 28428 }, { "epoch": 2.24, "learning_rate": 4.539685408171592e-05, "loss": 1.421, "step": 28429 }, { "epoch": 2.24, "learning_rate": 4.5387995899893176e-05, "loss": 1.4545, "step": 28430 }, { "epoch": 2.24, "learning_rate": 4.537913842832819e-05, "loss": 1.4834, "step": 28431 }, { "epoch": 2.24, "learning_rate": 4.537028166708112e-05, "loss": 1.4404, "step": 28432 }, { "epoch": 2.24, "learning_rate": 4.536142561621206e-05, "loss": 1.5158, "step": 28433 }, { "epoch": 2.24, "learning_rate": 4.5352570275781224e-05, "loss": 1.4012, "step": 28434 }, { "epoch": 2.24, "learning_rate": 4.534371564584868e-05, "loss": 1.4352, "step": 28435 }, { "epoch": 2.24, "learning_rate": 4.533486172647452e-05, "loss": 1.4213, "step": 28436 }, { "epoch": 2.24, "learning_rate": 4.532600851771892e-05, "loss": 1.4416, "step": 28437 }, { "epoch": 2.24, "learning_rate": 4.531715601964197e-05, "loss": 1.5285, "step": 28438 }, { "epoch": 2.24, "learning_rate": 4.5308304232303704e-05, "loss": 1.4668, "step": 28439 }, { "epoch": 2.24, "learning_rate": 4.529945315576429e-05, "loss": 1.4692, "step": 28440 }, { "epoch": 2.24, "learning_rate": 4.5290602790083854e-05, "loss": 1.5, "step": 28441 }, { "epoch": 2.24, "learning_rate": 4.528175313532243e-05, "loss": 1.4146, "step": 28442 }, { "epoch": 2.24, "learning_rate": 4.527290419154008e-05, "loss": 1.467, "step": 28443 }, { "epoch": 2.24, "learning_rate": 4.526405595879696e-05, "loss": 1.4488, "step": 28444 }, { "epoch": 2.24, "learning_rate": 4.5255208437153096e-05, "loss": 1.4344, "step": 28445 }, { "epoch": 2.24, "learning_rate": 4.5246361626668525e-05, "loss": 1.4442, "step": 28446 }, { "epoch": 2.24, "learning_rate": 4.523751552740341e-05, "loss": 1.4411, "step": 28447 }, { "epoch": 2.24, "learning_rate": 4.522867013941772e-05, "loss": 1.4355, "step": 28448 }, { "epoch": 2.24, "learning_rate": 4.521982546277156e-05, "loss": 1.5204, "step": 28449 }, { "epoch": 2.24, "learning_rate": 4.521098149752492e-05, "loss": 1.4609, "step": 28450 }, { "epoch": 2.24, "learning_rate": 4.5202138243737935e-05, "loss": 1.4562, "step": 28451 }, { "epoch": 2.24, "learning_rate": 4.519329570147059e-05, "loss": 1.4943, "step": 28452 }, { "epoch": 2.24, "learning_rate": 4.518445387078288e-05, "loss": 1.4869, "step": 28453 }, { "epoch": 2.24, "learning_rate": 4.5175612751734905e-05, "loss": 1.408, "step": 28454 }, { "epoch": 2.24, "learning_rate": 4.51667723443867e-05, "loss": 1.4806, "step": 28455 }, { "epoch": 2.24, "learning_rate": 4.5157932648798273e-05, "loss": 1.4237, "step": 28456 }, { "epoch": 2.24, "learning_rate": 4.514909366502958e-05, "loss": 1.4469, "step": 28457 }, { "epoch": 2.24, "learning_rate": 4.514025539314072e-05, "loss": 1.4576, "step": 28458 }, { "epoch": 2.24, "learning_rate": 4.5131417833191656e-05, "loss": 1.4918, "step": 28459 }, { "epoch": 2.24, "learning_rate": 4.512258098524235e-05, "loss": 1.4161, "step": 28460 }, { "epoch": 2.24, "learning_rate": 4.511374484935289e-05, "loss": 1.4483, "step": 28461 }, { "epoch": 2.24, "learning_rate": 4.510490942558323e-05, "loss": 1.4597, "step": 28462 }, { "epoch": 2.24, "learning_rate": 4.509607471399329e-05, "loss": 1.4645, "step": 28463 }, { "epoch": 2.24, "learning_rate": 4.5087240714643155e-05, "loss": 1.4786, "step": 28464 }, { "epoch": 2.24, "learning_rate": 4.507840742759278e-05, "loss": 1.4345, "step": 28465 }, { "epoch": 2.24, "learning_rate": 4.5069574852902054e-05, "loss": 1.4427, "step": 28466 }, { "epoch": 2.24, "learning_rate": 4.506074299063107e-05, "loss": 1.4398, "step": 28467 }, { "epoch": 2.24, "learning_rate": 4.5051911840839725e-05, "loss": 1.5267, "step": 28468 }, { "epoch": 2.24, "learning_rate": 4.5043081403587974e-05, "loss": 1.4556, "step": 28469 }, { "epoch": 2.24, "learning_rate": 4.5034251678935684e-05, "loss": 1.4238, "step": 28470 }, { "epoch": 2.24, "learning_rate": 4.5025422666943014e-05, "loss": 1.4825, "step": 28471 }, { "epoch": 2.24, "learning_rate": 4.501659436766977e-05, "loss": 1.4288, "step": 28472 }, { "epoch": 2.24, "learning_rate": 4.500776678117594e-05, "loss": 1.4337, "step": 28473 }, { "epoch": 2.24, "learning_rate": 4.499893990752137e-05, "loss": 1.4374, "step": 28474 }, { "epoch": 2.24, "learning_rate": 4.499011374676611e-05, "loss": 1.4374, "step": 28475 }, { "epoch": 2.24, "learning_rate": 4.4981288298970026e-05, "loss": 1.4415, "step": 28476 }, { "epoch": 2.24, "learning_rate": 4.4972463564193e-05, "loss": 1.4477, "step": 28477 }, { "epoch": 2.24, "learning_rate": 4.496363954249502e-05, "loss": 1.4076, "step": 28478 }, { "epoch": 2.24, "learning_rate": 4.4954816233935974e-05, "loss": 1.4573, "step": 28479 }, { "epoch": 2.24, "learning_rate": 4.4945993638575714e-05, "loss": 1.4691, "step": 28480 }, { "epoch": 2.24, "learning_rate": 4.493717175647422e-05, "loss": 1.4502, "step": 28481 }, { "epoch": 2.24, "learning_rate": 4.492835058769134e-05, "loss": 1.5082, "step": 28482 }, { "epoch": 2.24, "learning_rate": 4.4919530132286954e-05, "loss": 1.4402, "step": 28483 }, { "epoch": 2.24, "learning_rate": 4.491071039032101e-05, "loss": 1.4255, "step": 28484 }, { "epoch": 2.24, "learning_rate": 4.490189136185335e-05, "loss": 1.5001, "step": 28485 }, { "epoch": 2.24, "learning_rate": 4.48930730469438e-05, "loss": 1.424, "step": 28486 }, { "epoch": 2.24, "learning_rate": 4.4884255445652274e-05, "loss": 1.5139, "step": 28487 }, { "epoch": 2.24, "learning_rate": 4.48754385580387e-05, "loss": 1.4758, "step": 28488 }, { "epoch": 2.24, "learning_rate": 4.4866622384162884e-05, "loss": 1.4511, "step": 28489 }, { "epoch": 2.24, "learning_rate": 4.485780692408468e-05, "loss": 1.4652, "step": 28490 }, { "epoch": 2.24, "learning_rate": 4.484899217786391e-05, "loss": 1.4513, "step": 28491 }, { "epoch": 2.24, "learning_rate": 4.484017814556049e-05, "loss": 1.4187, "step": 28492 }, { "epoch": 2.24, "learning_rate": 4.483136482723424e-05, "loss": 1.402, "step": 28493 }, { "epoch": 2.24, "learning_rate": 4.482255222294494e-05, "loss": 1.4142, "step": 28494 }, { "epoch": 2.24, "learning_rate": 4.481374033275249e-05, "loss": 1.4221, "step": 28495 }, { "epoch": 2.24, "learning_rate": 4.4804929156716736e-05, "loss": 1.4689, "step": 28496 }, { "epoch": 2.24, "learning_rate": 4.479611869489739e-05, "loss": 1.443, "step": 28497 }, { "epoch": 2.24, "learning_rate": 4.478730894735439e-05, "loss": 1.4371, "step": 28498 }, { "epoch": 2.24, "learning_rate": 4.477849991414751e-05, "loss": 1.4445, "step": 28499 }, { "epoch": 2.24, "learning_rate": 4.4769691595336485e-05, "loss": 1.4652, "step": 28500 }, { "epoch": 2.24, "learning_rate": 4.4760883990981196e-05, "loss": 1.4546, "step": 28501 }, { "epoch": 2.24, "learning_rate": 4.475207710114148e-05, "loss": 1.3867, "step": 28502 }, { "epoch": 2.24, "learning_rate": 4.4743270925877085e-05, "loss": 1.4357, "step": 28503 }, { "epoch": 2.24, "learning_rate": 4.473446546524772e-05, "loss": 1.4606, "step": 28504 }, { "epoch": 2.24, "learning_rate": 4.472566071931331e-05, "loss": 1.4876, "step": 28505 }, { "epoch": 2.24, "learning_rate": 4.4716856688133576e-05, "loss": 1.4386, "step": 28506 }, { "epoch": 2.24, "learning_rate": 4.4708053371768274e-05, "loss": 1.4568, "step": 28507 }, { "epoch": 2.24, "learning_rate": 4.4699250770277136e-05, "loss": 1.4598, "step": 28508 }, { "epoch": 2.24, "learning_rate": 4.469044888372003e-05, "loss": 1.4602, "step": 28509 }, { "epoch": 2.24, "learning_rate": 4.4681647712156657e-05, "loss": 1.4554, "step": 28510 }, { "epoch": 2.24, "learning_rate": 4.4672847255646746e-05, "loss": 1.3991, "step": 28511 }, { "epoch": 2.24, "learning_rate": 4.46640475142501e-05, "loss": 1.4266, "step": 28512 }, { "epoch": 2.24, "learning_rate": 4.4655248488026446e-05, "loss": 1.4371, "step": 28513 }, { "epoch": 2.24, "learning_rate": 4.464645017703548e-05, "loss": 1.4741, "step": 28514 }, { "epoch": 2.24, "learning_rate": 4.4637652581337024e-05, "loss": 1.433, "step": 28515 }, { "epoch": 2.24, "learning_rate": 4.4628855700990765e-05, "loss": 1.4857, "step": 28516 }, { "epoch": 2.24, "learning_rate": 4.462005953605638e-05, "loss": 1.4137, "step": 28517 }, { "epoch": 2.24, "learning_rate": 4.461126408659365e-05, "loss": 1.4699, "step": 28518 }, { "epoch": 2.24, "learning_rate": 4.46024693526623e-05, "loss": 1.5006, "step": 28519 }, { "epoch": 2.24, "learning_rate": 4.459367533432203e-05, "loss": 1.4462, "step": 28520 }, { "epoch": 2.24, "learning_rate": 4.458488203163249e-05, "loss": 1.5194, "step": 28521 }, { "epoch": 2.24, "learning_rate": 4.457608944465349e-05, "loss": 1.4625, "step": 28522 }, { "epoch": 2.24, "learning_rate": 4.456729757344465e-05, "loss": 1.4502, "step": 28523 }, { "epoch": 2.24, "learning_rate": 4.455850641806562e-05, "loss": 1.4689, "step": 28524 }, { "epoch": 2.24, "learning_rate": 4.454971597857621e-05, "loss": 1.4075, "step": 28525 }, { "epoch": 2.24, "learning_rate": 4.454092625503603e-05, "loss": 1.4822, "step": 28526 }, { "epoch": 2.24, "learning_rate": 4.453213724750476e-05, "loss": 1.4483, "step": 28527 }, { "epoch": 2.24, "learning_rate": 4.4523348956042034e-05, "loss": 1.4274, "step": 28528 }, { "epoch": 2.24, "learning_rate": 4.45145613807076e-05, "loss": 1.4746, "step": 28529 }, { "epoch": 2.24, "learning_rate": 4.450577452156109e-05, "loss": 1.462, "step": 28530 }, { "epoch": 2.24, "learning_rate": 4.449698837866211e-05, "loss": 1.4588, "step": 28531 }, { "epoch": 2.24, "learning_rate": 4.44882029520704e-05, "loss": 1.4696, "step": 28532 }, { "epoch": 2.25, "learning_rate": 4.447941824184553e-05, "loss": 1.4863, "step": 28533 }, { "epoch": 2.25, "learning_rate": 4.447063424804721e-05, "loss": 1.4783, "step": 28534 }, { "epoch": 2.25, "learning_rate": 4.4461850970735e-05, "loss": 1.4743, "step": 28535 }, { "epoch": 2.25, "learning_rate": 4.445306840996864e-05, "loss": 1.4006, "step": 28536 }, { "epoch": 2.25, "learning_rate": 4.444428656580769e-05, "loss": 1.4944, "step": 28537 }, { "epoch": 2.25, "learning_rate": 4.443550543831174e-05, "loss": 1.4806, "step": 28538 }, { "epoch": 2.25, "learning_rate": 4.442672502754051e-05, "loss": 1.4818, "step": 28539 }, { "epoch": 2.25, "learning_rate": 4.4417945333553535e-05, "loss": 1.4433, "step": 28540 }, { "epoch": 2.25, "learning_rate": 4.4409166356410426e-05, "loss": 1.4757, "step": 28541 }, { "epoch": 2.25, "learning_rate": 4.4400388096170837e-05, "loss": 1.4301, "step": 28542 }, { "epoch": 2.25, "learning_rate": 4.439161055289434e-05, "loss": 1.4114, "step": 28543 }, { "epoch": 2.25, "learning_rate": 4.4382833726640524e-05, "loss": 1.4688, "step": 28544 }, { "epoch": 2.25, "learning_rate": 4.437405761746894e-05, "loss": 1.4308, "step": 28545 }, { "epoch": 2.25, "learning_rate": 4.4365282225439273e-05, "loss": 1.429, "step": 28546 }, { "epoch": 2.25, "learning_rate": 4.435650755061104e-05, "loss": 1.4461, "step": 28547 }, { "epoch": 2.25, "learning_rate": 4.434773359304377e-05, "loss": 1.5199, "step": 28548 }, { "epoch": 2.25, "learning_rate": 4.4338960352797084e-05, "loss": 1.4821, "step": 28549 }, { "epoch": 2.25, "learning_rate": 4.433018782993059e-05, "loss": 1.492, "step": 28550 }, { "epoch": 2.25, "learning_rate": 4.432141602450381e-05, "loss": 1.4527, "step": 28551 }, { "epoch": 2.25, "learning_rate": 4.431264493657627e-05, "loss": 1.4182, "step": 28552 }, { "epoch": 2.25, "learning_rate": 4.430387456620757e-05, "loss": 1.4218, "step": 28553 }, { "epoch": 2.25, "learning_rate": 4.429510491345725e-05, "loss": 1.4231, "step": 28554 }, { "epoch": 2.25, "learning_rate": 4.428633597838477e-05, "loss": 1.5022, "step": 28555 }, { "epoch": 2.25, "learning_rate": 4.427756776104981e-05, "loss": 1.4118, "step": 28556 }, { "epoch": 2.25, "learning_rate": 4.426880026151179e-05, "loss": 1.4121, "step": 28557 }, { "epoch": 2.25, "learning_rate": 4.426003347983022e-05, "loss": 1.4841, "step": 28558 }, { "epoch": 2.25, "learning_rate": 4.425126741606475e-05, "loss": 1.4661, "step": 28559 }, { "epoch": 2.25, "learning_rate": 4.424250207027479e-05, "loss": 1.4765, "step": 28560 }, { "epoch": 2.25, "learning_rate": 4.423373744251989e-05, "loss": 1.4469, "step": 28561 }, { "epoch": 2.25, "learning_rate": 4.422497353285949e-05, "loss": 1.4572, "step": 28562 }, { "epoch": 2.25, "learning_rate": 4.421621034135321e-05, "loss": 1.439, "step": 28563 }, { "epoch": 2.25, "learning_rate": 4.4207447868060427e-05, "loss": 1.4443, "step": 28564 }, { "epoch": 2.25, "learning_rate": 4.4198686113040696e-05, "loss": 1.4489, "step": 28565 }, { "epoch": 2.25, "learning_rate": 4.418992507635355e-05, "loss": 1.4153, "step": 28566 }, { "epoch": 2.25, "learning_rate": 4.4181164758058416e-05, "loss": 1.3983, "step": 28567 }, { "epoch": 2.25, "learning_rate": 4.417240515821479e-05, "loss": 1.4916, "step": 28568 }, { "epoch": 2.25, "learning_rate": 4.416364627688206e-05, "loss": 1.4732, "step": 28569 }, { "epoch": 2.25, "learning_rate": 4.4154888114119834e-05, "loss": 1.4626, "step": 28570 }, { "epoch": 2.25, "learning_rate": 4.41461306699875e-05, "loss": 1.4288, "step": 28571 }, { "epoch": 2.25, "learning_rate": 4.413737394454449e-05, "loss": 1.478, "step": 28572 }, { "epoch": 2.25, "learning_rate": 4.4128617937850325e-05, "loss": 1.4738, "step": 28573 }, { "epoch": 2.25, "learning_rate": 4.4119862649964424e-05, "loss": 1.4748, "step": 28574 }, { "epoch": 2.25, "learning_rate": 4.411110808094617e-05, "loss": 1.4436, "step": 28575 }, { "epoch": 2.25, "learning_rate": 4.410235423085512e-05, "loss": 1.4667, "step": 28576 }, { "epoch": 2.25, "learning_rate": 4.409360109975063e-05, "loss": 1.4678, "step": 28577 }, { "epoch": 2.25, "learning_rate": 4.4084848687692104e-05, "loss": 1.4732, "step": 28578 }, { "epoch": 2.25, "learning_rate": 4.407609699473905e-05, "loss": 1.4678, "step": 28579 }, { "epoch": 2.25, "learning_rate": 4.4067346020950814e-05, "loss": 1.4729, "step": 28580 }, { "epoch": 2.25, "learning_rate": 4.4058595766386864e-05, "loss": 1.4694, "step": 28581 }, { "epoch": 2.25, "learning_rate": 4.4049846231106555e-05, "loss": 1.4563, "step": 28582 }, { "epoch": 2.25, "learning_rate": 4.404109741516936e-05, "loss": 1.4296, "step": 28583 }, { "epoch": 2.25, "learning_rate": 4.403234931863464e-05, "loss": 1.5036, "step": 28584 }, { "epoch": 2.25, "learning_rate": 4.402360194156179e-05, "loss": 1.4671, "step": 28585 }, { "epoch": 2.25, "learning_rate": 4.401485528401017e-05, "loss": 1.4636, "step": 28586 }, { "epoch": 2.25, "learning_rate": 4.400610934603923e-05, "loss": 1.4846, "step": 28587 }, { "epoch": 2.25, "learning_rate": 4.399736412770831e-05, "loss": 1.4734, "step": 28588 }, { "epoch": 2.25, "learning_rate": 4.3988619629076746e-05, "loss": 1.4287, "step": 28589 }, { "epoch": 2.25, "learning_rate": 4.3979875850204e-05, "loss": 1.4489, "step": 28590 }, { "epoch": 2.25, "learning_rate": 4.39711327911494e-05, "loss": 1.4508, "step": 28591 }, { "epoch": 2.25, "learning_rate": 4.396239045197224e-05, "loss": 1.4602, "step": 28592 }, { "epoch": 2.25, "learning_rate": 4.395364883273198e-05, "loss": 1.4415, "step": 28593 }, { "epoch": 2.25, "learning_rate": 4.394490793348792e-05, "loss": 1.5127, "step": 28594 }, { "epoch": 2.25, "learning_rate": 4.393616775429938e-05, "loss": 1.4478, "step": 28595 }, { "epoch": 2.25, "learning_rate": 4.39274282952257e-05, "loss": 1.4065, "step": 28596 }, { "epoch": 2.25, "learning_rate": 4.3918689556326313e-05, "loss": 1.4858, "step": 28597 }, { "epoch": 2.25, "learning_rate": 4.390995153766048e-05, "loss": 1.4991, "step": 28598 }, { "epoch": 2.25, "learning_rate": 4.390121423928749e-05, "loss": 1.4251, "step": 28599 }, { "epoch": 2.25, "learning_rate": 4.389247766126675e-05, "loss": 1.3911, "step": 28600 }, { "epoch": 2.25, "learning_rate": 4.388374180365753e-05, "loss": 1.4777, "step": 28601 }, { "epoch": 2.25, "learning_rate": 4.387500666651913e-05, "loss": 1.5011, "step": 28602 }, { "epoch": 2.25, "learning_rate": 4.386627224991083e-05, "loss": 1.435, "step": 28603 }, { "epoch": 2.25, "learning_rate": 4.3857538553892024e-05, "loss": 1.4651, "step": 28604 }, { "epoch": 2.25, "learning_rate": 4.384880557852196e-05, "loss": 1.463, "step": 28605 }, { "epoch": 2.25, "learning_rate": 4.384007332385988e-05, "loss": 1.494, "step": 28606 }, { "epoch": 2.25, "learning_rate": 4.383134178996517e-05, "loss": 1.4852, "step": 28607 }, { "epoch": 2.25, "learning_rate": 4.382261097689704e-05, "loss": 1.438, "step": 28608 }, { "epoch": 2.25, "learning_rate": 4.3813880884714756e-05, "loss": 1.4736, "step": 28609 }, { "epoch": 2.25, "learning_rate": 4.3805151513477666e-05, "loss": 1.4553, "step": 28610 }, { "epoch": 2.25, "learning_rate": 4.379642286324495e-05, "loss": 1.4519, "step": 28611 }, { "epoch": 2.25, "learning_rate": 4.378769493407595e-05, "loss": 1.4503, "step": 28612 }, { "epoch": 2.25, "learning_rate": 4.377896772602985e-05, "loss": 1.4669, "step": 28613 }, { "epoch": 2.25, "learning_rate": 4.3770241239165996e-05, "loss": 1.429, "step": 28614 }, { "epoch": 2.25, "learning_rate": 4.376151547354358e-05, "loss": 1.4193, "step": 28615 }, { "epoch": 2.25, "learning_rate": 4.3752790429221794e-05, "loss": 1.4426, "step": 28616 }, { "epoch": 2.25, "learning_rate": 4.3744066106259965e-05, "loss": 1.4631, "step": 28617 }, { "epoch": 2.25, "learning_rate": 4.373534250471731e-05, "loss": 1.45, "step": 28618 }, { "epoch": 2.25, "learning_rate": 4.3726619624653034e-05, "loss": 1.5317, "step": 28619 }, { "epoch": 2.25, "learning_rate": 4.3717897466126306e-05, "loss": 1.4457, "step": 28620 }, { "epoch": 2.25, "learning_rate": 4.370917602919646e-05, "loss": 1.4582, "step": 28621 }, { "epoch": 2.25, "learning_rate": 4.3700455313922644e-05, "loss": 1.4589, "step": 28622 }, { "epoch": 2.25, "learning_rate": 4.369173532036404e-05, "loss": 1.4644, "step": 28623 }, { "epoch": 2.25, "learning_rate": 4.3683016048579934e-05, "loss": 1.4575, "step": 28624 }, { "epoch": 2.25, "learning_rate": 4.367429749862947e-05, "loss": 1.424, "step": 28625 }, { "epoch": 2.25, "learning_rate": 4.366557967057181e-05, "loss": 1.4411, "step": 28626 }, { "epoch": 2.25, "learning_rate": 4.365686256446618e-05, "loss": 1.4268, "step": 28627 }, { "epoch": 2.25, "learning_rate": 4.364814618037181e-05, "loss": 1.4415, "step": 28628 }, { "epoch": 2.25, "learning_rate": 4.363943051834785e-05, "loss": 1.4372, "step": 28629 }, { "epoch": 2.25, "learning_rate": 4.36307155784534e-05, "loss": 1.4728, "step": 28630 }, { "epoch": 2.25, "learning_rate": 4.362200136074775e-05, "loss": 1.4236, "step": 28631 }, { "epoch": 2.25, "learning_rate": 4.361328786529e-05, "loss": 1.4548, "step": 28632 }, { "epoch": 2.25, "learning_rate": 4.360457509213928e-05, "loss": 1.4114, "step": 28633 }, { "epoch": 2.25, "learning_rate": 4.3595863041354824e-05, "loss": 1.4615, "step": 28634 }, { "epoch": 2.25, "learning_rate": 4.3587151712995724e-05, "loss": 1.4048, "step": 28635 }, { "epoch": 2.25, "learning_rate": 4.357844110712111e-05, "loss": 1.4113, "step": 28636 }, { "epoch": 2.25, "learning_rate": 4.3569731223790186e-05, "loss": 1.485, "step": 28637 }, { "epoch": 2.25, "learning_rate": 4.3561022063062076e-05, "loss": 1.4513, "step": 28638 }, { "epoch": 2.25, "learning_rate": 4.3552313624995866e-05, "loss": 1.4277, "step": 28639 }, { "epoch": 2.25, "learning_rate": 4.354360590965067e-05, "loss": 1.4951, "step": 28640 }, { "epoch": 2.25, "learning_rate": 4.353489891708569e-05, "loss": 1.4499, "step": 28641 }, { "epoch": 2.25, "learning_rate": 4.352619264735999e-05, "loss": 1.4058, "step": 28642 }, { "epoch": 2.25, "learning_rate": 4.3517487100532635e-05, "loss": 1.482, "step": 28643 }, { "epoch": 2.25, "learning_rate": 4.3508782276662784e-05, "loss": 1.4801, "step": 28644 }, { "epoch": 2.25, "learning_rate": 4.3500078175809576e-05, "loss": 1.4593, "step": 28645 }, { "epoch": 2.25, "learning_rate": 4.349137479803207e-05, "loss": 1.4485, "step": 28646 }, { "epoch": 2.25, "learning_rate": 4.3482672143389315e-05, "loss": 1.4241, "step": 28647 }, { "epoch": 2.25, "learning_rate": 4.347397021194048e-05, "loss": 1.4908, "step": 28648 }, { "epoch": 2.25, "learning_rate": 4.3465269003744584e-05, "loss": 1.4179, "step": 28649 }, { "epoch": 2.25, "learning_rate": 4.345656851886068e-05, "loss": 1.4824, "step": 28650 }, { "epoch": 2.25, "learning_rate": 4.344786875734795e-05, "loss": 1.3816, "step": 28651 }, { "epoch": 2.25, "learning_rate": 4.343916971926536e-05, "loss": 1.4961, "step": 28652 }, { "epoch": 2.25, "learning_rate": 4.3430471404671974e-05, "loss": 1.509, "step": 28653 }, { "epoch": 2.25, "learning_rate": 4.342177381362691e-05, "loss": 1.4366, "step": 28654 }, { "epoch": 2.25, "learning_rate": 4.34130769461892e-05, "loss": 1.4673, "step": 28655 }, { "epoch": 2.25, "learning_rate": 4.340438080241787e-05, "loss": 1.4188, "step": 28656 }, { "epoch": 2.25, "learning_rate": 4.339568538237194e-05, "loss": 1.4526, "step": 28657 }, { "epoch": 2.25, "learning_rate": 4.33869906861105e-05, "loss": 1.5003, "step": 28658 }, { "epoch": 2.25, "learning_rate": 4.337829671369252e-05, "loss": 1.4273, "step": 28659 }, { "epoch": 2.26, "learning_rate": 4.336960346517712e-05, "loss": 1.3953, "step": 28660 }, { "epoch": 2.26, "learning_rate": 4.336091094062322e-05, "loss": 1.4172, "step": 28661 }, { "epoch": 2.26, "learning_rate": 4.335221914008994e-05, "loss": 1.4352, "step": 28662 }, { "epoch": 2.26, "learning_rate": 4.334352806363622e-05, "loss": 1.4738, "step": 28663 }, { "epoch": 2.26, "learning_rate": 4.3334837711321056e-05, "loss": 1.4071, "step": 28664 }, { "epoch": 2.26, "learning_rate": 4.332614808320353e-05, "loss": 1.4781, "step": 28665 }, { "epoch": 2.26, "learning_rate": 4.3317459179342565e-05, "loss": 1.4725, "step": 28666 }, { "epoch": 2.26, "learning_rate": 4.330877099979717e-05, "loss": 1.4513, "step": 28667 }, { "epoch": 2.26, "learning_rate": 4.330008354462636e-05, "loss": 1.4043, "step": 28668 }, { "epoch": 2.26, "learning_rate": 4.329139681388911e-05, "loss": 1.4435, "step": 28669 }, { "epoch": 2.26, "learning_rate": 4.328271080764435e-05, "loss": 1.4616, "step": 28670 }, { "epoch": 2.26, "learning_rate": 4.3274025525951124e-05, "loss": 1.4431, "step": 28671 }, { "epoch": 2.26, "learning_rate": 4.326534096886838e-05, "loss": 1.4366, "step": 28672 }, { "epoch": 2.26, "learning_rate": 4.325665713645507e-05, "loss": 1.4997, "step": 28673 }, { "epoch": 2.26, "learning_rate": 4.324797402877005e-05, "loss": 1.4523, "step": 28674 }, { "epoch": 2.26, "learning_rate": 4.3239291645872475e-05, "loss": 1.4331, "step": 28675 }, { "epoch": 2.26, "learning_rate": 4.3230609987821204e-05, "loss": 1.4735, "step": 28676 }, { "epoch": 2.26, "learning_rate": 4.3221929054675116e-05, "loss": 1.4207, "step": 28677 }, { "epoch": 2.26, "learning_rate": 4.321324884649325e-05, "loss": 1.5048, "step": 28678 }, { "epoch": 2.26, "learning_rate": 4.320456936333449e-05, "loss": 1.461, "step": 28679 }, { "epoch": 2.26, "learning_rate": 4.319589060525778e-05, "loss": 1.4681, "step": 28680 }, { "epoch": 2.26, "learning_rate": 4.318721257232198e-05, "loss": 1.4263, "step": 28681 }, { "epoch": 2.26, "learning_rate": 4.317853526458611e-05, "loss": 1.3856, "step": 28682 }, { "epoch": 2.26, "learning_rate": 4.316985868210903e-05, "loss": 1.423, "step": 28683 }, { "epoch": 2.26, "learning_rate": 4.3161182824949626e-05, "loss": 1.4764, "step": 28684 }, { "epoch": 2.26, "learning_rate": 4.315250769316686e-05, "loss": 1.4807, "step": 28685 }, { "epoch": 2.26, "learning_rate": 4.314383328681961e-05, "loss": 1.4266, "step": 28686 }, { "epoch": 2.26, "learning_rate": 4.313515960596672e-05, "loss": 1.4361, "step": 28687 }, { "epoch": 2.26, "learning_rate": 4.3126486650667166e-05, "loss": 1.4678, "step": 28688 }, { "epoch": 2.26, "learning_rate": 4.3117814420979794e-05, "loss": 1.4269, "step": 28689 }, { "epoch": 2.26, "learning_rate": 4.310914291696344e-05, "loss": 1.4314, "step": 28690 }, { "epoch": 2.26, "learning_rate": 4.3100472138677e-05, "loss": 1.4473, "step": 28691 }, { "epoch": 2.26, "learning_rate": 4.309180208617943e-05, "loss": 1.4964, "step": 28692 }, { "epoch": 2.26, "learning_rate": 4.308313275952952e-05, "loss": 1.4577, "step": 28693 }, { "epoch": 2.26, "learning_rate": 4.307446415878608e-05, "loss": 1.4525, "step": 28694 }, { "epoch": 2.26, "learning_rate": 4.306579628400808e-05, "loss": 1.4229, "step": 28695 }, { "epoch": 2.26, "learning_rate": 4.3057129135254307e-05, "loss": 1.4127, "step": 28696 }, { "epoch": 2.26, "learning_rate": 4.3048462712583606e-05, "loss": 1.4211, "step": 28697 }, { "epoch": 2.26, "learning_rate": 4.3039797016054784e-05, "loss": 1.3967, "step": 28698 }, { "epoch": 2.26, "learning_rate": 4.3031132045726765e-05, "loss": 1.4588, "step": 28699 }, { "epoch": 2.26, "learning_rate": 4.3022467801658314e-05, "loss": 1.4497, "step": 28700 }, { "epoch": 2.26, "learning_rate": 4.3013804283908235e-05, "loss": 1.479, "step": 28701 }, { "epoch": 2.26, "learning_rate": 4.300514149253543e-05, "loss": 1.4408, "step": 28702 }, { "epoch": 2.26, "learning_rate": 4.299647942759867e-05, "loss": 1.4354, "step": 28703 }, { "epoch": 2.26, "learning_rate": 4.298781808915672e-05, "loss": 1.4438, "step": 28704 }, { "epoch": 2.26, "learning_rate": 4.297915747726848e-05, "loss": 1.469, "step": 28705 }, { "epoch": 2.26, "learning_rate": 4.297049759199265e-05, "loss": 1.4073, "step": 28706 }, { "epoch": 2.26, "learning_rate": 4.296183843338812e-05, "loss": 1.4703, "step": 28707 }, { "epoch": 2.26, "learning_rate": 4.295318000151359e-05, "loss": 1.4952, "step": 28708 }, { "epoch": 2.26, "learning_rate": 4.2944522296427964e-05, "loss": 1.4241, "step": 28709 }, { "epoch": 2.26, "learning_rate": 4.293586531818993e-05, "loss": 1.5281, "step": 28710 }, { "epoch": 2.26, "learning_rate": 4.292720906685825e-05, "loss": 1.4347, "step": 28711 }, { "epoch": 2.26, "learning_rate": 4.2918553542491776e-05, "loss": 1.4917, "step": 28712 }, { "epoch": 2.26, "learning_rate": 4.290989874514923e-05, "loss": 1.4647, "step": 28713 }, { "epoch": 2.26, "learning_rate": 4.290124467488939e-05, "loss": 1.3839, "step": 28714 }, { "epoch": 2.26, "learning_rate": 4.289259133177093e-05, "loss": 1.4515, "step": 28715 }, { "epoch": 2.26, "learning_rate": 4.288393871585272e-05, "loss": 1.4461, "step": 28716 }, { "epoch": 2.26, "learning_rate": 4.2875286827193465e-05, "loss": 1.4652, "step": 28717 }, { "epoch": 2.26, "learning_rate": 4.286663566585184e-05, "loss": 1.4607, "step": 28718 }, { "epoch": 2.26, "learning_rate": 4.2857985231886675e-05, "loss": 1.4744, "step": 28719 }, { "epoch": 2.26, "learning_rate": 4.284933552535668e-05, "loss": 1.4487, "step": 28720 }, { "epoch": 2.26, "learning_rate": 4.2840686546320516e-05, "loss": 1.5305, "step": 28721 }, { "epoch": 2.26, "learning_rate": 4.283203829483696e-05, "loss": 1.4187, "step": 28722 }, { "epoch": 2.26, "learning_rate": 4.282339077096477e-05, "loss": 1.505, "step": 28723 }, { "epoch": 2.26, "learning_rate": 4.28147439747626e-05, "loss": 1.4275, "step": 28724 }, { "epoch": 2.26, "learning_rate": 4.2806097906289124e-05, "loss": 1.4316, "step": 28725 }, { "epoch": 2.26, "learning_rate": 4.2797452565603134e-05, "loss": 1.4751, "step": 28726 }, { "epoch": 2.26, "learning_rate": 4.278880795276329e-05, "loss": 1.4567, "step": 28727 }, { "epoch": 2.26, "learning_rate": 4.278016406782824e-05, "loss": 1.475, "step": 28728 }, { "epoch": 2.26, "learning_rate": 4.277152091085674e-05, "loss": 1.462, "step": 28729 }, { "epoch": 2.26, "learning_rate": 4.276287848190743e-05, "loss": 1.4791, "step": 28730 }, { "epoch": 2.26, "learning_rate": 4.2754236781039e-05, "loss": 1.5469, "step": 28731 }, { "epoch": 2.26, "learning_rate": 4.274559580831009e-05, "loss": 1.4485, "step": 28732 }, { "epoch": 2.26, "learning_rate": 4.273695556377943e-05, "loss": 1.4676, "step": 28733 }, { "epoch": 2.26, "learning_rate": 4.272831604750566e-05, "loss": 1.455, "step": 28734 }, { "epoch": 2.26, "learning_rate": 4.2719677259547355e-05, "loss": 1.4961, "step": 28735 }, { "epoch": 2.26, "learning_rate": 4.27110391999633e-05, "loss": 1.4606, "step": 28736 }, { "epoch": 2.26, "learning_rate": 4.270240186881205e-05, "loss": 1.4145, "step": 28737 }, { "epoch": 2.26, "learning_rate": 4.2693765266152306e-05, "loss": 1.4003, "step": 28738 }, { "epoch": 2.26, "learning_rate": 4.2685129392042635e-05, "loss": 1.4354, "step": 28739 }, { "epoch": 2.26, "learning_rate": 4.2676494246541774e-05, "loss": 1.4487, "step": 28740 }, { "epoch": 2.26, "learning_rate": 4.266785982970829e-05, "loss": 1.5597, "step": 28741 }, { "epoch": 2.26, "learning_rate": 4.265922614160075e-05, "loss": 1.4667, "step": 28742 }, { "epoch": 2.26, "learning_rate": 4.2650593182277874e-05, "loss": 1.4148, "step": 28743 }, { "epoch": 2.26, "learning_rate": 4.264196095179824e-05, "loss": 1.4333, "step": 28744 }, { "epoch": 2.26, "learning_rate": 4.263332945022039e-05, "loss": 1.4897, "step": 28745 }, { "epoch": 2.26, "learning_rate": 4.262469867760305e-05, "loss": 1.4005, "step": 28746 }, { "epoch": 2.26, "learning_rate": 4.2616068634004716e-05, "loss": 1.4483, "step": 28747 }, { "epoch": 2.26, "learning_rate": 4.2607439319484004e-05, "loss": 1.463, "step": 28748 }, { "epoch": 2.26, "learning_rate": 4.2598810734099546e-05, "loss": 1.4132, "step": 28749 }, { "epoch": 2.26, "learning_rate": 4.25901828779099e-05, "loss": 1.4595, "step": 28750 }, { "epoch": 2.26, "learning_rate": 4.2581555750973634e-05, "loss": 1.4209, "step": 28751 }, { "epoch": 2.26, "learning_rate": 4.257292935334928e-05, "loss": 1.4529, "step": 28752 }, { "epoch": 2.26, "learning_rate": 4.256430368509545e-05, "loss": 1.4487, "step": 28753 }, { "epoch": 2.26, "learning_rate": 4.255567874627076e-05, "loss": 1.4851, "step": 28754 }, { "epoch": 2.26, "learning_rate": 4.25470545369337e-05, "loss": 1.4593, "step": 28755 }, { "epoch": 2.26, "learning_rate": 4.2538431057142825e-05, "loss": 1.4231, "step": 28756 }, { "epoch": 2.26, "learning_rate": 4.252980830695673e-05, "loss": 1.4851, "step": 28757 }, { "epoch": 2.26, "learning_rate": 4.2521186286433946e-05, "loss": 1.431, "step": 28758 }, { "epoch": 2.26, "learning_rate": 4.2512564995632936e-05, "loss": 1.4669, "step": 28759 }, { "epoch": 2.26, "learning_rate": 4.2503944434612346e-05, "loss": 1.4163, "step": 28760 }, { "epoch": 2.26, "learning_rate": 4.249532460343065e-05, "loss": 1.4253, "step": 28761 }, { "epoch": 2.26, "learning_rate": 4.248670550214632e-05, "loss": 1.4721, "step": 28762 }, { "epoch": 2.26, "learning_rate": 4.247808713081798e-05, "loss": 1.4173, "step": 28763 }, { "epoch": 2.26, "learning_rate": 4.24694694895041e-05, "loss": 1.4506, "step": 28764 }, { "epoch": 2.26, "learning_rate": 4.246085257826312e-05, "loss": 1.4902, "step": 28765 }, { "epoch": 2.26, "learning_rate": 4.245223639715367e-05, "loss": 1.4327, "step": 28766 }, { "epoch": 2.26, "learning_rate": 4.244362094623417e-05, "loss": 1.4241, "step": 28767 }, { "epoch": 2.26, "learning_rate": 4.243500622556313e-05, "loss": 1.4711, "step": 28768 }, { "epoch": 2.26, "learning_rate": 4.242639223519896e-05, "loss": 1.4535, "step": 28769 }, { "epoch": 2.26, "learning_rate": 4.2417778975200313e-05, "loss": 1.4861, "step": 28770 }, { "epoch": 2.26, "learning_rate": 4.2409166445625566e-05, "loss": 1.4491, "step": 28771 }, { "epoch": 2.26, "learning_rate": 4.240055464653321e-05, "loss": 1.4707, "step": 28772 }, { "epoch": 2.26, "learning_rate": 4.239194357798166e-05, "loss": 1.5211, "step": 28773 }, { "epoch": 2.26, "learning_rate": 4.238333324002948e-05, "loss": 1.4257, "step": 28774 }, { "epoch": 2.26, "learning_rate": 4.2374723632735084e-05, "loss": 1.3984, "step": 28775 }, { "epoch": 2.26, "learning_rate": 4.2366114756156875e-05, "loss": 1.4554, "step": 28776 }, { "epoch": 2.26, "learning_rate": 4.2357506610353394e-05, "loss": 1.4237, "step": 28777 }, { "epoch": 2.26, "learning_rate": 4.234889919538304e-05, "loss": 1.4474, "step": 28778 }, { "epoch": 2.26, "learning_rate": 4.2340292511304205e-05, "loss": 1.4363, "step": 28779 }, { "epoch": 2.26, "learning_rate": 4.233168655817543e-05, "loss": 1.4228, "step": 28780 }, { "epoch": 2.26, "learning_rate": 4.232308133605507e-05, "loss": 1.4685, "step": 28781 }, { "epoch": 2.26, "learning_rate": 4.231447684500153e-05, "loss": 1.4523, "step": 28782 }, { "epoch": 2.26, "learning_rate": 4.230587308507332e-05, "loss": 1.4896, "step": 28783 }, { "epoch": 2.26, "learning_rate": 4.2297270056328745e-05, "loss": 1.4696, "step": 28784 }, { "epoch": 2.26, "learning_rate": 4.228866775882632e-05, "loss": 1.4638, "step": 28785 }, { "epoch": 2.26, "learning_rate": 4.2280066192624354e-05, "loss": 1.4592, "step": 28786 }, { "epoch": 2.26, "learning_rate": 4.227146535778134e-05, "loss": 1.4684, "step": 28787 }, { "epoch": 2.27, "learning_rate": 4.2262865254355614e-05, "loss": 1.4483, "step": 28788 }, { "epoch": 2.27, "learning_rate": 4.2254265882405555e-05, "loss": 1.3859, "step": 28789 }, { "epoch": 2.27, "learning_rate": 4.22456672419896e-05, "loss": 1.4704, "step": 28790 }, { "epoch": 2.27, "learning_rate": 4.223706933316611e-05, "loss": 1.4611, "step": 28791 }, { "epoch": 2.27, "learning_rate": 4.222847215599345e-05, "loss": 1.4627, "step": 28792 }, { "epoch": 2.27, "learning_rate": 4.2219875710529946e-05, "loss": 1.5062, "step": 28793 }, { "epoch": 2.27, "learning_rate": 4.2211279996834054e-05, "loss": 1.4355, "step": 28794 }, { "epoch": 2.27, "learning_rate": 4.220268501496408e-05, "loss": 1.4735, "step": 28795 }, { "epoch": 2.27, "learning_rate": 4.219409076497834e-05, "loss": 1.409, "step": 28796 }, { "epoch": 2.27, "learning_rate": 4.218549724693529e-05, "loss": 1.4447, "step": 28797 }, { "epoch": 2.27, "learning_rate": 4.2176904460893216e-05, "loss": 1.4423, "step": 28798 }, { "epoch": 2.27, "learning_rate": 4.2168312406910407e-05, "loss": 1.4431, "step": 28799 }, { "epoch": 2.27, "learning_rate": 4.215972108504525e-05, "loss": 1.4445, "step": 28800 }, { "epoch": 2.27, "learning_rate": 4.215113049535613e-05, "loss": 1.4831, "step": 28801 }, { "epoch": 2.27, "learning_rate": 4.214254063790129e-05, "loss": 1.429, "step": 28802 }, { "epoch": 2.27, "learning_rate": 4.2133951512739075e-05, "loss": 1.4776, "step": 28803 }, { "epoch": 2.27, "learning_rate": 4.212536311992781e-05, "loss": 1.4705, "step": 28804 }, { "epoch": 2.27, "learning_rate": 4.211677545952582e-05, "loss": 1.4795, "step": 28805 }, { "epoch": 2.27, "learning_rate": 4.2108188531591344e-05, "loss": 1.4544, "step": 28806 }, { "epoch": 2.27, "learning_rate": 4.209960233618278e-05, "loss": 1.5021, "step": 28807 }, { "epoch": 2.27, "learning_rate": 4.2091016873358356e-05, "loss": 1.4879, "step": 28808 }, { "epoch": 2.27, "learning_rate": 4.208243214317638e-05, "loss": 1.4596, "step": 28809 }, { "epoch": 2.27, "learning_rate": 4.20738481456951e-05, "loss": 1.4542, "step": 28810 }, { "epoch": 2.27, "learning_rate": 4.206526488097288e-05, "loss": 1.4741, "step": 28811 }, { "epoch": 2.27, "learning_rate": 4.205668234906793e-05, "loss": 1.4833, "step": 28812 }, { "epoch": 2.27, "learning_rate": 4.204810055003851e-05, "loss": 1.4434, "step": 28813 }, { "epoch": 2.27, "learning_rate": 4.203951948394295e-05, "loss": 1.4628, "step": 28814 }, { "epoch": 2.27, "learning_rate": 4.2030939150839496e-05, "loss": 1.4633, "step": 28815 }, { "epoch": 2.27, "learning_rate": 4.202235955078632e-05, "loss": 1.4395, "step": 28816 }, { "epoch": 2.27, "learning_rate": 4.201378068384172e-05, "loss": 1.4292, "step": 28817 }, { "epoch": 2.27, "learning_rate": 4.200520255006404e-05, "loss": 1.4307, "step": 28818 }, { "epoch": 2.27, "learning_rate": 4.199662514951142e-05, "loss": 1.4151, "step": 28819 }, { "epoch": 2.27, "learning_rate": 4.198804848224206e-05, "loss": 1.4563, "step": 28820 }, { "epoch": 2.27, "learning_rate": 4.197947254831429e-05, "loss": 1.411, "step": 28821 }, { "epoch": 2.27, "learning_rate": 4.19708973477863e-05, "loss": 1.4872, "step": 28822 }, { "epoch": 2.27, "learning_rate": 4.1962322880716266e-05, "loss": 1.4564, "step": 28823 }, { "epoch": 2.27, "learning_rate": 4.1953749147162466e-05, "loss": 1.467, "step": 28824 }, { "epoch": 2.27, "learning_rate": 4.1945176147183095e-05, "loss": 1.4616, "step": 28825 }, { "epoch": 2.27, "learning_rate": 4.193660388083635e-05, "loss": 1.3998, "step": 28826 }, { "epoch": 2.27, "learning_rate": 4.192803234818038e-05, "loss": 1.4157, "step": 28827 }, { "epoch": 2.27, "learning_rate": 4.191946154927347e-05, "loss": 1.4284, "step": 28828 }, { "epoch": 2.27, "learning_rate": 4.191089148417378e-05, "loss": 1.4168, "step": 28829 }, { "epoch": 2.27, "learning_rate": 4.1902322152939436e-05, "loss": 1.4693, "step": 28830 }, { "epoch": 2.27, "learning_rate": 4.189375355562868e-05, "loss": 1.4954, "step": 28831 }, { "epoch": 2.27, "learning_rate": 4.1885185692299715e-05, "loss": 1.4314, "step": 28832 }, { "epoch": 2.27, "learning_rate": 4.18766185630107e-05, "loss": 1.5111, "step": 28833 }, { "epoch": 2.27, "learning_rate": 4.186805216781971e-05, "loss": 1.4134, "step": 28834 }, { "epoch": 2.27, "learning_rate": 4.185948650678502e-05, "loss": 1.4335, "step": 28835 }, { "epoch": 2.27, "learning_rate": 4.185092157996474e-05, "loss": 1.422, "step": 28836 }, { "epoch": 2.27, "learning_rate": 4.1842357387416993e-05, "loss": 1.4467, "step": 28837 }, { "epoch": 2.27, "learning_rate": 4.183379392919999e-05, "loss": 1.4391, "step": 28838 }, { "epoch": 2.27, "learning_rate": 4.182523120537182e-05, "loss": 1.4627, "step": 28839 }, { "epoch": 2.27, "learning_rate": 4.18166692159906e-05, "loss": 1.4923, "step": 28840 }, { "epoch": 2.27, "learning_rate": 4.180810796111454e-05, "loss": 1.4632, "step": 28841 }, { "epoch": 2.27, "learning_rate": 4.179954744080172e-05, "loss": 1.4403, "step": 28842 }, { "epoch": 2.27, "learning_rate": 4.179098765511022e-05, "loss": 1.4178, "step": 28843 }, { "epoch": 2.27, "learning_rate": 4.178242860409825e-05, "loss": 1.4494, "step": 28844 }, { "epoch": 2.27, "learning_rate": 4.177387028782387e-05, "loss": 1.4916, "step": 28845 }, { "epoch": 2.27, "learning_rate": 4.176531270634518e-05, "loss": 1.435, "step": 28846 }, { "epoch": 2.27, "learning_rate": 4.1756755859720196e-05, "loss": 1.5, "step": 28847 }, { "epoch": 2.27, "learning_rate": 4.17481997480072e-05, "loss": 1.3983, "step": 28848 }, { "epoch": 2.27, "learning_rate": 4.1739644371264186e-05, "loss": 1.4458, "step": 28849 }, { "epoch": 2.27, "learning_rate": 4.173108972954924e-05, "loss": 1.4152, "step": 28850 }, { "epoch": 2.27, "learning_rate": 4.172253582292041e-05, "loss": 1.4418, "step": 28851 }, { "epoch": 2.27, "learning_rate": 4.171398265143585e-05, "loss": 1.5067, "step": 28852 }, { "epoch": 2.27, "learning_rate": 4.17054302151536e-05, "loss": 1.4252, "step": 28853 }, { "epoch": 2.27, "learning_rate": 4.169687851413166e-05, "loss": 1.4671, "step": 28854 }, { "epoch": 2.27, "learning_rate": 4.1688327548428205e-05, "loss": 1.4622, "step": 28855 }, { "epoch": 2.27, "learning_rate": 4.167977731810123e-05, "loss": 1.4368, "step": 28856 }, { "epoch": 2.27, "learning_rate": 4.167122782320874e-05, "loss": 1.4291, "step": 28857 }, { "epoch": 2.27, "learning_rate": 4.166267906380888e-05, "loss": 1.4942, "step": 28858 }, { "epoch": 2.27, "learning_rate": 4.165413103995965e-05, "loss": 1.4353, "step": 28859 }, { "epoch": 2.27, "learning_rate": 4.1645583751719033e-05, "loss": 1.4161, "step": 28860 }, { "epoch": 2.27, "learning_rate": 4.163703719914515e-05, "loss": 1.4748, "step": 28861 }, { "epoch": 2.27, "learning_rate": 4.162849138229598e-05, "loss": 1.4196, "step": 28862 }, { "epoch": 2.27, "learning_rate": 4.161994630122951e-05, "loss": 1.4834, "step": 28863 }, { "epoch": 2.27, "learning_rate": 4.16114019560038e-05, "loss": 1.4187, "step": 28864 }, { "epoch": 2.27, "learning_rate": 4.160285834667689e-05, "loss": 1.464, "step": 28865 }, { "epoch": 2.27, "learning_rate": 4.159431547330677e-05, "loss": 1.4562, "step": 28866 }, { "epoch": 2.27, "learning_rate": 4.1585773335951404e-05, "loss": 1.4431, "step": 28867 }, { "epoch": 2.27, "learning_rate": 4.157723193466876e-05, "loss": 1.4857, "step": 28868 }, { "epoch": 2.27, "learning_rate": 4.156869126951695e-05, "loss": 1.4712, "step": 28869 }, { "epoch": 2.27, "learning_rate": 4.1560151340553874e-05, "loss": 1.4514, "step": 28870 }, { "epoch": 2.27, "learning_rate": 4.1551612147837495e-05, "loss": 1.4353, "step": 28871 }, { "epoch": 2.27, "learning_rate": 4.154307369142585e-05, "loss": 1.45, "step": 28872 }, { "epoch": 2.27, "learning_rate": 4.153453597137689e-05, "loss": 1.5114, "step": 28873 }, { "epoch": 2.27, "learning_rate": 4.152599898774854e-05, "loss": 1.4672, "step": 28874 }, { "epoch": 2.27, "learning_rate": 4.1517462740598825e-05, "loss": 1.4686, "step": 28875 }, { "epoch": 2.27, "learning_rate": 4.150892722998569e-05, "loss": 1.488, "step": 28876 }, { "epoch": 2.27, "learning_rate": 4.1500392455967015e-05, "loss": 1.4678, "step": 28877 }, { "epoch": 2.27, "learning_rate": 4.149185841860083e-05, "loss": 1.4681, "step": 28878 }, { "epoch": 2.27, "learning_rate": 4.1483325117945026e-05, "loss": 1.4466, "step": 28879 }, { "epoch": 2.27, "learning_rate": 4.147479255405758e-05, "loss": 1.4344, "step": 28880 }, { "epoch": 2.27, "learning_rate": 4.1466260726996395e-05, "loss": 1.4241, "step": 28881 }, { "epoch": 2.27, "learning_rate": 4.145772963681942e-05, "loss": 1.4823, "step": 28882 }, { "epoch": 2.27, "learning_rate": 4.144919928358457e-05, "loss": 1.4372, "step": 28883 }, { "epoch": 2.27, "learning_rate": 4.1440669667349754e-05, "loss": 1.451, "step": 28884 }, { "epoch": 2.27, "learning_rate": 4.1432140788172826e-05, "loss": 1.4778, "step": 28885 }, { "epoch": 2.27, "learning_rate": 4.1423612646111827e-05, "loss": 1.4374, "step": 28886 }, { "epoch": 2.27, "learning_rate": 4.141508524122456e-05, "loss": 1.4728, "step": 28887 }, { "epoch": 2.27, "learning_rate": 4.1406558573568885e-05, "loss": 1.4427, "step": 28888 }, { "epoch": 2.27, "learning_rate": 4.139803264320281e-05, "loss": 1.5097, "step": 28889 }, { "epoch": 2.27, "learning_rate": 4.138950745018417e-05, "loss": 1.4653, "step": 28890 }, { "epoch": 2.27, "learning_rate": 4.138098299457078e-05, "loss": 1.4761, "step": 28891 }, { "epoch": 2.27, "learning_rate": 4.137245927642061e-05, "loss": 1.4791, "step": 28892 }, { "epoch": 2.27, "learning_rate": 4.136393629579152e-05, "loss": 1.4454, "step": 28893 }, { "epoch": 2.27, "learning_rate": 4.13554140527413e-05, "loss": 1.4768, "step": 28894 }, { "epoch": 2.27, "learning_rate": 4.1346892547327856e-05, "loss": 1.466, "step": 28895 }, { "epoch": 2.27, "learning_rate": 4.133837177960909e-05, "loss": 1.4356, "step": 28896 }, { "epoch": 2.27, "learning_rate": 4.132985174964283e-05, "loss": 1.4412, "step": 28897 }, { "epoch": 2.27, "learning_rate": 4.132133245748685e-05, "loss": 1.437, "step": 28898 }, { "epoch": 2.27, "learning_rate": 4.131281390319911e-05, "loss": 1.4627, "step": 28899 }, { "epoch": 2.27, "learning_rate": 4.130429608683738e-05, "loss": 1.3812, "step": 28900 }, { "epoch": 2.27, "learning_rate": 4.129577900845945e-05, "loss": 1.4578, "step": 28901 }, { "epoch": 2.27, "learning_rate": 4.128726266812323e-05, "loss": 1.4562, "step": 28902 }, { "epoch": 2.27, "learning_rate": 4.12787470658865e-05, "loss": 1.4698, "step": 28903 }, { "epoch": 2.27, "learning_rate": 4.1270232201807095e-05, "loss": 1.5205, "step": 28904 }, { "epoch": 2.27, "learning_rate": 4.126171807594276e-05, "loss": 1.4346, "step": 28905 }, { "epoch": 2.27, "learning_rate": 4.1253204688351405e-05, "loss": 1.4203, "step": 28906 }, { "epoch": 2.27, "learning_rate": 4.1244692039090774e-05, "loss": 1.3855, "step": 28907 }, { "epoch": 2.27, "learning_rate": 4.123618012821862e-05, "loss": 1.4248, "step": 28908 }, { "epoch": 2.27, "learning_rate": 4.122766895579282e-05, "loss": 1.4602, "step": 28909 }, { "epoch": 2.27, "learning_rate": 4.121915852187109e-05, "loss": 1.428, "step": 28910 }, { "epoch": 2.27, "learning_rate": 4.121064882651129e-05, "loss": 1.4371, "step": 28911 }, { "epoch": 2.27, "learning_rate": 4.12021398697711e-05, "loss": 1.4662, "step": 28912 }, { "epoch": 2.27, "learning_rate": 4.119363165170838e-05, "loss": 1.4317, "step": 28913 }, { "epoch": 2.27, "learning_rate": 4.118512417238085e-05, "loss": 1.4676, "step": 28914 }, { "epoch": 2.28, "learning_rate": 4.117661743184625e-05, "loss": 1.4197, "step": 28915 }, { "epoch": 2.28, "learning_rate": 4.116811143016241e-05, "loss": 1.4743, "step": 28916 }, { "epoch": 2.28, "learning_rate": 4.115960616738702e-05, "loss": 1.4927, "step": 28917 }, { "epoch": 2.28, "learning_rate": 4.1151101643577804e-05, "loss": 1.4674, "step": 28918 }, { "epoch": 2.28, "learning_rate": 4.114259785879258e-05, "loss": 1.5218, "step": 28919 }, { "epoch": 2.28, "learning_rate": 4.113409481308905e-05, "loss": 1.4769, "step": 28920 }, { "epoch": 2.28, "learning_rate": 4.112559250652494e-05, "loss": 1.4963, "step": 28921 }, { "epoch": 2.28, "learning_rate": 4.111709093915793e-05, "loss": 1.4383, "step": 28922 }, { "epoch": 2.28, "learning_rate": 4.110859011104583e-05, "loss": 1.4513, "step": 28923 }, { "epoch": 2.28, "learning_rate": 4.1100090022246306e-05, "loss": 1.4835, "step": 28924 }, { "epoch": 2.28, "learning_rate": 4.109159067281703e-05, "loss": 1.4519, "step": 28925 }, { "epoch": 2.28, "learning_rate": 4.108309206281576e-05, "loss": 1.444, "step": 28926 }, { "epoch": 2.28, "learning_rate": 4.107459419230023e-05, "loss": 1.4399, "step": 28927 }, { "epoch": 2.28, "learning_rate": 4.10660970613281e-05, "loss": 1.465, "step": 28928 }, { "epoch": 2.28, "learning_rate": 4.105760066995701e-05, "loss": 1.4425, "step": 28929 }, { "epoch": 2.28, "learning_rate": 4.104910501824473e-05, "loss": 1.4544, "step": 28930 }, { "epoch": 2.28, "learning_rate": 4.104061010624891e-05, "loss": 1.4256, "step": 28931 }, { "epoch": 2.28, "learning_rate": 4.1032115934027165e-05, "loss": 1.4036, "step": 28932 }, { "epoch": 2.28, "learning_rate": 4.1023622501637284e-05, "loss": 1.4065, "step": 28933 }, { "epoch": 2.28, "learning_rate": 4.101512980913685e-05, "loss": 1.4456, "step": 28934 }, { "epoch": 2.28, "learning_rate": 4.1006637856583504e-05, "loss": 1.4669, "step": 28935 }, { "epoch": 2.28, "learning_rate": 4.099814664403498e-05, "loss": 1.4665, "step": 28936 }, { "epoch": 2.28, "learning_rate": 4.098965617154888e-05, "loss": 1.4174, "step": 28937 }, { "epoch": 2.28, "learning_rate": 4.098116643918287e-05, "loss": 1.4664, "step": 28938 }, { "epoch": 2.28, "learning_rate": 4.0972677446994545e-05, "loss": 1.4523, "step": 28939 }, { "epoch": 2.28, "learning_rate": 4.096418919504161e-05, "loss": 1.4606, "step": 28940 }, { "epoch": 2.28, "learning_rate": 4.095570168338165e-05, "loss": 1.4181, "step": 28941 }, { "epoch": 2.28, "learning_rate": 4.094721491207222e-05, "loss": 1.4235, "step": 28942 }, { "epoch": 2.28, "learning_rate": 4.093872888117109e-05, "loss": 1.4926, "step": 28943 }, { "epoch": 2.28, "learning_rate": 4.0930243590735835e-05, "loss": 1.4039, "step": 28944 }, { "epoch": 2.28, "learning_rate": 4.092175904082402e-05, "loss": 1.4511, "step": 28945 }, { "epoch": 2.28, "learning_rate": 4.091327523149322e-05, "loss": 1.4585, "step": 28946 }, { "epoch": 2.28, "learning_rate": 4.0904792162801135e-05, "loss": 1.4277, "step": 28947 }, { "epoch": 2.28, "learning_rate": 4.089630983480531e-05, "loss": 1.4739, "step": 28948 }, { "epoch": 2.28, "learning_rate": 4.088782824756327e-05, "loss": 1.4348, "step": 28949 }, { "epoch": 2.28, "learning_rate": 4.087934740113273e-05, "loss": 1.4863, "step": 28950 }, { "epoch": 2.28, "learning_rate": 4.087086729557118e-05, "loss": 1.4488, "step": 28951 }, { "epoch": 2.28, "learning_rate": 4.08623879309362e-05, "loss": 1.4321, "step": 28952 }, { "epoch": 2.28, "learning_rate": 4.0853909307285396e-05, "loss": 1.4278, "step": 28953 }, { "epoch": 2.28, "learning_rate": 4.0845431424676345e-05, "loss": 1.4783, "step": 28954 }, { "epoch": 2.28, "learning_rate": 4.0836954283166505e-05, "loss": 1.4423, "step": 28955 }, { "epoch": 2.28, "learning_rate": 4.082847788281357e-05, "loss": 1.4938, "step": 28956 }, { "epoch": 2.28, "learning_rate": 4.082000222367497e-05, "loss": 1.3963, "step": 28957 }, { "epoch": 2.28, "learning_rate": 4.081152730580836e-05, "loss": 1.441, "step": 28958 }, { "epoch": 2.28, "learning_rate": 4.080305312927117e-05, "loss": 1.4678, "step": 28959 }, { "epoch": 2.28, "learning_rate": 4.079457969412103e-05, "loss": 1.5053, "step": 28960 }, { "epoch": 2.28, "learning_rate": 4.078610700041544e-05, "loss": 1.4779, "step": 28961 }, { "epoch": 2.28, "learning_rate": 4.07776350482119e-05, "loss": 1.4644, "step": 28962 }, { "epoch": 2.28, "learning_rate": 4.076916383756791e-05, "loss": 1.4509, "step": 28963 }, { "epoch": 2.28, "learning_rate": 4.076069336854107e-05, "loss": 1.4447, "step": 28964 }, { "epoch": 2.28, "learning_rate": 4.075222364118882e-05, "loss": 1.4552, "step": 28965 }, { "epoch": 2.28, "learning_rate": 4.074375465556866e-05, "loss": 1.435, "step": 28966 }, { "epoch": 2.28, "learning_rate": 4.0735286411738146e-05, "loss": 1.4386, "step": 28967 }, { "epoch": 2.28, "learning_rate": 4.072681890975474e-05, "loss": 1.3981, "step": 28968 }, { "epoch": 2.28, "learning_rate": 4.071835214967588e-05, "loss": 1.4185, "step": 28969 }, { "epoch": 2.28, "learning_rate": 4.070988613155917e-05, "loss": 1.5176, "step": 28970 }, { "epoch": 2.28, "learning_rate": 4.0701420855462e-05, "loss": 1.4417, "step": 28971 }, { "epoch": 2.28, "learning_rate": 4.0692956321441825e-05, "loss": 1.4476, "step": 28972 }, { "epoch": 2.28, "learning_rate": 4.068449252955616e-05, "loss": 1.4482, "step": 28973 }, { "epoch": 2.28, "learning_rate": 4.067602947986252e-05, "loss": 1.4565, "step": 28974 }, { "epoch": 2.28, "learning_rate": 4.066756717241829e-05, "loss": 1.479, "step": 28975 }, { "epoch": 2.28, "learning_rate": 4.0659105607280914e-05, "loss": 1.4453, "step": 28976 }, { "epoch": 2.28, "learning_rate": 4.0650644784507916e-05, "loss": 1.4607, "step": 28977 }, { "epoch": 2.28, "learning_rate": 4.06421847041567e-05, "loss": 1.4623, "step": 28978 }, { "epoch": 2.28, "learning_rate": 4.063372536628469e-05, "loss": 1.432, "step": 28979 }, { "epoch": 2.28, "learning_rate": 4.062526677094928e-05, "loss": 1.4726, "step": 28980 }, { "epoch": 2.28, "learning_rate": 4.061680891820801e-05, "loss": 1.4621, "step": 28981 }, { "epoch": 2.28, "learning_rate": 4.060835180811824e-05, "loss": 1.4398, "step": 28982 }, { "epoch": 2.28, "learning_rate": 4.0599895440737355e-05, "loss": 1.4473, "step": 28983 }, { "epoch": 2.28, "learning_rate": 4.059143981612285e-05, "loss": 1.4747, "step": 28984 }, { "epoch": 2.28, "learning_rate": 4.058298493433208e-05, "loss": 1.4714, "step": 28985 }, { "epoch": 2.28, "learning_rate": 4.0574530795422435e-05, "loss": 1.4629, "step": 28986 }, { "epoch": 2.28, "learning_rate": 4.056607739945136e-05, "loss": 1.4503, "step": 28987 }, { "epoch": 2.28, "learning_rate": 4.055762474647626e-05, "loss": 1.4475, "step": 28988 }, { "epoch": 2.28, "learning_rate": 4.054917283655442e-05, "loss": 1.4833, "step": 28989 }, { "epoch": 2.28, "learning_rate": 4.054072166974331e-05, "loss": 1.4833, "step": 28990 }, { "epoch": 2.28, "learning_rate": 4.053227124610034e-05, "loss": 1.4577, "step": 28991 }, { "epoch": 2.28, "learning_rate": 4.052382156568283e-05, "loss": 1.4481, "step": 28992 }, { "epoch": 2.28, "learning_rate": 4.051537262854813e-05, "loss": 1.4392, "step": 28993 }, { "epoch": 2.28, "learning_rate": 4.050692443475367e-05, "loss": 1.4589, "step": 28994 }, { "epoch": 2.28, "learning_rate": 4.049847698435677e-05, "loss": 1.4398, "step": 28995 }, { "epoch": 2.28, "learning_rate": 4.049003027741478e-05, "loss": 1.486, "step": 28996 }, { "epoch": 2.28, "learning_rate": 4.0481584313985e-05, "loss": 1.4609, "step": 28997 }, { "epoch": 2.28, "learning_rate": 4.047313909412487e-05, "loss": 1.4078, "step": 28998 }, { "epoch": 2.28, "learning_rate": 4.04646946178917e-05, "loss": 1.4385, "step": 28999 }, { "epoch": 2.28, "learning_rate": 4.045625088534275e-05, "loss": 1.4178, "step": 29000 }, { "epoch": 2.28, "learning_rate": 4.044780789653546e-05, "loss": 1.508, "step": 29001 }, { "epoch": 2.28, "learning_rate": 4.0439365651527086e-05, "loss": 1.4269, "step": 29002 }, { "epoch": 2.28, "learning_rate": 4.0430924150374916e-05, "loss": 1.4442, "step": 29003 }, { "epoch": 2.28, "learning_rate": 4.0422483393136304e-05, "loss": 1.4924, "step": 29004 }, { "epoch": 2.28, "learning_rate": 4.0414043379868616e-05, "loss": 1.3891, "step": 29005 }, { "epoch": 2.28, "learning_rate": 4.04056041106291e-05, "loss": 1.4711, "step": 29006 }, { "epoch": 2.28, "learning_rate": 4.039716558547499e-05, "loss": 1.4707, "step": 29007 }, { "epoch": 2.28, "learning_rate": 4.0388727804463696e-05, "loss": 1.4461, "step": 29008 }, { "epoch": 2.28, "learning_rate": 4.038029076765245e-05, "loss": 1.4378, "step": 29009 }, { "epoch": 2.28, "learning_rate": 4.0371854475098496e-05, "loss": 1.4682, "step": 29010 }, { "epoch": 2.28, "learning_rate": 4.0363418926859206e-05, "loss": 1.4411, "step": 29011 }, { "epoch": 2.28, "learning_rate": 4.035498412299179e-05, "loss": 1.4896, "step": 29012 }, { "epoch": 2.28, "learning_rate": 4.034655006355348e-05, "loss": 1.4715, "step": 29013 }, { "epoch": 2.28, "learning_rate": 4.033811674860162e-05, "loss": 1.4392, "step": 29014 }, { "epoch": 2.28, "learning_rate": 4.032968417819343e-05, "loss": 1.4255, "step": 29015 }, { "epoch": 2.28, "learning_rate": 4.032125235238618e-05, "loss": 1.4839, "step": 29016 }, { "epoch": 2.28, "learning_rate": 4.031282127123705e-05, "loss": 1.4482, "step": 29017 }, { "epoch": 2.28, "learning_rate": 4.030439093480336e-05, "loss": 1.3805, "step": 29018 }, { "epoch": 2.28, "learning_rate": 4.0295961343142346e-05, "loss": 1.4369, "step": 29019 }, { "epoch": 2.28, "learning_rate": 4.028753249631115e-05, "loss": 1.4072, "step": 29020 }, { "epoch": 2.28, "learning_rate": 4.0279104394367085e-05, "loss": 1.4168, "step": 29021 }, { "epoch": 2.28, "learning_rate": 4.027067703736738e-05, "loss": 1.4761, "step": 29022 }, { "epoch": 2.28, "learning_rate": 4.026225042536923e-05, "loss": 1.4057, "step": 29023 }, { "epoch": 2.28, "learning_rate": 4.02538245584298e-05, "loss": 1.4313, "step": 29024 }, { "epoch": 2.28, "learning_rate": 4.024539943660637e-05, "loss": 1.4718, "step": 29025 }, { "epoch": 2.28, "learning_rate": 4.023697505995613e-05, "loss": 1.4391, "step": 29026 }, { "epoch": 2.28, "learning_rate": 4.0228551428536197e-05, "loss": 1.4742, "step": 29027 }, { "epoch": 2.28, "learning_rate": 4.0220128542403865e-05, "loss": 1.3864, "step": 29028 }, { "epoch": 2.28, "learning_rate": 4.021170640161629e-05, "loss": 1.4949, "step": 29029 }, { "epoch": 2.28, "learning_rate": 4.02032850062306e-05, "loss": 1.3927, "step": 29030 }, { "epoch": 2.28, "learning_rate": 4.019486435630404e-05, "loss": 1.4784, "step": 29031 }, { "epoch": 2.28, "learning_rate": 4.018644445189378e-05, "loss": 1.4386, "step": 29032 }, { "epoch": 2.28, "learning_rate": 4.0178025293056936e-05, "loss": 1.3978, "step": 29033 }, { "epoch": 2.28, "learning_rate": 4.016960687985067e-05, "loss": 1.5011, "step": 29034 }, { "epoch": 2.28, "learning_rate": 4.0161189212332214e-05, "loss": 1.4901, "step": 29035 }, { "epoch": 2.28, "learning_rate": 4.01527722905586e-05, "loss": 1.4806, "step": 29036 }, { "epoch": 2.28, "learning_rate": 4.01443561145871e-05, "loss": 1.4299, "step": 29037 }, { "epoch": 2.28, "learning_rate": 4.0135940684474754e-05, "loss": 1.4225, "step": 29038 }, { "epoch": 2.28, "learning_rate": 4.0127526000278805e-05, "loss": 1.4552, "step": 29039 }, { "epoch": 2.28, "learning_rate": 4.01191120620563e-05, "loss": 1.4474, "step": 29040 }, { "epoch": 2.28, "learning_rate": 4.011069886986434e-05, "loss": 1.4984, "step": 29041 }, { "epoch": 2.29, "learning_rate": 4.010228642376015e-05, "loss": 1.4574, "step": 29042 }, { "epoch": 2.29, "learning_rate": 4.009387472380079e-05, "loss": 1.4475, "step": 29043 }, { "epoch": 2.29, "learning_rate": 4.008546377004331e-05, "loss": 1.4513, "step": 29044 }, { "epoch": 2.29, "learning_rate": 4.007705356254494e-05, "loss": 1.4653, "step": 29045 }, { "epoch": 2.29, "learning_rate": 4.0068644101362696e-05, "loss": 1.4137, "step": 29046 }, { "epoch": 2.29, "learning_rate": 4.0060235386553666e-05, "loss": 1.4425, "step": 29047 }, { "epoch": 2.29, "learning_rate": 4.0051827418175e-05, "loss": 1.4615, "step": 29048 }, { "epoch": 2.29, "learning_rate": 4.0043420196283756e-05, "loss": 1.3843, "step": 29049 }, { "epoch": 2.29, "learning_rate": 4.0035013720937e-05, "loss": 1.4487, "step": 29050 }, { "epoch": 2.29, "learning_rate": 4.002660799219178e-05, "loss": 1.4454, "step": 29051 }, { "epoch": 2.29, "learning_rate": 4.0018203010105216e-05, "loss": 1.4106, "step": 29052 }, { "epoch": 2.29, "learning_rate": 4.000979877473439e-05, "loss": 1.4369, "step": 29053 }, { "epoch": 2.29, "learning_rate": 4.000139528613629e-05, "loss": 1.3957, "step": 29054 }, { "epoch": 2.29, "learning_rate": 3.9992992544368064e-05, "loss": 1.4634, "step": 29055 }, { "epoch": 2.29, "learning_rate": 3.998459054948671e-05, "loss": 1.46, "step": 29056 }, { "epoch": 2.29, "learning_rate": 3.997618930154927e-05, "loss": 1.4536, "step": 29057 }, { "epoch": 2.29, "learning_rate": 3.996778880061275e-05, "loss": 1.4905, "step": 29058 }, { "epoch": 2.29, "learning_rate": 3.995938904673426e-05, "loss": 1.4339, "step": 29059 }, { "epoch": 2.29, "learning_rate": 3.99509900399708e-05, "loss": 1.4672, "step": 29060 }, { "epoch": 2.29, "learning_rate": 3.994259178037934e-05, "loss": 1.4671, "step": 29061 }, { "epoch": 2.29, "learning_rate": 3.9934194268017e-05, "loss": 1.5185, "step": 29062 }, { "epoch": 2.29, "learning_rate": 3.992579750294073e-05, "loss": 1.4867, "step": 29063 }, { "epoch": 2.29, "learning_rate": 3.9917401485207504e-05, "loss": 1.5055, "step": 29064 }, { "epoch": 2.29, "learning_rate": 3.990900621487442e-05, "loss": 1.4928, "step": 29065 }, { "epoch": 2.29, "learning_rate": 3.990061169199843e-05, "loss": 1.4286, "step": 29066 }, { "epoch": 2.29, "learning_rate": 3.98922179166365e-05, "loss": 1.4408, "step": 29067 }, { "epoch": 2.29, "learning_rate": 3.9883824888845636e-05, "loss": 1.4854, "step": 29068 }, { "epoch": 2.29, "learning_rate": 3.987543260868288e-05, "loss": 1.4638, "step": 29069 }, { "epoch": 2.29, "learning_rate": 3.986704107620517e-05, "loss": 1.4651, "step": 29070 }, { "epoch": 2.29, "learning_rate": 3.985865029146941e-05, "loss": 1.4701, "step": 29071 }, { "epoch": 2.29, "learning_rate": 3.9850260254532693e-05, "loss": 1.3882, "step": 29072 }, { "epoch": 2.29, "learning_rate": 3.984187096545194e-05, "loss": 1.4642, "step": 29073 }, { "epoch": 2.29, "learning_rate": 3.983348242428406e-05, "loss": 1.4734, "step": 29074 }, { "epoch": 2.29, "learning_rate": 3.982509463108603e-05, "loss": 1.469, "step": 29075 }, { "epoch": 2.29, "learning_rate": 3.981670758591483e-05, "loss": 1.4329, "step": 29076 }, { "epoch": 2.29, "learning_rate": 3.980832128882737e-05, "loss": 1.3651, "step": 29077 }, { "epoch": 2.29, "learning_rate": 3.979993573988057e-05, "loss": 1.4356, "step": 29078 }, { "epoch": 2.29, "learning_rate": 3.979155093913143e-05, "loss": 1.4469, "step": 29079 }, { "epoch": 2.29, "learning_rate": 3.9783166886636856e-05, "loss": 1.4742, "step": 29080 }, { "epoch": 2.29, "learning_rate": 3.977478358245371e-05, "loss": 1.4282, "step": 29081 }, { "epoch": 2.29, "learning_rate": 3.9766401026638985e-05, "loss": 1.3853, "step": 29082 }, { "epoch": 2.29, "learning_rate": 3.9758019219249525e-05, "loss": 1.4385, "step": 29083 }, { "epoch": 2.29, "learning_rate": 3.974963816034233e-05, "loss": 1.4735, "step": 29084 }, { "epoch": 2.29, "learning_rate": 3.974125784997421e-05, "loss": 1.4895, "step": 29085 }, { "epoch": 2.29, "learning_rate": 3.973287828820215e-05, "loss": 1.4661, "step": 29086 }, { "epoch": 2.29, "learning_rate": 3.972449947508297e-05, "loss": 1.4679, "step": 29087 }, { "epoch": 2.29, "learning_rate": 3.971612141067356e-05, "loss": 1.4238, "step": 29088 }, { "epoch": 2.29, "learning_rate": 3.9707744095030876e-05, "loss": 1.4437, "step": 29089 }, { "epoch": 2.29, "learning_rate": 3.969936752821173e-05, "loss": 1.4299, "step": 29090 }, { "epoch": 2.29, "learning_rate": 3.9690991710273005e-05, "loss": 1.448, "step": 29091 }, { "epoch": 2.29, "learning_rate": 3.968261664127155e-05, "loss": 1.4406, "step": 29092 }, { "epoch": 2.29, "learning_rate": 3.967424232126429e-05, "loss": 1.424, "step": 29093 }, { "epoch": 2.29, "learning_rate": 3.9665868750308034e-05, "loss": 1.4647, "step": 29094 }, { "epoch": 2.29, "learning_rate": 3.965749592845959e-05, "loss": 1.4468, "step": 29095 }, { "epoch": 2.29, "learning_rate": 3.96491238557759e-05, "loss": 1.4554, "step": 29096 }, { "epoch": 2.29, "learning_rate": 3.964075253231377e-05, "loss": 1.4582, "step": 29097 }, { "epoch": 2.29, "learning_rate": 3.963238195813e-05, "loss": 1.5159, "step": 29098 }, { "epoch": 2.29, "learning_rate": 3.962401213328143e-05, "loss": 1.5163, "step": 29099 }, { "epoch": 2.29, "learning_rate": 3.961564305782497e-05, "loss": 1.4885, "step": 29100 }, { "epoch": 2.29, "learning_rate": 3.9607274731817356e-05, "loss": 1.4777, "step": 29101 }, { "epoch": 2.29, "learning_rate": 3.95989071553154e-05, "loss": 1.4083, "step": 29102 }, { "epoch": 2.29, "learning_rate": 3.9590540328375974e-05, "loss": 1.4443, "step": 29103 }, { "epoch": 2.29, "learning_rate": 3.958217425105585e-05, "loss": 1.4138, "step": 29104 }, { "epoch": 2.29, "learning_rate": 3.957380892341179e-05, "loss": 1.4415, "step": 29105 }, { "epoch": 2.29, "learning_rate": 3.956544434550068e-05, "loss": 1.4658, "step": 29106 }, { "epoch": 2.29, "learning_rate": 3.955708051737925e-05, "loss": 1.4623, "step": 29107 }, { "epoch": 2.29, "learning_rate": 3.95487174391043e-05, "loss": 1.4244, "step": 29108 }, { "epoch": 2.29, "learning_rate": 3.954035511073256e-05, "loss": 1.507, "step": 29109 }, { "epoch": 2.29, "learning_rate": 3.953199353232089e-05, "loss": 1.4602, "step": 29110 }, { "epoch": 2.29, "learning_rate": 3.952363270392603e-05, "loss": 1.4832, "step": 29111 }, { "epoch": 2.29, "learning_rate": 3.95152726256047e-05, "loss": 1.4334, "step": 29112 }, { "epoch": 2.29, "learning_rate": 3.950691329741373e-05, "loss": 1.4376, "step": 29113 }, { "epoch": 2.29, "learning_rate": 3.9498554719409804e-05, "loss": 1.4725, "step": 29114 }, { "epoch": 2.29, "learning_rate": 3.949019689164976e-05, "loss": 1.4173, "step": 29115 }, { "epoch": 2.29, "learning_rate": 3.948183981419024e-05, "loss": 1.5424, "step": 29116 }, { "epoch": 2.29, "learning_rate": 3.94734834870881e-05, "loss": 1.4163, "step": 29117 }, { "epoch": 2.29, "learning_rate": 3.94651279104e-05, "loss": 1.4488, "step": 29118 }, { "epoch": 2.29, "learning_rate": 3.945677308418264e-05, "loss": 1.4704, "step": 29119 }, { "epoch": 2.29, "learning_rate": 3.944841900849284e-05, "loss": 1.3841, "step": 29120 }, { "epoch": 2.29, "learning_rate": 3.944006568338726e-05, "loss": 1.3952, "step": 29121 }, { "epoch": 2.29, "learning_rate": 3.943171310892259e-05, "loss": 1.4607, "step": 29122 }, { "epoch": 2.29, "learning_rate": 3.94233612851556e-05, "loss": 1.4157, "step": 29123 }, { "epoch": 2.29, "learning_rate": 3.941501021214297e-05, "loss": 1.467, "step": 29124 }, { "epoch": 2.29, "learning_rate": 3.940665988994135e-05, "loss": 1.5205, "step": 29125 }, { "epoch": 2.29, "learning_rate": 3.939831031860753e-05, "loss": 1.4923, "step": 29126 }, { "epoch": 2.29, "learning_rate": 3.938996149819814e-05, "loss": 1.4288, "step": 29127 }, { "epoch": 2.29, "learning_rate": 3.938161342876988e-05, "loss": 1.4451, "step": 29128 }, { "epoch": 2.29, "learning_rate": 3.9373266110379376e-05, "loss": 1.4109, "step": 29129 }, { "epoch": 2.29, "learning_rate": 3.9364919543083345e-05, "loss": 1.4187, "step": 29130 }, { "epoch": 2.29, "learning_rate": 3.935657372693849e-05, "loss": 1.4303, "step": 29131 }, { "epoch": 2.29, "learning_rate": 3.9348228662001446e-05, "loss": 1.4454, "step": 29132 }, { "epoch": 2.29, "learning_rate": 3.933988434832884e-05, "loss": 1.4836, "step": 29133 }, { "epoch": 2.29, "learning_rate": 3.9331540785977366e-05, "loss": 1.4726, "step": 29134 }, { "epoch": 2.29, "learning_rate": 3.9323197975003676e-05, "loss": 1.4911, "step": 29135 }, { "epoch": 2.29, "learning_rate": 3.931485591546436e-05, "loss": 1.4518, "step": 29136 }, { "epoch": 2.29, "learning_rate": 3.930651460741612e-05, "loss": 1.4056, "step": 29137 }, { "epoch": 2.29, "learning_rate": 3.929817405091556e-05, "loss": 1.4267, "step": 29138 }, { "epoch": 2.29, "learning_rate": 3.9289834246019274e-05, "loss": 1.4806, "step": 29139 }, { "epoch": 2.29, "learning_rate": 3.928149519278395e-05, "loss": 1.4424, "step": 29140 }, { "epoch": 2.29, "learning_rate": 3.927315689126618e-05, "loss": 1.4503, "step": 29141 }, { "epoch": 2.29, "learning_rate": 3.926481934152252e-05, "loss": 1.4753, "step": 29142 }, { "epoch": 2.29, "learning_rate": 3.9256482543609696e-05, "loss": 1.4403, "step": 29143 }, { "epoch": 2.29, "learning_rate": 3.924814649758422e-05, "loss": 1.494, "step": 29144 }, { "epoch": 2.29, "learning_rate": 3.923981120350272e-05, "loss": 1.41, "step": 29145 }, { "epoch": 2.29, "learning_rate": 3.923147666142168e-05, "loss": 1.4351, "step": 29146 }, { "epoch": 2.29, "learning_rate": 3.9223142871397886e-05, "loss": 1.4439, "step": 29147 }, { "epoch": 2.29, "learning_rate": 3.921480983348782e-05, "loss": 1.4228, "step": 29148 }, { "epoch": 2.29, "learning_rate": 3.920647754774806e-05, "loss": 1.4479, "step": 29149 }, { "epoch": 2.29, "learning_rate": 3.919814601423513e-05, "loss": 1.3798, "step": 29150 }, { "epoch": 2.29, "learning_rate": 3.918981523300569e-05, "loss": 1.4501, "step": 29151 }, { "epoch": 2.29, "learning_rate": 3.9181485204116234e-05, "loss": 1.4349, "step": 29152 }, { "epoch": 2.29, "learning_rate": 3.917315592762331e-05, "loss": 1.5113, "step": 29153 }, { "epoch": 2.29, "learning_rate": 3.9164827403583554e-05, "loss": 1.4266, "step": 29154 }, { "epoch": 2.29, "learning_rate": 3.915649963205343e-05, "loss": 1.4297, "step": 29155 }, { "epoch": 2.29, "learning_rate": 3.914817261308949e-05, "loss": 1.468, "step": 29156 }, { "epoch": 2.29, "learning_rate": 3.913984634674831e-05, "loss": 1.4588, "step": 29157 }, { "epoch": 2.29, "learning_rate": 3.91315208330864e-05, "loss": 1.4432, "step": 29158 }, { "epoch": 2.29, "learning_rate": 3.912319607216025e-05, "loss": 1.4648, "step": 29159 }, { "epoch": 2.29, "learning_rate": 3.911487206402644e-05, "loss": 1.4972, "step": 29160 }, { "epoch": 2.29, "learning_rate": 3.910654880874146e-05, "loss": 1.4472, "step": 29161 }, { "epoch": 2.29, "learning_rate": 3.909822630636178e-05, "loss": 1.4858, "step": 29162 }, { "epoch": 2.29, "learning_rate": 3.908990455694393e-05, "loss": 1.4874, "step": 29163 }, { "epoch": 2.29, "learning_rate": 3.9081583560544465e-05, "loss": 1.4007, "step": 29164 }, { "epoch": 2.29, "learning_rate": 3.907326331721985e-05, "loss": 1.4624, "step": 29165 }, { "epoch": 2.29, "learning_rate": 3.906494382702652e-05, "loss": 1.4506, "step": 29166 }, { "epoch": 2.29, "learning_rate": 3.9056625090021045e-05, "loss": 1.5162, "step": 29167 }, { "epoch": 2.29, "learning_rate": 3.904830710625985e-05, "loss": 1.4952, "step": 29168 }, { "epoch": 2.3, "learning_rate": 3.9039989875799435e-05, "loss": 1.4452, "step": 29169 }, { "epoch": 2.3, "learning_rate": 3.9031673398696206e-05, "loss": 1.4378, "step": 29170 }, { "epoch": 2.3, "learning_rate": 3.9023357675006714e-05, "loss": 1.446, "step": 29171 }, { "epoch": 2.3, "learning_rate": 3.9015042704787384e-05, "loss": 1.4401, "step": 29172 }, { "epoch": 2.3, "learning_rate": 3.9006728488094635e-05, "loss": 1.4639, "step": 29173 }, { "epoch": 2.3, "learning_rate": 3.899841502498498e-05, "loss": 1.3643, "step": 29174 }, { "epoch": 2.3, "learning_rate": 3.899010231551484e-05, "loss": 1.4457, "step": 29175 }, { "epoch": 2.3, "learning_rate": 3.898179035974061e-05, "loss": 1.4471, "step": 29176 }, { "epoch": 2.3, "learning_rate": 3.897347915771874e-05, "loss": 1.5455, "step": 29177 }, { "epoch": 2.3, "learning_rate": 3.8965168709505734e-05, "loss": 1.4399, "step": 29178 }, { "epoch": 2.3, "learning_rate": 3.895685901515795e-05, "loss": 1.4036, "step": 29179 }, { "epoch": 2.3, "learning_rate": 3.894855007473177e-05, "loss": 1.4168, "step": 29180 }, { "epoch": 2.3, "learning_rate": 3.8940241888283705e-05, "loss": 1.4331, "step": 29181 }, { "epoch": 2.3, "learning_rate": 3.8931934455870095e-05, "loss": 1.4398, "step": 29182 }, { "epoch": 2.3, "learning_rate": 3.892362777754732e-05, "loss": 1.4159, "step": 29183 }, { "epoch": 2.3, "learning_rate": 3.8915321853371865e-05, "loss": 1.448, "step": 29184 }, { "epoch": 2.3, "learning_rate": 3.890701668340007e-05, "loss": 1.4748, "step": 29185 }, { "epoch": 2.3, "learning_rate": 3.8898712267688324e-05, "loss": 1.4411, "step": 29186 }, { "epoch": 2.3, "learning_rate": 3.8890408606292975e-05, "loss": 1.4562, "step": 29187 }, { "epoch": 2.3, "learning_rate": 3.8882105699270474e-05, "loss": 1.4841, "step": 29188 }, { "epoch": 2.3, "learning_rate": 3.8873803546677146e-05, "loss": 1.4653, "step": 29189 }, { "epoch": 2.3, "learning_rate": 3.8865502148569336e-05, "loss": 1.4139, "step": 29190 }, { "epoch": 2.3, "learning_rate": 3.8857201505003476e-05, "loss": 1.4505, "step": 29191 }, { "epoch": 2.3, "learning_rate": 3.8848901616035884e-05, "loss": 1.4577, "step": 29192 }, { "epoch": 2.3, "learning_rate": 3.884060248172288e-05, "loss": 1.5082, "step": 29193 }, { "epoch": 2.3, "learning_rate": 3.883230410212083e-05, "loss": 1.457, "step": 29194 }, { "epoch": 2.3, "learning_rate": 3.8824006477286135e-05, "loss": 1.5146, "step": 29195 }, { "epoch": 2.3, "learning_rate": 3.8815709607275074e-05, "loss": 1.4308, "step": 29196 }, { "epoch": 2.3, "learning_rate": 3.8807413492143957e-05, "loss": 1.4849, "step": 29197 }, { "epoch": 2.3, "learning_rate": 3.879911813194917e-05, "loss": 1.3727, "step": 29198 }, { "epoch": 2.3, "learning_rate": 3.879082352674702e-05, "loss": 1.4926, "step": 29199 }, { "epoch": 2.3, "learning_rate": 3.878252967659377e-05, "loss": 1.4577, "step": 29200 }, { "epoch": 2.3, "learning_rate": 3.87742365815458e-05, "loss": 1.4549, "step": 29201 }, { "epoch": 2.3, "learning_rate": 3.876594424165939e-05, "loss": 1.4128, "step": 29202 }, { "epoch": 2.3, "learning_rate": 3.8757652656990825e-05, "loss": 1.4569, "step": 29203 }, { "epoch": 2.3, "learning_rate": 3.874936182759637e-05, "loss": 1.4482, "step": 29204 }, { "epoch": 2.3, "learning_rate": 3.87410717535324e-05, "loss": 1.4152, "step": 29205 }, { "epoch": 2.3, "learning_rate": 3.873278243485516e-05, "loss": 1.4384, "step": 29206 }, { "epoch": 2.3, "learning_rate": 3.872449387162087e-05, "loss": 1.4431, "step": 29207 }, { "epoch": 2.3, "learning_rate": 3.8716206063885925e-05, "loss": 1.4497, "step": 29208 }, { "epoch": 2.3, "learning_rate": 3.8707919011706464e-05, "loss": 1.4029, "step": 29209 }, { "epoch": 2.3, "learning_rate": 3.869963271513887e-05, "loss": 1.4599, "step": 29210 }, { "epoch": 2.3, "learning_rate": 3.8691347174239294e-05, "loss": 1.4265, "step": 29211 }, { "epoch": 2.3, "learning_rate": 3.86830623890641e-05, "loss": 1.4655, "step": 29212 }, { "epoch": 2.3, "learning_rate": 3.867477835966949e-05, "loss": 1.4639, "step": 29213 }, { "epoch": 2.3, "learning_rate": 3.8666495086111646e-05, "loss": 1.4713, "step": 29214 }, { "epoch": 2.3, "learning_rate": 3.86582125684469e-05, "loss": 1.4996, "step": 29215 }, { "epoch": 2.3, "learning_rate": 3.864993080673146e-05, "loss": 1.4718, "step": 29216 }, { "epoch": 2.3, "learning_rate": 3.86416498010215e-05, "loss": 1.4766, "step": 29217 }, { "epoch": 2.3, "learning_rate": 3.863336955137331e-05, "loss": 1.4871, "step": 29218 }, { "epoch": 2.3, "learning_rate": 3.8625090057843104e-05, "loss": 1.4315, "step": 29219 }, { "epoch": 2.3, "learning_rate": 3.861681132048702e-05, "loss": 1.4491, "step": 29220 }, { "epoch": 2.3, "learning_rate": 3.860853333936137e-05, "loss": 1.4495, "step": 29221 }, { "epoch": 2.3, "learning_rate": 3.86002561145223e-05, "loss": 1.4574, "step": 29222 }, { "epoch": 2.3, "learning_rate": 3.859197964602601e-05, "loss": 1.4116, "step": 29223 }, { "epoch": 2.3, "learning_rate": 3.858370393392863e-05, "loss": 1.4873, "step": 29224 }, { "epoch": 2.3, "learning_rate": 3.857542897828649e-05, "loss": 1.4544, "step": 29225 }, { "epoch": 2.3, "learning_rate": 3.8567154779155704e-05, "loss": 1.4747, "step": 29226 }, { "epoch": 2.3, "learning_rate": 3.855888133659244e-05, "loss": 1.414, "step": 29227 }, { "epoch": 2.3, "learning_rate": 3.855060865065284e-05, "loss": 1.4424, "step": 29228 }, { "epoch": 2.3, "learning_rate": 3.854233672139313e-05, "loss": 1.4861, "step": 29229 }, { "epoch": 2.3, "learning_rate": 3.853406554886946e-05, "loss": 1.4756, "step": 29230 }, { "epoch": 2.3, "learning_rate": 3.8525795133137915e-05, "loss": 1.4621, "step": 29231 }, { "epoch": 2.3, "learning_rate": 3.851752547425477e-05, "loss": 1.4394, "step": 29232 }, { "epoch": 2.3, "learning_rate": 3.8509256572276087e-05, "loss": 1.4317, "step": 29233 }, { "epoch": 2.3, "learning_rate": 3.8500988427258e-05, "loss": 1.4409, "step": 29234 }, { "epoch": 2.3, "learning_rate": 3.84927210392567e-05, "loss": 1.4757, "step": 29235 }, { "epoch": 2.3, "learning_rate": 3.84844544083283e-05, "loss": 1.4709, "step": 29236 }, { "epoch": 2.3, "learning_rate": 3.847618853452885e-05, "loss": 1.4187, "step": 29237 }, { "epoch": 2.3, "learning_rate": 3.8467923417914605e-05, "loss": 1.4785, "step": 29238 }, { "epoch": 2.3, "learning_rate": 3.845965905854159e-05, "loss": 1.4557, "step": 29239 }, { "epoch": 2.3, "learning_rate": 3.845139545646591e-05, "loss": 1.4761, "step": 29240 }, { "epoch": 2.3, "learning_rate": 3.844313261174368e-05, "loss": 1.4112, "step": 29241 }, { "epoch": 2.3, "learning_rate": 3.8434870524431076e-05, "loss": 1.4333, "step": 29242 }, { "epoch": 2.3, "learning_rate": 3.842660919458414e-05, "loss": 1.4744, "step": 29243 }, { "epoch": 2.3, "learning_rate": 3.841834862225894e-05, "loss": 1.4635, "step": 29244 }, { "epoch": 2.3, "learning_rate": 3.841008880751154e-05, "loss": 1.4605, "step": 29245 }, { "epoch": 2.3, "learning_rate": 3.840182975039811e-05, "loss": 1.4506, "step": 29246 }, { "epoch": 2.3, "learning_rate": 3.839357145097466e-05, "loss": 1.4209, "step": 29247 }, { "epoch": 2.3, "learning_rate": 3.838531390929722e-05, "loss": 1.4333, "step": 29248 }, { "epoch": 2.3, "learning_rate": 3.8377057125421976e-05, "loss": 1.4642, "step": 29249 }, { "epoch": 2.3, "learning_rate": 3.836880109940488e-05, "loss": 1.4562, "step": 29250 }, { "epoch": 2.3, "learning_rate": 3.836054583130199e-05, "loss": 1.4789, "step": 29251 }, { "epoch": 2.3, "learning_rate": 3.835229132116944e-05, "loss": 1.4386, "step": 29252 }, { "epoch": 2.3, "learning_rate": 3.834403756906322e-05, "loss": 1.4968, "step": 29253 }, { "epoch": 2.3, "learning_rate": 3.833578457503931e-05, "loss": 1.4535, "step": 29254 }, { "epoch": 2.3, "learning_rate": 3.832753233915386e-05, "loss": 1.4828, "step": 29255 }, { "epoch": 2.3, "learning_rate": 3.8319280861462787e-05, "loss": 1.4823, "step": 29256 }, { "epoch": 2.3, "learning_rate": 3.8311030142022206e-05, "loss": 1.4291, "step": 29257 }, { "epoch": 2.3, "learning_rate": 3.830278018088807e-05, "loss": 1.4353, "step": 29258 }, { "epoch": 2.3, "learning_rate": 3.8294530978116445e-05, "loss": 1.4761, "step": 29259 }, { "epoch": 2.3, "learning_rate": 3.8286282533763304e-05, "loss": 1.4417, "step": 29260 }, { "epoch": 2.3, "learning_rate": 3.827803484788468e-05, "loss": 1.4394, "step": 29261 }, { "epoch": 2.3, "learning_rate": 3.826978792053647e-05, "loss": 1.4149, "step": 29262 }, { "epoch": 2.3, "learning_rate": 3.826154175177481e-05, "loss": 1.396, "step": 29263 }, { "epoch": 2.3, "learning_rate": 3.8253296341655616e-05, "loss": 1.4726, "step": 29264 }, { "epoch": 2.3, "learning_rate": 3.8245051690234826e-05, "loss": 1.4653, "step": 29265 }, { "epoch": 2.3, "learning_rate": 3.8236807797568505e-05, "loss": 1.4706, "step": 29266 }, { "epoch": 2.3, "learning_rate": 3.822856466371259e-05, "loss": 1.4986, "step": 29267 }, { "epoch": 2.3, "learning_rate": 3.8220322288722995e-05, "loss": 1.4219, "step": 29268 }, { "epoch": 2.3, "learning_rate": 3.8212080672655757e-05, "loss": 1.4892, "step": 29269 }, { "epoch": 2.3, "learning_rate": 3.8203839815566813e-05, "loss": 1.4393, "step": 29270 }, { "epoch": 2.3, "learning_rate": 3.8195599717512056e-05, "loss": 1.4755, "step": 29271 }, { "epoch": 2.3, "learning_rate": 3.818736037854747e-05, "loss": 1.452, "step": 29272 }, { "epoch": 2.3, "learning_rate": 3.817912179872907e-05, "loss": 1.459, "step": 29273 }, { "epoch": 2.3, "learning_rate": 3.8170883978112716e-05, "loss": 1.4454, "step": 29274 }, { "epoch": 2.3, "learning_rate": 3.816264691675429e-05, "loss": 1.466, "step": 29275 }, { "epoch": 2.3, "learning_rate": 3.815441061470984e-05, "loss": 1.4261, "step": 29276 }, { "epoch": 2.3, "learning_rate": 3.81461750720352e-05, "loss": 1.4352, "step": 29277 }, { "epoch": 2.3, "learning_rate": 3.813794028878627e-05, "loss": 1.4418, "step": 29278 }, { "epoch": 2.3, "learning_rate": 3.8129706265019037e-05, "loss": 1.5267, "step": 29279 }, { "epoch": 2.3, "learning_rate": 3.812147300078937e-05, "loss": 1.4576, "step": 29280 }, { "epoch": 2.3, "learning_rate": 3.8113240496153156e-05, "loss": 1.4537, "step": 29281 }, { "epoch": 2.3, "learning_rate": 3.8105008751166236e-05, "loss": 1.4725, "step": 29282 }, { "epoch": 2.3, "learning_rate": 3.809677776588463e-05, "loss": 1.48, "step": 29283 }, { "epoch": 2.3, "learning_rate": 3.8088547540364135e-05, "loss": 1.5164, "step": 29284 }, { "epoch": 2.3, "learning_rate": 3.808031807466059e-05, "loss": 1.4198, "step": 29285 }, { "epoch": 2.3, "learning_rate": 3.807208936882998e-05, "loss": 1.479, "step": 29286 }, { "epoch": 2.3, "learning_rate": 3.806386142292808e-05, "loss": 1.422, "step": 29287 }, { "epoch": 2.3, "learning_rate": 3.805563423701083e-05, "loss": 1.4492, "step": 29288 }, { "epoch": 2.3, "learning_rate": 3.8047407811133994e-05, "loss": 1.4481, "step": 29289 }, { "epoch": 2.3, "learning_rate": 3.803918214535353e-05, "loss": 1.4631, "step": 29290 }, { "epoch": 2.3, "learning_rate": 3.803095723972522e-05, "loss": 1.4727, "step": 29291 }, { "epoch": 2.3, "learning_rate": 3.8022733094304896e-05, "loss": 1.482, "step": 29292 }, { "epoch": 2.3, "learning_rate": 3.8014509709148456e-05, "loss": 1.4606, "step": 29293 }, { "epoch": 2.3, "learning_rate": 3.800628708431169e-05, "loss": 1.4697, "step": 29294 }, { "epoch": 2.3, "learning_rate": 3.79980652198504e-05, "loss": 1.4436, "step": 29295 }, { "epoch": 2.31, "learning_rate": 3.798984411582048e-05, "loss": 1.4183, "step": 29296 }, { "epoch": 2.31, "learning_rate": 3.7981623772277694e-05, "loss": 1.4689, "step": 29297 }, { "epoch": 2.31, "learning_rate": 3.7973404189277876e-05, "loss": 1.449, "step": 29298 }, { "epoch": 2.31, "learning_rate": 3.7965185366876776e-05, "loss": 1.4967, "step": 29299 }, { "epoch": 2.31, "learning_rate": 3.795696730513028e-05, "loss": 1.4489, "step": 29300 }, { "epoch": 2.31, "learning_rate": 3.7948750004094166e-05, "loss": 1.4893, "step": 29301 }, { "epoch": 2.31, "learning_rate": 3.7940533463824146e-05, "loss": 1.4111, "step": 29302 }, { "epoch": 2.31, "learning_rate": 3.7932317684376054e-05, "loss": 1.4896, "step": 29303 }, { "epoch": 2.31, "learning_rate": 3.792410266580573e-05, "loss": 1.3941, "step": 29304 }, { "epoch": 2.31, "learning_rate": 3.7915888408168915e-05, "loss": 1.5065, "step": 29305 }, { "epoch": 2.31, "learning_rate": 3.790767491152132e-05, "loss": 1.5066, "step": 29306 }, { "epoch": 2.31, "learning_rate": 3.789946217591878e-05, "loss": 1.4628, "step": 29307 }, { "epoch": 2.31, "learning_rate": 3.7891250201417046e-05, "loss": 1.4539, "step": 29308 }, { "epoch": 2.31, "learning_rate": 3.7883038988071794e-05, "loss": 1.4321, "step": 29309 }, { "epoch": 2.31, "learning_rate": 3.78748285359389e-05, "loss": 1.5047, "step": 29310 }, { "epoch": 2.31, "learning_rate": 3.7866618845074035e-05, "loss": 1.4136, "step": 29311 }, { "epoch": 2.31, "learning_rate": 3.785840991553291e-05, "loss": 1.4721, "step": 29312 }, { "epoch": 2.31, "learning_rate": 3.785020174737134e-05, "loss": 1.4683, "step": 29313 }, { "epoch": 2.31, "learning_rate": 3.7841994340645004e-05, "loss": 1.4475, "step": 29314 }, { "epoch": 2.31, "learning_rate": 3.7833787695409626e-05, "loss": 1.4551, "step": 29315 }, { "epoch": 2.31, "learning_rate": 3.7825581811720896e-05, "loss": 1.4198, "step": 29316 }, { "epoch": 2.31, "learning_rate": 3.781737668963461e-05, "loss": 1.382, "step": 29317 }, { "epoch": 2.31, "learning_rate": 3.780917232920643e-05, "loss": 1.4766, "step": 29318 }, { "epoch": 2.31, "learning_rate": 3.780096873049197e-05, "loss": 1.4431, "step": 29319 }, { "epoch": 2.31, "learning_rate": 3.77927658935471e-05, "loss": 1.4297, "step": 29320 }, { "epoch": 2.31, "learning_rate": 3.778456381842742e-05, "loss": 1.4697, "step": 29321 }, { "epoch": 2.31, "learning_rate": 3.777636250518864e-05, "loss": 1.4609, "step": 29322 }, { "epoch": 2.31, "learning_rate": 3.776816195388637e-05, "loss": 1.443, "step": 29323 }, { "epoch": 2.31, "learning_rate": 3.775996216457641e-05, "loss": 1.406, "step": 29324 }, { "epoch": 2.31, "learning_rate": 3.775176313731435e-05, "loss": 1.4703, "step": 29325 }, { "epoch": 2.31, "learning_rate": 3.774356487215584e-05, "loss": 1.4694, "step": 29326 }, { "epoch": 2.31, "learning_rate": 3.773536736915662e-05, "loss": 1.4571, "step": 29327 }, { "epoch": 2.31, "learning_rate": 3.7727170628372285e-05, "loss": 1.4434, "step": 29328 }, { "epoch": 2.31, "learning_rate": 3.771897464985848e-05, "loss": 1.4165, "step": 29329 }, { "epoch": 2.31, "learning_rate": 3.7710779433670915e-05, "loss": 1.4714, "step": 29330 }, { "epoch": 2.31, "learning_rate": 3.7702584979865186e-05, "loss": 1.4516, "step": 29331 }, { "epoch": 2.31, "learning_rate": 3.7694391288496886e-05, "loss": 1.4045, "step": 29332 }, { "epoch": 2.31, "learning_rate": 3.768619835962176e-05, "loss": 1.4503, "step": 29333 }, { "epoch": 2.31, "learning_rate": 3.767800619329531e-05, "loss": 1.4004, "step": 29334 }, { "epoch": 2.31, "learning_rate": 3.766981478957325e-05, "loss": 1.4606, "step": 29335 }, { "epoch": 2.31, "learning_rate": 3.7661624148511125e-05, "loss": 1.4509, "step": 29336 }, { "epoch": 2.31, "learning_rate": 3.765343427016463e-05, "loss": 1.4751, "step": 29337 }, { "epoch": 2.31, "learning_rate": 3.764524515458929e-05, "loss": 1.4606, "step": 29338 }, { "epoch": 2.31, "learning_rate": 3.763705680184076e-05, "loss": 1.4599, "step": 29339 }, { "epoch": 2.31, "learning_rate": 3.762886921197455e-05, "loss": 1.469, "step": 29340 }, { "epoch": 2.31, "learning_rate": 3.762068238504635e-05, "loss": 1.4395, "step": 29341 }, { "epoch": 2.31, "learning_rate": 3.761249632111171e-05, "loss": 1.4756, "step": 29342 }, { "epoch": 2.31, "learning_rate": 3.760431102022615e-05, "loss": 1.4128, "step": 29343 }, { "epoch": 2.31, "learning_rate": 3.7596126482445344e-05, "loss": 1.4827, "step": 29344 }, { "epoch": 2.31, "learning_rate": 3.7587942707824805e-05, "loss": 1.4052, "step": 29345 }, { "epoch": 2.31, "learning_rate": 3.757975969642005e-05, "loss": 1.4302, "step": 29346 }, { "epoch": 2.31, "learning_rate": 3.7571577448286734e-05, "loss": 1.4885, "step": 29347 }, { "epoch": 2.31, "learning_rate": 3.756339596348037e-05, "loss": 1.4639, "step": 29348 }, { "epoch": 2.31, "learning_rate": 3.755521524205645e-05, "loss": 1.4423, "step": 29349 }, { "epoch": 2.31, "learning_rate": 3.754703528407057e-05, "loss": 1.4398, "step": 29350 }, { "epoch": 2.31, "learning_rate": 3.753885608957831e-05, "loss": 1.4528, "step": 29351 }, { "epoch": 2.31, "learning_rate": 3.753067765863515e-05, "loss": 1.4308, "step": 29352 }, { "epoch": 2.31, "learning_rate": 3.752249999129659e-05, "loss": 1.4171, "step": 29353 }, { "epoch": 2.31, "learning_rate": 3.751432308761822e-05, "loss": 1.4542, "step": 29354 }, { "epoch": 2.31, "learning_rate": 3.750614694765551e-05, "loss": 1.4119, "step": 29355 }, { "epoch": 2.31, "learning_rate": 3.749797157146401e-05, "loss": 1.4455, "step": 29356 }, { "epoch": 2.31, "learning_rate": 3.748979695909914e-05, "loss": 1.4964, "step": 29357 }, { "epoch": 2.31, "learning_rate": 3.748162311061649e-05, "loss": 1.4755, "step": 29358 }, { "epoch": 2.31, "learning_rate": 3.747345002607154e-05, "loss": 1.4633, "step": 29359 }, { "epoch": 2.31, "learning_rate": 3.746527770551973e-05, "loss": 1.4535, "step": 29360 }, { "epoch": 2.31, "learning_rate": 3.745710614901662e-05, "loss": 1.4545, "step": 29361 }, { "epoch": 2.31, "learning_rate": 3.7448935356617665e-05, "loss": 1.4228, "step": 29362 }, { "epoch": 2.31, "learning_rate": 3.744076532837826e-05, "loss": 1.4707, "step": 29363 }, { "epoch": 2.31, "learning_rate": 3.7432596064354006e-05, "loss": 1.4606, "step": 29364 }, { "epoch": 2.31, "learning_rate": 3.742442756460031e-05, "loss": 1.4737, "step": 29365 }, { "epoch": 2.31, "learning_rate": 3.741625982917256e-05, "loss": 1.4945, "step": 29366 }, { "epoch": 2.31, "learning_rate": 3.7408092858126284e-05, "loss": 1.5138, "step": 29367 }, { "epoch": 2.31, "learning_rate": 3.739992665151697e-05, "loss": 1.5043, "step": 29368 }, { "epoch": 2.31, "learning_rate": 3.7391761209400026e-05, "loss": 1.4003, "step": 29369 }, { "epoch": 2.31, "learning_rate": 3.738359653183083e-05, "loss": 1.4852, "step": 29370 }, { "epoch": 2.31, "learning_rate": 3.7375432618864906e-05, "loss": 1.4485, "step": 29371 }, { "epoch": 2.31, "learning_rate": 3.736726947055766e-05, "loss": 1.4427, "step": 29372 }, { "epoch": 2.31, "learning_rate": 3.7359107086964485e-05, "loss": 1.4558, "step": 29373 }, { "epoch": 2.31, "learning_rate": 3.7350945468140756e-05, "loss": 1.4155, "step": 29374 }, { "epoch": 2.31, "learning_rate": 3.7342784614142005e-05, "loss": 1.4734, "step": 29375 }, { "epoch": 2.31, "learning_rate": 3.733462452502357e-05, "loss": 1.4844, "step": 29376 }, { "epoch": 2.31, "learning_rate": 3.732646520084082e-05, "loss": 1.4578, "step": 29377 }, { "epoch": 2.31, "learning_rate": 3.7318306641649244e-05, "loss": 1.4597, "step": 29378 }, { "epoch": 2.31, "learning_rate": 3.7310148847504174e-05, "loss": 1.4679, "step": 29379 }, { "epoch": 2.31, "learning_rate": 3.730199181846095e-05, "loss": 1.4044, "step": 29380 }, { "epoch": 2.31, "learning_rate": 3.729383555457507e-05, "loss": 1.4484, "step": 29381 }, { "epoch": 2.31, "learning_rate": 3.7285680055901796e-05, "loss": 1.5134, "step": 29382 }, { "epoch": 2.31, "learning_rate": 3.7277525322496606e-05, "loss": 1.4419, "step": 29383 }, { "epoch": 2.31, "learning_rate": 3.726937135441477e-05, "loss": 1.4613, "step": 29384 }, { "epoch": 2.31, "learning_rate": 3.7261218151711743e-05, "loss": 1.4299, "step": 29385 }, { "epoch": 2.31, "learning_rate": 3.7253065714442816e-05, "loss": 1.4348, "step": 29386 }, { "epoch": 2.31, "learning_rate": 3.724491404266331e-05, "loss": 1.4482, "step": 29387 }, { "epoch": 2.31, "learning_rate": 3.7236763136428664e-05, "loss": 1.4274, "step": 29388 }, { "epoch": 2.31, "learning_rate": 3.722861299579417e-05, "loss": 1.3954, "step": 29389 }, { "epoch": 2.31, "learning_rate": 3.722046362081512e-05, "loss": 1.4167, "step": 29390 }, { "epoch": 2.31, "learning_rate": 3.721231501154692e-05, "loss": 1.4611, "step": 29391 }, { "epoch": 2.31, "learning_rate": 3.720416716804486e-05, "loss": 1.471, "step": 29392 }, { "epoch": 2.31, "learning_rate": 3.719602009036426e-05, "loss": 1.483, "step": 29393 }, { "epoch": 2.31, "learning_rate": 3.71878737785604e-05, "loss": 1.493, "step": 29394 }, { "epoch": 2.31, "learning_rate": 3.717972823268866e-05, "loss": 1.4662, "step": 29395 }, { "epoch": 2.31, "learning_rate": 3.717158345280429e-05, "loss": 1.4375, "step": 29396 }, { "epoch": 2.31, "learning_rate": 3.716343943896259e-05, "loss": 1.4667, "step": 29397 }, { "epoch": 2.31, "learning_rate": 3.7155296191218856e-05, "loss": 1.4571, "step": 29398 }, { "epoch": 2.31, "learning_rate": 3.714715370962842e-05, "loss": 1.4021, "step": 29399 }, { "epoch": 2.31, "learning_rate": 3.713901199424654e-05, "loss": 1.45, "step": 29400 }, { "epoch": 2.31, "learning_rate": 3.7130871045128446e-05, "loss": 1.4126, "step": 29401 }, { "epoch": 2.31, "learning_rate": 3.712273086232949e-05, "loss": 1.4802, "step": 29402 }, { "epoch": 2.31, "learning_rate": 3.7114591445904904e-05, "loss": 1.468, "step": 29403 }, { "epoch": 2.31, "learning_rate": 3.710645279590991e-05, "loss": 1.4325, "step": 29404 }, { "epoch": 2.31, "learning_rate": 3.709831491239984e-05, "loss": 1.4655, "step": 29405 }, { "epoch": 2.31, "learning_rate": 3.70901777954299e-05, "loss": 1.4946, "step": 29406 }, { "epoch": 2.31, "learning_rate": 3.708204144505531e-05, "loss": 1.4598, "step": 29407 }, { "epoch": 2.31, "learning_rate": 3.7073905861331376e-05, "loss": 1.4602, "step": 29408 }, { "epoch": 2.31, "learning_rate": 3.706577104431332e-05, "loss": 1.5245, "step": 29409 }, { "epoch": 2.31, "learning_rate": 3.7057636994056346e-05, "loss": 1.5176, "step": 29410 }, { "epoch": 2.31, "learning_rate": 3.7049503710615655e-05, "loss": 1.432, "step": 29411 }, { "epoch": 2.31, "learning_rate": 3.7041371194046535e-05, "loss": 1.4908, "step": 29412 }, { "epoch": 2.31, "learning_rate": 3.703323944440414e-05, "loss": 1.3729, "step": 29413 }, { "epoch": 2.31, "learning_rate": 3.7025108461743735e-05, "loss": 1.4907, "step": 29414 }, { "epoch": 2.31, "learning_rate": 3.701697824612047e-05, "loss": 1.4879, "step": 29415 }, { "epoch": 2.31, "learning_rate": 3.70088487975896e-05, "loss": 1.4523, "step": 29416 }, { "epoch": 2.31, "learning_rate": 3.7000720116206315e-05, "loss": 1.4667, "step": 29417 }, { "epoch": 2.31, "learning_rate": 3.699259220202572e-05, "loss": 1.4241, "step": 29418 }, { "epoch": 2.31, "learning_rate": 3.698446505510311e-05, "loss": 1.446, "step": 29419 }, { "epoch": 2.31, "learning_rate": 3.697633867549363e-05, "loss": 1.4413, "step": 29420 }, { "epoch": 2.31, "learning_rate": 3.696821306325237e-05, "loss": 1.4923, "step": 29421 }, { "epoch": 2.31, "learning_rate": 3.696008821843463e-05, "loss": 1.4189, "step": 29422 }, { "epoch": 2.32, "learning_rate": 3.6951964141095505e-05, "loss": 1.5031, "step": 29423 }, { "epoch": 2.32, "learning_rate": 3.694384083129011e-05, "loss": 1.4192, "step": 29424 }, { "epoch": 2.32, "learning_rate": 3.69357182890737e-05, "loss": 1.4826, "step": 29425 }, { "epoch": 2.32, "learning_rate": 3.692759651450135e-05, "loss": 1.4479, "step": 29426 }, { "epoch": 2.32, "learning_rate": 3.6919475507628244e-05, "loss": 1.403, "step": 29427 }, { "epoch": 2.32, "learning_rate": 3.691135526850945e-05, "loss": 1.4402, "step": 29428 }, { "epoch": 2.32, "learning_rate": 3.6903235797200134e-05, "loss": 1.4696, "step": 29429 }, { "epoch": 2.32, "learning_rate": 3.689511709375547e-05, "loss": 1.4421, "step": 29430 }, { "epoch": 2.32, "learning_rate": 3.688699915823052e-05, "loss": 1.4535, "step": 29431 }, { "epoch": 2.32, "learning_rate": 3.687888199068046e-05, "loss": 1.447, "step": 29432 }, { "epoch": 2.32, "learning_rate": 3.6870765591160364e-05, "loss": 1.423, "step": 29433 }, { "epoch": 2.32, "learning_rate": 3.686264995972536e-05, "loss": 1.4435, "step": 29434 }, { "epoch": 2.32, "learning_rate": 3.685453509643046e-05, "loss": 1.468, "step": 29435 }, { "epoch": 2.32, "learning_rate": 3.684642100133087e-05, "loss": 1.4783, "step": 29436 }, { "epoch": 2.32, "learning_rate": 3.6838307674481665e-05, "loss": 1.4141, "step": 29437 }, { "epoch": 2.32, "learning_rate": 3.683019511593783e-05, "loss": 1.4706, "step": 29438 }, { "epoch": 2.32, "learning_rate": 3.682208332575458e-05, "loss": 1.4198, "step": 29439 }, { "epoch": 2.32, "learning_rate": 3.681397230398692e-05, "loss": 1.4831, "step": 29440 }, { "epoch": 2.32, "learning_rate": 3.680586205068989e-05, "loss": 1.4581, "step": 29441 }, { "epoch": 2.32, "learning_rate": 3.679775256591862e-05, "loss": 1.4404, "step": 29442 }, { "epoch": 2.32, "learning_rate": 3.6789643849728154e-05, "loss": 1.3945, "step": 29443 }, { "epoch": 2.32, "learning_rate": 3.678153590217349e-05, "loss": 1.496, "step": 29444 }, { "epoch": 2.32, "learning_rate": 3.6773428723309703e-05, "loss": 1.4423, "step": 29445 }, { "epoch": 2.32, "learning_rate": 3.6765322313191915e-05, "loss": 1.4896, "step": 29446 }, { "epoch": 2.32, "learning_rate": 3.6757216671875084e-05, "loss": 1.4676, "step": 29447 }, { "epoch": 2.32, "learning_rate": 3.674911179941422e-05, "loss": 1.3923, "step": 29448 }, { "epoch": 2.32, "learning_rate": 3.674100769586443e-05, "loss": 1.4795, "step": 29449 }, { "epoch": 2.32, "learning_rate": 3.673290436128071e-05, "loss": 1.4584, "step": 29450 }, { "epoch": 2.32, "learning_rate": 3.6724801795718045e-05, "loss": 1.4312, "step": 29451 }, { "epoch": 2.32, "learning_rate": 3.6716699999231437e-05, "loss": 1.4365, "step": 29452 }, { "epoch": 2.32, "learning_rate": 3.670859897187595e-05, "loss": 1.5086, "step": 29453 }, { "epoch": 2.32, "learning_rate": 3.6700498713706566e-05, "loss": 1.4219, "step": 29454 }, { "epoch": 2.32, "learning_rate": 3.6692399224778236e-05, "loss": 1.4381, "step": 29455 }, { "epoch": 2.32, "learning_rate": 3.668430050514601e-05, "loss": 1.4333, "step": 29456 }, { "epoch": 2.32, "learning_rate": 3.6676202554864875e-05, "loss": 1.4789, "step": 29457 }, { "epoch": 2.32, "learning_rate": 3.666810537398973e-05, "loss": 1.4875, "step": 29458 }, { "epoch": 2.32, "learning_rate": 3.6660008962575654e-05, "loss": 1.4475, "step": 29459 }, { "epoch": 2.32, "learning_rate": 3.6651913320677515e-05, "loss": 1.4516, "step": 29460 }, { "epoch": 2.32, "learning_rate": 3.664381844835039e-05, "loss": 1.4708, "step": 29461 }, { "epoch": 2.32, "learning_rate": 3.663572434564914e-05, "loss": 1.4586, "step": 29462 }, { "epoch": 2.32, "learning_rate": 3.662763101262881e-05, "loss": 1.4537, "step": 29463 }, { "epoch": 2.32, "learning_rate": 3.66195384493443e-05, "loss": 1.4655, "step": 29464 }, { "epoch": 2.32, "learning_rate": 3.661144665585049e-05, "loss": 1.4166, "step": 29465 }, { "epoch": 2.32, "learning_rate": 3.6603355632202454e-05, "loss": 1.4314, "step": 29466 }, { "epoch": 2.32, "learning_rate": 3.659526537845504e-05, "loss": 1.4587, "step": 29467 }, { "epoch": 2.32, "learning_rate": 3.6587175894663195e-05, "loss": 1.4454, "step": 29468 }, { "epoch": 2.32, "learning_rate": 3.657908718088181e-05, "loss": 1.48, "step": 29469 }, { "epoch": 2.32, "learning_rate": 3.657099923716586e-05, "loss": 1.4615, "step": 29470 }, { "epoch": 2.32, "learning_rate": 3.656291206357023e-05, "loss": 1.4557, "step": 29471 }, { "epoch": 2.32, "learning_rate": 3.65548256601498e-05, "loss": 1.4084, "step": 29472 }, { "epoch": 2.32, "learning_rate": 3.654674002695952e-05, "loss": 1.432, "step": 29473 }, { "epoch": 2.32, "learning_rate": 3.653865516405428e-05, "loss": 1.4635, "step": 29474 }, { "epoch": 2.32, "learning_rate": 3.6530571071488916e-05, "loss": 1.4509, "step": 29475 }, { "epoch": 2.32, "learning_rate": 3.652248774931835e-05, "loss": 1.4635, "step": 29476 }, { "epoch": 2.32, "learning_rate": 3.6514405197597524e-05, "loss": 1.4867, "step": 29477 }, { "epoch": 2.32, "learning_rate": 3.6506323416381254e-05, "loss": 1.4545, "step": 29478 }, { "epoch": 2.32, "learning_rate": 3.649824240572437e-05, "loss": 1.4023, "step": 29479 }, { "epoch": 2.32, "learning_rate": 3.649016216568184e-05, "loss": 1.424, "step": 29480 }, { "epoch": 2.32, "learning_rate": 3.6482082696308454e-05, "loss": 1.4796, "step": 29481 }, { "epoch": 2.32, "learning_rate": 3.647400399765904e-05, "loss": 1.4677, "step": 29482 }, { "epoch": 2.32, "learning_rate": 3.6465926069788546e-05, "loss": 1.5069, "step": 29483 }, { "epoch": 2.32, "learning_rate": 3.645784891275175e-05, "loss": 1.4712, "step": 29484 }, { "epoch": 2.32, "learning_rate": 3.644977252660351e-05, "loss": 1.4364, "step": 29485 }, { "epoch": 2.32, "learning_rate": 3.644169691139859e-05, "loss": 1.4634, "step": 29486 }, { "epoch": 2.32, "learning_rate": 3.643362206719194e-05, "loss": 1.4357, "step": 29487 }, { "epoch": 2.32, "learning_rate": 3.642554799403833e-05, "loss": 1.403, "step": 29488 }, { "epoch": 2.32, "learning_rate": 3.641747469199253e-05, "loss": 1.4376, "step": 29489 }, { "epoch": 2.32, "learning_rate": 3.6409402161109424e-05, "loss": 1.4666, "step": 29490 }, { "epoch": 2.32, "learning_rate": 3.6401330401443813e-05, "loss": 1.5101, "step": 29491 }, { "epoch": 2.32, "learning_rate": 3.639325941305043e-05, "loss": 1.4246, "step": 29492 }, { "epoch": 2.32, "learning_rate": 3.6385189195984113e-05, "loss": 1.433, "step": 29493 }, { "epoch": 2.32, "learning_rate": 3.637711975029971e-05, "loss": 1.3702, "step": 29494 }, { "epoch": 2.32, "learning_rate": 3.636905107605197e-05, "loss": 1.4364, "step": 29495 }, { "epoch": 2.32, "learning_rate": 3.6360983173295616e-05, "loss": 1.479, "step": 29496 }, { "epoch": 2.32, "learning_rate": 3.635291604208552e-05, "loss": 1.4488, "step": 29497 }, { "epoch": 2.32, "learning_rate": 3.634484968247641e-05, "loss": 1.4499, "step": 29498 }, { "epoch": 2.32, "learning_rate": 3.6336784094523006e-05, "loss": 1.4428, "step": 29499 }, { "epoch": 2.32, "learning_rate": 3.632871927828015e-05, "loss": 1.432, "step": 29500 }, { "epoch": 2.32, "learning_rate": 3.632065523380258e-05, "loss": 1.443, "step": 29501 }, { "epoch": 2.32, "learning_rate": 3.631259196114496e-05, "loss": 1.4933, "step": 29502 }, { "epoch": 2.32, "learning_rate": 3.630452946036216e-05, "loss": 1.4219, "step": 29503 }, { "epoch": 2.32, "learning_rate": 3.629646773150886e-05, "loss": 1.4389, "step": 29504 }, { "epoch": 2.32, "learning_rate": 3.628840677463979e-05, "loss": 1.4124, "step": 29505 }, { "epoch": 2.32, "learning_rate": 3.628034658980965e-05, "loss": 1.467, "step": 29506 }, { "epoch": 2.32, "learning_rate": 3.62722871770732e-05, "loss": 1.5224, "step": 29507 }, { "epoch": 2.32, "learning_rate": 3.626422853648521e-05, "loss": 1.4278, "step": 29508 }, { "epoch": 2.32, "learning_rate": 3.6256170668100346e-05, "loss": 1.4651, "step": 29509 }, { "epoch": 2.32, "learning_rate": 3.624811357197327e-05, "loss": 1.3846, "step": 29510 }, { "epoch": 2.32, "learning_rate": 3.624005724815875e-05, "loss": 1.4665, "step": 29511 }, { "epoch": 2.32, "learning_rate": 3.6232001696711485e-05, "loss": 1.4301, "step": 29512 }, { "epoch": 2.32, "learning_rate": 3.62239469176861e-05, "loss": 1.4631, "step": 29513 }, { "epoch": 2.32, "learning_rate": 3.621589291113737e-05, "loss": 1.4405, "step": 29514 }, { "epoch": 2.32, "learning_rate": 3.6207839677119936e-05, "loss": 1.4491, "step": 29515 }, { "epoch": 2.32, "learning_rate": 3.619978721568842e-05, "loss": 1.4038, "step": 29516 }, { "epoch": 2.32, "learning_rate": 3.61917355268976e-05, "loss": 1.5074, "step": 29517 }, { "epoch": 2.32, "learning_rate": 3.618368461080209e-05, "loss": 1.489, "step": 29518 }, { "epoch": 2.32, "learning_rate": 3.617563446745653e-05, "loss": 1.447, "step": 29519 }, { "epoch": 2.32, "learning_rate": 3.616758509691563e-05, "loss": 1.4783, "step": 29520 }, { "epoch": 2.32, "learning_rate": 3.615953649923399e-05, "loss": 1.459, "step": 29521 }, { "epoch": 2.32, "learning_rate": 3.6151488674466296e-05, "loss": 1.4389, "step": 29522 }, { "epoch": 2.32, "learning_rate": 3.614344162266707e-05, "loss": 1.4781, "step": 29523 }, { "epoch": 2.32, "learning_rate": 3.613539534389114e-05, "loss": 1.4951, "step": 29524 }, { "epoch": 2.32, "learning_rate": 3.612734983819302e-05, "loss": 1.4523, "step": 29525 }, { "epoch": 2.32, "learning_rate": 3.611930510562737e-05, "loss": 1.3941, "step": 29526 }, { "epoch": 2.32, "learning_rate": 3.611126114624875e-05, "loss": 1.4907, "step": 29527 }, { "epoch": 2.32, "learning_rate": 3.610321796011186e-05, "loss": 1.4334, "step": 29528 }, { "epoch": 2.32, "learning_rate": 3.609517554727127e-05, "loss": 1.5313, "step": 29529 }, { "epoch": 2.32, "learning_rate": 3.6087133907781526e-05, "loss": 1.4385, "step": 29530 }, { "epoch": 2.32, "learning_rate": 3.6079093041697344e-05, "loss": 1.4553, "step": 29531 }, { "epoch": 2.32, "learning_rate": 3.6071052949073234e-05, "loss": 1.3935, "step": 29532 }, { "epoch": 2.32, "learning_rate": 3.6063013629963765e-05, "loss": 1.4913, "step": 29533 }, { "epoch": 2.32, "learning_rate": 3.60549750844236e-05, "loss": 1.4681, "step": 29534 }, { "epoch": 2.32, "learning_rate": 3.604693731250729e-05, "loss": 1.4885, "step": 29535 }, { "epoch": 2.32, "learning_rate": 3.6038900314269333e-05, "loss": 1.4289, "step": 29536 }, { "epoch": 2.32, "learning_rate": 3.60308640897644e-05, "loss": 1.4705, "step": 29537 }, { "epoch": 2.32, "learning_rate": 3.6022828639047e-05, "loss": 1.4327, "step": 29538 }, { "epoch": 2.32, "learning_rate": 3.601479396217166e-05, "loss": 1.4516, "step": 29539 }, { "epoch": 2.32, "learning_rate": 3.6006760059192966e-05, "loss": 1.4595, "step": 29540 }, { "epoch": 2.32, "learning_rate": 3.5998726930165513e-05, "loss": 1.4595, "step": 29541 }, { "epoch": 2.32, "learning_rate": 3.599069457514378e-05, "loss": 1.4192, "step": 29542 }, { "epoch": 2.32, "learning_rate": 3.598266299418228e-05, "loss": 1.4274, "step": 29543 }, { "epoch": 2.32, "learning_rate": 3.597463218733562e-05, "loss": 1.5064, "step": 29544 }, { "epoch": 2.32, "learning_rate": 3.5966602154658276e-05, "loss": 1.4181, "step": 29545 }, { "epoch": 2.32, "learning_rate": 3.595857289620478e-05, "loss": 1.4238, "step": 29546 }, { "epoch": 2.32, "learning_rate": 3.595054441202961e-05, "loss": 1.5065, "step": 29547 }, { "epoch": 2.32, "learning_rate": 3.594251670218733e-05, "loss": 1.4675, "step": 29548 }, { "epoch": 2.32, "learning_rate": 3.593448976673243e-05, "loss": 1.4663, "step": 29549 }, { "epoch": 2.33, "learning_rate": 3.592646360571936e-05, "loss": 1.4716, "step": 29550 }, { "epoch": 2.33, "learning_rate": 3.591843821920268e-05, "loss": 1.4568, "step": 29551 }, { "epoch": 2.33, "learning_rate": 3.5910413607236846e-05, "loss": 1.4712, "step": 29552 }, { "epoch": 2.33, "learning_rate": 3.590238976987631e-05, "loss": 1.4777, "step": 29553 }, { "epoch": 2.33, "learning_rate": 3.589436670717559e-05, "loss": 1.454, "step": 29554 }, { "epoch": 2.33, "learning_rate": 3.588634441918918e-05, "loss": 1.4624, "step": 29555 }, { "epoch": 2.33, "learning_rate": 3.587832290597154e-05, "loss": 1.4559, "step": 29556 }, { "epoch": 2.33, "learning_rate": 3.587030216757705e-05, "loss": 1.4479, "step": 29557 }, { "epoch": 2.33, "learning_rate": 3.586228220406028e-05, "loss": 1.4379, "step": 29558 }, { "epoch": 2.33, "learning_rate": 3.585426301547562e-05, "loss": 1.454, "step": 29559 }, { "epoch": 2.33, "learning_rate": 3.584624460187747e-05, "loss": 1.531, "step": 29560 }, { "epoch": 2.33, "learning_rate": 3.583822696332039e-05, "loss": 1.4301, "step": 29561 }, { "epoch": 2.33, "learning_rate": 3.583021009985872e-05, "loss": 1.4726, "step": 29562 }, { "epoch": 2.33, "learning_rate": 3.582219401154694e-05, "loss": 1.489, "step": 29563 }, { "epoch": 2.33, "learning_rate": 3.581417869843941e-05, "loss": 1.4338, "step": 29564 }, { "epoch": 2.33, "learning_rate": 3.580616416059063e-05, "loss": 1.4657, "step": 29565 }, { "epoch": 2.33, "learning_rate": 3.5798150398054984e-05, "loss": 1.4517, "step": 29566 }, { "epoch": 2.33, "learning_rate": 3.5790137410886836e-05, "loss": 1.4792, "step": 29567 }, { "epoch": 2.33, "learning_rate": 3.578212519914066e-05, "loss": 1.4874, "step": 29568 }, { "epoch": 2.33, "learning_rate": 3.577411376287082e-05, "loss": 1.5343, "step": 29569 }, { "epoch": 2.33, "learning_rate": 3.5766103102131693e-05, "loss": 1.444, "step": 29570 }, { "epoch": 2.33, "learning_rate": 3.575809321697766e-05, "loss": 1.4222, "step": 29571 }, { "epoch": 2.33, "learning_rate": 3.575008410746318e-05, "loss": 1.464, "step": 29572 }, { "epoch": 2.33, "learning_rate": 3.57420757736426e-05, "loss": 1.4307, "step": 29573 }, { "epoch": 2.33, "learning_rate": 3.573406821557021e-05, "loss": 1.4463, "step": 29574 }, { "epoch": 2.33, "learning_rate": 3.5726061433300494e-05, "loss": 1.4624, "step": 29575 }, { "epoch": 2.33, "learning_rate": 3.571805542688774e-05, "loss": 1.4635, "step": 29576 }, { "epoch": 2.33, "learning_rate": 3.571005019638631e-05, "loss": 1.4115, "step": 29577 }, { "epoch": 2.33, "learning_rate": 3.570204574185058e-05, "loss": 1.4472, "step": 29578 }, { "epoch": 2.33, "learning_rate": 3.5694042063334906e-05, "loss": 1.4264, "step": 29579 }, { "epoch": 2.33, "learning_rate": 3.56860391608936e-05, "loss": 1.4432, "step": 29580 }, { "epoch": 2.33, "learning_rate": 3.567803703458097e-05, "loss": 1.3925, "step": 29581 }, { "epoch": 2.33, "learning_rate": 3.567003568445141e-05, "loss": 1.4766, "step": 29582 }, { "epoch": 2.33, "learning_rate": 3.566203511055922e-05, "loss": 1.4544, "step": 29583 }, { "epoch": 2.33, "learning_rate": 3.565403531295867e-05, "loss": 1.4366, "step": 29584 }, { "epoch": 2.33, "learning_rate": 3.564603629170416e-05, "loss": 1.4256, "step": 29585 }, { "epoch": 2.33, "learning_rate": 3.5638038046849925e-05, "loss": 1.408, "step": 29586 }, { "epoch": 2.33, "learning_rate": 3.563004057845034e-05, "loss": 1.4617, "step": 29587 }, { "epoch": 2.33, "learning_rate": 3.562204388655962e-05, "loss": 1.4611, "step": 29588 }, { "epoch": 2.33, "learning_rate": 3.561404797123215e-05, "loss": 1.4919, "step": 29589 }, { "epoch": 2.33, "learning_rate": 3.560605283252217e-05, "loss": 1.4122, "step": 29590 }, { "epoch": 2.33, "learning_rate": 3.5598058470483914e-05, "loss": 1.4594, "step": 29591 }, { "epoch": 2.33, "learning_rate": 3.559006488517176e-05, "loss": 1.4706, "step": 29592 }, { "epoch": 2.33, "learning_rate": 3.558207207663993e-05, "loss": 1.4812, "step": 29593 }, { "epoch": 2.33, "learning_rate": 3.557408004494264e-05, "loss": 1.499, "step": 29594 }, { "epoch": 2.33, "learning_rate": 3.5566088790134246e-05, "loss": 1.4414, "step": 29595 }, { "epoch": 2.33, "learning_rate": 3.555809831226896e-05, "loss": 1.4927, "step": 29596 }, { "epoch": 2.33, "learning_rate": 3.5550108611400984e-05, "loss": 1.4578, "step": 29597 }, { "epoch": 2.33, "learning_rate": 3.554211968758465e-05, "loss": 1.4296, "step": 29598 }, { "epoch": 2.33, "learning_rate": 3.553413154087418e-05, "loss": 1.4729, "step": 29599 }, { "epoch": 2.33, "learning_rate": 3.552614417132378e-05, "loss": 1.4442, "step": 29600 }, { "epoch": 2.33, "learning_rate": 3.551815757898765e-05, "loss": 1.4548, "step": 29601 }, { "epoch": 2.33, "learning_rate": 3.551017176392004e-05, "loss": 1.4555, "step": 29602 }, { "epoch": 2.33, "learning_rate": 3.550218672617524e-05, "loss": 1.4646, "step": 29603 }, { "epoch": 2.33, "learning_rate": 3.54942024658074e-05, "loss": 1.4541, "step": 29604 }, { "epoch": 2.33, "learning_rate": 3.5486218982870694e-05, "loss": 1.461, "step": 29605 }, { "epoch": 2.33, "learning_rate": 3.5478236277419405e-05, "loss": 1.4468, "step": 29606 }, { "epoch": 2.33, "learning_rate": 3.5470254349507694e-05, "loss": 1.4808, "step": 29607 }, { "epoch": 2.33, "learning_rate": 3.5462273199189725e-05, "loss": 1.4288, "step": 29608 }, { "epoch": 2.33, "learning_rate": 3.545429282651975e-05, "loss": 1.4555, "step": 29609 }, { "epoch": 2.33, "learning_rate": 3.544631323155191e-05, "loss": 1.4589, "step": 29610 }, { "epoch": 2.33, "learning_rate": 3.5438334414340344e-05, "loss": 1.5048, "step": 29611 }, { "epoch": 2.33, "learning_rate": 3.5430356374939315e-05, "loss": 1.4504, "step": 29612 }, { "epoch": 2.33, "learning_rate": 3.542237911340293e-05, "loss": 1.4869, "step": 29613 }, { "epoch": 2.33, "learning_rate": 3.541440262978533e-05, "loss": 1.4665, "step": 29614 }, { "epoch": 2.33, "learning_rate": 3.540642692414074e-05, "loss": 1.4656, "step": 29615 }, { "epoch": 2.33, "learning_rate": 3.5398451996523274e-05, "loss": 1.3916, "step": 29616 }, { "epoch": 2.33, "learning_rate": 3.539047784698704e-05, "loss": 1.4829, "step": 29617 }, { "epoch": 2.33, "learning_rate": 3.538250447558622e-05, "loss": 1.5455, "step": 29618 }, { "epoch": 2.33, "learning_rate": 3.5374531882374966e-05, "loss": 1.4134, "step": 29619 }, { "epoch": 2.33, "learning_rate": 3.536656006740741e-05, "loss": 1.4495, "step": 29620 }, { "epoch": 2.33, "learning_rate": 3.535858903073762e-05, "loss": 1.4789, "step": 29621 }, { "epoch": 2.33, "learning_rate": 3.535061877241972e-05, "loss": 1.4761, "step": 29622 }, { "epoch": 2.33, "learning_rate": 3.534264929250791e-05, "loss": 1.4609, "step": 29623 }, { "epoch": 2.33, "learning_rate": 3.533468059105621e-05, "loss": 1.4217, "step": 29624 }, { "epoch": 2.33, "learning_rate": 3.532671266811871e-05, "loss": 1.4289, "step": 29625 }, { "epoch": 2.33, "learning_rate": 3.531874552374961e-05, "loss": 1.4431, "step": 29626 }, { "epoch": 2.33, "learning_rate": 3.531077915800294e-05, "loss": 1.496, "step": 29627 }, { "epoch": 2.33, "learning_rate": 3.5302813570932725e-05, "loss": 1.4204, "step": 29628 }, { "epoch": 2.33, "learning_rate": 3.529484876259317e-05, "loss": 1.4972, "step": 29629 }, { "epoch": 2.33, "learning_rate": 3.5286884733038297e-05, "loss": 1.449, "step": 29630 }, { "epoch": 2.33, "learning_rate": 3.5278921482322125e-05, "loss": 1.4871, "step": 29631 }, { "epoch": 2.33, "learning_rate": 3.527095901049881e-05, "loss": 1.4786, "step": 29632 }, { "epoch": 2.33, "learning_rate": 3.526299731762233e-05, "loss": 1.421, "step": 29633 }, { "epoch": 2.33, "learning_rate": 3.525503640374681e-05, "loss": 1.4878, "step": 29634 }, { "epoch": 2.33, "learning_rate": 3.5247076268926236e-05, "loss": 1.4713, "step": 29635 }, { "epoch": 2.33, "learning_rate": 3.523911691321473e-05, "loss": 1.4545, "step": 29636 }, { "epoch": 2.33, "learning_rate": 3.52311583366663e-05, "loss": 1.3995, "step": 29637 }, { "epoch": 2.33, "learning_rate": 3.522320053933495e-05, "loss": 1.4813, "step": 29638 }, { "epoch": 2.33, "learning_rate": 3.521524352127471e-05, "loss": 1.4713, "step": 29639 }, { "epoch": 2.33, "learning_rate": 3.520728728253965e-05, "loss": 1.4417, "step": 29640 }, { "epoch": 2.33, "learning_rate": 3.519933182318377e-05, "loss": 1.463, "step": 29641 }, { "epoch": 2.33, "learning_rate": 3.519137714326103e-05, "loss": 1.4434, "step": 29642 }, { "epoch": 2.33, "learning_rate": 3.5183423242825524e-05, "loss": 1.5056, "step": 29643 }, { "epoch": 2.33, "learning_rate": 3.517547012193122e-05, "loss": 1.4312, "step": 29644 }, { "epoch": 2.33, "learning_rate": 3.5167517780632054e-05, "loss": 1.4398, "step": 29645 }, { "epoch": 2.33, "learning_rate": 3.5159566218982115e-05, "loss": 1.4363, "step": 29646 }, { "epoch": 2.33, "learning_rate": 3.515161543703536e-05, "loss": 1.452, "step": 29647 }, { "epoch": 2.33, "learning_rate": 3.51436654348457e-05, "loss": 1.4242, "step": 29648 }, { "epoch": 2.33, "learning_rate": 3.513571621246719e-05, "loss": 1.4005, "step": 29649 }, { "epoch": 2.33, "learning_rate": 3.51277677699538e-05, "loss": 1.4196, "step": 29650 }, { "epoch": 2.33, "learning_rate": 3.511982010735949e-05, "loss": 1.4581, "step": 29651 }, { "epoch": 2.33, "learning_rate": 3.5111873224738154e-05, "loss": 1.4531, "step": 29652 }, { "epoch": 2.33, "learning_rate": 3.510392712214384e-05, "loss": 1.4129, "step": 29653 }, { "epoch": 2.33, "learning_rate": 3.5095981799630455e-05, "loss": 1.4571, "step": 29654 }, { "epoch": 2.33, "learning_rate": 3.508803725725192e-05, "loss": 1.4592, "step": 29655 }, { "epoch": 2.33, "learning_rate": 3.508009349506222e-05, "loss": 1.3963, "step": 29656 }, { "epoch": 2.33, "learning_rate": 3.507215051311528e-05, "loss": 1.4715, "step": 29657 }, { "epoch": 2.33, "learning_rate": 3.5064208311465e-05, "loss": 1.5005, "step": 29658 }, { "epoch": 2.33, "learning_rate": 3.5056266890165293e-05, "loss": 1.4334, "step": 29659 }, { "epoch": 2.33, "learning_rate": 3.504832624927013e-05, "loss": 1.443, "step": 29660 }, { "epoch": 2.33, "learning_rate": 3.5040386388833414e-05, "loss": 1.3982, "step": 29661 }, { "epoch": 2.33, "learning_rate": 3.503244730890898e-05, "loss": 1.4995, "step": 29662 }, { "epoch": 2.33, "learning_rate": 3.502450900955082e-05, "loss": 1.5131, "step": 29663 }, { "epoch": 2.33, "learning_rate": 3.501657149081277e-05, "loss": 1.4724, "step": 29664 }, { "epoch": 2.33, "learning_rate": 3.500863475274877e-05, "loss": 1.4594, "step": 29665 }, { "epoch": 2.33, "learning_rate": 3.500069879541266e-05, "loss": 1.4193, "step": 29666 }, { "epoch": 2.33, "learning_rate": 3.4992763618858385e-05, "loss": 1.491, "step": 29667 }, { "epoch": 2.33, "learning_rate": 3.4984829223139754e-05, "loss": 1.4821, "step": 29668 }, { "epoch": 2.33, "learning_rate": 3.497689560831064e-05, "loss": 1.4713, "step": 29669 }, { "epoch": 2.33, "learning_rate": 3.4968962774424964e-05, "loss": 1.4549, "step": 29670 }, { "epoch": 2.33, "learning_rate": 3.496103072153657e-05, "loss": 1.4074, "step": 29671 }, { "epoch": 2.33, "learning_rate": 3.4953099449699224e-05, "loss": 1.5109, "step": 29672 }, { "epoch": 2.33, "learning_rate": 3.49451689589669e-05, "loss": 1.403, "step": 29673 }, { "epoch": 2.33, "learning_rate": 3.493723924939339e-05, "loss": 1.4242, "step": 29674 }, { "epoch": 2.33, "learning_rate": 3.4929310321032526e-05, "loss": 1.4424, "step": 29675 }, { "epoch": 2.33, "learning_rate": 3.49213821739381e-05, "loss": 1.4288, "step": 29676 }, { "epoch": 2.34, "learning_rate": 3.491345480816403e-05, "loss": 1.4424, "step": 29677 }, { "epoch": 2.34, "learning_rate": 3.490552822376408e-05, "loss": 1.4373, "step": 29678 }, { "epoch": 2.34, "learning_rate": 3.4897602420792045e-05, "loss": 1.464, "step": 29679 }, { "epoch": 2.34, "learning_rate": 3.488967739930176e-05, "loss": 1.4398, "step": 29680 }, { "epoch": 2.34, "learning_rate": 3.48817531593471e-05, "loss": 1.4675, "step": 29681 }, { "epoch": 2.34, "learning_rate": 3.487382970098181e-05, "loss": 1.4637, "step": 29682 }, { "epoch": 2.34, "learning_rate": 3.486590702425964e-05, "loss": 1.4222, "step": 29683 }, { "epoch": 2.34, "learning_rate": 3.4857985129234456e-05, "loss": 1.456, "step": 29684 }, { "epoch": 2.34, "learning_rate": 3.485006401596002e-05, "loss": 1.4367, "step": 29685 }, { "epoch": 2.34, "learning_rate": 3.4842143684490056e-05, "loss": 1.3734, "step": 29686 }, { "epoch": 2.34, "learning_rate": 3.483422413487844e-05, "loss": 1.423, "step": 29687 }, { "epoch": 2.34, "learning_rate": 3.482630536717887e-05, "loss": 1.4814, "step": 29688 }, { "epoch": 2.34, "learning_rate": 3.48183873814451e-05, "loss": 1.4212, "step": 29689 }, { "epoch": 2.34, "learning_rate": 3.481047017773096e-05, "loss": 1.4796, "step": 29690 }, { "epoch": 2.34, "learning_rate": 3.480255375609017e-05, "loss": 1.5108, "step": 29691 }, { "epoch": 2.34, "learning_rate": 3.479463811657645e-05, "loss": 1.4182, "step": 29692 }, { "epoch": 2.34, "learning_rate": 3.4786723259243534e-05, "loss": 1.4203, "step": 29693 }, { "epoch": 2.34, "learning_rate": 3.4778809184145225e-05, "loss": 1.4516, "step": 29694 }, { "epoch": 2.34, "learning_rate": 3.477089589133521e-05, "loss": 1.5071, "step": 29695 }, { "epoch": 2.34, "learning_rate": 3.476298338086715e-05, "loss": 1.4385, "step": 29696 }, { "epoch": 2.34, "learning_rate": 3.475507165279491e-05, "loss": 1.4786, "step": 29697 }, { "epoch": 2.34, "learning_rate": 3.474716070717215e-05, "loss": 1.3884, "step": 29698 }, { "epoch": 2.34, "learning_rate": 3.4739250544052546e-05, "loss": 1.4688, "step": 29699 }, { "epoch": 2.34, "learning_rate": 3.47313411634898e-05, "loss": 1.4475, "step": 29700 }, { "epoch": 2.34, "learning_rate": 3.4723432565537676e-05, "loss": 1.4395, "step": 29701 }, { "epoch": 2.34, "learning_rate": 3.471552475024984e-05, "loss": 1.5443, "step": 29702 }, { "epoch": 2.34, "learning_rate": 3.470761771767992e-05, "loss": 1.4227, "step": 29703 }, { "epoch": 2.34, "learning_rate": 3.4699711467881694e-05, "loss": 1.4416, "step": 29704 }, { "epoch": 2.34, "learning_rate": 3.4691806000908794e-05, "loss": 1.4049, "step": 29705 }, { "epoch": 2.34, "learning_rate": 3.4683901316814864e-05, "loss": 1.4156, "step": 29706 }, { "epoch": 2.34, "learning_rate": 3.4675997415653646e-05, "loss": 1.4211, "step": 29707 }, { "epoch": 2.34, "learning_rate": 3.466809429747877e-05, "loss": 1.4797, "step": 29708 }, { "epoch": 2.34, "learning_rate": 3.4660191962343845e-05, "loss": 1.4944, "step": 29709 }, { "epoch": 2.34, "learning_rate": 3.465229041030261e-05, "loss": 1.4388, "step": 29710 }, { "epoch": 2.34, "learning_rate": 3.464438964140866e-05, "loss": 1.4269, "step": 29711 }, { "epoch": 2.34, "learning_rate": 3.463648965571561e-05, "loss": 1.4703, "step": 29712 }, { "epoch": 2.34, "learning_rate": 3.462859045327714e-05, "loss": 1.4249, "step": 29713 }, { "epoch": 2.34, "learning_rate": 3.4620692034146904e-05, "loss": 1.4091, "step": 29714 }, { "epoch": 2.34, "learning_rate": 3.461279439837849e-05, "loss": 1.4814, "step": 29715 }, { "epoch": 2.34, "learning_rate": 3.460489754602554e-05, "loss": 1.4713, "step": 29716 }, { "epoch": 2.34, "learning_rate": 3.4597001477141605e-05, "loss": 1.4032, "step": 29717 }, { "epoch": 2.34, "learning_rate": 3.4589106191780396e-05, "loss": 1.4644, "step": 29718 }, { "epoch": 2.34, "learning_rate": 3.4581211689995475e-05, "loss": 1.4113, "step": 29719 }, { "epoch": 2.34, "learning_rate": 3.457331797184038e-05, "loss": 1.4579, "step": 29720 }, { "epoch": 2.34, "learning_rate": 3.456542503736879e-05, "loss": 1.4775, "step": 29721 }, { "epoch": 2.34, "learning_rate": 3.455753288663427e-05, "loss": 1.4479, "step": 29722 }, { "epoch": 2.34, "learning_rate": 3.454964151969037e-05, "loss": 1.4576, "step": 29723 }, { "epoch": 2.34, "learning_rate": 3.454175093659071e-05, "loss": 1.4159, "step": 29724 }, { "epoch": 2.34, "learning_rate": 3.453386113738886e-05, "loss": 1.4876, "step": 29725 }, { "epoch": 2.34, "learning_rate": 3.452597212213833e-05, "loss": 1.4548, "step": 29726 }, { "epoch": 2.34, "learning_rate": 3.451808389089271e-05, "loss": 1.4977, "step": 29727 }, { "epoch": 2.34, "learning_rate": 3.451019644370563e-05, "loss": 1.43, "step": 29728 }, { "epoch": 2.34, "learning_rate": 3.450230978063059e-05, "loss": 1.4554, "step": 29729 }, { "epoch": 2.34, "learning_rate": 3.449442390172108e-05, "loss": 1.4805, "step": 29730 }, { "epoch": 2.34, "learning_rate": 3.4486538807030725e-05, "loss": 1.4061, "step": 29731 }, { "epoch": 2.34, "learning_rate": 3.447865449661304e-05, "loss": 1.5178, "step": 29732 }, { "epoch": 2.34, "learning_rate": 3.447077097052152e-05, "loss": 1.4181, "step": 29733 }, { "epoch": 2.34, "learning_rate": 3.44628882288097e-05, "loss": 1.4646, "step": 29734 }, { "epoch": 2.34, "learning_rate": 3.445500627153113e-05, "loss": 1.4547, "step": 29735 }, { "epoch": 2.34, "learning_rate": 3.44471250987393e-05, "loss": 1.4209, "step": 29736 }, { "epoch": 2.34, "learning_rate": 3.44392447104877e-05, "loss": 1.4063, "step": 29737 }, { "epoch": 2.34, "learning_rate": 3.443136510682988e-05, "loss": 1.4589, "step": 29738 }, { "epoch": 2.34, "learning_rate": 3.442348628781934e-05, "loss": 1.4704, "step": 29739 }, { "epoch": 2.34, "learning_rate": 3.441560825350948e-05, "loss": 1.4716, "step": 29740 }, { "epoch": 2.34, "learning_rate": 3.4407731003953906e-05, "loss": 1.5079, "step": 29741 }, { "epoch": 2.34, "learning_rate": 3.4399854539206046e-05, "loss": 1.4379, "step": 29742 }, { "epoch": 2.34, "learning_rate": 3.439197885931935e-05, "loss": 1.4546, "step": 29743 }, { "epoch": 2.34, "learning_rate": 3.43841039643473e-05, "loss": 1.4211, "step": 29744 }, { "epoch": 2.34, "learning_rate": 3.437622985434344e-05, "loss": 1.4027, "step": 29745 }, { "epoch": 2.34, "learning_rate": 3.436835652936116e-05, "loss": 1.471, "step": 29746 }, { "epoch": 2.34, "learning_rate": 3.4360483989453905e-05, "loss": 1.5049, "step": 29747 }, { "epoch": 2.34, "learning_rate": 3.435261223467518e-05, "loss": 1.4883, "step": 29748 }, { "epoch": 2.34, "learning_rate": 3.434474126507841e-05, "loss": 1.5152, "step": 29749 }, { "epoch": 2.34, "learning_rate": 3.433687108071701e-05, "loss": 1.4324, "step": 29750 }, { "epoch": 2.34, "learning_rate": 3.432900168164438e-05, "loss": 1.4703, "step": 29751 }, { "epoch": 2.34, "learning_rate": 3.432113306791404e-05, "loss": 1.4594, "step": 29752 }, { "epoch": 2.34, "learning_rate": 3.4313265239579386e-05, "loss": 1.438, "step": 29753 }, { "epoch": 2.34, "learning_rate": 3.430539819669377e-05, "loss": 1.469, "step": 29754 }, { "epoch": 2.34, "learning_rate": 3.429753193931068e-05, "loss": 1.4318, "step": 29755 }, { "epoch": 2.34, "learning_rate": 3.428966646748351e-05, "loss": 1.4832, "step": 29756 }, { "epoch": 2.34, "learning_rate": 3.428180178126562e-05, "loss": 1.4182, "step": 29757 }, { "epoch": 2.34, "learning_rate": 3.427393788071047e-05, "loss": 1.4552, "step": 29758 }, { "epoch": 2.34, "learning_rate": 3.426607476587137e-05, "loss": 1.4946, "step": 29759 }, { "epoch": 2.34, "learning_rate": 3.425821243680181e-05, "loss": 1.4513, "step": 29760 }, { "epoch": 2.34, "learning_rate": 3.425035089355507e-05, "loss": 1.4439, "step": 29761 }, { "epoch": 2.34, "learning_rate": 3.424249013618461e-05, "loss": 1.4622, "step": 29762 }, { "epoch": 2.34, "learning_rate": 3.4234630164743756e-05, "loss": 1.4539, "step": 29763 }, { "epoch": 2.34, "learning_rate": 3.4226770979285846e-05, "loss": 1.3995, "step": 29764 }, { "epoch": 2.34, "learning_rate": 3.421891257986431e-05, "loss": 1.4373, "step": 29765 }, { "epoch": 2.34, "learning_rate": 3.421105496653246e-05, "loss": 1.4935, "step": 29766 }, { "epoch": 2.34, "learning_rate": 3.4203198139343614e-05, "loss": 1.4552, "step": 29767 }, { "epoch": 2.34, "learning_rate": 3.4195342098351194e-05, "loss": 1.459, "step": 29768 }, { "epoch": 2.34, "learning_rate": 3.418748684360849e-05, "loss": 1.4261, "step": 29769 }, { "epoch": 2.34, "learning_rate": 3.417963237516884e-05, "loss": 1.4644, "step": 29770 }, { "epoch": 2.34, "learning_rate": 3.417177869308553e-05, "loss": 1.4791, "step": 29771 }, { "epoch": 2.34, "learning_rate": 3.416392579741197e-05, "loss": 1.4668, "step": 29772 }, { "epoch": 2.34, "learning_rate": 3.415607368820143e-05, "loss": 1.4569, "step": 29773 }, { "epoch": 2.34, "learning_rate": 3.414822236550718e-05, "loss": 1.4651, "step": 29774 }, { "epoch": 2.34, "learning_rate": 3.414037182938255e-05, "loss": 1.4398, "step": 29775 }, { "epoch": 2.34, "learning_rate": 3.4132522079880925e-05, "loss": 1.4328, "step": 29776 }, { "epoch": 2.34, "learning_rate": 3.412467311705552e-05, "loss": 1.4051, "step": 29777 }, { "epoch": 2.34, "learning_rate": 3.41168249409596e-05, "loss": 1.3877, "step": 29778 }, { "epoch": 2.34, "learning_rate": 3.4108977551646536e-05, "loss": 1.4924, "step": 29779 }, { "epoch": 2.34, "learning_rate": 3.4101130949169556e-05, "loss": 1.4936, "step": 29780 }, { "epoch": 2.34, "learning_rate": 3.4093285133581887e-05, "loss": 1.4438, "step": 29781 }, { "epoch": 2.34, "learning_rate": 3.408544010493692e-05, "loss": 1.4648, "step": 29782 }, { "epoch": 2.34, "learning_rate": 3.4077595863287815e-05, "loss": 1.4347, "step": 29783 }, { "epoch": 2.34, "learning_rate": 3.406975240868784e-05, "loss": 1.4427, "step": 29784 }, { "epoch": 2.34, "learning_rate": 3.406190974119031e-05, "loss": 1.4551, "step": 29785 }, { "epoch": 2.34, "learning_rate": 3.405406786084843e-05, "loss": 1.4499, "step": 29786 }, { "epoch": 2.34, "learning_rate": 3.404622676771544e-05, "loss": 1.4745, "step": 29787 }, { "epoch": 2.34, "learning_rate": 3.403838646184454e-05, "loss": 1.4705, "step": 29788 }, { "epoch": 2.34, "learning_rate": 3.403054694328906e-05, "loss": 1.46, "step": 29789 }, { "epoch": 2.34, "learning_rate": 3.402270821210212e-05, "loss": 1.483, "step": 29790 }, { "epoch": 2.34, "learning_rate": 3.401487026833702e-05, "loss": 1.4815, "step": 29791 }, { "epoch": 2.34, "learning_rate": 3.400703311204692e-05, "loss": 1.4527, "step": 29792 }, { "epoch": 2.34, "learning_rate": 3.399919674328509e-05, "loss": 1.4409, "step": 29793 }, { "epoch": 2.34, "learning_rate": 3.39913611621047e-05, "loss": 1.4208, "step": 29794 }, { "epoch": 2.34, "learning_rate": 3.39835263685589e-05, "loss": 1.3996, "step": 29795 }, { "epoch": 2.34, "learning_rate": 3.397569236270097e-05, "loss": 1.4749, "step": 29796 }, { "epoch": 2.34, "learning_rate": 3.396785914458408e-05, "loss": 1.4938, "step": 29797 }, { "epoch": 2.34, "learning_rate": 3.396002671426134e-05, "loss": 1.4517, "step": 29798 }, { "epoch": 2.34, "learning_rate": 3.3952195071786025e-05, "loss": 1.4637, "step": 29799 }, { "epoch": 2.34, "learning_rate": 3.3944364217211274e-05, "loss": 1.4086, "step": 29800 }, { "epoch": 2.34, "learning_rate": 3.39365341505902e-05, "loss": 1.449, "step": 29801 }, { "epoch": 2.34, "learning_rate": 3.3928704871976045e-05, "loss": 1.4683, "step": 29802 }, { "epoch": 2.34, "learning_rate": 3.392087638142194e-05, "loss": 1.459, "step": 29803 }, { "epoch": 2.35, "learning_rate": 3.3913048678981024e-05, "loss": 1.4471, "step": 29804 }, { "epoch": 2.35, "learning_rate": 3.390522176470639e-05, "loss": 1.4511, "step": 29805 }, { "epoch": 2.35, "learning_rate": 3.3897395638651246e-05, "loss": 1.4212, "step": 29806 }, { "epoch": 2.35, "learning_rate": 3.3889570300868765e-05, "loss": 1.4681, "step": 29807 }, { "epoch": 2.35, "learning_rate": 3.3881745751411975e-05, "loss": 1.4381, "step": 29808 }, { "epoch": 2.35, "learning_rate": 3.3873921990334095e-05, "loss": 1.4719, "step": 29809 }, { "epoch": 2.35, "learning_rate": 3.3866099017688204e-05, "loss": 1.4543, "step": 29810 }, { "epoch": 2.35, "learning_rate": 3.38582768335274e-05, "loss": 1.4983, "step": 29811 }, { "epoch": 2.35, "learning_rate": 3.385045543790477e-05, "loss": 1.4836, "step": 29812 }, { "epoch": 2.35, "learning_rate": 3.3842634830873496e-05, "loss": 1.4598, "step": 29813 }, { "epoch": 2.35, "learning_rate": 3.3834815012486625e-05, "loss": 1.4043, "step": 29814 }, { "epoch": 2.35, "learning_rate": 3.382699598279723e-05, "loss": 1.4236, "step": 29815 }, { "epoch": 2.35, "learning_rate": 3.3819177741858445e-05, "loss": 1.4534, "step": 29816 }, { "epoch": 2.35, "learning_rate": 3.3811360289723334e-05, "loss": 1.419, "step": 29817 }, { "epoch": 2.35, "learning_rate": 3.3803543626444934e-05, "loss": 1.4444, "step": 29818 }, { "epoch": 2.35, "learning_rate": 3.379572775207637e-05, "loss": 1.477, "step": 29819 }, { "epoch": 2.35, "learning_rate": 3.378791266667071e-05, "loss": 1.5221, "step": 29820 }, { "epoch": 2.35, "learning_rate": 3.378009837028095e-05, "loss": 1.4329, "step": 29821 }, { "epoch": 2.35, "learning_rate": 3.3772284862960173e-05, "loss": 1.5175, "step": 29822 }, { "epoch": 2.35, "learning_rate": 3.376447214476149e-05, "loss": 1.4436, "step": 29823 }, { "epoch": 2.35, "learning_rate": 3.3756660215737915e-05, "loss": 1.4901, "step": 29824 }, { "epoch": 2.35, "learning_rate": 3.3748849075942404e-05, "loss": 1.4539, "step": 29825 }, { "epoch": 2.35, "learning_rate": 3.37410387254281e-05, "loss": 1.4524, "step": 29826 }, { "epoch": 2.35, "learning_rate": 3.373322916424799e-05, "loss": 1.3772, "step": 29827 }, { "epoch": 2.35, "learning_rate": 3.372542039245509e-05, "loss": 1.4833, "step": 29828 }, { "epoch": 2.35, "learning_rate": 3.3717612410102375e-05, "loss": 1.4376, "step": 29829 }, { "epoch": 2.35, "learning_rate": 3.370980521724296e-05, "loss": 1.433, "step": 29830 }, { "epoch": 2.35, "learning_rate": 3.370199881392977e-05, "loss": 1.4381, "step": 29831 }, { "epoch": 2.35, "learning_rate": 3.36941932002158e-05, "loss": 1.4541, "step": 29832 }, { "epoch": 2.35, "learning_rate": 3.368638837615413e-05, "loss": 1.4253, "step": 29833 }, { "epoch": 2.35, "learning_rate": 3.367858434179767e-05, "loss": 1.4469, "step": 29834 }, { "epoch": 2.35, "learning_rate": 3.367078109719941e-05, "loss": 1.4766, "step": 29835 }, { "epoch": 2.35, "learning_rate": 3.366297864241237e-05, "loss": 1.3989, "step": 29836 }, { "epoch": 2.35, "learning_rate": 3.365517697748948e-05, "loss": 1.4306, "step": 29837 }, { "epoch": 2.35, "learning_rate": 3.364737610248378e-05, "loss": 1.4414, "step": 29838 }, { "epoch": 2.35, "learning_rate": 3.363957601744814e-05, "loss": 1.4451, "step": 29839 }, { "epoch": 2.35, "learning_rate": 3.36317767224356e-05, "loss": 1.4382, "step": 29840 }, { "epoch": 2.35, "learning_rate": 3.3623978217499096e-05, "loss": 1.435, "step": 29841 }, { "epoch": 2.35, "learning_rate": 3.3616180502691507e-05, "loss": 1.4235, "step": 29842 }, { "epoch": 2.35, "learning_rate": 3.3608383578065856e-05, "loss": 1.4615, "step": 29843 }, { "epoch": 2.35, "learning_rate": 3.360058744367507e-05, "loss": 1.4365, "step": 29844 }, { "epoch": 2.35, "learning_rate": 3.359279209957204e-05, "loss": 1.5141, "step": 29845 }, { "epoch": 2.35, "learning_rate": 3.35849975458097e-05, "loss": 1.4068, "step": 29846 }, { "epoch": 2.35, "learning_rate": 3.3577203782440996e-05, "loss": 1.4147, "step": 29847 }, { "epoch": 2.35, "learning_rate": 3.3569410809518846e-05, "loss": 1.4577, "step": 29848 }, { "epoch": 2.35, "learning_rate": 3.35616186270961e-05, "loss": 1.503, "step": 29849 }, { "epoch": 2.35, "learning_rate": 3.355382723522576e-05, "loss": 1.5186, "step": 29850 }, { "epoch": 2.35, "learning_rate": 3.3546036633960656e-05, "loss": 1.4588, "step": 29851 }, { "epoch": 2.35, "learning_rate": 3.3538246823353656e-05, "loss": 1.4237, "step": 29852 }, { "epoch": 2.35, "learning_rate": 3.353045780345771e-05, "loss": 1.5027, "step": 29853 }, { "epoch": 2.35, "learning_rate": 3.35226695743257e-05, "loss": 1.4356, "step": 29854 }, { "epoch": 2.35, "learning_rate": 3.3514882136010504e-05, "loss": 1.483, "step": 29855 }, { "epoch": 2.35, "learning_rate": 3.350709548856492e-05, "loss": 1.4397, "step": 29856 }, { "epoch": 2.35, "learning_rate": 3.3499309632041936e-05, "loss": 1.4828, "step": 29857 }, { "epoch": 2.35, "learning_rate": 3.3491524566494336e-05, "loss": 1.4846, "step": 29858 }, { "epoch": 2.35, "learning_rate": 3.348374029197495e-05, "loss": 1.4592, "step": 29859 }, { "epoch": 2.35, "learning_rate": 3.3475956808536705e-05, "loss": 1.4177, "step": 29860 }, { "epoch": 2.35, "learning_rate": 3.346817411623241e-05, "loss": 1.5111, "step": 29861 }, { "epoch": 2.35, "learning_rate": 3.346039221511486e-05, "loss": 1.4677, "step": 29862 }, { "epoch": 2.35, "learning_rate": 3.345261110523699e-05, "loss": 1.4193, "step": 29863 }, { "epoch": 2.35, "learning_rate": 3.3444830786651564e-05, "loss": 1.4848, "step": 29864 }, { "epoch": 2.35, "learning_rate": 3.343705125941142e-05, "loss": 1.4514, "step": 29865 }, { "epoch": 2.35, "learning_rate": 3.342927252356933e-05, "loss": 1.3814, "step": 29866 }, { "epoch": 2.35, "learning_rate": 3.34214945791782e-05, "loss": 1.4355, "step": 29867 }, { "epoch": 2.35, "learning_rate": 3.341371742629078e-05, "loss": 1.4065, "step": 29868 }, { "epoch": 2.35, "learning_rate": 3.340594106495984e-05, "loss": 1.4719, "step": 29869 }, { "epoch": 2.35, "learning_rate": 3.3398165495238215e-05, "loss": 1.44, "step": 29870 }, { "epoch": 2.35, "learning_rate": 3.339039071717874e-05, "loss": 1.4763, "step": 29871 }, { "epoch": 2.35, "learning_rate": 3.338261673083418e-05, "loss": 1.4673, "step": 29872 }, { "epoch": 2.35, "learning_rate": 3.337484353625724e-05, "loss": 1.436, "step": 29873 }, { "epoch": 2.35, "learning_rate": 3.3367071133500804e-05, "loss": 1.457, "step": 29874 }, { "epoch": 2.35, "learning_rate": 3.335929952261759e-05, "loss": 1.4429, "step": 29875 }, { "epoch": 2.35, "learning_rate": 3.335152870366031e-05, "loss": 1.4514, "step": 29876 }, { "epoch": 2.35, "learning_rate": 3.334375867668184e-05, "loss": 1.4323, "step": 29877 }, { "epoch": 2.35, "learning_rate": 3.333598944173485e-05, "loss": 1.4833, "step": 29878 }, { "epoch": 2.35, "learning_rate": 3.332822099887208e-05, "loss": 1.4592, "step": 29879 }, { "epoch": 2.35, "learning_rate": 3.332045334814635e-05, "loss": 1.459, "step": 29880 }, { "epoch": 2.35, "learning_rate": 3.3312686489610345e-05, "loss": 1.3942, "step": 29881 }, { "epoch": 2.35, "learning_rate": 3.330492042331682e-05, "loss": 1.4833, "step": 29882 }, { "epoch": 2.35, "learning_rate": 3.329715514931843e-05, "loss": 1.4496, "step": 29883 }, { "epoch": 2.35, "learning_rate": 3.328939066766797e-05, "loss": 1.4466, "step": 29884 }, { "epoch": 2.35, "learning_rate": 3.328162697841817e-05, "loss": 1.5132, "step": 29885 }, { "epoch": 2.35, "learning_rate": 3.327386408162172e-05, "loss": 1.4621, "step": 29886 }, { "epoch": 2.35, "learning_rate": 3.3266101977331266e-05, "loss": 1.4492, "step": 29887 }, { "epoch": 2.35, "learning_rate": 3.325834066559962e-05, "loss": 1.4242, "step": 29888 }, { "epoch": 2.35, "learning_rate": 3.325058014647939e-05, "loss": 1.4312, "step": 29889 }, { "epoch": 2.35, "learning_rate": 3.3242820420023284e-05, "loss": 1.4861, "step": 29890 }, { "epoch": 2.35, "learning_rate": 3.323506148628402e-05, "loss": 1.4496, "step": 29891 }, { "epoch": 2.35, "learning_rate": 3.3227303345314246e-05, "loss": 1.4147, "step": 29892 }, { "epoch": 2.35, "learning_rate": 3.321954599716661e-05, "loss": 1.518, "step": 29893 }, { "epoch": 2.35, "learning_rate": 3.321178944189385e-05, "loss": 1.4477, "step": 29894 }, { "epoch": 2.35, "learning_rate": 3.320403367954858e-05, "loss": 1.4972, "step": 29895 }, { "epoch": 2.35, "learning_rate": 3.3196278710183444e-05, "loss": 1.4733, "step": 29896 }, { "epoch": 2.35, "learning_rate": 3.318852453385115e-05, "loss": 1.4587, "step": 29897 }, { "epoch": 2.35, "learning_rate": 3.3180771150604315e-05, "loss": 1.4572, "step": 29898 }, { "epoch": 2.35, "learning_rate": 3.3173018560495584e-05, "loss": 1.5104, "step": 29899 }, { "epoch": 2.35, "learning_rate": 3.316526676357749e-05, "loss": 1.476, "step": 29900 }, { "epoch": 2.35, "learning_rate": 3.315751575990286e-05, "loss": 1.4175, "step": 29901 }, { "epoch": 2.35, "learning_rate": 3.314976554952421e-05, "loss": 1.3771, "step": 29902 }, { "epoch": 2.35, "learning_rate": 3.314201613249417e-05, "loss": 1.4905, "step": 29903 }, { "epoch": 2.35, "learning_rate": 3.31342675088653e-05, "loss": 1.4709, "step": 29904 }, { "epoch": 2.35, "learning_rate": 3.312651967869031e-05, "loss": 1.4662, "step": 29905 }, { "epoch": 2.35, "learning_rate": 3.3118772642021764e-05, "loss": 1.441, "step": 29906 }, { "epoch": 2.35, "learning_rate": 3.311102639891221e-05, "loss": 1.4592, "step": 29907 }, { "epoch": 2.35, "learning_rate": 3.310328094941432e-05, "loss": 1.4859, "step": 29908 }, { "epoch": 2.35, "learning_rate": 3.3095536293580624e-05, "loss": 1.4449, "step": 29909 }, { "epoch": 2.35, "learning_rate": 3.308779243146371e-05, "loss": 1.4377, "step": 29910 }, { "epoch": 2.35, "learning_rate": 3.3080049363116196e-05, "loss": 1.4453, "step": 29911 }, { "epoch": 2.35, "learning_rate": 3.3072307088590625e-05, "loss": 1.4071, "step": 29912 }, { "epoch": 2.35, "learning_rate": 3.3064565607939534e-05, "loss": 1.4186, "step": 29913 }, { "epoch": 2.35, "learning_rate": 3.305682492121553e-05, "loss": 1.449, "step": 29914 }, { "epoch": 2.35, "learning_rate": 3.304908502847116e-05, "loss": 1.4551, "step": 29915 }, { "epoch": 2.35, "learning_rate": 3.3041345929758936e-05, "loss": 1.4282, "step": 29916 }, { "epoch": 2.35, "learning_rate": 3.303360762513142e-05, "loss": 1.4197, "step": 29917 }, { "epoch": 2.35, "learning_rate": 3.3025870114641196e-05, "loss": 1.4799, "step": 29918 }, { "epoch": 2.35, "learning_rate": 3.301813339834077e-05, "loss": 1.4444, "step": 29919 }, { "epoch": 2.35, "learning_rate": 3.301039747628263e-05, "loss": 1.4656, "step": 29920 }, { "epoch": 2.35, "learning_rate": 3.3002662348519354e-05, "loss": 1.468, "step": 29921 }, { "epoch": 2.35, "learning_rate": 3.299492801510345e-05, "loss": 1.4391, "step": 29922 }, { "epoch": 2.35, "learning_rate": 3.298719447608741e-05, "loss": 1.4149, "step": 29923 }, { "epoch": 2.35, "learning_rate": 3.2979461731523706e-05, "loss": 1.4149, "step": 29924 }, { "epoch": 2.35, "learning_rate": 3.2971729781464914e-05, "loss": 1.4447, "step": 29925 }, { "epoch": 2.35, "learning_rate": 3.296399862596351e-05, "loss": 1.4861, "step": 29926 }, { "epoch": 2.35, "learning_rate": 3.2956268265071914e-05, "loss": 1.4497, "step": 29927 }, { "epoch": 2.35, "learning_rate": 3.2948538698842706e-05, "loss": 1.4539, "step": 29928 }, { "epoch": 2.35, "learning_rate": 3.2940809927328336e-05, "loss": 1.4752, "step": 29929 }, { "epoch": 2.35, "learning_rate": 3.293308195058123e-05, "loss": 1.4805, "step": 29930 }, { "epoch": 2.36, "learning_rate": 3.292535476865392e-05, "loss": 1.4354, "step": 29931 }, { "epoch": 2.36, "learning_rate": 3.291762838159882e-05, "loss": 1.4199, "step": 29932 }, { "epoch": 2.36, "learning_rate": 3.2909902789468446e-05, "loss": 1.439, "step": 29933 }, { "epoch": 2.36, "learning_rate": 3.290217799231517e-05, "loss": 1.4728, "step": 29934 }, { "epoch": 2.36, "learning_rate": 3.289445399019154e-05, "loss": 1.4729, "step": 29935 }, { "epoch": 2.36, "learning_rate": 3.2886730783149926e-05, "loss": 1.4502, "step": 29936 }, { "epoch": 2.36, "learning_rate": 3.287900837124275e-05, "loss": 1.4924, "step": 29937 }, { "epoch": 2.36, "learning_rate": 3.287128675452251e-05, "loss": 1.4457, "step": 29938 }, { "epoch": 2.36, "learning_rate": 3.286356593304161e-05, "loss": 1.481, "step": 29939 }, { "epoch": 2.36, "learning_rate": 3.285584590685244e-05, "loss": 1.5002, "step": 29940 }, { "epoch": 2.36, "learning_rate": 3.28481266760074e-05, "loss": 1.4355, "step": 29941 }, { "epoch": 2.36, "learning_rate": 3.284040824055897e-05, "loss": 1.5042, "step": 29942 }, { "epoch": 2.36, "learning_rate": 3.283269060055951e-05, "loss": 1.4211, "step": 29943 }, { "epoch": 2.36, "learning_rate": 3.2824973756061376e-05, "loss": 1.5006, "step": 29944 }, { "epoch": 2.36, "learning_rate": 3.2817257707117054e-05, "loss": 1.5371, "step": 29945 }, { "epoch": 2.36, "learning_rate": 3.280954245377889e-05, "loss": 1.413, "step": 29946 }, { "epoch": 2.36, "learning_rate": 3.280182799609922e-05, "loss": 1.4641, "step": 29947 }, { "epoch": 2.36, "learning_rate": 3.279411433413046e-05, "loss": 1.4268, "step": 29948 }, { "epoch": 2.36, "learning_rate": 3.2786401467925026e-05, "loss": 1.4964, "step": 29949 }, { "epoch": 2.36, "learning_rate": 3.2778689397535244e-05, "loss": 1.4732, "step": 29950 }, { "epoch": 2.36, "learning_rate": 3.277097812301344e-05, "loss": 1.4689, "step": 29951 }, { "epoch": 2.36, "learning_rate": 3.276326764441202e-05, "loss": 1.4448, "step": 29952 }, { "epoch": 2.36, "learning_rate": 3.275555796178333e-05, "loss": 1.458, "step": 29953 }, { "epoch": 2.36, "learning_rate": 3.274784907517967e-05, "loss": 1.4522, "step": 29954 }, { "epoch": 2.36, "learning_rate": 3.2740140984653424e-05, "loss": 1.4897, "step": 29955 }, { "epoch": 2.36, "learning_rate": 3.273243369025693e-05, "loss": 1.4824, "step": 29956 }, { "epoch": 2.36, "learning_rate": 3.27247271920425e-05, "loss": 1.444, "step": 29957 }, { "epoch": 2.36, "learning_rate": 3.27170214900624e-05, "loss": 1.4687, "step": 29958 }, { "epoch": 2.36, "learning_rate": 3.270931658436905e-05, "loss": 1.4343, "step": 29959 }, { "epoch": 2.36, "learning_rate": 3.270161247501472e-05, "loss": 1.4648, "step": 29960 }, { "epoch": 2.36, "learning_rate": 3.2693909162051674e-05, "loss": 1.4401, "step": 29961 }, { "epoch": 2.36, "learning_rate": 3.268620664553227e-05, "loss": 1.4096, "step": 29962 }, { "epoch": 2.36, "learning_rate": 3.2678504925508754e-05, "loss": 1.4585, "step": 29963 }, { "epoch": 2.36, "learning_rate": 3.26708040020335e-05, "loss": 1.4765, "step": 29964 }, { "epoch": 2.36, "learning_rate": 3.2663103875158673e-05, "loss": 1.4345, "step": 29965 }, { "epoch": 2.36, "learning_rate": 3.265540454493668e-05, "loss": 1.4648, "step": 29966 }, { "epoch": 2.36, "learning_rate": 3.2647706011419724e-05, "loss": 1.4396, "step": 29967 }, { "epoch": 2.36, "learning_rate": 3.264000827466004e-05, "loss": 1.4588, "step": 29968 }, { "epoch": 2.36, "learning_rate": 3.2632311334709995e-05, "loss": 1.4464, "step": 29969 }, { "epoch": 2.36, "learning_rate": 3.262461519162177e-05, "loss": 1.4282, "step": 29970 }, { "epoch": 2.36, "learning_rate": 3.261691984544759e-05, "loss": 1.4746, "step": 29971 }, { "epoch": 2.36, "learning_rate": 3.260922529623979e-05, "loss": 1.451, "step": 29972 }, { "epoch": 2.36, "learning_rate": 3.2601531544050584e-05, "loss": 1.5088, "step": 29973 }, { "epoch": 2.36, "learning_rate": 3.259383858893214e-05, "loss": 1.4357, "step": 29974 }, { "epoch": 2.36, "learning_rate": 3.258614643093679e-05, "loss": 1.449, "step": 29975 }, { "epoch": 2.36, "learning_rate": 3.25784550701167e-05, "loss": 1.4608, "step": 29976 }, { "epoch": 2.36, "learning_rate": 3.257076450652411e-05, "loss": 1.4821, "step": 29977 }, { "epoch": 2.36, "learning_rate": 3.256307474021118e-05, "loss": 1.4131, "step": 29978 }, { "epoch": 2.36, "learning_rate": 3.255538577123017e-05, "loss": 1.4273, "step": 29979 }, { "epoch": 2.36, "learning_rate": 3.254769759963332e-05, "loss": 1.4321, "step": 29980 }, { "epoch": 2.36, "learning_rate": 3.2540010225472795e-05, "loss": 1.4039, "step": 29981 }, { "epoch": 2.36, "learning_rate": 3.253232364880072e-05, "loss": 1.4308, "step": 29982 }, { "epoch": 2.36, "learning_rate": 3.2524637869669406e-05, "loss": 1.398, "step": 29983 }, { "epoch": 2.36, "learning_rate": 3.2516952888130955e-05, "loss": 1.4389, "step": 29984 }, { "epoch": 2.36, "learning_rate": 3.2509268704237534e-05, "loss": 1.4459, "step": 29985 }, { "epoch": 2.36, "learning_rate": 3.2501585318041376e-05, "loss": 1.4441, "step": 29986 }, { "epoch": 2.36, "learning_rate": 3.249390272959461e-05, "loss": 1.4671, "step": 29987 }, { "epoch": 2.36, "learning_rate": 3.248622093894936e-05, "loss": 1.4294, "step": 29988 }, { "epoch": 2.36, "learning_rate": 3.247853994615787e-05, "loss": 1.4503, "step": 29989 }, { "epoch": 2.36, "learning_rate": 3.247085975127223e-05, "loss": 1.4523, "step": 29990 }, { "epoch": 2.36, "learning_rate": 3.246318035434455e-05, "loss": 1.4455, "step": 29991 }, { "epoch": 2.36, "learning_rate": 3.245550175542706e-05, "loss": 1.4227, "step": 29992 }, { "epoch": 2.36, "learning_rate": 3.244782395457186e-05, "loss": 1.4413, "step": 29993 }, { "epoch": 2.36, "learning_rate": 3.244014695183101e-05, "loss": 1.4403, "step": 29994 }, { "epoch": 2.36, "learning_rate": 3.243247074725668e-05, "loss": 1.4698, "step": 29995 }, { "epoch": 2.36, "learning_rate": 3.242479534090104e-05, "loss": 1.5069, "step": 29996 }, { "epoch": 2.36, "learning_rate": 3.2417120732816165e-05, "loss": 1.4667, "step": 29997 }, { "epoch": 2.36, "learning_rate": 3.240944692305415e-05, "loss": 1.4484, "step": 29998 }, { "epoch": 2.36, "learning_rate": 3.240177391166705e-05, "loss": 1.4136, "step": 29999 }, { "epoch": 2.36, "learning_rate": 3.239410169870706e-05, "loss": 1.4584, "step": 30000 }, { "epoch": 2.36, "learning_rate": 3.2386430284226216e-05, "loss": 1.4815, "step": 30001 }, { "epoch": 2.36, "learning_rate": 3.237875966827657e-05, "loss": 1.4452, "step": 30002 }, { "epoch": 2.36, "learning_rate": 3.237108985091027e-05, "loss": 1.4112, "step": 30003 }, { "epoch": 2.36, "learning_rate": 3.2363420832179354e-05, "loss": 1.4124, "step": 30004 }, { "epoch": 2.36, "learning_rate": 3.235575261213586e-05, "loss": 1.4207, "step": 30005 }, { "epoch": 2.36, "learning_rate": 3.2348085190831924e-05, "loss": 1.4611, "step": 30006 }, { "epoch": 2.36, "learning_rate": 3.234041856831956e-05, "loss": 1.4553, "step": 30007 }, { "epoch": 2.36, "learning_rate": 3.233275274465077e-05, "loss": 1.4295, "step": 30008 }, { "epoch": 2.36, "learning_rate": 3.2325087719877714e-05, "loss": 1.51, "step": 30009 }, { "epoch": 2.36, "learning_rate": 3.231742349405234e-05, "loss": 1.4647, "step": 30010 }, { "epoch": 2.36, "learning_rate": 3.230976006722674e-05, "loss": 1.3984, "step": 30011 }, { "epoch": 2.36, "learning_rate": 3.230209743945289e-05, "loss": 1.4478, "step": 30012 }, { "epoch": 2.36, "learning_rate": 3.229443561078289e-05, "loss": 1.4273, "step": 30013 }, { "epoch": 2.36, "learning_rate": 3.228677458126872e-05, "loss": 1.4559, "step": 30014 }, { "epoch": 2.36, "learning_rate": 3.227911435096238e-05, "loss": 1.4974, "step": 30015 }, { "epoch": 2.36, "learning_rate": 3.227145491991585e-05, "loss": 1.4402, "step": 30016 }, { "epoch": 2.36, "learning_rate": 3.226379628818122e-05, "loss": 1.3773, "step": 30017 }, { "epoch": 2.36, "learning_rate": 3.225613845581045e-05, "loss": 1.4488, "step": 30018 }, { "epoch": 2.36, "learning_rate": 3.224848142285546e-05, "loss": 1.477, "step": 30019 }, { "epoch": 2.36, "learning_rate": 3.2240825189368364e-05, "loss": 1.4125, "step": 30020 }, { "epoch": 2.36, "learning_rate": 3.223316975540107e-05, "loss": 1.4531, "step": 30021 }, { "epoch": 2.36, "learning_rate": 3.2225515121005513e-05, "loss": 1.4329, "step": 30022 }, { "epoch": 2.36, "learning_rate": 3.221786128623377e-05, "loss": 1.4469, "step": 30023 }, { "epoch": 2.36, "learning_rate": 3.221020825113775e-05, "loss": 1.4896, "step": 30024 }, { "epoch": 2.36, "learning_rate": 3.220255601576937e-05, "loss": 1.4631, "step": 30025 }, { "epoch": 2.36, "learning_rate": 3.2194904580180635e-05, "loss": 1.4539, "step": 30026 }, { "epoch": 2.36, "learning_rate": 3.2187253944423516e-05, "loss": 1.5287, "step": 30027 }, { "epoch": 2.36, "learning_rate": 3.2179604108549946e-05, "loss": 1.4871, "step": 30028 }, { "epoch": 2.36, "learning_rate": 3.217195507261179e-05, "loss": 1.38, "step": 30029 }, { "epoch": 2.36, "learning_rate": 3.216430683666107e-05, "loss": 1.404, "step": 30030 }, { "epoch": 2.36, "learning_rate": 3.2156659400749696e-05, "loss": 1.4302, "step": 30031 }, { "epoch": 2.36, "learning_rate": 3.214901276492953e-05, "loss": 1.4526, "step": 30032 }, { "epoch": 2.36, "learning_rate": 3.214136692925256e-05, "loss": 1.4653, "step": 30033 }, { "epoch": 2.36, "learning_rate": 3.2133721893770685e-05, "loss": 1.4076, "step": 30034 }, { "epoch": 2.36, "learning_rate": 3.212607765853578e-05, "loss": 1.4454, "step": 30035 }, { "epoch": 2.36, "learning_rate": 3.211843422359974e-05, "loss": 1.4278, "step": 30036 }, { "epoch": 2.36, "learning_rate": 3.2110791589014494e-05, "loss": 1.4557, "step": 30037 }, { "epoch": 2.36, "learning_rate": 3.210314975483193e-05, "loss": 1.3849, "step": 30038 }, { "epoch": 2.36, "learning_rate": 3.209550872110389e-05, "loss": 1.4434, "step": 30039 }, { "epoch": 2.36, "learning_rate": 3.20878684878823e-05, "loss": 1.4686, "step": 30040 }, { "epoch": 2.36, "learning_rate": 3.208022905521902e-05, "loss": 1.4426, "step": 30041 }, { "epoch": 2.36, "learning_rate": 3.2072590423165864e-05, "loss": 1.4768, "step": 30042 }, { "epoch": 2.36, "learning_rate": 3.206495259177475e-05, "loss": 1.4569, "step": 30043 }, { "epoch": 2.36, "learning_rate": 3.205731556109758e-05, "loss": 1.5233, "step": 30044 }, { "epoch": 2.36, "learning_rate": 3.204967933118613e-05, "loss": 1.4277, "step": 30045 }, { "epoch": 2.36, "learning_rate": 3.2042043902092223e-05, "loss": 1.4101, "step": 30046 }, { "epoch": 2.36, "learning_rate": 3.2034409273867806e-05, "loss": 1.4801, "step": 30047 }, { "epoch": 2.36, "learning_rate": 3.2026775446564635e-05, "loss": 1.4438, "step": 30048 }, { "epoch": 2.36, "learning_rate": 3.2019142420234514e-05, "loss": 1.4578, "step": 30049 }, { "epoch": 2.36, "learning_rate": 3.201151019492936e-05, "loss": 1.4916, "step": 30050 }, { "epoch": 2.36, "learning_rate": 3.2003878770700934e-05, "loss": 1.4645, "step": 30051 }, { "epoch": 2.36, "learning_rate": 3.199624814760106e-05, "loss": 1.4221, "step": 30052 }, { "epoch": 2.36, "learning_rate": 3.1988618325681495e-05, "loss": 1.451, "step": 30053 }, { "epoch": 2.36, "learning_rate": 3.198098930499413e-05, "loss": 1.4466, "step": 30054 }, { "epoch": 2.36, "learning_rate": 3.197336108559072e-05, "loss": 1.3912, "step": 30055 }, { "epoch": 2.36, "learning_rate": 3.1965733667523025e-05, "loss": 1.4483, "step": 30056 }, { "epoch": 2.36, "learning_rate": 3.1958107050842835e-05, "loss": 1.4384, "step": 30057 }, { "epoch": 2.37, "learning_rate": 3.1950481235602024e-05, "loss": 1.4217, "step": 30058 }, { "epoch": 2.37, "learning_rate": 3.194285622185229e-05, "loss": 1.4148, "step": 30059 }, { "epoch": 2.37, "learning_rate": 3.1935232009645374e-05, "loss": 1.4301, "step": 30060 }, { "epoch": 2.37, "learning_rate": 3.192760859903311e-05, "loss": 1.4196, "step": 30061 }, { "epoch": 2.37, "learning_rate": 3.1919985990067245e-05, "loss": 1.3839, "step": 30062 }, { "epoch": 2.37, "learning_rate": 3.191236418279946e-05, "loss": 1.5227, "step": 30063 }, { "epoch": 2.37, "learning_rate": 3.190474317728161e-05, "loss": 1.4187, "step": 30064 }, { "epoch": 2.37, "learning_rate": 3.189712297356536e-05, "loss": 1.4032, "step": 30065 }, { "epoch": 2.37, "learning_rate": 3.188950357170244e-05, "loss": 1.444, "step": 30066 }, { "epoch": 2.37, "learning_rate": 3.188188497174466e-05, "loss": 1.465, "step": 30067 }, { "epoch": 2.37, "learning_rate": 3.1874267173743687e-05, "loss": 1.4527, "step": 30068 }, { "epoch": 2.37, "learning_rate": 3.186665017775126e-05, "loss": 1.4452, "step": 30069 }, { "epoch": 2.37, "learning_rate": 3.1859033983819056e-05, "loss": 1.4762, "step": 30070 }, { "epoch": 2.37, "learning_rate": 3.185141859199884e-05, "loss": 1.4907, "step": 30071 }, { "epoch": 2.37, "learning_rate": 3.1843804002342296e-05, "loss": 1.412, "step": 30072 }, { "epoch": 2.37, "learning_rate": 3.183619021490104e-05, "loss": 1.4581, "step": 30073 }, { "epoch": 2.37, "learning_rate": 3.182857722972693e-05, "loss": 1.4782, "step": 30074 }, { "epoch": 2.37, "learning_rate": 3.1820965046871554e-05, "loss": 1.4398, "step": 30075 }, { "epoch": 2.37, "learning_rate": 3.181335366638662e-05, "loss": 1.4169, "step": 30076 }, { "epoch": 2.37, "learning_rate": 3.180574308832375e-05, "loss": 1.4382, "step": 30077 }, { "epoch": 2.37, "learning_rate": 3.1798133312734695e-05, "loss": 1.4485, "step": 30078 }, { "epoch": 2.37, "learning_rate": 3.1790524339671093e-05, "loss": 1.4886, "step": 30079 }, { "epoch": 2.37, "learning_rate": 3.178291616918456e-05, "loss": 1.4439, "step": 30080 }, { "epoch": 2.37, "learning_rate": 3.177530880132682e-05, "loss": 1.4703, "step": 30081 }, { "epoch": 2.37, "learning_rate": 3.176770223614949e-05, "loss": 1.4405, "step": 30082 }, { "epoch": 2.37, "learning_rate": 3.176009647370419e-05, "loss": 1.4365, "step": 30083 }, { "epoch": 2.37, "learning_rate": 3.175249151404261e-05, "loss": 1.4405, "step": 30084 }, { "epoch": 2.37, "learning_rate": 3.1744887357216365e-05, "loss": 1.435, "step": 30085 }, { "epoch": 2.37, "learning_rate": 3.173728400327704e-05, "loss": 1.4877, "step": 30086 }, { "epoch": 2.37, "learning_rate": 3.1729681452276336e-05, "loss": 1.4938, "step": 30087 }, { "epoch": 2.37, "learning_rate": 3.172207970426582e-05, "loss": 1.4546, "step": 30088 }, { "epoch": 2.37, "learning_rate": 3.171447875929707e-05, "loss": 1.4938, "step": 30089 }, { "epoch": 2.37, "learning_rate": 3.170687861742173e-05, "loss": 1.4522, "step": 30090 }, { "epoch": 2.37, "learning_rate": 3.169927927869145e-05, "loss": 1.4736, "step": 30091 }, { "epoch": 2.37, "learning_rate": 3.1691680743157786e-05, "loss": 1.4446, "step": 30092 }, { "epoch": 2.37, "learning_rate": 3.168408301087232e-05, "loss": 1.4296, "step": 30093 }, { "epoch": 2.37, "learning_rate": 3.167648608188659e-05, "loss": 1.4417, "step": 30094 }, { "epoch": 2.37, "learning_rate": 3.166888995625227e-05, "loss": 1.4744, "step": 30095 }, { "epoch": 2.37, "learning_rate": 3.1661294634020876e-05, "loss": 1.4007, "step": 30096 }, { "epoch": 2.37, "learning_rate": 3.165370011524396e-05, "loss": 1.4252, "step": 30097 }, { "epoch": 2.37, "learning_rate": 3.164610639997315e-05, "loss": 1.465, "step": 30098 }, { "epoch": 2.37, "learning_rate": 3.163851348825996e-05, "loss": 1.4426, "step": 30099 }, { "epoch": 2.37, "learning_rate": 3.1630921380155915e-05, "loss": 1.4414, "step": 30100 }, { "epoch": 2.37, "learning_rate": 3.1623330075712624e-05, "loss": 1.4189, "step": 30101 }, { "epoch": 2.37, "learning_rate": 3.16157395749816e-05, "loss": 1.522, "step": 30102 }, { "epoch": 2.37, "learning_rate": 3.160814987801433e-05, "loss": 1.4792, "step": 30103 }, { "epoch": 2.37, "learning_rate": 3.160056098486239e-05, "loss": 1.4939, "step": 30104 }, { "epoch": 2.37, "learning_rate": 3.1592972895577345e-05, "loss": 1.4356, "step": 30105 }, { "epoch": 2.37, "learning_rate": 3.158538561021066e-05, "loss": 1.4809, "step": 30106 }, { "epoch": 2.37, "learning_rate": 3.1577799128813835e-05, "loss": 1.442, "step": 30107 }, { "epoch": 2.37, "learning_rate": 3.157021345143844e-05, "loss": 1.4407, "step": 30108 }, { "epoch": 2.37, "learning_rate": 3.156262857813594e-05, "loss": 1.4633, "step": 30109 }, { "epoch": 2.37, "learning_rate": 3.155504450895784e-05, "loss": 1.4213, "step": 30110 }, { "epoch": 2.37, "learning_rate": 3.154746124395556e-05, "loss": 1.4718, "step": 30111 }, { "epoch": 2.37, "learning_rate": 3.15398787831807e-05, "loss": 1.4336, "step": 30112 }, { "epoch": 2.37, "learning_rate": 3.153229712668471e-05, "loss": 1.3993, "step": 30113 }, { "epoch": 2.37, "learning_rate": 3.1524716274519e-05, "loss": 1.4291, "step": 30114 }, { "epoch": 2.37, "learning_rate": 3.151713622673511e-05, "loss": 1.4359, "step": 30115 }, { "epoch": 2.37, "learning_rate": 3.1509556983384496e-05, "loss": 1.4625, "step": 30116 }, { "epoch": 2.37, "learning_rate": 3.150197854451856e-05, "loss": 1.4669, "step": 30117 }, { "epoch": 2.37, "learning_rate": 3.149440091018883e-05, "loss": 1.4418, "step": 30118 }, { "epoch": 2.37, "learning_rate": 3.1486824080446734e-05, "loss": 1.4941, "step": 30119 }, { "epoch": 2.37, "learning_rate": 3.1479248055343655e-05, "loss": 1.425, "step": 30120 }, { "epoch": 2.37, "learning_rate": 3.147167283493107e-05, "loss": 1.4341, "step": 30121 }, { "epoch": 2.37, "learning_rate": 3.146409841926046e-05, "loss": 1.468, "step": 30122 }, { "epoch": 2.37, "learning_rate": 3.1456524808383205e-05, "loss": 1.4392, "step": 30123 }, { "epoch": 2.37, "learning_rate": 3.1448952002350705e-05, "loss": 1.4508, "step": 30124 }, { "epoch": 2.37, "learning_rate": 3.1441380001214414e-05, "loss": 1.452, "step": 30125 }, { "epoch": 2.37, "learning_rate": 3.1433808805025736e-05, "loss": 1.4334, "step": 30126 }, { "epoch": 2.37, "learning_rate": 3.142623841383608e-05, "loss": 1.4616, "step": 30127 }, { "epoch": 2.37, "learning_rate": 3.141866882769678e-05, "loss": 1.4203, "step": 30128 }, { "epoch": 2.37, "learning_rate": 3.141110004665933e-05, "loss": 1.4581, "step": 30129 }, { "epoch": 2.37, "learning_rate": 3.1403532070775064e-05, "loss": 1.477, "step": 30130 }, { "epoch": 2.37, "learning_rate": 3.139596490009531e-05, "loss": 1.4836, "step": 30131 }, { "epoch": 2.37, "learning_rate": 3.138839853467156e-05, "loss": 1.4636, "step": 30132 }, { "epoch": 2.37, "learning_rate": 3.138083297455512e-05, "loss": 1.4412, "step": 30133 }, { "epoch": 2.37, "learning_rate": 3.137326821979733e-05, "loss": 1.4536, "step": 30134 }, { "epoch": 2.37, "learning_rate": 3.136570427044963e-05, "loss": 1.485, "step": 30135 }, { "epoch": 2.37, "learning_rate": 3.135814112656328e-05, "loss": 1.4007, "step": 30136 }, { "epoch": 2.37, "learning_rate": 3.1350578788189735e-05, "loss": 1.3946, "step": 30137 }, { "epoch": 2.37, "learning_rate": 3.134301725538024e-05, "loss": 1.4404, "step": 30138 }, { "epoch": 2.37, "learning_rate": 3.1335456528186196e-05, "loss": 1.4095, "step": 30139 }, { "epoch": 2.37, "learning_rate": 3.132789660665894e-05, "loss": 1.4704, "step": 30140 }, { "epoch": 2.37, "learning_rate": 3.132033749084973e-05, "loss": 1.4551, "step": 30141 }, { "epoch": 2.37, "learning_rate": 3.131277918080998e-05, "loss": 1.4318, "step": 30142 }, { "epoch": 2.37, "learning_rate": 3.130522167659095e-05, "loss": 1.4937, "step": 30143 }, { "epoch": 2.37, "learning_rate": 3.129766497824393e-05, "loss": 1.4593, "step": 30144 }, { "epoch": 2.37, "learning_rate": 3.1290109085820306e-05, "loss": 1.4738, "step": 30145 }, { "epoch": 2.37, "learning_rate": 3.1282553999371324e-05, "loss": 1.4438, "step": 30146 }, { "epoch": 2.37, "learning_rate": 3.12749997189483e-05, "loss": 1.4292, "step": 30147 }, { "epoch": 2.37, "learning_rate": 3.126744624460245e-05, "loss": 1.4872, "step": 30148 }, { "epoch": 2.37, "learning_rate": 3.125989357638516e-05, "loss": 1.425, "step": 30149 }, { "epoch": 2.37, "learning_rate": 3.125234171434769e-05, "loss": 1.4495, "step": 30150 }, { "epoch": 2.37, "learning_rate": 3.124479065854124e-05, "loss": 1.3968, "step": 30151 }, { "epoch": 2.37, "learning_rate": 3.123724040901711e-05, "loss": 1.4513, "step": 30152 }, { "epoch": 2.37, "learning_rate": 3.122969096582664e-05, "loss": 1.4944, "step": 30153 }, { "epoch": 2.37, "learning_rate": 3.1222142329021006e-05, "loss": 1.4609, "step": 30154 }, { "epoch": 2.37, "learning_rate": 3.121459449865144e-05, "loss": 1.4837, "step": 30155 }, { "epoch": 2.37, "learning_rate": 3.120704747476929e-05, "loss": 1.4343, "step": 30156 }, { "epoch": 2.37, "learning_rate": 3.11995012574257e-05, "loss": 1.4582, "step": 30157 }, { "epoch": 2.37, "learning_rate": 3.1191955846671914e-05, "loss": 1.4338, "step": 30158 }, { "epoch": 2.37, "learning_rate": 3.1184411242559224e-05, "loss": 1.4332, "step": 30159 }, { "epoch": 2.37, "learning_rate": 3.117686744513882e-05, "loss": 1.4568, "step": 30160 }, { "epoch": 2.37, "learning_rate": 3.116932445446187e-05, "loss": 1.5005, "step": 30161 }, { "epoch": 2.37, "learning_rate": 3.116178227057967e-05, "loss": 1.4095, "step": 30162 }, { "epoch": 2.37, "learning_rate": 3.115424089354337e-05, "loss": 1.499, "step": 30163 }, { "epoch": 2.37, "learning_rate": 3.1146700323404204e-05, "loss": 1.4346, "step": 30164 }, { "epoch": 2.37, "learning_rate": 3.113916056021332e-05, "loss": 1.4576, "step": 30165 }, { "epoch": 2.37, "learning_rate": 3.1131621604021976e-05, "loss": 1.4585, "step": 30166 }, { "epoch": 2.37, "learning_rate": 3.11240834548813e-05, "loss": 1.4523, "step": 30167 }, { "epoch": 2.37, "learning_rate": 3.111654611284252e-05, "loss": 1.3779, "step": 30168 }, { "epoch": 2.37, "learning_rate": 3.110900957795674e-05, "loss": 1.4553, "step": 30169 }, { "epoch": 2.37, "learning_rate": 3.1101473850275227e-05, "loss": 1.4228, "step": 30170 }, { "epoch": 2.37, "learning_rate": 3.1093938929849094e-05, "loss": 1.416, "step": 30171 }, { "epoch": 2.37, "learning_rate": 3.108640481672945e-05, "loss": 1.4394, "step": 30172 }, { "epoch": 2.37, "learning_rate": 3.107887151096755e-05, "loss": 1.5123, "step": 30173 }, { "epoch": 2.37, "learning_rate": 3.107133901261448e-05, "loss": 1.444, "step": 30174 }, { "epoch": 2.37, "learning_rate": 3.106380732172133e-05, "loss": 1.5257, "step": 30175 }, { "epoch": 2.37, "learning_rate": 3.105627643833935e-05, "loss": 1.3851, "step": 30176 }, { "epoch": 2.37, "learning_rate": 3.104874636251962e-05, "loss": 1.45, "step": 30177 }, { "epoch": 2.37, "learning_rate": 3.1041217094313205e-05, "loss": 1.4447, "step": 30178 }, { "epoch": 2.37, "learning_rate": 3.1033688633771337e-05, "loss": 1.4623, "step": 30179 }, { "epoch": 2.37, "learning_rate": 3.1026160980945057e-05, "loss": 1.4921, "step": 30180 }, { "epoch": 2.37, "learning_rate": 3.1018634135885485e-05, "loss": 1.4403, "step": 30181 }, { "epoch": 2.37, "learning_rate": 3.10111080986437e-05, "loss": 1.4217, "step": 30182 }, { "epoch": 2.37, "learning_rate": 3.1003582869270835e-05, "loss": 1.4345, "step": 30183 }, { "epoch": 2.37, "learning_rate": 3.099605844781799e-05, "loss": 1.481, "step": 30184 }, { "epoch": 2.37, "learning_rate": 3.0988534834336204e-05, "loss": 1.4455, "step": 30185 }, { "epoch": 2.38, "learning_rate": 3.098101202887665e-05, "loss": 1.4388, "step": 30186 }, { "epoch": 2.38, "learning_rate": 3.0973490031490324e-05, "loss": 1.4912, "step": 30187 }, { "epoch": 2.38, "learning_rate": 3.0965968842228326e-05, "loss": 1.3943, "step": 30188 }, { "epoch": 2.38, "learning_rate": 3.095844846114166e-05, "loss": 1.4519, "step": 30189 }, { "epoch": 2.38, "learning_rate": 3.095092888828149e-05, "loss": 1.422, "step": 30190 }, { "epoch": 2.38, "learning_rate": 3.094341012369881e-05, "loss": 1.4948, "step": 30191 }, { "epoch": 2.38, "learning_rate": 3.0935892167444625e-05, "loss": 1.4586, "step": 30192 }, { "epoch": 2.38, "learning_rate": 3.092837501957009e-05, "loss": 1.4363, "step": 30193 }, { "epoch": 2.38, "learning_rate": 3.092085868012616e-05, "loss": 1.4525, "step": 30194 }, { "epoch": 2.38, "learning_rate": 3.091334314916386e-05, "loss": 1.4861, "step": 30195 }, { "epoch": 2.38, "learning_rate": 3.090582842673427e-05, "loss": 1.4428, "step": 30196 }, { "epoch": 2.38, "learning_rate": 3.08983145128884e-05, "loss": 1.4173, "step": 30197 }, { "epoch": 2.38, "learning_rate": 3.0890801407677176e-05, "loss": 1.4776, "step": 30198 }, { "epoch": 2.38, "learning_rate": 3.0883289111151715e-05, "loss": 1.4453, "step": 30199 }, { "epoch": 2.38, "learning_rate": 3.087577762336301e-05, "loss": 1.4115, "step": 30200 }, { "epoch": 2.38, "learning_rate": 3.0868266944362045e-05, "loss": 1.4322, "step": 30201 }, { "epoch": 2.38, "learning_rate": 3.086075707419976e-05, "loss": 1.4403, "step": 30202 }, { "epoch": 2.38, "learning_rate": 3.085324801292723e-05, "loss": 1.4329, "step": 30203 }, { "epoch": 2.38, "learning_rate": 3.084573976059539e-05, "loss": 1.4667, "step": 30204 }, { "epoch": 2.38, "learning_rate": 3.083823231725522e-05, "loss": 1.4693, "step": 30205 }, { "epoch": 2.38, "learning_rate": 3.0830725682957656e-05, "loss": 1.4855, "step": 30206 }, { "epoch": 2.38, "learning_rate": 3.0823219857753754e-05, "loss": 1.4749, "step": 30207 }, { "epoch": 2.38, "learning_rate": 3.0815714841694406e-05, "loss": 1.4065, "step": 30208 }, { "epoch": 2.38, "learning_rate": 3.080821063483055e-05, "loss": 1.5156, "step": 30209 }, { "epoch": 2.38, "learning_rate": 3.0800707237213214e-05, "loss": 1.455, "step": 30210 }, { "epoch": 2.38, "learning_rate": 3.0793204648893285e-05, "loss": 1.4469, "step": 30211 }, { "epoch": 2.38, "learning_rate": 3.0785702869921686e-05, "loss": 1.4636, "step": 30212 }, { "epoch": 2.38, "learning_rate": 3.0778201900349415e-05, "loss": 1.4472, "step": 30213 }, { "epoch": 2.38, "learning_rate": 3.077070174022731e-05, "loss": 1.4168, "step": 30214 }, { "epoch": 2.38, "learning_rate": 3.0763202389606386e-05, "loss": 1.4327, "step": 30215 }, { "epoch": 2.38, "learning_rate": 3.075570384853748e-05, "loss": 1.4954, "step": 30216 }, { "epoch": 2.38, "learning_rate": 3.074820611707159e-05, "loss": 1.4992, "step": 30217 }, { "epoch": 2.38, "learning_rate": 3.074070919525956e-05, "loss": 1.4401, "step": 30218 }, { "epoch": 2.38, "learning_rate": 3.073321308315227e-05, "loss": 1.4419, "step": 30219 }, { "epoch": 2.38, "learning_rate": 3.072571778080067e-05, "loss": 1.4638, "step": 30220 }, { "epoch": 2.38, "learning_rate": 3.0718223288255635e-05, "loss": 1.4105, "step": 30221 }, { "epoch": 2.38, "learning_rate": 3.071072960556804e-05, "loss": 1.4225, "step": 30222 }, { "epoch": 2.38, "learning_rate": 3.070323673278872e-05, "loss": 1.4439, "step": 30223 }, { "epoch": 2.38, "learning_rate": 3.0695744669968636e-05, "loss": 1.4658, "step": 30224 }, { "epoch": 2.38, "learning_rate": 3.068825341715861e-05, "loss": 1.4463, "step": 30225 }, { "epoch": 2.38, "learning_rate": 3.068076297440945e-05, "loss": 1.41, "step": 30226 }, { "epoch": 2.38, "learning_rate": 3.0673273341772105e-05, "loss": 1.417, "step": 30227 }, { "epoch": 2.38, "learning_rate": 3.066578451929739e-05, "loss": 1.4746, "step": 30228 }, { "epoch": 2.38, "learning_rate": 3.06582965070361e-05, "loss": 1.4222, "step": 30229 }, { "epoch": 2.38, "learning_rate": 3.065080930503912e-05, "loss": 1.4422, "step": 30230 }, { "epoch": 2.38, "learning_rate": 3.0643322913357327e-05, "loss": 1.4936, "step": 30231 }, { "epoch": 2.38, "learning_rate": 3.063583733204149e-05, "loss": 1.4262, "step": 30232 }, { "epoch": 2.38, "learning_rate": 3.062835256114242e-05, "loss": 1.4622, "step": 30233 }, { "epoch": 2.38, "learning_rate": 3.062086860071101e-05, "loss": 1.4039, "step": 30234 }, { "epoch": 2.38, "learning_rate": 3.061338545079801e-05, "loss": 1.4578, "step": 30235 }, { "epoch": 2.38, "learning_rate": 3.0605903111454194e-05, "loss": 1.5228, "step": 30236 }, { "epoch": 2.38, "learning_rate": 3.059842158273047e-05, "loss": 1.4634, "step": 30237 }, { "epoch": 2.38, "learning_rate": 3.0590940864677546e-05, "loss": 1.485, "step": 30238 }, { "epoch": 2.38, "learning_rate": 3.058346095734622e-05, "loss": 1.4553, "step": 30239 }, { "epoch": 2.38, "learning_rate": 3.057598186078732e-05, "loss": 1.3955, "step": 30240 }, { "epoch": 2.38, "learning_rate": 3.056850357505161e-05, "loss": 1.3858, "step": 30241 }, { "epoch": 2.38, "learning_rate": 3.056102610018985e-05, "loss": 1.4939, "step": 30242 }, { "epoch": 2.38, "learning_rate": 3.055354943625276e-05, "loss": 1.4576, "step": 30243 }, { "epoch": 2.38, "learning_rate": 3.0546073583291216e-05, "loss": 1.4392, "step": 30244 }, { "epoch": 2.38, "learning_rate": 3.0538598541355894e-05, "loss": 1.4624, "step": 30245 }, { "epoch": 2.38, "learning_rate": 3.053112431049752e-05, "loss": 1.4493, "step": 30246 }, { "epoch": 2.38, "learning_rate": 3.05236508907669e-05, "loss": 1.4132, "step": 30247 }, { "epoch": 2.38, "learning_rate": 3.051617828221478e-05, "loss": 1.4583, "step": 30248 }, { "epoch": 2.38, "learning_rate": 3.0508706484891893e-05, "loss": 1.4189, "step": 30249 }, { "epoch": 2.38, "learning_rate": 3.0501235498848898e-05, "loss": 1.4466, "step": 30250 }, { "epoch": 2.38, "learning_rate": 3.0493765324136605e-05, "loss": 1.4313, "step": 30251 }, { "epoch": 2.38, "learning_rate": 3.0486295960805707e-05, "loss": 1.4079, "step": 30252 }, { "epoch": 2.38, "learning_rate": 3.0478827408906847e-05, "loss": 1.3629, "step": 30253 }, { "epoch": 2.38, "learning_rate": 3.0471359668490852e-05, "loss": 1.4312, "step": 30254 }, { "epoch": 2.38, "learning_rate": 3.046389273960835e-05, "loss": 1.4627, "step": 30255 }, { "epoch": 2.38, "learning_rate": 3.0456426622310027e-05, "loss": 1.4084, "step": 30256 }, { "epoch": 2.38, "learning_rate": 3.044896131664663e-05, "loss": 1.4497, "step": 30257 }, { "epoch": 2.38, "learning_rate": 3.0441496822668802e-05, "loss": 1.4871, "step": 30258 }, { "epoch": 2.38, "learning_rate": 3.0434033140427238e-05, "loss": 1.4195, "step": 30259 }, { "epoch": 2.38, "learning_rate": 3.0426570269972577e-05, "loss": 1.4159, "step": 30260 }, { "epoch": 2.38, "learning_rate": 3.0419108211355547e-05, "loss": 1.4809, "step": 30261 }, { "epoch": 2.38, "learning_rate": 3.041164696462674e-05, "loss": 1.4558, "step": 30262 }, { "epoch": 2.38, "learning_rate": 3.04041865298369e-05, "loss": 1.45, "step": 30263 }, { "epoch": 2.38, "learning_rate": 3.03967269070366e-05, "loss": 1.4377, "step": 30264 }, { "epoch": 2.38, "learning_rate": 3.0389268096276553e-05, "loss": 1.4573, "step": 30265 }, { "epoch": 2.38, "learning_rate": 3.0381810097607383e-05, "loss": 1.437, "step": 30266 }, { "epoch": 2.38, "learning_rate": 3.0374352911079653e-05, "loss": 1.4494, "step": 30267 }, { "epoch": 2.38, "learning_rate": 3.0366896536744102e-05, "loss": 1.3863, "step": 30268 }, { "epoch": 2.38, "learning_rate": 3.0359440974651304e-05, "loss": 1.4882, "step": 30269 }, { "epoch": 2.38, "learning_rate": 3.0351986224851843e-05, "loss": 1.4129, "step": 30270 }, { "epoch": 2.38, "learning_rate": 3.0344532287396407e-05, "loss": 1.4676, "step": 30271 }, { "epoch": 2.38, "learning_rate": 3.0337079162335552e-05, "loss": 1.4913, "step": 30272 }, { "epoch": 2.38, "learning_rate": 3.0329626849719864e-05, "loss": 1.3802, "step": 30273 }, { "epoch": 2.38, "learning_rate": 3.032217534960001e-05, "loss": 1.4182, "step": 30274 }, { "epoch": 2.38, "learning_rate": 3.031472466202655e-05, "loss": 1.4951, "step": 30275 }, { "epoch": 2.38, "learning_rate": 3.030727478705005e-05, "loss": 1.4778, "step": 30276 }, { "epoch": 2.38, "learning_rate": 3.0299825724721033e-05, "loss": 1.4363, "step": 30277 }, { "epoch": 2.38, "learning_rate": 3.0292377475090208e-05, "loss": 1.4555, "step": 30278 }, { "epoch": 2.38, "learning_rate": 3.028493003820808e-05, "loss": 1.4448, "step": 30279 }, { "epoch": 2.38, "learning_rate": 3.0277483414125236e-05, "loss": 1.4791, "step": 30280 }, { "epoch": 2.38, "learning_rate": 3.0270037602892144e-05, "loss": 1.4504, "step": 30281 }, { "epoch": 2.38, "learning_rate": 3.0262592604559482e-05, "loss": 1.474, "step": 30282 }, { "epoch": 2.38, "learning_rate": 3.0255148419177726e-05, "loss": 1.4662, "step": 30283 }, { "epoch": 2.38, "learning_rate": 3.0247705046797404e-05, "loss": 1.5009, "step": 30284 }, { "epoch": 2.38, "learning_rate": 3.0240262487469123e-05, "loss": 1.4718, "step": 30285 }, { "epoch": 2.38, "learning_rate": 3.0232820741243365e-05, "loss": 1.4593, "step": 30286 }, { "epoch": 2.38, "learning_rate": 3.0225379808170614e-05, "loss": 1.451, "step": 30287 }, { "epoch": 2.38, "learning_rate": 3.0217939688301484e-05, "loss": 1.4914, "step": 30288 }, { "epoch": 2.38, "learning_rate": 3.0210500381686437e-05, "loss": 1.5017, "step": 30289 }, { "epoch": 2.38, "learning_rate": 3.0203061888375947e-05, "loss": 1.4566, "step": 30290 }, { "epoch": 2.38, "learning_rate": 3.0195624208420603e-05, "loss": 1.4902, "step": 30291 }, { "epoch": 2.38, "learning_rate": 3.0188187341870857e-05, "loss": 1.4375, "step": 30292 }, { "epoch": 2.38, "learning_rate": 3.018075128877716e-05, "loss": 1.4194, "step": 30293 }, { "epoch": 2.38, "learning_rate": 3.0173316049190044e-05, "loss": 1.4392, "step": 30294 }, { "epoch": 2.38, "learning_rate": 3.0165881623160015e-05, "loss": 1.4657, "step": 30295 }, { "epoch": 2.38, "learning_rate": 3.0158448010737536e-05, "loss": 1.4202, "step": 30296 }, { "epoch": 2.38, "learning_rate": 3.015101521197301e-05, "loss": 1.4731, "step": 30297 }, { "epoch": 2.38, "learning_rate": 3.014358322691699e-05, "loss": 1.4498, "step": 30298 }, { "epoch": 2.38, "learning_rate": 3.0136152055619893e-05, "loss": 1.4217, "step": 30299 }, { "epoch": 2.38, "learning_rate": 3.01287216981322e-05, "loss": 1.456, "step": 30300 }, { "epoch": 2.38, "learning_rate": 3.0121292154504272e-05, "loss": 1.4692, "step": 30301 }, { "epoch": 2.38, "learning_rate": 3.0113863424786666e-05, "loss": 1.4788, "step": 30302 }, { "epoch": 2.38, "learning_rate": 3.0106435509029775e-05, "loss": 1.4352, "step": 30303 }, { "epoch": 2.38, "learning_rate": 3.0099008407283974e-05, "loss": 1.4876, "step": 30304 }, { "epoch": 2.38, "learning_rate": 3.0091582119599794e-05, "loss": 1.4741, "step": 30305 }, { "epoch": 2.38, "learning_rate": 3.0084156646027576e-05, "loss": 1.4598, "step": 30306 }, { "epoch": 2.38, "learning_rate": 3.007673198661774e-05, "loss": 1.4078, "step": 30307 }, { "epoch": 2.38, "learning_rate": 3.0069308141420738e-05, "loss": 1.484, "step": 30308 }, { "epoch": 2.38, "learning_rate": 3.0061885110486927e-05, "loss": 1.4521, "step": 30309 }, { "epoch": 2.38, "learning_rate": 3.0054462893866765e-05, "loss": 1.4681, "step": 30310 }, { "epoch": 2.38, "learning_rate": 3.004704149161056e-05, "loss": 1.4473, "step": 30311 }, { "epoch": 2.38, "learning_rate": 3.0039620903768797e-05, "loss": 1.4719, "step": 30312 }, { "epoch": 2.39, "learning_rate": 3.0032201130391808e-05, "loss": 1.4486, "step": 30313 }, { "epoch": 2.39, "learning_rate": 3.0024782171529927e-05, "loss": 1.5076, "step": 30314 }, { "epoch": 2.39, "learning_rate": 3.0017364027233593e-05, "loss": 1.465, "step": 30315 }, { "epoch": 2.39, "learning_rate": 3.0009946697553165e-05, "loss": 1.4656, "step": 30316 }, { "epoch": 2.39, "learning_rate": 3.0002530182538976e-05, "loss": 1.5076, "step": 30317 }, { "epoch": 2.39, "learning_rate": 2.9995114482241344e-05, "loss": 1.462, "step": 30318 }, { "epoch": 2.39, "learning_rate": 2.99876995967107e-05, "loss": 1.471, "step": 30319 }, { "epoch": 2.39, "learning_rate": 2.9980285525997354e-05, "loss": 1.5038, "step": 30320 }, { "epoch": 2.39, "learning_rate": 2.99728722701516e-05, "loss": 1.4427, "step": 30321 }, { "epoch": 2.39, "learning_rate": 2.9965459829223843e-05, "loss": 1.4357, "step": 30322 }, { "epoch": 2.39, "learning_rate": 2.9958048203264378e-05, "loss": 1.4744, "step": 30323 }, { "epoch": 2.39, "learning_rate": 2.9950637392323468e-05, "loss": 1.4726, "step": 30324 }, { "epoch": 2.39, "learning_rate": 2.9943227396451486e-05, "loss": 1.4229, "step": 30325 }, { "epoch": 2.39, "learning_rate": 2.9935818215698775e-05, "loss": 1.417, "step": 30326 }, { "epoch": 2.39, "learning_rate": 2.9928409850115613e-05, "loss": 1.4996, "step": 30327 }, { "epoch": 2.39, "learning_rate": 2.9921002299752243e-05, "loss": 1.4962, "step": 30328 }, { "epoch": 2.39, "learning_rate": 2.991359556465904e-05, "loss": 1.4539, "step": 30329 }, { "epoch": 2.39, "learning_rate": 2.9906189644886252e-05, "loss": 1.4527, "step": 30330 }, { "epoch": 2.39, "learning_rate": 2.9898784540484116e-05, "loss": 1.4056, "step": 30331 }, { "epoch": 2.39, "learning_rate": 2.989138025150301e-05, "loss": 1.4887, "step": 30332 }, { "epoch": 2.39, "learning_rate": 2.9883976777993147e-05, "loss": 1.4742, "step": 30333 }, { "epoch": 2.39, "learning_rate": 2.9876574120004782e-05, "loss": 1.4879, "step": 30334 }, { "epoch": 2.39, "learning_rate": 2.986917227758816e-05, "loss": 1.4542, "step": 30335 }, { "epoch": 2.39, "learning_rate": 2.9861771250793608e-05, "loss": 1.4774, "step": 30336 }, { "epoch": 2.39, "learning_rate": 2.9854371039671338e-05, "loss": 1.4016, "step": 30337 }, { "epoch": 2.39, "learning_rate": 2.984697164427154e-05, "loss": 1.4235, "step": 30338 }, { "epoch": 2.39, "learning_rate": 2.9839573064644522e-05, "loss": 1.465, "step": 30339 }, { "epoch": 2.39, "learning_rate": 2.9832175300840482e-05, "loss": 1.4616, "step": 30340 }, { "epoch": 2.39, "learning_rate": 2.982477835290968e-05, "loss": 1.5043, "step": 30341 }, { "epoch": 2.39, "learning_rate": 2.981738222090227e-05, "loss": 1.4862, "step": 30342 }, { "epoch": 2.39, "learning_rate": 2.9809986904868566e-05, "loss": 1.4828, "step": 30343 }, { "epoch": 2.39, "learning_rate": 2.980259240485871e-05, "loss": 1.4205, "step": 30344 }, { "epoch": 2.39, "learning_rate": 2.9795198720922898e-05, "loss": 1.4295, "step": 30345 }, { "epoch": 2.39, "learning_rate": 2.9787805853111384e-05, "loss": 1.5057, "step": 30346 }, { "epoch": 2.39, "learning_rate": 2.9780413801474334e-05, "loss": 1.4594, "step": 30347 }, { "epoch": 2.39, "learning_rate": 2.977302256606187e-05, "loss": 1.4487, "step": 30348 }, { "epoch": 2.39, "learning_rate": 2.9765632146924305e-05, "loss": 1.4079, "step": 30349 }, { "epoch": 2.39, "learning_rate": 2.9758242544111733e-05, "loss": 1.4711, "step": 30350 }, { "epoch": 2.39, "learning_rate": 2.975085375767431e-05, "loss": 1.4449, "step": 30351 }, { "epoch": 2.39, "learning_rate": 2.9743465787662245e-05, "loss": 1.4578, "step": 30352 }, { "epoch": 2.39, "learning_rate": 2.9736078634125705e-05, "loss": 1.442, "step": 30353 }, { "epoch": 2.39, "learning_rate": 2.9728692297114825e-05, "loss": 1.4858, "step": 30354 }, { "epoch": 2.39, "learning_rate": 2.9721306776679705e-05, "loss": 1.5023, "step": 30355 }, { "epoch": 2.39, "learning_rate": 2.971392207287055e-05, "loss": 1.4644, "step": 30356 }, { "epoch": 2.39, "learning_rate": 2.9706538185737505e-05, "loss": 1.415, "step": 30357 }, { "epoch": 2.39, "learning_rate": 2.9699155115330697e-05, "loss": 1.4656, "step": 30358 }, { "epoch": 2.39, "learning_rate": 2.9691772861700203e-05, "loss": 1.4601, "step": 30359 }, { "epoch": 2.39, "learning_rate": 2.9684391424896197e-05, "loss": 1.4508, "step": 30360 }, { "epoch": 2.39, "learning_rate": 2.9677010804968794e-05, "loss": 1.4218, "step": 30361 }, { "epoch": 2.39, "learning_rate": 2.9669631001968047e-05, "loss": 1.5003, "step": 30362 }, { "epoch": 2.39, "learning_rate": 2.966225201594414e-05, "loss": 1.4119, "step": 30363 }, { "epoch": 2.39, "learning_rate": 2.9654873846947142e-05, "loss": 1.4726, "step": 30364 }, { "epoch": 2.39, "learning_rate": 2.9647496495027084e-05, "loss": 1.4519, "step": 30365 }, { "epoch": 2.39, "learning_rate": 2.964011996023416e-05, "loss": 1.4684, "step": 30366 }, { "epoch": 2.39, "learning_rate": 2.9632744242618394e-05, "loss": 1.4803, "step": 30367 }, { "epoch": 2.39, "learning_rate": 2.9625369342229833e-05, "loss": 1.4258, "step": 30368 }, { "epoch": 2.39, "learning_rate": 2.9617995259118617e-05, "loss": 1.499, "step": 30369 }, { "epoch": 2.39, "learning_rate": 2.9610621993334787e-05, "loss": 1.4105, "step": 30370 }, { "epoch": 2.39, "learning_rate": 2.960324954492841e-05, "loss": 1.4532, "step": 30371 }, { "epoch": 2.39, "learning_rate": 2.959587791394944e-05, "loss": 1.4305, "step": 30372 }, { "epoch": 2.39, "learning_rate": 2.9588507100448088e-05, "loss": 1.4619, "step": 30373 }, { "epoch": 2.39, "learning_rate": 2.9581137104474333e-05, "loss": 1.4742, "step": 30374 }, { "epoch": 2.39, "learning_rate": 2.9573767926078202e-05, "loss": 1.4655, "step": 30375 }, { "epoch": 2.39, "learning_rate": 2.9566399565309683e-05, "loss": 1.4397, "step": 30376 }, { "epoch": 2.39, "learning_rate": 2.9559032022218894e-05, "loss": 1.4046, "step": 30377 }, { "epoch": 2.39, "learning_rate": 2.955166529685582e-05, "loss": 1.4366, "step": 30378 }, { "epoch": 2.39, "learning_rate": 2.9544299389270425e-05, "loss": 1.4539, "step": 30379 }, { "epoch": 2.39, "learning_rate": 2.9536934299512803e-05, "loss": 1.4591, "step": 30380 }, { "epoch": 2.39, "learning_rate": 2.9529570027632916e-05, "loss": 1.4394, "step": 30381 }, { "epoch": 2.39, "learning_rate": 2.9522206573680734e-05, "loss": 1.4477, "step": 30382 }, { "epoch": 2.39, "learning_rate": 2.951484393770632e-05, "loss": 1.4166, "step": 30383 }, { "epoch": 2.39, "learning_rate": 2.9507482119759623e-05, "loss": 1.4958, "step": 30384 }, { "epoch": 2.39, "learning_rate": 2.9500121119890595e-05, "loss": 1.4515, "step": 30385 }, { "epoch": 2.39, "learning_rate": 2.9492760938149285e-05, "loss": 1.4773, "step": 30386 }, { "epoch": 2.39, "learning_rate": 2.94854015745856e-05, "loss": 1.5034, "step": 30387 }, { "epoch": 2.39, "learning_rate": 2.9478043029249564e-05, "loss": 1.4508, "step": 30388 }, { "epoch": 2.39, "learning_rate": 2.947068530219106e-05, "loss": 1.4869, "step": 30389 }, { "epoch": 2.39, "learning_rate": 2.946332839346013e-05, "loss": 1.4703, "step": 30390 }, { "epoch": 2.39, "learning_rate": 2.9455972303106695e-05, "loss": 1.457, "step": 30391 }, { "epoch": 2.39, "learning_rate": 2.944861703118067e-05, "loss": 1.4807, "step": 30392 }, { "epoch": 2.39, "learning_rate": 2.9441262577731983e-05, "loss": 1.4944, "step": 30393 }, { "epoch": 2.39, "learning_rate": 2.9433908942810623e-05, "loss": 1.3712, "step": 30394 }, { "epoch": 2.39, "learning_rate": 2.9426556126466488e-05, "loss": 1.4736, "step": 30395 }, { "epoch": 2.39, "learning_rate": 2.9419204128749468e-05, "loss": 1.4167, "step": 30396 }, { "epoch": 2.39, "learning_rate": 2.941185294970954e-05, "loss": 1.4488, "step": 30397 }, { "epoch": 2.39, "learning_rate": 2.9404502589396582e-05, "loss": 1.3992, "step": 30398 }, { "epoch": 2.39, "learning_rate": 2.9397153047860474e-05, "loss": 1.4851, "step": 30399 }, { "epoch": 2.39, "learning_rate": 2.9389804325151183e-05, "loss": 1.4448, "step": 30400 }, { "epoch": 2.39, "learning_rate": 2.9382456421318547e-05, "loss": 1.4898, "step": 30401 }, { "epoch": 2.39, "learning_rate": 2.937510933641245e-05, "loss": 1.4665, "step": 30402 }, { "epoch": 2.39, "learning_rate": 2.9367763070482776e-05, "loss": 1.4315, "step": 30403 }, { "epoch": 2.39, "learning_rate": 2.9360417623579463e-05, "loss": 1.4354, "step": 30404 }, { "epoch": 2.39, "learning_rate": 2.935307299575234e-05, "loss": 1.4252, "step": 30405 }, { "epoch": 2.39, "learning_rate": 2.9345729187051253e-05, "loss": 1.4477, "step": 30406 }, { "epoch": 2.39, "learning_rate": 2.9338386197526093e-05, "loss": 1.4618, "step": 30407 }, { "epoch": 2.39, "learning_rate": 2.933104402722672e-05, "loss": 1.4468, "step": 30408 }, { "epoch": 2.39, "learning_rate": 2.9323702676202926e-05, "loss": 1.4602, "step": 30409 }, { "epoch": 2.39, "learning_rate": 2.931636214450464e-05, "loss": 1.403, "step": 30410 }, { "epoch": 2.39, "learning_rate": 2.9309022432181655e-05, "loss": 1.4758, "step": 30411 }, { "epoch": 2.39, "learning_rate": 2.9301683539283798e-05, "loss": 1.5021, "step": 30412 }, { "epoch": 2.39, "learning_rate": 2.9294345465860862e-05, "loss": 1.394, "step": 30413 }, { "epoch": 2.39, "learning_rate": 2.928700821196276e-05, "loss": 1.4836, "step": 30414 }, { "epoch": 2.39, "learning_rate": 2.9279671777639245e-05, "loss": 1.4266, "step": 30415 }, { "epoch": 2.39, "learning_rate": 2.9272336162940102e-05, "loss": 1.472, "step": 30416 }, { "epoch": 2.39, "learning_rate": 2.926500136791522e-05, "loss": 1.4872, "step": 30417 }, { "epoch": 2.39, "learning_rate": 2.925766739261436e-05, "loss": 1.4317, "step": 30418 }, { "epoch": 2.39, "learning_rate": 2.9250334237087246e-05, "loss": 1.4295, "step": 30419 }, { "epoch": 2.39, "learning_rate": 2.9243001901383745e-05, "loss": 1.4646, "step": 30420 }, { "epoch": 2.39, "learning_rate": 2.9235670385553646e-05, "loss": 1.4878, "step": 30421 }, { "epoch": 2.39, "learning_rate": 2.9228339689646707e-05, "loss": 1.4529, "step": 30422 }, { "epoch": 2.39, "learning_rate": 2.9221009813712658e-05, "loss": 1.4278, "step": 30423 }, { "epoch": 2.39, "learning_rate": 2.9213680757801343e-05, "loss": 1.407, "step": 30424 }, { "epoch": 2.39, "learning_rate": 2.920635252196249e-05, "loss": 1.4624, "step": 30425 }, { "epoch": 2.39, "learning_rate": 2.9199025106245787e-05, "loss": 1.5043, "step": 30426 }, { "epoch": 2.39, "learning_rate": 2.9191698510701085e-05, "loss": 1.4696, "step": 30427 }, { "epoch": 2.39, "learning_rate": 2.918437273537807e-05, "loss": 1.452, "step": 30428 }, { "epoch": 2.39, "learning_rate": 2.9177047780326508e-05, "loss": 1.444, "step": 30429 }, { "epoch": 2.39, "learning_rate": 2.916972364559607e-05, "loss": 1.4765, "step": 30430 }, { "epoch": 2.39, "learning_rate": 2.9162400331236575e-05, "loss": 1.4924, "step": 30431 }, { "epoch": 2.39, "learning_rate": 2.915507783729769e-05, "loss": 1.4272, "step": 30432 }, { "epoch": 2.39, "learning_rate": 2.9147756163829117e-05, "loss": 1.4844, "step": 30433 }, { "epoch": 2.39, "learning_rate": 2.914043531088061e-05, "loss": 1.4766, "step": 30434 }, { "epoch": 2.39, "learning_rate": 2.9133115278501816e-05, "loss": 1.445, "step": 30435 }, { "epoch": 2.39, "learning_rate": 2.9125796066742514e-05, "loss": 1.4372, "step": 30436 }, { "epoch": 2.39, "learning_rate": 2.9118477675652306e-05, "loss": 1.468, "step": 30437 }, { "epoch": 2.39, "learning_rate": 2.911116010528096e-05, "loss": 1.4169, "step": 30438 }, { "epoch": 2.39, "learning_rate": 2.9103843355678135e-05, "loss": 1.4857, "step": 30439 }, { "epoch": 2.4, "learning_rate": 2.9096527426893457e-05, "loss": 1.42, "step": 30440 }, { "epoch": 2.4, "learning_rate": 2.9089212318976686e-05, "loss": 1.432, "step": 30441 }, { "epoch": 2.4, "learning_rate": 2.9081898031977413e-05, "loss": 1.4483, "step": 30442 }, { "epoch": 2.4, "learning_rate": 2.90745845659453e-05, "loss": 1.4399, "step": 30443 }, { "epoch": 2.4, "learning_rate": 2.906727192093008e-05, "loss": 1.4255, "step": 30444 }, { "epoch": 2.4, "learning_rate": 2.9059960096981322e-05, "loss": 1.4511, "step": 30445 }, { "epoch": 2.4, "learning_rate": 2.9052649094148706e-05, "loss": 1.4347, "step": 30446 }, { "epoch": 2.4, "learning_rate": 2.9045338912481826e-05, "loss": 1.4778, "step": 30447 }, { "epoch": 2.4, "learning_rate": 2.9038029552030374e-05, "loss": 1.4277, "step": 30448 }, { "epoch": 2.4, "learning_rate": 2.903072101284396e-05, "loss": 1.4676, "step": 30449 }, { "epoch": 2.4, "learning_rate": 2.9023413294972115e-05, "loss": 1.4551, "step": 30450 }, { "epoch": 2.4, "learning_rate": 2.9016106398464595e-05, "loss": 1.4734, "step": 30451 }, { "epoch": 2.4, "learning_rate": 2.900880032337096e-05, "loss": 1.4808, "step": 30452 }, { "epoch": 2.4, "learning_rate": 2.900149506974081e-05, "loss": 1.4703, "step": 30453 }, { "epoch": 2.4, "learning_rate": 2.8994190637623682e-05, "loss": 1.4732, "step": 30454 }, { "epoch": 2.4, "learning_rate": 2.8986887027069272e-05, "loss": 1.4564, "step": 30455 }, { "epoch": 2.4, "learning_rate": 2.8979584238127124e-05, "loss": 1.419, "step": 30456 }, { "epoch": 2.4, "learning_rate": 2.8972282270846765e-05, "loss": 1.4336, "step": 30457 }, { "epoch": 2.4, "learning_rate": 2.8964981125277853e-05, "loss": 1.5459, "step": 30458 }, { "epoch": 2.4, "learning_rate": 2.8957680801469935e-05, "loss": 1.4307, "step": 30459 }, { "epoch": 2.4, "learning_rate": 2.8950381299472535e-05, "loss": 1.4369, "step": 30460 }, { "epoch": 2.4, "learning_rate": 2.8943082619335283e-05, "loss": 1.4691, "step": 30461 }, { "epoch": 2.4, "learning_rate": 2.893578476110769e-05, "loss": 1.4393, "step": 30462 }, { "epoch": 2.4, "learning_rate": 2.892848772483926e-05, "loss": 1.4364, "step": 30463 }, { "epoch": 2.4, "learning_rate": 2.8921191510579645e-05, "loss": 1.4459, "step": 30464 }, { "epoch": 2.4, "learning_rate": 2.8913896118378316e-05, "loss": 1.4608, "step": 30465 }, { "epoch": 2.4, "learning_rate": 2.890660154828477e-05, "loss": 1.4085, "step": 30466 }, { "epoch": 2.4, "learning_rate": 2.8899307800348566e-05, "loss": 1.4375, "step": 30467 }, { "epoch": 2.4, "learning_rate": 2.8892014874619295e-05, "loss": 1.4838, "step": 30468 }, { "epoch": 2.4, "learning_rate": 2.888472277114639e-05, "loss": 1.4423, "step": 30469 }, { "epoch": 2.4, "learning_rate": 2.8877431489979392e-05, "loss": 1.4215, "step": 30470 }, { "epoch": 2.4, "learning_rate": 2.887014103116774e-05, "loss": 1.4981, "step": 30471 }, { "epoch": 2.4, "learning_rate": 2.8862851394761037e-05, "loss": 1.4463, "step": 30472 }, { "epoch": 2.4, "learning_rate": 2.885556258080872e-05, "loss": 1.4208, "step": 30473 }, { "epoch": 2.4, "learning_rate": 2.8848274589360238e-05, "loss": 1.3823, "step": 30474 }, { "epoch": 2.4, "learning_rate": 2.884098742046516e-05, "loss": 1.4379, "step": 30475 }, { "epoch": 2.4, "learning_rate": 2.8833701074172904e-05, "loss": 1.4511, "step": 30476 }, { "epoch": 2.4, "learning_rate": 2.8826415550532927e-05, "loss": 1.4458, "step": 30477 }, { "epoch": 2.4, "learning_rate": 2.8819130849594756e-05, "loss": 1.442, "step": 30478 }, { "epoch": 2.4, "learning_rate": 2.881184697140782e-05, "loss": 1.4266, "step": 30479 }, { "epoch": 2.4, "learning_rate": 2.880456391602151e-05, "loss": 1.4637, "step": 30480 }, { "epoch": 2.4, "learning_rate": 2.8797281683485374e-05, "loss": 1.4477, "step": 30481 }, { "epoch": 2.4, "learning_rate": 2.8790000273848785e-05, "loss": 1.4572, "step": 30482 }, { "epoch": 2.4, "learning_rate": 2.878271968716122e-05, "loss": 1.5263, "step": 30483 }, { "epoch": 2.4, "learning_rate": 2.8775439923472076e-05, "loss": 1.4583, "step": 30484 }, { "epoch": 2.4, "learning_rate": 2.876816098283083e-05, "loss": 1.479, "step": 30485 }, { "epoch": 2.4, "learning_rate": 2.876088286528687e-05, "loss": 1.4508, "step": 30486 }, { "epoch": 2.4, "learning_rate": 2.8753605570889614e-05, "loss": 1.4229, "step": 30487 }, { "epoch": 2.4, "learning_rate": 2.874632909968842e-05, "loss": 1.458, "step": 30488 }, { "epoch": 2.4, "learning_rate": 2.873905345173278e-05, "loss": 1.4481, "step": 30489 }, { "epoch": 2.4, "learning_rate": 2.8731778627072055e-05, "loss": 1.4789, "step": 30490 }, { "epoch": 2.4, "learning_rate": 2.8724504625755588e-05, "loss": 1.4518, "step": 30491 }, { "epoch": 2.4, "learning_rate": 2.8717231447832846e-05, "loss": 1.4539, "step": 30492 }, { "epoch": 2.4, "learning_rate": 2.870995909335318e-05, "loss": 1.4156, "step": 30493 }, { "epoch": 2.4, "learning_rate": 2.8702687562365906e-05, "loss": 1.453, "step": 30494 }, { "epoch": 2.4, "learning_rate": 2.86954168549205e-05, "loss": 1.4189, "step": 30495 }, { "epoch": 2.4, "learning_rate": 2.8688146971066272e-05, "loss": 1.4562, "step": 30496 }, { "epoch": 2.4, "learning_rate": 2.8680877910852535e-05, "loss": 1.471, "step": 30497 }, { "epoch": 2.4, "learning_rate": 2.867360967432868e-05, "loss": 1.453, "step": 30498 }, { "epoch": 2.4, "learning_rate": 2.8666342261544118e-05, "loss": 1.4446, "step": 30499 }, { "epoch": 2.4, "learning_rate": 2.8659075672548127e-05, "loss": 1.4464, "step": 30500 }, { "epoch": 2.4, "learning_rate": 2.865180990739e-05, "loss": 1.4788, "step": 30501 }, { "epoch": 2.4, "learning_rate": 2.8644544966119166e-05, "loss": 1.4331, "step": 30502 }, { "epoch": 2.4, "learning_rate": 2.8637280848784916e-05, "loss": 1.4372, "step": 30503 }, { "epoch": 2.4, "learning_rate": 2.863001755543653e-05, "loss": 1.4687, "step": 30504 }, { "epoch": 2.4, "learning_rate": 2.8622755086123332e-05, "loss": 1.4894, "step": 30505 }, { "epoch": 2.4, "learning_rate": 2.861549344089467e-05, "loss": 1.4275, "step": 30506 }, { "epoch": 2.4, "learning_rate": 2.860823261979982e-05, "loss": 1.446, "step": 30507 }, { "epoch": 2.4, "learning_rate": 2.860097262288806e-05, "loss": 1.4142, "step": 30508 }, { "epoch": 2.4, "learning_rate": 2.8593713450208727e-05, "loss": 1.4364, "step": 30509 }, { "epoch": 2.4, "learning_rate": 2.858645510181109e-05, "loss": 1.4162, "step": 30510 }, { "epoch": 2.4, "learning_rate": 2.8579197577744372e-05, "loss": 1.486, "step": 30511 }, { "epoch": 2.4, "learning_rate": 2.8571940878057937e-05, "loss": 1.4476, "step": 30512 }, { "epoch": 2.4, "learning_rate": 2.8564685002800975e-05, "loss": 1.442, "step": 30513 }, { "epoch": 2.4, "learning_rate": 2.855742995202283e-05, "loss": 1.4858, "step": 30514 }, { "epoch": 2.4, "learning_rate": 2.8550175725772684e-05, "loss": 1.4549, "step": 30515 }, { "epoch": 2.4, "learning_rate": 2.854292232409986e-05, "loss": 1.4175, "step": 30516 }, { "epoch": 2.4, "learning_rate": 2.853566974705357e-05, "loss": 1.4777, "step": 30517 }, { "epoch": 2.4, "learning_rate": 2.8528417994683007e-05, "loss": 1.4558, "step": 30518 }, { "epoch": 2.4, "learning_rate": 2.8521167067037498e-05, "loss": 1.4438, "step": 30519 }, { "epoch": 2.4, "learning_rate": 2.8513916964166222e-05, "loss": 1.5148, "step": 30520 }, { "epoch": 2.4, "learning_rate": 2.8506667686118374e-05, "loss": 1.4831, "step": 30521 }, { "epoch": 2.4, "learning_rate": 2.8499419232943245e-05, "loss": 1.4011, "step": 30522 }, { "epoch": 2.4, "learning_rate": 2.8492171604690013e-05, "loss": 1.4635, "step": 30523 }, { "epoch": 2.4, "learning_rate": 2.848492480140787e-05, "loss": 1.4385, "step": 30524 }, { "epoch": 2.4, "learning_rate": 2.8477678823145998e-05, "loss": 1.4525, "step": 30525 }, { "epoch": 2.4, "learning_rate": 2.8470433669953657e-05, "loss": 1.4055, "step": 30526 }, { "epoch": 2.4, "learning_rate": 2.8463189341880023e-05, "loss": 1.444, "step": 30527 }, { "epoch": 2.4, "learning_rate": 2.8455945838974204e-05, "loss": 1.4774, "step": 30528 }, { "epoch": 2.4, "learning_rate": 2.8448703161285464e-05, "loss": 1.4484, "step": 30529 }, { "epoch": 2.4, "learning_rate": 2.8441461308862963e-05, "loss": 1.3987, "step": 30530 }, { "epoch": 2.4, "learning_rate": 2.8434220281755875e-05, "loss": 1.4434, "step": 30531 }, { "epoch": 2.4, "learning_rate": 2.84269800800133e-05, "loss": 1.475, "step": 30532 }, { "epoch": 2.4, "learning_rate": 2.8419740703684497e-05, "loss": 1.5044, "step": 30533 }, { "epoch": 2.4, "learning_rate": 2.841250215281854e-05, "loss": 1.4209, "step": 30534 }, { "epoch": 2.4, "learning_rate": 2.8405264427464557e-05, "loss": 1.4228, "step": 30535 }, { "epoch": 2.4, "learning_rate": 2.839802752767178e-05, "loss": 1.4673, "step": 30536 }, { "epoch": 2.4, "learning_rate": 2.839079145348928e-05, "loss": 1.3593, "step": 30537 }, { "epoch": 2.4, "learning_rate": 2.8383556204966174e-05, "loss": 1.4354, "step": 30538 }, { "epoch": 2.4, "learning_rate": 2.8376321782151635e-05, "loss": 1.4433, "step": 30539 }, { "epoch": 2.4, "learning_rate": 2.836908818509474e-05, "loss": 1.4584, "step": 30540 }, { "epoch": 2.4, "learning_rate": 2.8361855413844635e-05, "loss": 1.4833, "step": 30541 }, { "epoch": 2.4, "learning_rate": 2.8354623468450366e-05, "loss": 1.4343, "step": 30542 }, { "epoch": 2.4, "learning_rate": 2.8347392348961105e-05, "loss": 1.4862, "step": 30543 }, { "epoch": 2.4, "learning_rate": 2.834016205542592e-05, "loss": 1.4772, "step": 30544 }, { "epoch": 2.4, "learning_rate": 2.8332932587893848e-05, "loss": 1.5024, "step": 30545 }, { "epoch": 2.4, "learning_rate": 2.8325703946414036e-05, "loss": 1.4586, "step": 30546 }, { "epoch": 2.4, "learning_rate": 2.8318476131035578e-05, "loss": 1.454, "step": 30547 }, { "epoch": 2.4, "learning_rate": 2.8311249141807534e-05, "loss": 1.4553, "step": 30548 }, { "epoch": 2.4, "learning_rate": 2.8304022978778902e-05, "loss": 1.4515, "step": 30549 }, { "epoch": 2.4, "learning_rate": 2.8296797641998836e-05, "loss": 1.4373, "step": 30550 }, { "epoch": 2.4, "learning_rate": 2.8289573131516353e-05, "loss": 1.4829, "step": 30551 }, { "epoch": 2.4, "learning_rate": 2.828234944738046e-05, "loss": 1.4328, "step": 30552 }, { "epoch": 2.4, "learning_rate": 2.82751265896403e-05, "loss": 1.4444, "step": 30553 }, { "epoch": 2.4, "learning_rate": 2.826790455834484e-05, "loss": 1.4649, "step": 30554 }, { "epoch": 2.4, "learning_rate": 2.82606833535431e-05, "loss": 1.4138, "step": 30555 }, { "epoch": 2.4, "learning_rate": 2.825346297528418e-05, "loss": 1.4992, "step": 30556 }, { "epoch": 2.4, "learning_rate": 2.8246243423617055e-05, "loss": 1.4769, "step": 30557 }, { "epoch": 2.4, "learning_rate": 2.823902469859075e-05, "loss": 1.4317, "step": 30558 }, { "epoch": 2.4, "learning_rate": 2.823180680025423e-05, "loss": 1.4547, "step": 30559 }, { "epoch": 2.4, "learning_rate": 2.8224589728656556e-05, "loss": 1.4087, "step": 30560 }, { "epoch": 2.4, "learning_rate": 2.821737348384675e-05, "loss": 1.4519, "step": 30561 }, { "epoch": 2.4, "learning_rate": 2.8210158065873727e-05, "loss": 1.4751, "step": 30562 }, { "epoch": 2.4, "learning_rate": 2.8202943474786566e-05, "loss": 1.4652, "step": 30563 }, { "epoch": 2.4, "learning_rate": 2.8195729710634206e-05, "loss": 1.4019, "step": 30564 }, { "epoch": 2.4, "learning_rate": 2.8188516773465632e-05, "loss": 1.4359, "step": 30565 }, { "epoch": 2.4, "learning_rate": 2.818130466332976e-05, "loss": 1.4799, "step": 30566 }, { "epoch": 2.41, "learning_rate": 2.8174093380275648e-05, "loss": 1.4196, "step": 30567 }, { "epoch": 2.41, "learning_rate": 2.8166882924352212e-05, "loss": 1.3812, "step": 30568 }, { "epoch": 2.41, "learning_rate": 2.8159673295608353e-05, "loss": 1.4665, "step": 30569 }, { "epoch": 2.41, "learning_rate": 2.815246449409313e-05, "loss": 1.4208, "step": 30570 }, { "epoch": 2.41, "learning_rate": 2.8145256519855436e-05, "loss": 1.5145, "step": 30571 }, { "epoch": 2.41, "learning_rate": 2.8138049372944166e-05, "loss": 1.4498, "step": 30572 }, { "epoch": 2.41, "learning_rate": 2.8130843053408313e-05, "loss": 1.4786, "step": 30573 }, { "epoch": 2.41, "learning_rate": 2.812363756129681e-05, "loss": 1.4135, "step": 30574 }, { "epoch": 2.41, "learning_rate": 2.811643289665849e-05, "loss": 1.4134, "step": 30575 }, { "epoch": 2.41, "learning_rate": 2.8109229059542328e-05, "loss": 1.4274, "step": 30576 }, { "epoch": 2.41, "learning_rate": 2.810202604999729e-05, "loss": 1.465, "step": 30577 }, { "epoch": 2.41, "learning_rate": 2.8094823868072226e-05, "loss": 1.4196, "step": 30578 }, { "epoch": 2.41, "learning_rate": 2.8087622513815978e-05, "loss": 1.4506, "step": 30579 }, { "epoch": 2.41, "learning_rate": 2.8080421987277558e-05, "loss": 1.5027, "step": 30580 }, { "epoch": 2.41, "learning_rate": 2.8073222288505776e-05, "loss": 1.489, "step": 30581 }, { "epoch": 2.41, "learning_rate": 2.8066023417549528e-05, "loss": 1.4914, "step": 30582 }, { "epoch": 2.41, "learning_rate": 2.8058825374457672e-05, "loss": 1.4544, "step": 30583 }, { "epoch": 2.41, "learning_rate": 2.8051628159279122e-05, "loss": 1.4387, "step": 30584 }, { "epoch": 2.41, "learning_rate": 2.804443177206272e-05, "loss": 1.4111, "step": 30585 }, { "epoch": 2.41, "learning_rate": 2.8037236212857294e-05, "loss": 1.455, "step": 30586 }, { "epoch": 2.41, "learning_rate": 2.8030041481711757e-05, "loss": 1.4562, "step": 30587 }, { "epoch": 2.41, "learning_rate": 2.8022847578674933e-05, "loss": 1.5018, "step": 30588 }, { "epoch": 2.41, "learning_rate": 2.801565450379564e-05, "loss": 1.4402, "step": 30589 }, { "epoch": 2.41, "learning_rate": 2.800846225712276e-05, "loss": 1.4319, "step": 30590 }, { "epoch": 2.41, "learning_rate": 2.80012708387051e-05, "loss": 1.4177, "step": 30591 }, { "epoch": 2.41, "learning_rate": 2.799408024859146e-05, "loss": 1.447, "step": 30592 }, { "epoch": 2.41, "learning_rate": 2.7986890486830676e-05, "loss": 1.4312, "step": 30593 }, { "epoch": 2.41, "learning_rate": 2.7979701553471608e-05, "loss": 1.4533, "step": 30594 }, { "epoch": 2.41, "learning_rate": 2.7972513448563044e-05, "loss": 1.4842, "step": 30595 }, { "epoch": 2.41, "learning_rate": 2.796532617215372e-05, "loss": 1.458, "step": 30596 }, { "epoch": 2.41, "learning_rate": 2.795813972429254e-05, "loss": 1.4564, "step": 30597 }, { "epoch": 2.41, "learning_rate": 2.7950954105028235e-05, "loss": 1.4773, "step": 30598 }, { "epoch": 2.41, "learning_rate": 2.7943769314409597e-05, "loss": 1.4494, "step": 30599 }, { "epoch": 2.41, "learning_rate": 2.7936585352485373e-05, "loss": 1.4611, "step": 30600 }, { "epoch": 2.41, "learning_rate": 2.792940221930441e-05, "loss": 1.442, "step": 30601 }, { "epoch": 2.41, "learning_rate": 2.7922219914915445e-05, "loss": 1.4758, "step": 30602 }, { "epoch": 2.41, "learning_rate": 2.7915038439367194e-05, "loss": 1.4665, "step": 30603 }, { "epoch": 2.41, "learning_rate": 2.79078577927085e-05, "loss": 1.5173, "step": 30604 }, { "epoch": 2.41, "learning_rate": 2.7900677974988088e-05, "loss": 1.4482, "step": 30605 }, { "epoch": 2.41, "learning_rate": 2.789349898625464e-05, "loss": 1.4369, "step": 30606 }, { "epoch": 2.41, "learning_rate": 2.788632082655695e-05, "loss": 1.4699, "step": 30607 }, { "epoch": 2.41, "learning_rate": 2.787914349594381e-05, "loss": 1.4669, "step": 30608 }, { "epoch": 2.41, "learning_rate": 2.7871966994463884e-05, "loss": 1.4615, "step": 30609 }, { "epoch": 2.41, "learning_rate": 2.7864791322165864e-05, "loss": 1.4755, "step": 30610 }, { "epoch": 2.41, "learning_rate": 2.7857616479098545e-05, "loss": 1.4699, "step": 30611 }, { "epoch": 2.41, "learning_rate": 2.785044246531062e-05, "loss": 1.4649, "step": 30612 }, { "epoch": 2.41, "learning_rate": 2.784326928085073e-05, "loss": 1.4734, "step": 30613 }, { "epoch": 2.41, "learning_rate": 2.783609692576768e-05, "loss": 1.4047, "step": 30614 }, { "epoch": 2.41, "learning_rate": 2.782892540011011e-05, "loss": 1.4708, "step": 30615 }, { "epoch": 2.41, "learning_rate": 2.7821754703926673e-05, "loss": 1.4758, "step": 30616 }, { "epoch": 2.41, "learning_rate": 2.781458483726616e-05, "loss": 1.4511, "step": 30617 }, { "epoch": 2.41, "learning_rate": 2.780741580017717e-05, "loss": 1.4079, "step": 30618 }, { "epoch": 2.41, "learning_rate": 2.7800247592708385e-05, "loss": 1.4519, "step": 30619 }, { "epoch": 2.41, "learning_rate": 2.779308021490847e-05, "loss": 1.4423, "step": 30620 }, { "epoch": 2.41, "learning_rate": 2.7785913666826115e-05, "loss": 1.4128, "step": 30621 }, { "epoch": 2.41, "learning_rate": 2.7778747948509982e-05, "loss": 1.4786, "step": 30622 }, { "epoch": 2.41, "learning_rate": 2.777158306000865e-05, "loss": 1.4536, "step": 30623 }, { "epoch": 2.41, "learning_rate": 2.776441900137083e-05, "loss": 1.4303, "step": 30624 }, { "epoch": 2.41, "learning_rate": 2.7757255772645182e-05, "loss": 1.4206, "step": 30625 }, { "epoch": 2.41, "learning_rate": 2.7750093373880317e-05, "loss": 1.4224, "step": 30626 }, { "epoch": 2.41, "learning_rate": 2.7742931805124813e-05, "loss": 1.4942, "step": 30627 }, { "epoch": 2.41, "learning_rate": 2.7735771066427363e-05, "loss": 1.4145, "step": 30628 }, { "epoch": 2.41, "learning_rate": 2.7728611157836568e-05, "loss": 1.4412, "step": 30629 }, { "epoch": 2.41, "learning_rate": 2.772145207940098e-05, "loss": 1.5129, "step": 30630 }, { "epoch": 2.41, "learning_rate": 2.7714293831169298e-05, "loss": 1.3949, "step": 30631 }, { "epoch": 2.41, "learning_rate": 2.7707136413190084e-05, "loss": 1.4725, "step": 30632 }, { "epoch": 2.41, "learning_rate": 2.769997982551188e-05, "loss": 1.4354, "step": 30633 }, { "epoch": 2.41, "learning_rate": 2.769282406818335e-05, "loss": 1.452, "step": 30634 }, { "epoch": 2.41, "learning_rate": 2.768566914125307e-05, "loss": 1.4555, "step": 30635 }, { "epoch": 2.41, "learning_rate": 2.7678515044769585e-05, "loss": 1.4562, "step": 30636 }, { "epoch": 2.41, "learning_rate": 2.7671361778781452e-05, "loss": 1.4903, "step": 30637 }, { "epoch": 2.41, "learning_rate": 2.766420934333729e-05, "loss": 1.4553, "step": 30638 }, { "epoch": 2.41, "learning_rate": 2.7657057738485623e-05, "loss": 1.4527, "step": 30639 }, { "epoch": 2.41, "learning_rate": 2.7649906964275027e-05, "loss": 1.4616, "step": 30640 }, { "epoch": 2.41, "learning_rate": 2.764275702075403e-05, "loss": 1.3787, "step": 30641 }, { "epoch": 2.41, "learning_rate": 2.7635607907971214e-05, "loss": 1.4286, "step": 30642 }, { "epoch": 2.41, "learning_rate": 2.76284596259751e-05, "loss": 1.4329, "step": 30643 }, { "epoch": 2.41, "learning_rate": 2.7621312174814175e-05, "loss": 1.4719, "step": 30644 }, { "epoch": 2.41, "learning_rate": 2.7614165554537043e-05, "loss": 1.4157, "step": 30645 }, { "epoch": 2.41, "learning_rate": 2.76070197651922e-05, "loss": 1.4971, "step": 30646 }, { "epoch": 2.41, "learning_rate": 2.759987480682811e-05, "loss": 1.5094, "step": 30647 }, { "epoch": 2.41, "learning_rate": 2.7592730679493347e-05, "loss": 1.4515, "step": 30648 }, { "epoch": 2.41, "learning_rate": 2.7585587383236408e-05, "loss": 1.4472, "step": 30649 }, { "epoch": 2.41, "learning_rate": 2.7578444918105734e-05, "loss": 1.4427, "step": 30650 }, { "epoch": 2.41, "learning_rate": 2.7571303284149894e-05, "loss": 1.493, "step": 30651 }, { "epoch": 2.41, "learning_rate": 2.7564162481417358e-05, "loss": 1.4683, "step": 30652 }, { "epoch": 2.41, "learning_rate": 2.7557022509956573e-05, "loss": 1.4703, "step": 30653 }, { "epoch": 2.41, "learning_rate": 2.7549883369816e-05, "loss": 1.4148, "step": 30654 }, { "epoch": 2.41, "learning_rate": 2.7542745061044153e-05, "loss": 1.4219, "step": 30655 }, { "epoch": 2.41, "learning_rate": 2.753560758368954e-05, "loss": 1.4228, "step": 30656 }, { "epoch": 2.41, "learning_rate": 2.7528470937800558e-05, "loss": 1.4585, "step": 30657 }, { "epoch": 2.41, "learning_rate": 2.7521335123425632e-05, "loss": 1.4268, "step": 30658 }, { "epoch": 2.41, "learning_rate": 2.751420014061329e-05, "loss": 1.4456, "step": 30659 }, { "epoch": 2.41, "learning_rate": 2.750706598941193e-05, "loss": 1.4333, "step": 30660 }, { "epoch": 2.41, "learning_rate": 2.749993266986996e-05, "loss": 1.4381, "step": 30661 }, { "epoch": 2.41, "learning_rate": 2.7492800182035897e-05, "loss": 1.4324, "step": 30662 }, { "epoch": 2.41, "learning_rate": 2.748566852595811e-05, "loss": 1.5095, "step": 30663 }, { "epoch": 2.41, "learning_rate": 2.7478537701684983e-05, "loss": 1.4791, "step": 30664 }, { "epoch": 2.41, "learning_rate": 2.747140770926501e-05, "loss": 1.4368, "step": 30665 }, { "epoch": 2.41, "learning_rate": 2.7464278548746548e-05, "loss": 1.4717, "step": 30666 }, { "epoch": 2.41, "learning_rate": 2.7457150220177997e-05, "loss": 1.444, "step": 30667 }, { "epoch": 2.41, "learning_rate": 2.7450022723607802e-05, "loss": 1.4254, "step": 30668 }, { "epoch": 2.41, "learning_rate": 2.744289605908432e-05, "loss": 1.3697, "step": 30669 }, { "epoch": 2.41, "learning_rate": 2.7435770226655914e-05, "loss": 1.4249, "step": 30670 }, { "epoch": 2.41, "learning_rate": 2.7428645226370978e-05, "loss": 1.4551, "step": 30671 }, { "epoch": 2.41, "learning_rate": 2.742152105827794e-05, "loss": 1.4554, "step": 30672 }, { "epoch": 2.41, "learning_rate": 2.7414397722425146e-05, "loss": 1.4583, "step": 30673 }, { "epoch": 2.41, "learning_rate": 2.7407275218860892e-05, "loss": 1.4061, "step": 30674 }, { "epoch": 2.41, "learning_rate": 2.7400153547633618e-05, "loss": 1.4783, "step": 30675 }, { "epoch": 2.41, "learning_rate": 2.7393032708791655e-05, "loss": 1.5087, "step": 30676 }, { "epoch": 2.41, "learning_rate": 2.738591270238335e-05, "loss": 1.4858, "step": 30677 }, { "epoch": 2.41, "learning_rate": 2.7378793528456978e-05, "loss": 1.4697, "step": 30678 }, { "epoch": 2.41, "learning_rate": 2.737167518706098e-05, "loss": 1.4209, "step": 30679 }, { "epoch": 2.41, "learning_rate": 2.7364557678243626e-05, "loss": 1.4523, "step": 30680 }, { "epoch": 2.41, "learning_rate": 2.735744100205322e-05, "loss": 1.4634, "step": 30681 }, { "epoch": 2.41, "learning_rate": 2.7350325158538143e-05, "loss": 1.4612, "step": 30682 }, { "epoch": 2.41, "learning_rate": 2.7343210147746676e-05, "loss": 1.444, "step": 30683 }, { "epoch": 2.41, "learning_rate": 2.733609596972709e-05, "loss": 1.4694, "step": 30684 }, { "epoch": 2.41, "learning_rate": 2.7328982624527752e-05, "loss": 1.4536, "step": 30685 }, { "epoch": 2.41, "learning_rate": 2.7321870112196888e-05, "loss": 1.4466, "step": 30686 }, { "epoch": 2.41, "learning_rate": 2.7314758432782858e-05, "loss": 1.4196, "step": 30687 }, { "epoch": 2.41, "learning_rate": 2.7307647586333893e-05, "loss": 1.4167, "step": 30688 }, { "epoch": 2.41, "learning_rate": 2.730053757289832e-05, "loss": 1.4294, "step": 30689 }, { "epoch": 2.41, "learning_rate": 2.7293428392524397e-05, "loss": 1.3839, "step": 30690 }, { "epoch": 2.41, "learning_rate": 2.728632004526034e-05, "loss": 1.4387, "step": 30691 }, { "epoch": 2.41, "learning_rate": 2.7279212531154477e-05, "loss": 1.4378, "step": 30692 }, { "epoch": 2.41, "learning_rate": 2.727210585025505e-05, "loss": 1.4461, "step": 30693 }, { "epoch": 2.42, "learning_rate": 2.726500000261029e-05, "loss": 1.4184, "step": 30694 }, { "epoch": 2.42, "learning_rate": 2.725789498826842e-05, "loss": 1.4787, "step": 30695 }, { "epoch": 2.42, "learning_rate": 2.725079080727774e-05, "loss": 1.4232, "step": 30696 }, { "epoch": 2.42, "learning_rate": 2.7243687459686443e-05, "loss": 1.5164, "step": 30697 }, { "epoch": 2.42, "learning_rate": 2.723658494554274e-05, "loss": 1.44, "step": 30698 }, { "epoch": 2.42, "learning_rate": 2.7229483264894925e-05, "loss": 1.4051, "step": 30699 }, { "epoch": 2.42, "learning_rate": 2.7222382417791144e-05, "loss": 1.4184, "step": 30700 }, { "epoch": 2.42, "learning_rate": 2.7215282404279608e-05, "loss": 1.4459, "step": 30701 }, { "epoch": 2.42, "learning_rate": 2.7208183224408547e-05, "loss": 1.4633, "step": 30702 }, { "epoch": 2.42, "learning_rate": 2.7201084878226205e-05, "loss": 1.4461, "step": 30703 }, { "epoch": 2.42, "learning_rate": 2.7193987365780724e-05, "loss": 1.4521, "step": 30704 }, { "epoch": 2.42, "learning_rate": 2.718689068712025e-05, "loss": 1.4431, "step": 30705 }, { "epoch": 2.42, "learning_rate": 2.7179794842293063e-05, "loss": 1.442, "step": 30706 }, { "epoch": 2.42, "learning_rate": 2.717269983134729e-05, "loss": 1.4022, "step": 30707 }, { "epoch": 2.42, "learning_rate": 2.7165605654331058e-05, "loss": 1.4569, "step": 30708 }, { "epoch": 2.42, "learning_rate": 2.7158512311292628e-05, "loss": 1.4566, "step": 30709 }, { "epoch": 2.42, "learning_rate": 2.71514198022801e-05, "loss": 1.4654, "step": 30710 }, { "epoch": 2.42, "learning_rate": 2.7144328127341646e-05, "loss": 1.4136, "step": 30711 }, { "epoch": 2.42, "learning_rate": 2.7137237286525364e-05, "loss": 1.4298, "step": 30712 }, { "epoch": 2.42, "learning_rate": 2.7130147279879484e-05, "loss": 1.4663, "step": 30713 }, { "epoch": 2.42, "learning_rate": 2.7123058107452096e-05, "loss": 1.4805, "step": 30714 }, { "epoch": 2.42, "learning_rate": 2.7115969769291295e-05, "loss": 1.4583, "step": 30715 }, { "epoch": 2.42, "learning_rate": 2.710888226544528e-05, "loss": 1.4694, "step": 30716 }, { "epoch": 2.42, "learning_rate": 2.7101795595962094e-05, "loss": 1.4479, "step": 30717 }, { "epoch": 2.42, "learning_rate": 2.709470976088995e-05, "loss": 1.4355, "step": 30718 }, { "epoch": 2.42, "learning_rate": 2.7087624760276855e-05, "loss": 1.4412, "step": 30719 }, { "epoch": 2.42, "learning_rate": 2.7080540594170992e-05, "loss": 1.4567, "step": 30720 }, { "epoch": 2.42, "learning_rate": 2.7073457262620434e-05, "loss": 1.4526, "step": 30721 }, { "epoch": 2.42, "learning_rate": 2.706637476567323e-05, "loss": 1.4386, "step": 30722 }, { "epoch": 2.42, "learning_rate": 2.7059293103377526e-05, "loss": 1.4826, "step": 30723 }, { "epoch": 2.42, "learning_rate": 2.70522122757814e-05, "loss": 1.443, "step": 30724 }, { "epoch": 2.42, "learning_rate": 2.704513228293284e-05, "loss": 1.4358, "step": 30725 }, { "epoch": 2.42, "learning_rate": 2.7038053124880032e-05, "loss": 1.4655, "step": 30726 }, { "epoch": 2.42, "learning_rate": 2.7030974801670984e-05, "loss": 1.4721, "step": 30727 }, { "epoch": 2.42, "learning_rate": 2.7023897313353726e-05, "loss": 1.4936, "step": 30728 }, { "epoch": 2.42, "learning_rate": 2.701682065997637e-05, "loss": 1.4362, "step": 30729 }, { "epoch": 2.42, "learning_rate": 2.700974484158694e-05, "loss": 1.4714, "step": 30730 }, { "epoch": 2.42, "learning_rate": 2.7002669858233467e-05, "loss": 1.4107, "step": 30731 }, { "epoch": 2.42, "learning_rate": 2.6995595709963947e-05, "loss": 1.4395, "step": 30732 }, { "epoch": 2.42, "learning_rate": 2.6988522396826456e-05, "loss": 1.4494, "step": 30733 }, { "epoch": 2.42, "learning_rate": 2.698144991886906e-05, "loss": 1.4905, "step": 30734 }, { "epoch": 2.42, "learning_rate": 2.697437827613973e-05, "loss": 1.453, "step": 30735 }, { "epoch": 2.42, "learning_rate": 2.6967307468686434e-05, "loss": 1.4689, "step": 30736 }, { "epoch": 2.42, "learning_rate": 2.6960237496557264e-05, "loss": 1.4519, "step": 30737 }, { "epoch": 2.42, "learning_rate": 2.69531683598002e-05, "loss": 1.4325, "step": 30738 }, { "epoch": 2.42, "learning_rate": 2.6946100058463165e-05, "loss": 1.4615, "step": 30739 }, { "epoch": 2.42, "learning_rate": 2.6939032592594247e-05, "loss": 1.4476, "step": 30740 }, { "epoch": 2.42, "learning_rate": 2.693196596224138e-05, "loss": 1.4581, "step": 30741 }, { "epoch": 2.42, "learning_rate": 2.692490016745252e-05, "loss": 1.4335, "step": 30742 }, { "epoch": 2.42, "learning_rate": 2.6917835208275702e-05, "loss": 1.4311, "step": 30743 }, { "epoch": 2.42, "learning_rate": 2.6910771084758874e-05, "loss": 1.4143, "step": 30744 }, { "epoch": 2.42, "learning_rate": 2.6903707796949936e-05, "loss": 1.4478, "step": 30745 }, { "epoch": 2.42, "learning_rate": 2.6896645344896928e-05, "loss": 1.4436, "step": 30746 }, { "epoch": 2.42, "learning_rate": 2.688958372864776e-05, "loss": 1.4843, "step": 30747 }, { "epoch": 2.42, "learning_rate": 2.6882522948250385e-05, "loss": 1.412, "step": 30748 }, { "epoch": 2.42, "learning_rate": 2.6875463003752657e-05, "loss": 1.4528, "step": 30749 }, { "epoch": 2.42, "learning_rate": 2.6868403895202674e-05, "loss": 1.4068, "step": 30750 }, { "epoch": 2.42, "learning_rate": 2.6861345622648278e-05, "loss": 1.479, "step": 30751 }, { "epoch": 2.42, "learning_rate": 2.6854288186137386e-05, "loss": 1.4555, "step": 30752 }, { "epoch": 2.42, "learning_rate": 2.6847231585717887e-05, "loss": 1.4795, "step": 30753 }, { "epoch": 2.42, "learning_rate": 2.6840175821437766e-05, "loss": 1.4581, "step": 30754 }, { "epoch": 2.42, "learning_rate": 2.6833120893344877e-05, "loss": 1.5232, "step": 30755 }, { "epoch": 2.42, "learning_rate": 2.682606680148709e-05, "loss": 1.4888, "step": 30756 }, { "epoch": 2.42, "learning_rate": 2.6819013545912376e-05, "loss": 1.4544, "step": 30757 }, { "epoch": 2.42, "learning_rate": 2.6811961126668587e-05, "loss": 1.4646, "step": 30758 }, { "epoch": 2.42, "learning_rate": 2.680490954380356e-05, "loss": 1.4566, "step": 30759 }, { "epoch": 2.42, "learning_rate": 2.679785879736526e-05, "loss": 1.5003, "step": 30760 }, { "epoch": 2.42, "learning_rate": 2.6790808887401504e-05, "loss": 1.4743, "step": 30761 }, { "epoch": 2.42, "learning_rate": 2.6783759813960116e-05, "loss": 1.4313, "step": 30762 }, { "epoch": 2.42, "learning_rate": 2.6776711577089053e-05, "loss": 1.4617, "step": 30763 }, { "epoch": 2.42, "learning_rate": 2.6769664176836102e-05, "loss": 1.4712, "step": 30764 }, { "epoch": 2.42, "learning_rate": 2.6762617613249103e-05, "loss": 1.4503, "step": 30765 }, { "epoch": 2.42, "learning_rate": 2.675557188637592e-05, "loss": 1.4549, "step": 30766 }, { "epoch": 2.42, "learning_rate": 2.674852699626443e-05, "loss": 1.4734, "step": 30767 }, { "epoch": 2.42, "learning_rate": 2.674148294296243e-05, "loss": 1.4585, "step": 30768 }, { "epoch": 2.42, "learning_rate": 2.6734439726517743e-05, "loss": 1.4416, "step": 30769 }, { "epoch": 2.42, "learning_rate": 2.6727397346978135e-05, "loss": 1.4484, "step": 30770 }, { "epoch": 2.42, "learning_rate": 2.672035580439152e-05, "loss": 1.39, "step": 30771 }, { "epoch": 2.42, "learning_rate": 2.6713315098805653e-05, "loss": 1.4283, "step": 30772 }, { "epoch": 2.42, "learning_rate": 2.6706275230268302e-05, "loss": 1.4667, "step": 30773 }, { "epoch": 2.42, "learning_rate": 2.6699236198827346e-05, "loss": 1.4877, "step": 30774 }, { "epoch": 2.42, "learning_rate": 2.6692198004530525e-05, "loss": 1.4758, "step": 30775 }, { "epoch": 2.42, "learning_rate": 2.6685160647425602e-05, "loss": 1.4785, "step": 30776 }, { "epoch": 2.42, "learning_rate": 2.6678124127560424e-05, "loss": 1.4711, "step": 30777 }, { "epoch": 2.42, "learning_rate": 2.6671088444982735e-05, "loss": 1.4768, "step": 30778 }, { "epoch": 2.42, "learning_rate": 2.6664053599740248e-05, "loss": 1.4744, "step": 30779 }, { "epoch": 2.42, "learning_rate": 2.665701959188079e-05, "loss": 1.4761, "step": 30780 }, { "epoch": 2.42, "learning_rate": 2.6649986421452125e-05, "loss": 1.3917, "step": 30781 }, { "epoch": 2.42, "learning_rate": 2.6642954088501976e-05, "loss": 1.4682, "step": 30782 }, { "epoch": 2.42, "learning_rate": 2.663592259307808e-05, "loss": 1.3911, "step": 30783 }, { "epoch": 2.42, "learning_rate": 2.6628891935228207e-05, "loss": 1.465, "step": 30784 }, { "epoch": 2.42, "learning_rate": 2.662186211500009e-05, "loss": 1.3407, "step": 30785 }, { "epoch": 2.42, "learning_rate": 2.661483313244141e-05, "loss": 1.4565, "step": 30786 }, { "epoch": 2.42, "learning_rate": 2.6607804987599956e-05, "loss": 1.4586, "step": 30787 }, { "epoch": 2.42, "learning_rate": 2.6600777680523412e-05, "loss": 1.4875, "step": 30788 }, { "epoch": 2.42, "learning_rate": 2.6593751211259486e-05, "loss": 1.4156, "step": 30789 }, { "epoch": 2.42, "learning_rate": 2.6586725579855837e-05, "loss": 1.4565, "step": 30790 }, { "epoch": 2.42, "learning_rate": 2.657970078636027e-05, "loss": 1.4205, "step": 30791 }, { "epoch": 2.42, "learning_rate": 2.657267683082044e-05, "loss": 1.449, "step": 30792 }, { "epoch": 2.42, "learning_rate": 2.6565653713283958e-05, "loss": 1.4684, "step": 30793 }, { "epoch": 2.42, "learning_rate": 2.6558631433798622e-05, "loss": 1.3862, "step": 30794 }, { "epoch": 2.42, "learning_rate": 2.655160999241206e-05, "loss": 1.4389, "step": 30795 }, { "epoch": 2.42, "learning_rate": 2.65445893891719e-05, "loss": 1.4373, "step": 30796 }, { "epoch": 2.42, "learning_rate": 2.6537569624125836e-05, "loss": 1.4996, "step": 30797 }, { "epoch": 2.42, "learning_rate": 2.65305506973216e-05, "loss": 1.4785, "step": 30798 }, { "epoch": 2.42, "learning_rate": 2.6523532608806786e-05, "loss": 1.4422, "step": 30799 }, { "epoch": 2.42, "learning_rate": 2.6516515358629003e-05, "loss": 1.4197, "step": 30800 }, { "epoch": 2.42, "learning_rate": 2.6509498946835965e-05, "loss": 1.3727, "step": 30801 }, { "epoch": 2.42, "learning_rate": 2.65024833734753e-05, "loss": 1.4207, "step": 30802 }, { "epoch": 2.42, "learning_rate": 2.6495468638594575e-05, "loss": 1.4327, "step": 30803 }, { "epoch": 2.42, "learning_rate": 2.6488454742241493e-05, "loss": 1.4127, "step": 30804 }, { "epoch": 2.42, "learning_rate": 2.6481441684463654e-05, "loss": 1.4123, "step": 30805 }, { "epoch": 2.42, "learning_rate": 2.6474429465308657e-05, "loss": 1.4364, "step": 30806 }, { "epoch": 2.42, "learning_rate": 2.6467418084824088e-05, "loss": 1.4618, "step": 30807 }, { "epoch": 2.42, "learning_rate": 2.6460407543057614e-05, "loss": 1.4309, "step": 30808 }, { "epoch": 2.42, "learning_rate": 2.64533978400568e-05, "loss": 1.4198, "step": 30809 }, { "epoch": 2.42, "learning_rate": 2.6446388975869188e-05, "loss": 1.4351, "step": 30810 }, { "epoch": 2.42, "learning_rate": 2.6439380950542455e-05, "loss": 1.4382, "step": 30811 }, { "epoch": 2.42, "learning_rate": 2.64323737641241e-05, "loss": 1.4412, "step": 30812 }, { "epoch": 2.42, "learning_rate": 2.642536741666178e-05, "loss": 1.4481, "step": 30813 }, { "epoch": 2.42, "learning_rate": 2.6418361908202978e-05, "loss": 1.4361, "step": 30814 }, { "epoch": 2.42, "learning_rate": 2.641135723879534e-05, "loss": 1.4628, "step": 30815 }, { "epoch": 2.42, "learning_rate": 2.6404353408486388e-05, "loss": 1.4628, "step": 30816 }, { "epoch": 2.42, "learning_rate": 2.6397350417323625e-05, "loss": 1.4278, "step": 30817 }, { "epoch": 2.42, "learning_rate": 2.639034826535468e-05, "loss": 1.4644, "step": 30818 }, { "epoch": 2.42, "learning_rate": 2.638334695262707e-05, "loss": 1.4848, "step": 30819 }, { "epoch": 2.42, "learning_rate": 2.637634647918827e-05, "loss": 1.4917, "step": 30820 }, { "epoch": 2.43, "learning_rate": 2.6369346845085887e-05, "loss": 1.4211, "step": 30821 }, { "epoch": 2.43, "learning_rate": 2.6362348050367433e-05, "loss": 1.4245, "step": 30822 }, { "epoch": 2.43, "learning_rate": 2.6355350095080385e-05, "loss": 1.433, "step": 30823 }, { "epoch": 2.43, "learning_rate": 2.6348352979272258e-05, "loss": 1.4539, "step": 30824 }, { "epoch": 2.43, "learning_rate": 2.634135670299061e-05, "loss": 1.4815, "step": 30825 }, { "epoch": 2.43, "learning_rate": 2.633436126628291e-05, "loss": 1.44, "step": 30826 }, { "epoch": 2.43, "learning_rate": 2.6327366669196566e-05, "loss": 1.4812, "step": 30827 }, { "epoch": 2.43, "learning_rate": 2.6320372911779237e-05, "loss": 1.4393, "step": 30828 }, { "epoch": 2.43, "learning_rate": 2.6313379994078338e-05, "loss": 1.4674, "step": 30829 }, { "epoch": 2.43, "learning_rate": 2.6306387916141312e-05, "loss": 1.4176, "step": 30830 }, { "epoch": 2.43, "learning_rate": 2.6299396678015627e-05, "loss": 1.452, "step": 30831 }, { "epoch": 2.43, "learning_rate": 2.6292406279748808e-05, "loss": 1.459, "step": 30832 }, { "epoch": 2.43, "learning_rate": 2.628541672138828e-05, "loss": 1.4337, "step": 30833 }, { "epoch": 2.43, "learning_rate": 2.627842800298146e-05, "loss": 1.4367, "step": 30834 }, { "epoch": 2.43, "learning_rate": 2.6271440124575893e-05, "loss": 1.4754, "step": 30835 }, { "epoch": 2.43, "learning_rate": 2.6264453086218956e-05, "loss": 1.4073, "step": 30836 }, { "epoch": 2.43, "learning_rate": 2.6257466887958063e-05, "loss": 1.43, "step": 30837 }, { "epoch": 2.43, "learning_rate": 2.625048152984072e-05, "loss": 1.434, "step": 30838 }, { "epoch": 2.43, "learning_rate": 2.6243497011914317e-05, "loss": 1.4319, "step": 30839 }, { "epoch": 2.43, "learning_rate": 2.623651333422624e-05, "loss": 1.4383, "step": 30840 }, { "epoch": 2.43, "learning_rate": 2.622953049682397e-05, "loss": 1.4613, "step": 30841 }, { "epoch": 2.43, "learning_rate": 2.6222548499754904e-05, "loss": 1.4486, "step": 30842 }, { "epoch": 2.43, "learning_rate": 2.621556734306637e-05, "loss": 1.4405, "step": 30843 }, { "epoch": 2.43, "learning_rate": 2.6208587026805828e-05, "loss": 1.5096, "step": 30844 }, { "epoch": 2.43, "learning_rate": 2.6201607551020708e-05, "loss": 1.4097, "step": 30845 }, { "epoch": 2.43, "learning_rate": 2.619462891575836e-05, "loss": 1.4683, "step": 30846 }, { "epoch": 2.43, "learning_rate": 2.6187651121066154e-05, "loss": 1.4101, "step": 30847 }, { "epoch": 2.43, "learning_rate": 2.6180674166991428e-05, "loss": 1.4715, "step": 30848 }, { "epoch": 2.43, "learning_rate": 2.6173698053581638e-05, "loss": 1.413, "step": 30849 }, { "epoch": 2.43, "learning_rate": 2.6166722780884114e-05, "loss": 1.4706, "step": 30850 }, { "epoch": 2.43, "learning_rate": 2.6159748348946154e-05, "loss": 1.4816, "step": 30851 }, { "epoch": 2.43, "learning_rate": 2.6152774757815215e-05, "loss": 1.4639, "step": 30852 }, { "epoch": 2.43, "learning_rate": 2.614580200753858e-05, "loss": 1.482, "step": 30853 }, { "epoch": 2.43, "learning_rate": 2.613883009816356e-05, "loss": 1.4868, "step": 30854 }, { "epoch": 2.43, "learning_rate": 2.6131859029737566e-05, "loss": 1.4247, "step": 30855 }, { "epoch": 2.43, "learning_rate": 2.6124888802307915e-05, "loss": 1.4353, "step": 30856 }, { "epoch": 2.43, "learning_rate": 2.6117919415921846e-05, "loss": 1.4219, "step": 30857 }, { "epoch": 2.43, "learning_rate": 2.611095087062679e-05, "loss": 1.4067, "step": 30858 }, { "epoch": 2.43, "learning_rate": 2.6103983166469977e-05, "loss": 1.4386, "step": 30859 }, { "epoch": 2.43, "learning_rate": 2.6097016303498784e-05, "loss": 1.4815, "step": 30860 }, { "epoch": 2.43, "learning_rate": 2.6090050281760427e-05, "loss": 1.4754, "step": 30861 }, { "epoch": 2.43, "learning_rate": 2.6083085101302298e-05, "loss": 1.4668, "step": 30862 }, { "epoch": 2.43, "learning_rate": 2.6076120762171627e-05, "loss": 1.4579, "step": 30863 }, { "epoch": 2.43, "learning_rate": 2.6069157264415724e-05, "loss": 1.4457, "step": 30864 }, { "epoch": 2.43, "learning_rate": 2.6062194608081805e-05, "loss": 1.49, "step": 30865 }, { "epoch": 2.43, "learning_rate": 2.605523279321723e-05, "loss": 1.4372, "step": 30866 }, { "epoch": 2.43, "learning_rate": 2.6048271819869227e-05, "loss": 1.4756, "step": 30867 }, { "epoch": 2.43, "learning_rate": 2.604131168808501e-05, "loss": 1.4803, "step": 30868 }, { "epoch": 2.43, "learning_rate": 2.6034352397911923e-05, "loss": 1.4304, "step": 30869 }, { "epoch": 2.43, "learning_rate": 2.602739394939718e-05, "loss": 1.4427, "step": 30870 }, { "epoch": 2.43, "learning_rate": 2.6020436342587975e-05, "loss": 1.4236, "step": 30871 }, { "epoch": 2.43, "learning_rate": 2.601347957753162e-05, "loss": 1.4352, "step": 30872 }, { "epoch": 2.43, "learning_rate": 2.600652365427533e-05, "loss": 1.4088, "step": 30873 }, { "epoch": 2.43, "learning_rate": 2.5999568572866282e-05, "loss": 1.4448, "step": 30874 }, { "epoch": 2.43, "learning_rate": 2.5992614333351718e-05, "loss": 1.4595, "step": 30875 }, { "epoch": 2.43, "learning_rate": 2.5985660935778925e-05, "loss": 1.4548, "step": 30876 }, { "epoch": 2.43, "learning_rate": 2.597870838019504e-05, "loss": 1.4454, "step": 30877 }, { "epoch": 2.43, "learning_rate": 2.5971756666647263e-05, "loss": 1.4429, "step": 30878 }, { "epoch": 2.43, "learning_rate": 2.596480579518284e-05, "loss": 1.4544, "step": 30879 }, { "epoch": 2.43, "learning_rate": 2.595785576584895e-05, "loss": 1.4191, "step": 30880 }, { "epoch": 2.43, "learning_rate": 2.5950906578692753e-05, "loss": 1.4506, "step": 30881 }, { "epoch": 2.43, "learning_rate": 2.5943958233761415e-05, "loss": 1.4743, "step": 30882 }, { "epoch": 2.43, "learning_rate": 2.5937010731102177e-05, "loss": 1.4595, "step": 30883 }, { "epoch": 2.43, "learning_rate": 2.5930064070762185e-05, "loss": 1.4246, "step": 30884 }, { "epoch": 2.43, "learning_rate": 2.5923118252788538e-05, "loss": 1.4545, "step": 30885 }, { "epoch": 2.43, "learning_rate": 2.591617327722848e-05, "loss": 1.4829, "step": 30886 }, { "epoch": 2.43, "learning_rate": 2.590922914412914e-05, "loss": 1.4258, "step": 30887 }, { "epoch": 2.43, "learning_rate": 2.5902285853537615e-05, "loss": 1.3898, "step": 30888 }, { "epoch": 2.43, "learning_rate": 2.589534340550113e-05, "loss": 1.4437, "step": 30889 }, { "epoch": 2.43, "learning_rate": 2.5888401800066733e-05, "loss": 1.4751, "step": 30890 }, { "epoch": 2.43, "learning_rate": 2.5881461037281636e-05, "loss": 1.5045, "step": 30891 }, { "epoch": 2.43, "learning_rate": 2.5874521117192885e-05, "loss": 1.4538, "step": 30892 }, { "epoch": 2.43, "learning_rate": 2.586758203984768e-05, "loss": 1.4576, "step": 30893 }, { "epoch": 2.43, "learning_rate": 2.5860643805293073e-05, "loss": 1.4926, "step": 30894 }, { "epoch": 2.43, "learning_rate": 2.585370641357617e-05, "loss": 1.4118, "step": 30895 }, { "epoch": 2.43, "learning_rate": 2.5846769864744128e-05, "loss": 1.4378, "step": 30896 }, { "epoch": 2.43, "learning_rate": 2.583983415884401e-05, "loss": 1.4555, "step": 30897 }, { "epoch": 2.43, "learning_rate": 2.5832899295922844e-05, "loss": 1.4351, "step": 30898 }, { "epoch": 2.43, "learning_rate": 2.5825965276027828e-05, "loss": 1.4262, "step": 30899 }, { "epoch": 2.43, "learning_rate": 2.581903209920597e-05, "loss": 1.482, "step": 30900 }, { "epoch": 2.43, "learning_rate": 2.5812099765504356e-05, "loss": 1.5204, "step": 30901 }, { "epoch": 2.43, "learning_rate": 2.5805168274970013e-05, "loss": 1.4415, "step": 30902 }, { "epoch": 2.43, "learning_rate": 2.579823762765008e-05, "loss": 1.4751, "step": 30903 }, { "epoch": 2.43, "learning_rate": 2.579130782359158e-05, "loss": 1.4701, "step": 30904 }, { "epoch": 2.43, "learning_rate": 2.5784378862841516e-05, "loss": 1.4334, "step": 30905 }, { "epoch": 2.43, "learning_rate": 2.577745074544697e-05, "loss": 1.4705, "step": 30906 }, { "epoch": 2.43, "learning_rate": 2.5770523471455025e-05, "loss": 1.461, "step": 30907 }, { "epoch": 2.43, "learning_rate": 2.5763597040912654e-05, "loss": 1.4641, "step": 30908 }, { "epoch": 2.43, "learning_rate": 2.575667145386687e-05, "loss": 1.4868, "step": 30909 }, { "epoch": 2.43, "learning_rate": 2.574974671036478e-05, "loss": 1.4182, "step": 30910 }, { "epoch": 2.43, "learning_rate": 2.574282281045331e-05, "loss": 1.4752, "step": 30911 }, { "epoch": 2.43, "learning_rate": 2.573589975417949e-05, "loss": 1.4199, "step": 30912 }, { "epoch": 2.43, "learning_rate": 2.5728977541590357e-05, "loss": 1.4746, "step": 30913 }, { "epoch": 2.43, "learning_rate": 2.5722056172732907e-05, "loss": 1.4059, "step": 30914 }, { "epoch": 2.43, "learning_rate": 2.5715135647654056e-05, "loss": 1.431, "step": 30915 }, { "epoch": 2.43, "learning_rate": 2.5708215966400896e-05, "loss": 1.4213, "step": 30916 }, { "epoch": 2.43, "learning_rate": 2.570129712902036e-05, "loss": 1.5146, "step": 30917 }, { "epoch": 2.43, "learning_rate": 2.5694379135559422e-05, "loss": 1.4754, "step": 30918 }, { "epoch": 2.43, "learning_rate": 2.5687461986065017e-05, "loss": 1.4885, "step": 30919 }, { "epoch": 2.43, "learning_rate": 2.568054568058417e-05, "loss": 1.4443, "step": 30920 }, { "epoch": 2.43, "learning_rate": 2.5673630219163825e-05, "loss": 1.454, "step": 30921 }, { "epoch": 2.43, "learning_rate": 2.5666715601850886e-05, "loss": 1.4652, "step": 30922 }, { "epoch": 2.43, "learning_rate": 2.5659801828692323e-05, "loss": 1.4477, "step": 30923 }, { "epoch": 2.43, "learning_rate": 2.5652888899735134e-05, "loss": 1.4224, "step": 30924 }, { "epoch": 2.43, "learning_rate": 2.5645976815026204e-05, "loss": 1.4938, "step": 30925 }, { "epoch": 2.43, "learning_rate": 2.5639065574612438e-05, "loss": 1.4419, "step": 30926 }, { "epoch": 2.43, "learning_rate": 2.563215517854082e-05, "loss": 1.4303, "step": 30927 }, { "epoch": 2.43, "learning_rate": 2.5625245626858242e-05, "loss": 1.4482, "step": 30928 }, { "epoch": 2.43, "learning_rate": 2.5618336919611572e-05, "loss": 1.4815, "step": 30929 }, { "epoch": 2.43, "learning_rate": 2.5611429056847782e-05, "loss": 1.4437, "step": 30930 }, { "epoch": 2.43, "learning_rate": 2.5604522038613757e-05, "loss": 1.4765, "step": 30931 }, { "epoch": 2.43, "learning_rate": 2.559761586495634e-05, "loss": 1.4707, "step": 30932 }, { "epoch": 2.43, "learning_rate": 2.5590710535922492e-05, "loss": 1.4883, "step": 30933 }, { "epoch": 2.43, "learning_rate": 2.5583806051559065e-05, "loss": 1.44, "step": 30934 }, { "epoch": 2.43, "learning_rate": 2.5576902411912947e-05, "loss": 1.4357, "step": 30935 }, { "epoch": 2.43, "learning_rate": 2.5569999617030957e-05, "loss": 1.4241, "step": 30936 }, { "epoch": 2.43, "learning_rate": 2.556309766696e-05, "loss": 1.435, "step": 30937 }, { "epoch": 2.43, "learning_rate": 2.5556196561746982e-05, "loss": 1.4677, "step": 30938 }, { "epoch": 2.43, "learning_rate": 2.5549296301438675e-05, "loss": 1.5214, "step": 30939 }, { "epoch": 2.43, "learning_rate": 2.5542396886081997e-05, "loss": 1.498, "step": 30940 }, { "epoch": 2.43, "learning_rate": 2.5535498315723783e-05, "loss": 1.4667, "step": 30941 }, { "epoch": 2.43, "learning_rate": 2.5528600590410843e-05, "loss": 1.4427, "step": 30942 }, { "epoch": 2.43, "learning_rate": 2.552170371018996e-05, "loss": 1.4534, "step": 30943 }, { "epoch": 2.43, "learning_rate": 2.5514807675108072e-05, "loss": 1.4458, "step": 30944 }, { "epoch": 2.43, "learning_rate": 2.550791248521194e-05, "loss": 1.3844, "step": 30945 }, { "epoch": 2.43, "learning_rate": 2.550101814054834e-05, "loss": 1.4548, "step": 30946 }, { "epoch": 2.43, "learning_rate": 2.549412464116417e-05, "loss": 1.4655, "step": 30947 }, { "epoch": 2.44, "learning_rate": 2.5487231987106176e-05, "loss": 1.4249, "step": 30948 }, { "epoch": 2.44, "learning_rate": 2.5480340178421138e-05, "loss": 1.4169, "step": 30949 }, { "epoch": 2.44, "learning_rate": 2.54734492151559e-05, "loss": 1.384, "step": 30950 }, { "epoch": 2.44, "learning_rate": 2.5466559097357224e-05, "loss": 1.4382, "step": 30951 }, { "epoch": 2.44, "learning_rate": 2.545966982507186e-05, "loss": 1.4267, "step": 30952 }, { "epoch": 2.44, "learning_rate": 2.54527813983466e-05, "loss": 1.4671, "step": 30953 }, { "epoch": 2.44, "learning_rate": 2.5445893817228274e-05, "loss": 1.4529, "step": 30954 }, { "epoch": 2.44, "learning_rate": 2.543900708176358e-05, "loss": 1.3741, "step": 30955 }, { "epoch": 2.44, "learning_rate": 2.543212119199926e-05, "loss": 1.4963, "step": 30956 }, { "epoch": 2.44, "learning_rate": 2.542523614798213e-05, "loss": 1.4821, "step": 30957 }, { "epoch": 2.44, "learning_rate": 2.5418351949758904e-05, "loss": 1.4846, "step": 30958 }, { "epoch": 2.44, "learning_rate": 2.5411468597376323e-05, "loss": 1.4329, "step": 30959 }, { "epoch": 2.44, "learning_rate": 2.5404586090881068e-05, "loss": 1.447, "step": 30960 }, { "epoch": 2.44, "learning_rate": 2.5397704430319954e-05, "loss": 1.4909, "step": 30961 }, { "epoch": 2.44, "learning_rate": 2.5390823615739675e-05, "loss": 1.4395, "step": 30962 }, { "epoch": 2.44, "learning_rate": 2.5383943647186894e-05, "loss": 1.4389, "step": 30963 }, { "epoch": 2.44, "learning_rate": 2.5377064524708406e-05, "loss": 1.4117, "step": 30964 }, { "epoch": 2.44, "learning_rate": 2.5370186248350878e-05, "loss": 1.4535, "step": 30965 }, { "epoch": 2.44, "learning_rate": 2.5363308818160965e-05, "loss": 1.4471, "step": 30966 }, { "epoch": 2.44, "learning_rate": 2.5356432234185454e-05, "loss": 1.4746, "step": 30967 }, { "epoch": 2.44, "learning_rate": 2.534955649647097e-05, "loss": 1.4278, "step": 30968 }, { "epoch": 2.44, "learning_rate": 2.534268160506419e-05, "loss": 1.4178, "step": 30969 }, { "epoch": 2.44, "learning_rate": 2.53358075600118e-05, "loss": 1.4324, "step": 30970 }, { "epoch": 2.44, "learning_rate": 2.532893436136051e-05, "loss": 1.4247, "step": 30971 }, { "epoch": 2.44, "learning_rate": 2.5322062009156964e-05, "loss": 1.4324, "step": 30972 }, { "epoch": 2.44, "learning_rate": 2.5315190503447792e-05, "loss": 1.3696, "step": 30973 }, { "epoch": 2.44, "learning_rate": 2.530831984427969e-05, "loss": 1.4624, "step": 30974 }, { "epoch": 2.44, "learning_rate": 2.5301450031699288e-05, "loss": 1.4522, "step": 30975 }, { "epoch": 2.44, "learning_rate": 2.5294581065753218e-05, "loss": 1.4471, "step": 30976 }, { "epoch": 2.44, "learning_rate": 2.5287712946488105e-05, "loss": 1.4429, "step": 30977 }, { "epoch": 2.44, "learning_rate": 2.5280845673950628e-05, "loss": 1.4567, "step": 30978 }, { "epoch": 2.44, "learning_rate": 2.5273979248187387e-05, "loss": 1.4604, "step": 30979 }, { "epoch": 2.44, "learning_rate": 2.5267113669244943e-05, "loss": 1.4744, "step": 30980 }, { "epoch": 2.44, "learning_rate": 2.5260248937170023e-05, "loss": 1.4235, "step": 30981 }, { "epoch": 2.44, "learning_rate": 2.525338505200916e-05, "loss": 1.4676, "step": 30982 }, { "epoch": 2.44, "learning_rate": 2.524652201380895e-05, "loss": 1.4656, "step": 30983 }, { "epoch": 2.44, "learning_rate": 2.5239659822616036e-05, "loss": 1.4951, "step": 30984 }, { "epoch": 2.44, "learning_rate": 2.523279847847695e-05, "loss": 1.4384, "step": 30985 }, { "epoch": 2.44, "learning_rate": 2.522593798143834e-05, "loss": 1.4574, "step": 30986 }, { "epoch": 2.44, "learning_rate": 2.5219078331546728e-05, "loss": 1.4261, "step": 30987 }, { "epoch": 2.44, "learning_rate": 2.521221952884875e-05, "loss": 1.4841, "step": 30988 }, { "epoch": 2.44, "learning_rate": 2.520536157339093e-05, "loss": 1.4591, "step": 30989 }, { "epoch": 2.44, "learning_rate": 2.5198504465219806e-05, "loss": 1.4249, "step": 30990 }, { "epoch": 2.44, "learning_rate": 2.5191648204382e-05, "loss": 1.4877, "step": 30991 }, { "epoch": 2.44, "learning_rate": 2.518479279092404e-05, "loss": 1.4322, "step": 30992 }, { "epoch": 2.44, "learning_rate": 2.5177938224892413e-05, "loss": 1.5093, "step": 30993 }, { "epoch": 2.44, "learning_rate": 2.5171084506333727e-05, "loss": 1.4259, "step": 30994 }, { "epoch": 2.44, "learning_rate": 2.5164231635294514e-05, "loss": 1.4517, "step": 30995 }, { "epoch": 2.44, "learning_rate": 2.5157379611821266e-05, "loss": 1.4154, "step": 30996 }, { "epoch": 2.44, "learning_rate": 2.515052843596048e-05, "loss": 1.4686, "step": 30997 }, { "epoch": 2.44, "learning_rate": 2.514367810775874e-05, "loss": 1.477, "step": 30998 }, { "epoch": 2.44, "learning_rate": 2.513682862726254e-05, "loss": 1.4516, "step": 30999 }, { "epoch": 2.44, "learning_rate": 2.5129979994518308e-05, "loss": 1.4581, "step": 31000 }, { "epoch": 2.44, "learning_rate": 2.5123132209572622e-05, "loss": 1.4445, "step": 31001 }, { "epoch": 2.44, "learning_rate": 2.511628527247198e-05, "loss": 1.4978, "step": 31002 }, { "epoch": 2.44, "learning_rate": 2.5109439183262863e-05, "loss": 1.4505, "step": 31003 }, { "epoch": 2.44, "learning_rate": 2.5102593941991683e-05, "loss": 1.463, "step": 31004 }, { "epoch": 2.44, "learning_rate": 2.5095749548705e-05, "loss": 1.4579, "step": 31005 }, { "epoch": 2.44, "learning_rate": 2.508890600344925e-05, "loss": 1.4673, "step": 31006 }, { "epoch": 2.44, "learning_rate": 2.508206330627087e-05, "loss": 1.3552, "step": 31007 }, { "epoch": 2.44, "learning_rate": 2.507522145721638e-05, "loss": 1.4734, "step": 31008 }, { "epoch": 2.44, "learning_rate": 2.5068380456332194e-05, "loss": 1.4252, "step": 31009 }, { "epoch": 2.44, "learning_rate": 2.5061540303664717e-05, "loss": 1.4531, "step": 31010 }, { "epoch": 2.44, "learning_rate": 2.5054700999260485e-05, "loss": 1.4635, "step": 31011 }, { "epoch": 2.44, "learning_rate": 2.5047862543165875e-05, "loss": 1.4349, "step": 31012 }, { "epoch": 2.44, "learning_rate": 2.504102493542732e-05, "loss": 1.4157, "step": 31013 }, { "epoch": 2.44, "learning_rate": 2.5034188176091206e-05, "loss": 1.4418, "step": 31014 }, { "epoch": 2.44, "learning_rate": 2.5027352265204043e-05, "loss": 1.4746, "step": 31015 }, { "epoch": 2.44, "learning_rate": 2.502051720281215e-05, "loss": 1.4889, "step": 31016 }, { "epoch": 2.44, "learning_rate": 2.5013682988962013e-05, "loss": 1.4645, "step": 31017 }, { "epoch": 2.44, "learning_rate": 2.500684962369996e-05, "loss": 1.4777, "step": 31018 }, { "epoch": 2.44, "learning_rate": 2.5000017107072467e-05, "loss": 1.4437, "step": 31019 }, { "epoch": 2.44, "learning_rate": 2.4993185439125867e-05, "loss": 1.4113, "step": 31020 }, { "epoch": 2.44, "learning_rate": 2.4986354619906523e-05, "loss": 1.4528, "step": 31021 }, { "epoch": 2.44, "learning_rate": 2.4979524649460865e-05, "loss": 1.4284, "step": 31022 }, { "epoch": 2.44, "learning_rate": 2.497269552783525e-05, "loss": 1.4583, "step": 31023 }, { "epoch": 2.44, "learning_rate": 2.4965867255076e-05, "loss": 1.4366, "step": 31024 }, { "epoch": 2.44, "learning_rate": 2.4959039831229555e-05, "loss": 1.4794, "step": 31025 }, { "epoch": 2.44, "learning_rate": 2.495221325634223e-05, "loss": 1.4681, "step": 31026 }, { "epoch": 2.44, "learning_rate": 2.494538753046032e-05, "loss": 1.4151, "step": 31027 }, { "epoch": 2.44, "learning_rate": 2.4938562653630255e-05, "loss": 1.4599, "step": 31028 }, { "epoch": 2.44, "learning_rate": 2.4931738625898335e-05, "loss": 1.464, "step": 31029 }, { "epoch": 2.44, "learning_rate": 2.49249154473109e-05, "loss": 1.4293, "step": 31030 }, { "epoch": 2.44, "learning_rate": 2.4918093117914236e-05, "loss": 1.4848, "step": 31031 }, { "epoch": 2.44, "learning_rate": 2.491127163775468e-05, "loss": 1.4835, "step": 31032 }, { "epoch": 2.44, "learning_rate": 2.490445100687859e-05, "loss": 1.5074, "step": 31033 }, { "epoch": 2.44, "learning_rate": 2.4897631225332253e-05, "loss": 1.4676, "step": 31034 }, { "epoch": 2.44, "learning_rate": 2.4890812293161937e-05, "loss": 1.4467, "step": 31035 }, { "epoch": 2.44, "learning_rate": 2.4883994210413987e-05, "loss": 1.4401, "step": 31036 }, { "epoch": 2.44, "learning_rate": 2.4877176977134684e-05, "loss": 1.4341, "step": 31037 }, { "epoch": 2.44, "learning_rate": 2.4870360593370255e-05, "loss": 1.4895, "step": 31038 }, { "epoch": 2.44, "learning_rate": 2.486354505916706e-05, "loss": 1.4766, "step": 31039 }, { "epoch": 2.44, "learning_rate": 2.4856730374571336e-05, "loss": 1.4426, "step": 31040 }, { "epoch": 2.44, "learning_rate": 2.4849916539629327e-05, "loss": 1.4208, "step": 31041 }, { "epoch": 2.44, "learning_rate": 2.4843103554387344e-05, "loss": 1.4267, "step": 31042 }, { "epoch": 2.44, "learning_rate": 2.4836291418891637e-05, "loss": 1.5063, "step": 31043 }, { "epoch": 2.44, "learning_rate": 2.4829480133188394e-05, "loss": 1.4997, "step": 31044 }, { "epoch": 2.44, "learning_rate": 2.4822669697323954e-05, "loss": 1.461, "step": 31045 }, { "epoch": 2.44, "learning_rate": 2.4815860111344495e-05, "loss": 1.4677, "step": 31046 }, { "epoch": 2.44, "learning_rate": 2.4809051375296225e-05, "loss": 1.4515, "step": 31047 }, { "epoch": 2.44, "learning_rate": 2.4802243489225426e-05, "loss": 1.4607, "step": 31048 }, { "epoch": 2.44, "learning_rate": 2.479543645317833e-05, "loss": 1.4816, "step": 31049 }, { "epoch": 2.44, "learning_rate": 2.4788630267201114e-05, "loss": 1.4487, "step": 31050 }, { "epoch": 2.44, "learning_rate": 2.478182493133998e-05, "loss": 1.4752, "step": 31051 }, { "epoch": 2.44, "learning_rate": 2.47750204456412e-05, "loss": 1.4499, "step": 31052 }, { "epoch": 2.44, "learning_rate": 2.4768216810150905e-05, "loss": 1.4564, "step": 31053 }, { "epoch": 2.44, "learning_rate": 2.4761414024915327e-05, "loss": 1.4563, "step": 31054 }, { "epoch": 2.44, "learning_rate": 2.475461208998058e-05, "loss": 1.439, "step": 31055 }, { "epoch": 2.44, "learning_rate": 2.474781100539294e-05, "loss": 1.4576, "step": 31056 }, { "epoch": 2.44, "learning_rate": 2.474101077119856e-05, "loss": 1.4357, "step": 31057 }, { "epoch": 2.44, "learning_rate": 2.4734211387443547e-05, "loss": 1.4416, "step": 31058 }, { "epoch": 2.44, "learning_rate": 2.472741285417415e-05, "loss": 1.4702, "step": 31059 }, { "epoch": 2.44, "learning_rate": 2.472061517143648e-05, "loss": 1.4213, "step": 31060 }, { "epoch": 2.44, "learning_rate": 2.4713818339276668e-05, "loss": 1.4458, "step": 31061 }, { "epoch": 2.44, "learning_rate": 2.470702235774093e-05, "loss": 1.4537, "step": 31062 }, { "epoch": 2.44, "learning_rate": 2.470022722687534e-05, "loss": 1.4429, "step": 31063 }, { "epoch": 2.44, "learning_rate": 2.4693432946726083e-05, "loss": 1.3762, "step": 31064 }, { "epoch": 2.44, "learning_rate": 2.4686639517339235e-05, "loss": 1.4444, "step": 31065 }, { "epoch": 2.44, "learning_rate": 2.4679846938760977e-05, "loss": 1.4428, "step": 31066 }, { "epoch": 2.44, "learning_rate": 2.4673055211037425e-05, "loss": 1.4566, "step": 31067 }, { "epoch": 2.44, "learning_rate": 2.4666264334214603e-05, "loss": 1.4824, "step": 31068 }, { "epoch": 2.44, "learning_rate": 2.4659474308338745e-05, "loss": 1.5117, "step": 31069 }, { "epoch": 2.44, "learning_rate": 2.4652685133455863e-05, "loss": 1.4178, "step": 31070 }, { "epoch": 2.44, "learning_rate": 2.464589680961209e-05, "loss": 1.4635, "step": 31071 }, { "epoch": 2.44, "learning_rate": 2.4639109336853464e-05, "loss": 1.4534, "step": 31072 }, { "epoch": 2.44, "learning_rate": 2.4632322715226138e-05, "loss": 1.4089, "step": 31073 }, { "epoch": 2.44, "learning_rate": 2.462553694477616e-05, "loss": 1.4325, "step": 31074 }, { "epoch": 2.45, "learning_rate": 2.4618752025549554e-05, "loss": 1.4531, "step": 31075 }, { "epoch": 2.45, "learning_rate": 2.461196795759249e-05, "loss": 1.3969, "step": 31076 }, { "epoch": 2.45, "learning_rate": 2.460518474095094e-05, "loss": 1.4551, "step": 31077 }, { "epoch": 2.45, "learning_rate": 2.459840237567097e-05, "loss": 1.4404, "step": 31078 }, { "epoch": 2.45, "learning_rate": 2.4591620861798634e-05, "loss": 1.4121, "step": 31079 }, { "epoch": 2.45, "learning_rate": 2.4584840199380034e-05, "loss": 1.4009, "step": 31080 }, { "epoch": 2.45, "learning_rate": 2.4578060388461156e-05, "loss": 1.4596, "step": 31081 }, { "epoch": 2.45, "learning_rate": 2.4571281429087997e-05, "loss": 1.418, "step": 31082 }, { "epoch": 2.45, "learning_rate": 2.456450332130665e-05, "loss": 1.437, "step": 31083 }, { "epoch": 2.45, "learning_rate": 2.4557726065163114e-05, "loss": 1.4418, "step": 31084 }, { "epoch": 2.45, "learning_rate": 2.455094966070335e-05, "loss": 1.4463, "step": 31085 }, { "epoch": 2.45, "learning_rate": 2.454417410797344e-05, "loss": 1.4751, "step": 31086 }, { "epoch": 2.45, "learning_rate": 2.4537399407019366e-05, "loss": 1.4386, "step": 31087 }, { "epoch": 2.45, "learning_rate": 2.4530625557887118e-05, "loss": 1.4884, "step": 31088 }, { "epoch": 2.45, "learning_rate": 2.452385256062263e-05, "loss": 1.4076, "step": 31089 }, { "epoch": 2.45, "learning_rate": 2.4517080415272002e-05, "loss": 1.4693, "step": 31090 }, { "epoch": 2.45, "learning_rate": 2.4510309121881122e-05, "loss": 1.4318, "step": 31091 }, { "epoch": 2.45, "learning_rate": 2.4503538680495977e-05, "loss": 1.4541, "step": 31092 }, { "epoch": 2.45, "learning_rate": 2.4496769091162576e-05, "loss": 1.4544, "step": 31093 }, { "epoch": 2.45, "learning_rate": 2.4490000353926853e-05, "loss": 1.401, "step": 31094 }, { "epoch": 2.45, "learning_rate": 2.4483232468834736e-05, "loss": 1.4023, "step": 31095 }, { "epoch": 2.45, "learning_rate": 2.44764654359322e-05, "loss": 1.4569, "step": 31096 }, { "epoch": 2.45, "learning_rate": 2.4469699255265235e-05, "loss": 1.4696, "step": 31097 }, { "epoch": 2.45, "learning_rate": 2.446293392687973e-05, "loss": 1.445, "step": 31098 }, { "epoch": 2.45, "learning_rate": 2.4456169450821584e-05, "loss": 1.4534, "step": 31099 }, { "epoch": 2.45, "learning_rate": 2.4449405827136825e-05, "loss": 1.461, "step": 31100 }, { "epoch": 2.45, "learning_rate": 2.4442643055871303e-05, "loss": 1.4793, "step": 31101 }, { "epoch": 2.45, "learning_rate": 2.4435881137070913e-05, "loss": 1.4723, "step": 31102 }, { "epoch": 2.45, "learning_rate": 2.442912007078163e-05, "loss": 1.4069, "step": 31103 }, { "epoch": 2.45, "learning_rate": 2.442235985704933e-05, "loss": 1.4546, "step": 31104 }, { "epoch": 2.45, "learning_rate": 2.441560049591986e-05, "loss": 1.4421, "step": 31105 }, { "epoch": 2.45, "learning_rate": 2.4408841987439214e-05, "loss": 1.4769, "step": 31106 }, { "epoch": 2.45, "learning_rate": 2.4402084331653217e-05, "loss": 1.4279, "step": 31107 }, { "epoch": 2.45, "learning_rate": 2.439532752860776e-05, "loss": 1.4573, "step": 31108 }, { "epoch": 2.45, "learning_rate": 2.4388571578348665e-05, "loss": 1.4767, "step": 31109 }, { "epoch": 2.45, "learning_rate": 2.4381816480921856e-05, "loss": 1.4604, "step": 31110 }, { "epoch": 2.45, "learning_rate": 2.4375062236373234e-05, "loss": 1.4026, "step": 31111 }, { "epoch": 2.45, "learning_rate": 2.4368308844748625e-05, "loss": 1.4333, "step": 31112 }, { "epoch": 2.45, "learning_rate": 2.436155630609381e-05, "loss": 1.4537, "step": 31113 }, { "epoch": 2.45, "learning_rate": 2.4354804620454738e-05, "loss": 1.4116, "step": 31114 }, { "epoch": 2.45, "learning_rate": 2.434805378787722e-05, "loss": 1.4354, "step": 31115 }, { "epoch": 2.45, "learning_rate": 2.434130380840702e-05, "loss": 1.4148, "step": 31116 }, { "epoch": 2.45, "learning_rate": 2.433455468209007e-05, "loss": 1.5019, "step": 31117 }, { "epoch": 2.45, "learning_rate": 2.4327806408972146e-05, "loss": 1.457, "step": 31118 }, { "epoch": 2.45, "learning_rate": 2.4321058989099012e-05, "loss": 1.4415, "step": 31119 }, { "epoch": 2.45, "learning_rate": 2.4314312422516587e-05, "loss": 1.4831, "step": 31120 }, { "epoch": 2.45, "learning_rate": 2.4307566709270626e-05, "loss": 1.4729, "step": 31121 }, { "epoch": 2.45, "learning_rate": 2.4300821849406866e-05, "loss": 1.4277, "step": 31122 }, { "epoch": 2.45, "learning_rate": 2.4294077842971216e-05, "loss": 1.4618, "step": 31123 }, { "epoch": 2.45, "learning_rate": 2.428733469000939e-05, "loss": 1.4431, "step": 31124 }, { "epoch": 2.45, "learning_rate": 2.4280592390567204e-05, "loss": 1.4488, "step": 31125 }, { "epoch": 2.45, "learning_rate": 2.427385094469034e-05, "loss": 1.4629, "step": 31126 }, { "epoch": 2.45, "learning_rate": 2.4267110352424718e-05, "loss": 1.4248, "step": 31127 }, { "epoch": 2.45, "learning_rate": 2.4260370613816025e-05, "loss": 1.4445, "step": 31128 }, { "epoch": 2.45, "learning_rate": 2.4253631728910045e-05, "loss": 1.4406, "step": 31129 }, { "epoch": 2.45, "learning_rate": 2.424689369775245e-05, "loss": 1.4342, "step": 31130 }, { "epoch": 2.45, "learning_rate": 2.424015652038911e-05, "loss": 1.3804, "step": 31131 }, { "epoch": 2.45, "learning_rate": 2.42334201968657e-05, "loss": 1.4492, "step": 31132 }, { "epoch": 2.45, "learning_rate": 2.422668472722792e-05, "loss": 1.5045, "step": 31133 }, { "epoch": 2.45, "learning_rate": 2.421995011152158e-05, "loss": 1.535, "step": 31134 }, { "epoch": 2.45, "learning_rate": 2.421321634979238e-05, "loss": 1.4892, "step": 31135 }, { "epoch": 2.45, "learning_rate": 2.4206483442085983e-05, "loss": 1.4522, "step": 31136 }, { "epoch": 2.45, "learning_rate": 2.4199751388448186e-05, "loss": 1.4347, "step": 31137 }, { "epoch": 2.45, "learning_rate": 2.4193020188924632e-05, "loss": 1.4378, "step": 31138 }, { "epoch": 2.45, "learning_rate": 2.418628984356104e-05, "loss": 1.4444, "step": 31139 }, { "epoch": 2.45, "learning_rate": 2.417956035240312e-05, "loss": 1.4625, "step": 31140 }, { "epoch": 2.45, "learning_rate": 2.4172831715496572e-05, "loss": 1.4585, "step": 31141 }, { "epoch": 2.45, "learning_rate": 2.4166103932887004e-05, "loss": 1.4234, "step": 31142 }, { "epoch": 2.45, "learning_rate": 2.4159377004620167e-05, "loss": 1.4099, "step": 31143 }, { "epoch": 2.45, "learning_rate": 2.415265093074174e-05, "loss": 1.4721, "step": 31144 }, { "epoch": 2.45, "learning_rate": 2.414592571129737e-05, "loss": 1.4552, "step": 31145 }, { "epoch": 2.45, "learning_rate": 2.413920134633272e-05, "loss": 1.4444, "step": 31146 }, { "epoch": 2.45, "learning_rate": 2.4132477835893387e-05, "loss": 1.5256, "step": 31147 }, { "epoch": 2.45, "learning_rate": 2.412575518002512e-05, "loss": 1.4059, "step": 31148 }, { "epoch": 2.45, "learning_rate": 2.4119033378773494e-05, "loss": 1.4617, "step": 31149 }, { "epoch": 2.45, "learning_rate": 2.4112312432184144e-05, "loss": 1.4292, "step": 31150 }, { "epoch": 2.45, "learning_rate": 2.4105592340302764e-05, "loss": 1.4498, "step": 31151 }, { "epoch": 2.45, "learning_rate": 2.4098873103174922e-05, "loss": 1.4317, "step": 31152 }, { "epoch": 2.45, "learning_rate": 2.4092154720846224e-05, "loss": 1.451, "step": 31153 }, { "epoch": 2.45, "learning_rate": 2.408543719336234e-05, "loss": 1.4842, "step": 31154 }, { "epoch": 2.45, "learning_rate": 2.407872052076886e-05, "loss": 1.4408, "step": 31155 }, { "epoch": 2.45, "learning_rate": 2.4072004703111343e-05, "loss": 1.4382, "step": 31156 }, { "epoch": 2.45, "learning_rate": 2.4065289740435424e-05, "loss": 1.4703, "step": 31157 }, { "epoch": 2.45, "learning_rate": 2.405857563278672e-05, "loss": 1.4315, "step": 31158 }, { "epoch": 2.45, "learning_rate": 2.4051862380210795e-05, "loss": 1.4623, "step": 31159 }, { "epoch": 2.45, "learning_rate": 2.404514998275318e-05, "loss": 1.4865, "step": 31160 }, { "epoch": 2.45, "learning_rate": 2.4038438440459522e-05, "loss": 1.4754, "step": 31161 }, { "epoch": 2.45, "learning_rate": 2.403172775337537e-05, "loss": 1.4601, "step": 31162 }, { "epoch": 2.45, "learning_rate": 2.402501792154623e-05, "loss": 1.4995, "step": 31163 }, { "epoch": 2.45, "learning_rate": 2.4018308945017724e-05, "loss": 1.4896, "step": 31164 }, { "epoch": 2.45, "learning_rate": 2.401160082383539e-05, "loss": 1.4523, "step": 31165 }, { "epoch": 2.45, "learning_rate": 2.4004893558044752e-05, "loss": 1.446, "step": 31166 }, { "epoch": 2.45, "learning_rate": 2.3998187147691315e-05, "loss": 1.3967, "step": 31167 }, { "epoch": 2.45, "learning_rate": 2.3991481592820698e-05, "loss": 1.3914, "step": 31168 }, { "epoch": 2.45, "learning_rate": 2.3984776893478395e-05, "loss": 1.4424, "step": 31169 }, { "epoch": 2.45, "learning_rate": 2.3978073049709873e-05, "loss": 1.4604, "step": 31170 }, { "epoch": 2.45, "learning_rate": 2.3971370061560708e-05, "loss": 1.4714, "step": 31171 }, { "epoch": 2.45, "learning_rate": 2.3964667929076414e-05, "loss": 1.4017, "step": 31172 }, { "epoch": 2.45, "learning_rate": 2.3957966652302424e-05, "loss": 1.4378, "step": 31173 }, { "epoch": 2.45, "learning_rate": 2.39512662312843e-05, "loss": 1.4352, "step": 31174 }, { "epoch": 2.45, "learning_rate": 2.3944566666067538e-05, "loss": 1.3578, "step": 31175 }, { "epoch": 2.45, "learning_rate": 2.393786795669762e-05, "loss": 1.464, "step": 31176 }, { "epoch": 2.45, "learning_rate": 2.393117010321996e-05, "loss": 1.4586, "step": 31177 }, { "epoch": 2.45, "learning_rate": 2.3924473105680137e-05, "loss": 1.4205, "step": 31178 }, { "epoch": 2.45, "learning_rate": 2.3917776964123547e-05, "loss": 1.4878, "step": 31179 }, { "epoch": 2.45, "learning_rate": 2.3911081678595655e-05, "loss": 1.5079, "step": 31180 }, { "epoch": 2.45, "learning_rate": 2.390438724914196e-05, "loss": 1.4287, "step": 31181 }, { "epoch": 2.45, "learning_rate": 2.3897693675807904e-05, "loss": 1.377, "step": 31182 }, { "epoch": 2.45, "learning_rate": 2.3891000958638905e-05, "loss": 1.48, "step": 31183 }, { "epoch": 2.45, "learning_rate": 2.3884309097680394e-05, "loss": 1.4446, "step": 31184 }, { "epoch": 2.45, "learning_rate": 2.3877618092977864e-05, "loss": 1.4572, "step": 31185 }, { "epoch": 2.45, "learning_rate": 2.3870927944576695e-05, "loss": 1.4076, "step": 31186 }, { "epoch": 2.45, "learning_rate": 2.386423865252229e-05, "loss": 1.429, "step": 31187 }, { "epoch": 2.45, "learning_rate": 2.385755021686014e-05, "loss": 1.46, "step": 31188 }, { "epoch": 2.45, "learning_rate": 2.385086263763556e-05, "loss": 1.4844, "step": 31189 }, { "epoch": 2.45, "learning_rate": 2.3844175914894065e-05, "loss": 1.4016, "step": 31190 }, { "epoch": 2.45, "learning_rate": 2.383749004868095e-05, "loss": 1.4753, "step": 31191 }, { "epoch": 2.45, "learning_rate": 2.3830805039041682e-05, "loss": 1.4942, "step": 31192 }, { "epoch": 2.45, "learning_rate": 2.3824120886021643e-05, "loss": 1.4451, "step": 31193 }, { "epoch": 2.45, "learning_rate": 2.3817437589666138e-05, "loss": 1.4295, "step": 31194 }, { "epoch": 2.45, "learning_rate": 2.3810755150020637e-05, "loss": 1.4035, "step": 31195 }, { "epoch": 2.45, "learning_rate": 2.3804073567130487e-05, "loss": 1.4272, "step": 31196 }, { "epoch": 2.45, "learning_rate": 2.3797392841040984e-05, "loss": 1.4546, "step": 31197 }, { "epoch": 2.45, "learning_rate": 2.3790712971797592e-05, "loss": 1.3829, "step": 31198 }, { "epoch": 2.45, "learning_rate": 2.378403395944559e-05, "loss": 1.4444, "step": 31199 }, { "epoch": 2.45, "learning_rate": 2.3777355804030362e-05, "loss": 1.4131, "step": 31200 }, { "epoch": 2.45, "learning_rate": 2.37706785055972e-05, "loss": 1.4353, "step": 31201 }, { "epoch": 2.46, "learning_rate": 2.376400206419149e-05, "loss": 1.4052, "step": 31202 }, { "epoch": 2.46, "learning_rate": 2.3757326479858556e-05, "loss": 1.4955, "step": 31203 }, { "epoch": 2.46, "learning_rate": 2.3750651752643667e-05, "loss": 1.435, "step": 31204 }, { "epoch": 2.46, "learning_rate": 2.3743977882592185e-05, "loss": 1.4441, "step": 31205 }, { "epoch": 2.46, "learning_rate": 2.3737304869749458e-05, "loss": 1.3819, "step": 31206 }, { "epoch": 2.46, "learning_rate": 2.3730632714160746e-05, "loss": 1.4665, "step": 31207 }, { "epoch": 2.46, "learning_rate": 2.3723961415871336e-05, "loss": 1.4526, "step": 31208 }, { "epoch": 2.46, "learning_rate": 2.3717290974926567e-05, "loss": 1.4552, "step": 31209 }, { "epoch": 2.46, "learning_rate": 2.371062139137171e-05, "loss": 1.4796, "step": 31210 }, { "epoch": 2.46, "learning_rate": 2.370395266525199e-05, "loss": 1.5206, "step": 31211 }, { "epoch": 2.46, "learning_rate": 2.3697284796612793e-05, "loss": 1.4784, "step": 31212 }, { "epoch": 2.46, "learning_rate": 2.369061778549931e-05, "loss": 1.4701, "step": 31213 }, { "epoch": 2.46, "learning_rate": 2.368395163195681e-05, "loss": 1.4006, "step": 31214 }, { "epoch": 2.46, "learning_rate": 2.3677286336030604e-05, "loss": 1.4659, "step": 31215 }, { "epoch": 2.46, "learning_rate": 2.3670621897765905e-05, "loss": 1.4319, "step": 31216 }, { "epoch": 2.46, "learning_rate": 2.3663958317207948e-05, "loss": 1.4842, "step": 31217 }, { "epoch": 2.46, "learning_rate": 2.3657295594402024e-05, "loss": 1.457, "step": 31218 }, { "epoch": 2.46, "learning_rate": 2.3650633729393336e-05, "loss": 1.4688, "step": 31219 }, { "epoch": 2.46, "learning_rate": 2.3643972722227094e-05, "loss": 1.438, "step": 31220 }, { "epoch": 2.46, "learning_rate": 2.3637312572948547e-05, "loss": 1.4195, "step": 31221 }, { "epoch": 2.46, "learning_rate": 2.363065328160294e-05, "loss": 1.4234, "step": 31222 }, { "epoch": 2.46, "learning_rate": 2.3623994848235473e-05, "loss": 1.4118, "step": 31223 }, { "epoch": 2.46, "learning_rate": 2.3617337272891325e-05, "loss": 1.4733, "step": 31224 }, { "epoch": 2.46, "learning_rate": 2.361068055561569e-05, "loss": 1.4802, "step": 31225 }, { "epoch": 2.46, "learning_rate": 2.3604024696453822e-05, "loss": 1.4538, "step": 31226 }, { "epoch": 2.46, "learning_rate": 2.359736969545088e-05, "loss": 1.4308, "step": 31227 }, { "epoch": 2.46, "learning_rate": 2.3590715552651995e-05, "loss": 1.4748, "step": 31228 }, { "epoch": 2.46, "learning_rate": 2.3584062268102434e-05, "loss": 1.4201, "step": 31229 }, { "epoch": 2.46, "learning_rate": 2.3577409841847324e-05, "loss": 1.4184, "step": 31230 }, { "epoch": 2.46, "learning_rate": 2.357075827393181e-05, "loss": 1.4058, "step": 31231 }, { "epoch": 2.46, "learning_rate": 2.3564107564401115e-05, "loss": 1.4445, "step": 31232 }, { "epoch": 2.46, "learning_rate": 2.355745771330034e-05, "loss": 1.468, "step": 31233 }, { "epoch": 2.46, "learning_rate": 2.355080872067463e-05, "loss": 1.4186, "step": 31234 }, { "epoch": 2.46, "learning_rate": 2.3544160586569172e-05, "loss": 1.5129, "step": 31235 }, { "epoch": 2.46, "learning_rate": 2.353751331102905e-05, "loss": 1.4643, "step": 31236 }, { "epoch": 2.46, "learning_rate": 2.353086689409946e-05, "loss": 1.4384, "step": 31237 }, { "epoch": 2.46, "learning_rate": 2.3524221335825465e-05, "loss": 1.4278, "step": 31238 }, { "epoch": 2.46, "learning_rate": 2.3517576636252235e-05, "loss": 1.4622, "step": 31239 }, { "epoch": 2.46, "learning_rate": 2.351093279542486e-05, "loss": 1.4463, "step": 31240 }, { "epoch": 2.46, "learning_rate": 2.3504289813388454e-05, "loss": 1.4627, "step": 31241 }, { "epoch": 2.46, "learning_rate": 2.349764769018809e-05, "loss": 1.4293, "step": 31242 }, { "epoch": 2.46, "learning_rate": 2.3491006425868903e-05, "loss": 1.4729, "step": 31243 }, { "epoch": 2.46, "learning_rate": 2.348436602047598e-05, "loss": 1.4093, "step": 31244 }, { "epoch": 2.46, "learning_rate": 2.347772647405437e-05, "loss": 1.4021, "step": 31245 }, { "epoch": 2.46, "learning_rate": 2.3471087786649202e-05, "loss": 1.4208, "step": 31246 }, { "epoch": 2.46, "learning_rate": 2.346444995830552e-05, "loss": 1.4934, "step": 31247 }, { "epoch": 2.46, "learning_rate": 2.345781298906836e-05, "loss": 1.4185, "step": 31248 }, { "epoch": 2.46, "learning_rate": 2.3451176878982848e-05, "loss": 1.4092, "step": 31249 }, { "epoch": 2.46, "learning_rate": 2.3444541628094017e-05, "loss": 1.4601, "step": 31250 }, { "epoch": 2.46, "learning_rate": 2.343790723644688e-05, "loss": 1.4554, "step": 31251 }, { "epoch": 2.46, "learning_rate": 2.34312737040865e-05, "loss": 1.4647, "step": 31252 }, { "epoch": 2.46, "learning_rate": 2.3424641031057962e-05, "loss": 1.4115, "step": 31253 }, { "epoch": 2.46, "learning_rate": 2.341800921740626e-05, "loss": 1.438, "step": 31254 }, { "epoch": 2.46, "learning_rate": 2.341137826317639e-05, "loss": 1.4265, "step": 31255 }, { "epoch": 2.46, "learning_rate": 2.3404748168413434e-05, "loss": 1.411, "step": 31256 }, { "epoch": 2.46, "learning_rate": 2.339811893316239e-05, "loss": 1.4131, "step": 31257 }, { "epoch": 2.46, "learning_rate": 2.339149055746824e-05, "loss": 1.438, "step": 31258 }, { "epoch": 2.46, "learning_rate": 2.3384863041375963e-05, "loss": 1.447, "step": 31259 }, { "epoch": 2.46, "learning_rate": 2.3378236384930638e-05, "loss": 1.5095, "step": 31260 }, { "epoch": 2.46, "learning_rate": 2.3371610588177214e-05, "loss": 1.4418, "step": 31261 }, { "epoch": 2.46, "learning_rate": 2.336498565116064e-05, "loss": 1.4122, "step": 31262 }, { "epoch": 2.46, "learning_rate": 2.335836157392596e-05, "loss": 1.4596, "step": 31263 }, { "epoch": 2.46, "learning_rate": 2.3351738356518125e-05, "loss": 1.4458, "step": 31264 }, { "epoch": 2.46, "learning_rate": 2.334511599898206e-05, "loss": 1.443, "step": 31265 }, { "epoch": 2.46, "learning_rate": 2.3338494501362786e-05, "loss": 1.4224, "step": 31266 }, { "epoch": 2.46, "learning_rate": 2.3331873863705214e-05, "loss": 1.4263, "step": 31267 }, { "epoch": 2.46, "learning_rate": 2.3325254086054356e-05, "loss": 1.4392, "step": 31268 }, { "epoch": 2.46, "learning_rate": 2.3318635168455063e-05, "loss": 1.4394, "step": 31269 }, { "epoch": 2.46, "learning_rate": 2.331201711095238e-05, "loss": 1.5033, "step": 31270 }, { "epoch": 2.46, "learning_rate": 2.330539991359119e-05, "loss": 1.4304, "step": 31271 }, { "epoch": 2.46, "learning_rate": 2.3298783576416385e-05, "loss": 1.4192, "step": 31272 }, { "epoch": 2.46, "learning_rate": 2.3292168099472937e-05, "loss": 1.4043, "step": 31273 }, { "epoch": 2.46, "learning_rate": 2.328555348280577e-05, "loss": 1.4287, "step": 31274 }, { "epoch": 2.46, "learning_rate": 2.3278939726459716e-05, "loss": 1.4253, "step": 31275 }, { "epoch": 2.46, "learning_rate": 2.327232683047976e-05, "loss": 1.4808, "step": 31276 }, { "epoch": 2.46, "learning_rate": 2.3265714794910776e-05, "loss": 1.4615, "step": 31277 }, { "epoch": 2.46, "learning_rate": 2.325910361979767e-05, "loss": 1.4306, "step": 31278 }, { "epoch": 2.46, "learning_rate": 2.3252493305185248e-05, "loss": 1.4141, "step": 31279 }, { "epoch": 2.46, "learning_rate": 2.3245883851118496e-05, "loss": 1.4562, "step": 31280 }, { "epoch": 2.46, "learning_rate": 2.323927525764226e-05, "loss": 1.4225, "step": 31281 }, { "epoch": 2.46, "learning_rate": 2.3232667524801335e-05, "loss": 1.4491, "step": 31282 }, { "epoch": 2.46, "learning_rate": 2.3226060652640656e-05, "loss": 1.4224, "step": 31283 }, { "epoch": 2.46, "learning_rate": 2.321945464120508e-05, "loss": 1.4639, "step": 31284 }, { "epoch": 2.46, "learning_rate": 2.3212849490539463e-05, "loss": 1.4592, "step": 31285 }, { "epoch": 2.46, "learning_rate": 2.32062452006886e-05, "loss": 1.4645, "step": 31286 }, { "epoch": 2.46, "learning_rate": 2.3199641771697386e-05, "loss": 1.4779, "step": 31287 }, { "epoch": 2.46, "learning_rate": 2.319303920361062e-05, "loss": 1.4229, "step": 31288 }, { "epoch": 2.46, "learning_rate": 2.3186437496473115e-05, "loss": 1.4488, "step": 31289 }, { "epoch": 2.46, "learning_rate": 2.3179836650329752e-05, "loss": 1.46, "step": 31290 }, { "epoch": 2.46, "learning_rate": 2.317323666522533e-05, "loss": 1.4377, "step": 31291 }, { "epoch": 2.46, "learning_rate": 2.316663754120458e-05, "loss": 1.4836, "step": 31292 }, { "epoch": 2.46, "learning_rate": 2.3160039278312416e-05, "loss": 1.4488, "step": 31293 }, { "epoch": 2.46, "learning_rate": 2.3153441876593597e-05, "loss": 1.4797, "step": 31294 }, { "epoch": 2.46, "learning_rate": 2.3146845336092895e-05, "loss": 1.4706, "step": 31295 }, { "epoch": 2.46, "learning_rate": 2.3140249656855087e-05, "loss": 1.4348, "step": 31296 }, { "epoch": 2.46, "learning_rate": 2.3133654838925005e-05, "loss": 1.4942, "step": 31297 }, { "epoch": 2.46, "learning_rate": 2.3127060882347392e-05, "loss": 1.4773, "step": 31298 }, { "epoch": 2.46, "learning_rate": 2.3120467787166986e-05, "loss": 1.4479, "step": 31299 }, { "epoch": 2.46, "learning_rate": 2.3113875553428597e-05, "loss": 1.4149, "step": 31300 }, { "epoch": 2.46, "learning_rate": 2.3107284181176987e-05, "loss": 1.4218, "step": 31301 }, { "epoch": 2.46, "learning_rate": 2.310069367045691e-05, "loss": 1.4829, "step": 31302 }, { "epoch": 2.46, "learning_rate": 2.309410402131306e-05, "loss": 1.4999, "step": 31303 }, { "epoch": 2.46, "learning_rate": 2.308751523379023e-05, "loss": 1.4297, "step": 31304 }, { "epoch": 2.46, "learning_rate": 2.308092730793316e-05, "loss": 1.3891, "step": 31305 }, { "epoch": 2.46, "learning_rate": 2.3074340243786494e-05, "loss": 1.4166, "step": 31306 }, { "epoch": 2.46, "learning_rate": 2.306775404139506e-05, "loss": 1.4152, "step": 31307 }, { "epoch": 2.46, "learning_rate": 2.306116870080354e-05, "loss": 1.4152, "step": 31308 }, { "epoch": 2.46, "learning_rate": 2.3054584222056583e-05, "loss": 1.4906, "step": 31309 }, { "epoch": 2.46, "learning_rate": 2.3048000605198986e-05, "loss": 1.4997, "step": 31310 }, { "epoch": 2.46, "learning_rate": 2.3041417850275395e-05, "loss": 1.42, "step": 31311 }, { "epoch": 2.46, "learning_rate": 2.3034835957330526e-05, "loss": 1.494, "step": 31312 }, { "epoch": 2.46, "learning_rate": 2.302825492640903e-05, "loss": 1.4129, "step": 31313 }, { "epoch": 2.46, "learning_rate": 2.302167475755563e-05, "loss": 1.4222, "step": 31314 }, { "epoch": 2.46, "learning_rate": 2.3015095450814962e-05, "loss": 1.4539, "step": 31315 }, { "epoch": 2.46, "learning_rate": 2.3008517006231725e-05, "loss": 1.4941, "step": 31316 }, { "epoch": 2.46, "learning_rate": 2.3001939423850595e-05, "loss": 1.3757, "step": 31317 }, { "epoch": 2.46, "learning_rate": 2.2995362703716226e-05, "loss": 1.4533, "step": 31318 }, { "epoch": 2.46, "learning_rate": 2.298878684587326e-05, "loss": 1.4786, "step": 31319 }, { "epoch": 2.46, "learning_rate": 2.298221185036631e-05, "loss": 1.4346, "step": 31320 }, { "epoch": 2.46, "learning_rate": 2.2975637717240065e-05, "loss": 1.4382, "step": 31321 }, { "epoch": 2.46, "learning_rate": 2.296906444653915e-05, "loss": 1.4275, "step": 31322 }, { "epoch": 2.46, "learning_rate": 2.296249203830816e-05, "loss": 1.405, "step": 31323 }, { "epoch": 2.46, "learning_rate": 2.2955920492591766e-05, "loss": 1.4492, "step": 31324 }, { "epoch": 2.46, "learning_rate": 2.2949349809434566e-05, "loss": 1.4717, "step": 31325 }, { "epoch": 2.46, "learning_rate": 2.2942779988881133e-05, "loss": 1.4796, "step": 31326 }, { "epoch": 2.46, "learning_rate": 2.2936211030976153e-05, "loss": 1.405, "step": 31327 }, { "epoch": 2.46, "learning_rate": 2.2929642935764175e-05, "loss": 1.4216, "step": 31328 }, { "epoch": 2.47, "learning_rate": 2.292307570328976e-05, "loss": 1.4538, "step": 31329 }, { "epoch": 2.47, "learning_rate": 2.2916509333597527e-05, "loss": 1.467, "step": 31330 }, { "epoch": 2.47, "learning_rate": 2.2909943826732102e-05, "loss": 1.479, "step": 31331 }, { "epoch": 2.47, "learning_rate": 2.2903379182738035e-05, "loss": 1.468, "step": 31332 }, { "epoch": 2.47, "learning_rate": 2.2896815401659857e-05, "loss": 1.4194, "step": 31333 }, { "epoch": 2.47, "learning_rate": 2.289025248354218e-05, "loss": 1.4243, "step": 31334 }, { "epoch": 2.47, "learning_rate": 2.288369042842954e-05, "loss": 1.4433, "step": 31335 }, { "epoch": 2.47, "learning_rate": 2.2877129236366513e-05, "loss": 1.4481, "step": 31336 }, { "epoch": 2.47, "learning_rate": 2.2870568907397567e-05, "loss": 1.4706, "step": 31337 }, { "epoch": 2.47, "learning_rate": 2.2864009441567367e-05, "loss": 1.5242, "step": 31338 }, { "epoch": 2.47, "learning_rate": 2.2857450838920356e-05, "loss": 1.4518, "step": 31339 }, { "epoch": 2.47, "learning_rate": 2.2850893099501068e-05, "loss": 1.4609, "step": 31340 }, { "epoch": 2.47, "learning_rate": 2.2844336223354083e-05, "loss": 1.4839, "step": 31341 }, { "epoch": 2.47, "learning_rate": 2.283778021052388e-05, "loss": 1.4364, "step": 31342 }, { "epoch": 2.47, "learning_rate": 2.283122506105495e-05, "loss": 1.4631, "step": 31343 }, { "epoch": 2.47, "learning_rate": 2.282467077499186e-05, "loss": 1.4382, "step": 31344 }, { "epoch": 2.47, "learning_rate": 2.2818117352379066e-05, "loss": 1.4232, "step": 31345 }, { "epoch": 2.47, "learning_rate": 2.2811564793261034e-05, "loss": 1.4044, "step": 31346 }, { "epoch": 2.47, "learning_rate": 2.2805013097682308e-05, "loss": 1.4361, "step": 31347 }, { "epoch": 2.47, "learning_rate": 2.2798462265687366e-05, "loss": 1.4452, "step": 31348 }, { "epoch": 2.47, "learning_rate": 2.2791912297320664e-05, "loss": 1.4355, "step": 31349 }, { "epoch": 2.47, "learning_rate": 2.278536319262666e-05, "loss": 1.4076, "step": 31350 }, { "epoch": 2.47, "learning_rate": 2.277881495164987e-05, "loss": 1.4407, "step": 31351 }, { "epoch": 2.47, "learning_rate": 2.277226757443471e-05, "loss": 1.4406, "step": 31352 }, { "epoch": 2.47, "learning_rate": 2.276572106102566e-05, "loss": 1.5, "step": 31353 }, { "epoch": 2.47, "learning_rate": 2.27591754114671e-05, "loss": 1.4339, "step": 31354 }, { "epoch": 2.47, "learning_rate": 2.2752630625803562e-05, "loss": 1.4077, "step": 31355 }, { "epoch": 2.47, "learning_rate": 2.274608670407943e-05, "loss": 1.5004, "step": 31356 }, { "epoch": 2.47, "learning_rate": 2.273954364633913e-05, "loss": 1.4149, "step": 31357 }, { "epoch": 2.47, "learning_rate": 2.2733001452627116e-05, "loss": 1.442, "step": 31358 }, { "epoch": 2.47, "learning_rate": 2.2726460122987812e-05, "loss": 1.4731, "step": 31359 }, { "epoch": 2.47, "learning_rate": 2.2719919657465552e-05, "loss": 1.4349, "step": 31360 }, { "epoch": 2.47, "learning_rate": 2.271338005610485e-05, "loss": 1.4738, "step": 31361 }, { "epoch": 2.47, "learning_rate": 2.270684131895001e-05, "loss": 1.4392, "step": 31362 }, { "epoch": 2.47, "learning_rate": 2.2700303446045502e-05, "loss": 1.4311, "step": 31363 }, { "epoch": 2.47, "learning_rate": 2.2693766437435668e-05, "loss": 1.4662, "step": 31364 }, { "epoch": 2.47, "learning_rate": 2.2687230293164914e-05, "loss": 1.3939, "step": 31365 }, { "epoch": 2.47, "learning_rate": 2.268069501327763e-05, "loss": 1.4371, "step": 31366 }, { "epoch": 2.47, "learning_rate": 2.2674160597818135e-05, "loss": 1.4451, "step": 31367 }, { "epoch": 2.47, "learning_rate": 2.266762704683084e-05, "loss": 1.4436, "step": 31368 }, { "epoch": 2.47, "learning_rate": 2.2661094360360117e-05, "loss": 1.3876, "step": 31369 }, { "epoch": 2.47, "learning_rate": 2.2654562538450233e-05, "loss": 1.4708, "step": 31370 }, { "epoch": 2.47, "learning_rate": 2.2648031581145638e-05, "loss": 1.4298, "step": 31371 }, { "epoch": 2.47, "learning_rate": 2.2641501488490625e-05, "loss": 1.4487, "step": 31372 }, { "epoch": 2.47, "learning_rate": 2.2634972260529533e-05, "loss": 1.4722, "step": 31373 }, { "epoch": 2.47, "learning_rate": 2.262844389730667e-05, "loss": 1.4405, "step": 31374 }, { "epoch": 2.47, "learning_rate": 2.2621916398866417e-05, "loss": 1.4915, "step": 31375 }, { "epoch": 2.47, "learning_rate": 2.2615389765253045e-05, "loss": 1.4387, "step": 31376 }, { "epoch": 2.47, "learning_rate": 2.2608863996510862e-05, "loss": 1.414, "step": 31377 }, { "epoch": 2.47, "learning_rate": 2.2602339092684184e-05, "loss": 1.4743, "step": 31378 }, { "epoch": 2.47, "learning_rate": 2.2595815053817362e-05, "loss": 1.444, "step": 31379 }, { "epoch": 2.47, "learning_rate": 2.258929187995464e-05, "loss": 1.4618, "step": 31380 }, { "epoch": 2.47, "learning_rate": 2.2582769571140268e-05, "loss": 1.4642, "step": 31381 }, { "epoch": 2.47, "learning_rate": 2.2576248127418628e-05, "loss": 1.4413, "step": 31382 }, { "epoch": 2.47, "learning_rate": 2.256972754883395e-05, "loss": 1.4722, "step": 31383 }, { "epoch": 2.47, "learning_rate": 2.2563207835430446e-05, "loss": 1.4308, "step": 31384 }, { "epoch": 2.47, "learning_rate": 2.2556688987252486e-05, "loss": 1.4667, "step": 31385 }, { "epoch": 2.47, "learning_rate": 2.255017100434428e-05, "loss": 1.4841, "step": 31386 }, { "epoch": 2.47, "learning_rate": 2.2543653886750028e-05, "loss": 1.4524, "step": 31387 }, { "epoch": 2.47, "learning_rate": 2.253713763451408e-05, "loss": 1.4574, "step": 31388 }, { "epoch": 2.47, "learning_rate": 2.253062224768063e-05, "loss": 1.4366, "step": 31389 }, { "epoch": 2.47, "learning_rate": 2.2524107726293895e-05, "loss": 1.4678, "step": 31390 }, { "epoch": 2.47, "learning_rate": 2.2517594070398104e-05, "loss": 1.3962, "step": 31391 }, { "epoch": 2.47, "learning_rate": 2.2511081280037525e-05, "loss": 1.4688, "step": 31392 }, { "epoch": 2.47, "learning_rate": 2.2504569355256318e-05, "loss": 1.4752, "step": 31393 }, { "epoch": 2.47, "learning_rate": 2.2498058296098753e-05, "loss": 1.4612, "step": 31394 }, { "epoch": 2.47, "learning_rate": 2.2491548102608993e-05, "loss": 1.4184, "step": 31395 }, { "epoch": 2.47, "learning_rate": 2.2485038774831282e-05, "loss": 1.4868, "step": 31396 }, { "epoch": 2.47, "learning_rate": 2.247853031280979e-05, "loss": 1.449, "step": 31397 }, { "epoch": 2.47, "learning_rate": 2.247202271658866e-05, "loss": 1.4589, "step": 31398 }, { "epoch": 2.47, "learning_rate": 2.246551598621216e-05, "loss": 1.4393, "step": 31399 }, { "epoch": 2.47, "learning_rate": 2.2459010121724442e-05, "loss": 1.4809, "step": 31400 }, { "epoch": 2.47, "learning_rate": 2.245250512316961e-05, "loss": 1.4773, "step": 31401 }, { "epoch": 2.47, "learning_rate": 2.244600099059192e-05, "loss": 1.4153, "step": 31402 }, { "epoch": 2.47, "learning_rate": 2.2439497724035506e-05, "loss": 1.4928, "step": 31403 }, { "epoch": 2.47, "learning_rate": 2.2432995323544454e-05, "loss": 1.4437, "step": 31404 }, { "epoch": 2.47, "learning_rate": 2.242649378916301e-05, "loss": 1.4445, "step": 31405 }, { "epoch": 2.47, "learning_rate": 2.2419993120935274e-05, "loss": 1.3964, "step": 31406 }, { "epoch": 2.47, "learning_rate": 2.241349331890539e-05, "loss": 1.4831, "step": 31407 }, { "epoch": 2.47, "learning_rate": 2.240699438311743e-05, "loss": 1.4319, "step": 31408 }, { "epoch": 2.47, "learning_rate": 2.2400496313615567e-05, "loss": 1.4518, "step": 31409 }, { "epoch": 2.47, "learning_rate": 2.2393999110443962e-05, "loss": 1.4279, "step": 31410 }, { "epoch": 2.47, "learning_rate": 2.2387502773646678e-05, "loss": 1.4922, "step": 31411 }, { "epoch": 2.47, "learning_rate": 2.2381007303267777e-05, "loss": 1.491, "step": 31412 }, { "epoch": 2.47, "learning_rate": 2.2374512699351466e-05, "loss": 1.4294, "step": 31413 }, { "epoch": 2.47, "learning_rate": 2.2368018961941785e-05, "loss": 1.4548, "step": 31414 }, { "epoch": 2.47, "learning_rate": 2.2361526091082788e-05, "loss": 1.4786, "step": 31415 }, { "epoch": 2.47, "learning_rate": 2.235503408681862e-05, "loss": 1.4356, "step": 31416 }, { "epoch": 2.47, "learning_rate": 2.2348542949193326e-05, "loss": 1.4123, "step": 31417 }, { "epoch": 2.47, "learning_rate": 2.234205267825096e-05, "loss": 1.4882, "step": 31418 }, { "epoch": 2.47, "learning_rate": 2.2335563274035635e-05, "loss": 1.4364, "step": 31419 }, { "epoch": 2.47, "learning_rate": 2.232907473659138e-05, "loss": 1.4224, "step": 31420 }, { "epoch": 2.47, "learning_rate": 2.2322587065962226e-05, "loss": 1.4108, "step": 31421 }, { "epoch": 2.47, "learning_rate": 2.2316100262192277e-05, "loss": 1.4266, "step": 31422 }, { "epoch": 2.47, "learning_rate": 2.2309614325325544e-05, "loss": 1.4847, "step": 31423 }, { "epoch": 2.47, "learning_rate": 2.230312925540607e-05, "loss": 1.4509, "step": 31424 }, { "epoch": 2.47, "learning_rate": 2.2296645052477813e-05, "loss": 1.452, "step": 31425 }, { "epoch": 2.47, "learning_rate": 2.2290161716584932e-05, "loss": 1.4188, "step": 31426 }, { "epoch": 2.47, "learning_rate": 2.2283679247771358e-05, "loss": 1.4809, "step": 31427 }, { "epoch": 2.47, "learning_rate": 2.227719764608111e-05, "loss": 1.4795, "step": 31428 }, { "epoch": 2.47, "learning_rate": 2.2270716911558227e-05, "loss": 1.4628, "step": 31429 }, { "epoch": 2.47, "learning_rate": 2.22642370442467e-05, "loss": 1.4754, "step": 31430 }, { "epoch": 2.47, "learning_rate": 2.225775804419051e-05, "loss": 1.4025, "step": 31431 }, { "epoch": 2.47, "learning_rate": 2.225127991143362e-05, "loss": 1.4776, "step": 31432 }, { "epoch": 2.47, "learning_rate": 2.2244802646020072e-05, "loss": 1.4261, "step": 31433 }, { "epoch": 2.47, "learning_rate": 2.2238326247993803e-05, "loss": 1.4071, "step": 31434 }, { "epoch": 2.47, "learning_rate": 2.2231850717398762e-05, "loss": 1.4763, "step": 31435 }, { "epoch": 2.47, "learning_rate": 2.2225376054279e-05, "loss": 1.449, "step": 31436 }, { "epoch": 2.47, "learning_rate": 2.2218902258678408e-05, "loss": 1.4067, "step": 31437 }, { "epoch": 2.47, "learning_rate": 2.2212429330640917e-05, "loss": 1.3928, "step": 31438 }, { "epoch": 2.47, "learning_rate": 2.220595727021055e-05, "loss": 1.4563, "step": 31439 }, { "epoch": 2.47, "learning_rate": 2.2199486077431166e-05, "loss": 1.4187, "step": 31440 }, { "epoch": 2.47, "learning_rate": 2.21930157523468e-05, "loss": 1.4265, "step": 31441 }, { "epoch": 2.47, "learning_rate": 2.2186546295001278e-05, "loss": 1.422, "step": 31442 }, { "epoch": 2.47, "learning_rate": 2.218007770543862e-05, "loss": 1.4687, "step": 31443 }, { "epoch": 2.47, "learning_rate": 2.2173609983702688e-05, "loss": 1.4877, "step": 31444 }, { "epoch": 2.47, "learning_rate": 2.2167143129837368e-05, "loss": 1.5046, "step": 31445 }, { "epoch": 2.47, "learning_rate": 2.2160677143886635e-05, "loss": 1.447, "step": 31446 }, { "epoch": 2.47, "learning_rate": 2.2154212025894358e-05, "loss": 1.4809, "step": 31447 }, { "epoch": 2.47, "learning_rate": 2.2147747775904433e-05, "loss": 1.451, "step": 31448 }, { "epoch": 2.47, "learning_rate": 2.2141284393960713e-05, "loss": 1.4609, "step": 31449 }, { "epoch": 2.47, "learning_rate": 2.2134821880107156e-05, "loss": 1.4542, "step": 31450 }, { "epoch": 2.47, "learning_rate": 2.2128360234387583e-05, "loss": 1.4567, "step": 31451 }, { "epoch": 2.47, "learning_rate": 2.2121899456845854e-05, "loss": 1.4444, "step": 31452 }, { "epoch": 2.47, "learning_rate": 2.2115439547525887e-05, "loss": 1.4196, "step": 31453 }, { "epoch": 2.47, "learning_rate": 2.2108980506471513e-05, "loss": 1.4553, "step": 31454 }, { "epoch": 2.47, "learning_rate": 2.2102522333726547e-05, "loss": 1.4706, "step": 31455 }, { "epoch": 2.47, "learning_rate": 2.2096065029334887e-05, "loss": 1.4444, "step": 31456 }, { "epoch": 2.48, "learning_rate": 2.208960859334038e-05, "loss": 1.4729, "step": 31457 }, { "epoch": 2.48, "learning_rate": 2.2083153025786858e-05, "loss": 1.382, "step": 31458 }, { "epoch": 2.48, "learning_rate": 2.2076698326718107e-05, "loss": 1.4258, "step": 31459 }, { "epoch": 2.48, "learning_rate": 2.2070244496178004e-05, "loss": 1.4344, "step": 31460 }, { "epoch": 2.48, "learning_rate": 2.2063791534210347e-05, "loss": 1.4591, "step": 31461 }, { "epoch": 2.48, "learning_rate": 2.20573394408589e-05, "loss": 1.4485, "step": 31462 }, { "epoch": 2.48, "learning_rate": 2.205088821616755e-05, "loss": 1.4714, "step": 31463 }, { "epoch": 2.48, "learning_rate": 2.2044437860180074e-05, "loss": 1.4634, "step": 31464 }, { "epoch": 2.48, "learning_rate": 2.203798837294024e-05, "loss": 1.4433, "step": 31465 }, { "epoch": 2.48, "learning_rate": 2.2031539754491827e-05, "loss": 1.492, "step": 31466 }, { "epoch": 2.48, "learning_rate": 2.202509200487867e-05, "loss": 1.4334, "step": 31467 }, { "epoch": 2.48, "learning_rate": 2.2018645124144512e-05, "loss": 1.4771, "step": 31468 }, { "epoch": 2.48, "learning_rate": 2.201219911233309e-05, "loss": 1.5031, "step": 31469 }, { "epoch": 2.48, "learning_rate": 2.200575396948825e-05, "loss": 1.4141, "step": 31470 }, { "epoch": 2.48, "learning_rate": 2.1999309695653705e-05, "loss": 1.4323, "step": 31471 }, { "epoch": 2.48, "learning_rate": 2.1992866290873172e-05, "loss": 1.4854, "step": 31472 }, { "epoch": 2.48, "learning_rate": 2.1986423755190452e-05, "loss": 1.4592, "step": 31473 }, { "epoch": 2.48, "learning_rate": 2.197998208864929e-05, "loss": 1.4428, "step": 31474 }, { "epoch": 2.48, "learning_rate": 2.1973541291293402e-05, "loss": 1.4875, "step": 31475 }, { "epoch": 2.48, "learning_rate": 2.1967101363166485e-05, "loss": 1.4377, "step": 31476 }, { "epoch": 2.48, "learning_rate": 2.196066230431234e-05, "loss": 1.4479, "step": 31477 }, { "epoch": 2.48, "learning_rate": 2.1954224114774628e-05, "loss": 1.4494, "step": 31478 }, { "epoch": 2.48, "learning_rate": 2.1947786794597032e-05, "loss": 1.4405, "step": 31479 }, { "epoch": 2.48, "learning_rate": 2.1941350343823355e-05, "loss": 1.4517, "step": 31480 }, { "epoch": 2.48, "learning_rate": 2.1934914762497223e-05, "loss": 1.5064, "step": 31481 }, { "epoch": 2.48, "learning_rate": 2.1928480050662322e-05, "loss": 1.4926, "step": 31482 }, { "epoch": 2.48, "learning_rate": 2.1922046208362397e-05, "loss": 1.4388, "step": 31483 }, { "epoch": 2.48, "learning_rate": 2.19156132356411e-05, "loss": 1.4738, "step": 31484 }, { "epoch": 2.48, "learning_rate": 2.1909181132542108e-05, "loss": 1.4349, "step": 31485 }, { "epoch": 2.48, "learning_rate": 2.1902749899109058e-05, "loss": 1.4591, "step": 31486 }, { "epoch": 2.48, "learning_rate": 2.1896319535385627e-05, "loss": 1.4646, "step": 31487 }, { "epoch": 2.48, "learning_rate": 2.188989004141555e-05, "loss": 1.4353, "step": 31488 }, { "epoch": 2.48, "learning_rate": 2.1883461417242404e-05, "loss": 1.4358, "step": 31489 }, { "epoch": 2.48, "learning_rate": 2.1877033662909842e-05, "loss": 1.4465, "step": 31490 }, { "epoch": 2.48, "learning_rate": 2.187060677846153e-05, "loss": 1.4633, "step": 31491 }, { "epoch": 2.48, "learning_rate": 2.1864180763941114e-05, "loss": 1.464, "step": 31492 }, { "epoch": 2.48, "learning_rate": 2.185775561939214e-05, "loss": 1.422, "step": 31493 }, { "epoch": 2.48, "learning_rate": 2.185133134485833e-05, "loss": 1.4525, "step": 31494 }, { "epoch": 2.48, "learning_rate": 2.1844907940383277e-05, "loss": 1.4552, "step": 31495 }, { "epoch": 2.48, "learning_rate": 2.1838485406010532e-05, "loss": 1.4253, "step": 31496 }, { "epoch": 2.48, "learning_rate": 2.183206374178379e-05, "loss": 1.4675, "step": 31497 }, { "epoch": 2.48, "learning_rate": 2.1825642947746586e-05, "loss": 1.4488, "step": 31498 }, { "epoch": 2.48, "learning_rate": 2.1819223023942517e-05, "loss": 1.4704, "step": 31499 }, { "epoch": 2.48, "learning_rate": 2.1812803970415216e-05, "loss": 1.4086, "step": 31500 }, { "epoch": 2.48, "learning_rate": 2.1806385787208248e-05, "loss": 1.4065, "step": 31501 }, { "epoch": 2.48, "learning_rate": 2.179996847436516e-05, "loss": 1.4512, "step": 31502 }, { "epoch": 2.48, "learning_rate": 2.179355203192947e-05, "loss": 1.4348, "step": 31503 }, { "epoch": 2.48, "learning_rate": 2.1787136459944886e-05, "loss": 1.4405, "step": 31504 }, { "epoch": 2.48, "learning_rate": 2.17807217584549e-05, "loss": 1.5202, "step": 31505 }, { "epoch": 2.48, "learning_rate": 2.1774307927503054e-05, "loss": 1.4465, "step": 31506 }, { "epoch": 2.48, "learning_rate": 2.176789496713285e-05, "loss": 1.4485, "step": 31507 }, { "epoch": 2.48, "learning_rate": 2.1761482877387914e-05, "loss": 1.4557, "step": 31508 }, { "epoch": 2.48, "learning_rate": 2.1755071658311752e-05, "loss": 1.4538, "step": 31509 }, { "epoch": 2.48, "learning_rate": 2.1748661309947842e-05, "loss": 1.3933, "step": 31510 }, { "epoch": 2.48, "learning_rate": 2.174225183233978e-05, "loss": 1.4251, "step": 31511 }, { "epoch": 2.48, "learning_rate": 2.173584322553105e-05, "loss": 1.4628, "step": 31512 }, { "epoch": 2.48, "learning_rate": 2.1729435489565123e-05, "loss": 1.4222, "step": 31513 }, { "epoch": 2.48, "learning_rate": 2.1723028624485573e-05, "loss": 1.4324, "step": 31514 }, { "epoch": 2.48, "learning_rate": 2.1716622630335883e-05, "loss": 1.4284, "step": 31515 }, { "epoch": 2.48, "learning_rate": 2.1710217507159487e-05, "loss": 1.4641, "step": 31516 }, { "epoch": 2.48, "learning_rate": 2.170381325499997e-05, "loss": 1.4711, "step": 31517 }, { "epoch": 2.48, "learning_rate": 2.169740987390074e-05, "loss": 1.4366, "step": 31518 }, { "epoch": 2.48, "learning_rate": 2.1691007363905282e-05, "loss": 1.4688, "step": 31519 }, { "epoch": 2.48, "learning_rate": 2.1684605725057065e-05, "loss": 1.4703, "step": 31520 }, { "epoch": 2.48, "learning_rate": 2.1678204957399598e-05, "loss": 1.4835, "step": 31521 }, { "epoch": 2.48, "learning_rate": 2.16718050609763e-05, "loss": 1.4336, "step": 31522 }, { "epoch": 2.48, "learning_rate": 2.1665406035830636e-05, "loss": 1.4134, "step": 31523 }, { "epoch": 2.48, "learning_rate": 2.1659007882006002e-05, "loss": 1.435, "step": 31524 }, { "epoch": 2.48, "learning_rate": 2.1652610599545933e-05, "loss": 1.4817, "step": 31525 }, { "epoch": 2.48, "learning_rate": 2.1646214188493794e-05, "loss": 1.4231, "step": 31526 }, { "epoch": 2.48, "learning_rate": 2.1639818648893e-05, "loss": 1.4525, "step": 31527 }, { "epoch": 2.48, "learning_rate": 2.163342398078703e-05, "loss": 1.3962, "step": 31528 }, { "epoch": 2.48, "learning_rate": 2.1627030184219285e-05, "loss": 1.4787, "step": 31529 }, { "epoch": 2.48, "learning_rate": 2.1620637259233114e-05, "loss": 1.3759, "step": 31530 }, { "epoch": 2.48, "learning_rate": 2.1614245205872015e-05, "loss": 1.4302, "step": 31531 }, { "epoch": 2.48, "learning_rate": 2.160785402417934e-05, "loss": 1.4427, "step": 31532 }, { "epoch": 2.48, "learning_rate": 2.1601463714198447e-05, "loss": 1.4243, "step": 31533 }, { "epoch": 2.48, "learning_rate": 2.159507427597279e-05, "loss": 1.4358, "step": 31534 }, { "epoch": 2.48, "learning_rate": 2.15886857095457e-05, "loss": 1.4531, "step": 31535 }, { "epoch": 2.48, "learning_rate": 2.158229801496059e-05, "loss": 1.4696, "step": 31536 }, { "epoch": 2.48, "learning_rate": 2.157591119226078e-05, "loss": 1.4197, "step": 31537 }, { "epoch": 2.48, "learning_rate": 2.15695252414897e-05, "loss": 1.4627, "step": 31538 }, { "epoch": 2.48, "learning_rate": 2.156314016269066e-05, "loss": 1.4382, "step": 31539 }, { "epoch": 2.48, "learning_rate": 2.1556755955907e-05, "loss": 1.41, "step": 31540 }, { "epoch": 2.48, "learning_rate": 2.1550372621182115e-05, "loss": 1.441, "step": 31541 }, { "epoch": 2.48, "learning_rate": 2.154399015855932e-05, "loss": 1.4881, "step": 31542 }, { "epoch": 2.48, "learning_rate": 2.1537608568081932e-05, "loss": 1.4699, "step": 31543 }, { "epoch": 2.48, "learning_rate": 2.1531227849793264e-05, "loss": 1.4397, "step": 31544 }, { "epoch": 2.48, "learning_rate": 2.15248480037367e-05, "loss": 1.4717, "step": 31545 }, { "epoch": 2.48, "learning_rate": 2.151846902995552e-05, "loss": 1.4866, "step": 31546 }, { "epoch": 2.48, "learning_rate": 2.1512090928492993e-05, "loss": 1.4554, "step": 31547 }, { "epoch": 2.48, "learning_rate": 2.1505713699392498e-05, "loss": 1.456, "step": 31548 }, { "epoch": 2.48, "learning_rate": 2.1499337342697296e-05, "loss": 1.3978, "step": 31549 }, { "epoch": 2.48, "learning_rate": 2.1492961858450662e-05, "loss": 1.4323, "step": 31550 }, { "epoch": 2.48, "learning_rate": 2.1486587246695893e-05, "loss": 1.4407, "step": 31551 }, { "epoch": 2.48, "learning_rate": 2.1480213507476297e-05, "loss": 1.4882, "step": 31552 }, { "epoch": 2.48, "learning_rate": 2.1473840640835143e-05, "loss": 1.4904, "step": 31553 }, { "epoch": 2.48, "learning_rate": 2.146746864681565e-05, "loss": 1.4944, "step": 31554 }, { "epoch": 2.48, "learning_rate": 2.1461097525461146e-05, "loss": 1.4592, "step": 31555 }, { "epoch": 2.48, "learning_rate": 2.1454727276814847e-05, "loss": 1.4496, "step": 31556 }, { "epoch": 2.48, "learning_rate": 2.144835790091999e-05, "loss": 1.4331, "step": 31557 }, { "epoch": 2.48, "learning_rate": 2.144198939781988e-05, "loss": 1.463, "step": 31558 }, { "epoch": 2.48, "learning_rate": 2.143562176755771e-05, "loss": 1.385, "step": 31559 }, { "epoch": 2.48, "learning_rate": 2.142925501017672e-05, "loss": 1.4214, "step": 31560 }, { "epoch": 2.48, "learning_rate": 2.14228891257201e-05, "loss": 1.424, "step": 31561 }, { "epoch": 2.48, "learning_rate": 2.1416524114231144e-05, "loss": 1.4198, "step": 31562 }, { "epoch": 2.48, "learning_rate": 2.1410159975753032e-05, "loss": 1.4325, "step": 31563 }, { "epoch": 2.48, "learning_rate": 2.140379671032895e-05, "loss": 1.4443, "step": 31564 }, { "epoch": 2.48, "learning_rate": 2.1397434318002148e-05, "loss": 1.5086, "step": 31565 }, { "epoch": 2.48, "learning_rate": 2.1391072798815755e-05, "loss": 1.4325, "step": 31566 }, { "epoch": 2.48, "learning_rate": 2.1384712152813056e-05, "loss": 1.4542, "step": 31567 }, { "epoch": 2.48, "learning_rate": 2.1378352380037145e-05, "loss": 1.473, "step": 31568 }, { "epoch": 2.48, "learning_rate": 2.1371993480531273e-05, "loss": 1.4411, "step": 31569 }, { "epoch": 2.48, "learning_rate": 2.1365635454338576e-05, "loss": 1.4254, "step": 31570 }, { "epoch": 2.48, "learning_rate": 2.1359278301502215e-05, "loss": 1.4197, "step": 31571 }, { "epoch": 2.48, "learning_rate": 2.135292202206537e-05, "loss": 1.4121, "step": 31572 }, { "epoch": 2.48, "learning_rate": 2.1346566616071213e-05, "loss": 1.4405, "step": 31573 }, { "epoch": 2.48, "learning_rate": 2.134021208356284e-05, "loss": 1.4223, "step": 31574 }, { "epoch": 2.48, "learning_rate": 2.133385842458345e-05, "loss": 1.4378, "step": 31575 }, { "epoch": 2.48, "learning_rate": 2.1327505639176157e-05, "loss": 1.4125, "step": 31576 }, { "epoch": 2.48, "learning_rate": 2.1321153727384095e-05, "loss": 1.5069, "step": 31577 }, { "epoch": 2.48, "learning_rate": 2.131480268925036e-05, "loss": 1.4593, "step": 31578 }, { "epoch": 2.48, "learning_rate": 2.130845252481812e-05, "loss": 1.4694, "step": 31579 }, { "epoch": 2.48, "learning_rate": 2.130210323413049e-05, "loss": 1.4719, "step": 31580 }, { "epoch": 2.48, "learning_rate": 2.1295754817230504e-05, "loss": 1.3869, "step": 31581 }, { "epoch": 2.48, "learning_rate": 2.1289407274161325e-05, "loss": 1.4418, "step": 31582 }, { "epoch": 2.48, "learning_rate": 2.1283060604966086e-05, "loss": 1.4911, "step": 31583 }, { "epoch": 2.49, "learning_rate": 2.1276714809687818e-05, "loss": 1.4466, "step": 31584 }, { "epoch": 2.49, "learning_rate": 2.1270369888369603e-05, "loss": 1.4468, "step": 31585 }, { "epoch": 2.49, "learning_rate": 2.1264025841054562e-05, "loss": 1.4379, "step": 31586 }, { "epoch": 2.49, "learning_rate": 2.1257682667785735e-05, "loss": 1.463, "step": 31587 }, { "epoch": 2.49, "learning_rate": 2.1251340368606177e-05, "loss": 1.4291, "step": 31588 }, { "epoch": 2.49, "learning_rate": 2.1244998943559004e-05, "loss": 1.4955, "step": 31589 }, { "epoch": 2.49, "learning_rate": 2.123865839268723e-05, "loss": 1.4593, "step": 31590 }, { "epoch": 2.49, "learning_rate": 2.123231871603387e-05, "loss": 1.4167, "step": 31591 }, { "epoch": 2.49, "learning_rate": 2.1225979913642038e-05, "loss": 1.4269, "step": 31592 }, { "epoch": 2.49, "learning_rate": 2.1219641985554752e-05, "loss": 1.4196, "step": 31593 }, { "epoch": 2.49, "learning_rate": 2.1213304931814996e-05, "loss": 1.4086, "step": 31594 }, { "epoch": 2.49, "learning_rate": 2.1206968752465847e-05, "loss": 1.4118, "step": 31595 }, { "epoch": 2.49, "learning_rate": 2.1200633447550324e-05, "loss": 1.4955, "step": 31596 }, { "epoch": 2.49, "learning_rate": 2.119429901711141e-05, "loss": 1.5025, "step": 31597 }, { "epoch": 2.49, "learning_rate": 2.1187965461192054e-05, "loss": 1.4213, "step": 31598 }, { "epoch": 2.49, "learning_rate": 2.11816327798354e-05, "loss": 1.4362, "step": 31599 }, { "epoch": 2.49, "learning_rate": 2.1175300973084386e-05, "loss": 1.4372, "step": 31600 }, { "epoch": 2.49, "learning_rate": 2.1168970040981976e-05, "loss": 1.4377, "step": 31601 }, { "epoch": 2.49, "learning_rate": 2.1162639983571134e-05, "loss": 1.4263, "step": 31602 }, { "epoch": 2.49, "learning_rate": 2.1156310800894893e-05, "loss": 1.4176, "step": 31603 }, { "epoch": 2.49, "learning_rate": 2.1149982492996204e-05, "loss": 1.3977, "step": 31604 }, { "epoch": 2.49, "learning_rate": 2.1143655059917995e-05, "loss": 1.4012, "step": 31605 }, { "epoch": 2.49, "learning_rate": 2.1137328501703288e-05, "loss": 1.4293, "step": 31606 }, { "epoch": 2.49, "learning_rate": 2.1131002818395028e-05, "loss": 1.466, "step": 31607 }, { "epoch": 2.49, "learning_rate": 2.1124678010036095e-05, "loss": 1.4627, "step": 31608 }, { "epoch": 2.49, "learning_rate": 2.1118354076669508e-05, "loss": 1.4242, "step": 31609 }, { "epoch": 2.49, "learning_rate": 2.1112031018338184e-05, "loss": 1.4692, "step": 31610 }, { "epoch": 2.49, "learning_rate": 2.1105708835085e-05, "loss": 1.5245, "step": 31611 }, { "epoch": 2.49, "learning_rate": 2.109938752695296e-05, "loss": 1.4377, "step": 31612 }, { "epoch": 2.49, "learning_rate": 2.1093067093984912e-05, "loss": 1.5022, "step": 31613 }, { "epoch": 2.49, "learning_rate": 2.1086747536223837e-05, "loss": 1.4226, "step": 31614 }, { "epoch": 2.49, "learning_rate": 2.1080428853712584e-05, "loss": 1.4771, "step": 31615 }, { "epoch": 2.49, "learning_rate": 2.1074111046494084e-05, "loss": 1.4189, "step": 31616 }, { "epoch": 2.49, "learning_rate": 2.106779411461124e-05, "loss": 1.428, "step": 31617 }, { "epoch": 2.49, "learning_rate": 2.106147805810692e-05, "loss": 1.455, "step": 31618 }, { "epoch": 2.49, "learning_rate": 2.105516287702398e-05, "loss": 1.3835, "step": 31619 }, { "epoch": 2.49, "learning_rate": 2.104884857140536e-05, "loss": 1.4902, "step": 31620 }, { "epoch": 2.49, "learning_rate": 2.1042535141293887e-05, "loss": 1.3797, "step": 31621 }, { "epoch": 2.49, "learning_rate": 2.1036222586732398e-05, "loss": 1.4447, "step": 31622 }, { "epoch": 2.49, "learning_rate": 2.102991090776384e-05, "loss": 1.4696, "step": 31623 }, { "epoch": 2.49, "learning_rate": 2.1023600104431014e-05, "loss": 1.4889, "step": 31624 }, { "epoch": 2.49, "learning_rate": 2.101729017677672e-05, "loss": 1.4829, "step": 31625 }, { "epoch": 2.49, "learning_rate": 2.1010981124843902e-05, "loss": 1.4335, "step": 31626 }, { "epoch": 2.49, "learning_rate": 2.1004672948675328e-05, "loss": 1.4058, "step": 31627 }, { "epoch": 2.49, "learning_rate": 2.0998365648313796e-05, "loss": 1.4389, "step": 31628 }, { "epoch": 2.49, "learning_rate": 2.0992059223802178e-05, "loss": 1.3863, "step": 31629 }, { "epoch": 2.49, "learning_rate": 2.098575367518333e-05, "loss": 1.4453, "step": 31630 }, { "epoch": 2.49, "learning_rate": 2.097944900250001e-05, "loss": 1.4523, "step": 31631 }, { "epoch": 2.49, "learning_rate": 2.0973145205794993e-05, "loss": 1.432, "step": 31632 }, { "epoch": 2.49, "learning_rate": 2.0966842285111167e-05, "loss": 1.4599, "step": 31633 }, { "epoch": 2.49, "learning_rate": 2.0960540240491264e-05, "loss": 1.4636, "step": 31634 }, { "epoch": 2.49, "learning_rate": 2.0954239071978078e-05, "loss": 1.3874, "step": 31635 }, { "epoch": 2.49, "learning_rate": 2.094793877961438e-05, "loss": 1.4772, "step": 31636 }, { "epoch": 2.49, "learning_rate": 2.0941639363442986e-05, "loss": 1.4481, "step": 31637 }, { "epoch": 2.49, "learning_rate": 2.0935340823506623e-05, "loss": 1.4315, "step": 31638 }, { "epoch": 2.49, "learning_rate": 2.0929043159848063e-05, "loss": 1.437, "step": 31639 }, { "epoch": 2.49, "learning_rate": 2.0922746372510085e-05, "loss": 1.4542, "step": 31640 }, { "epoch": 2.49, "learning_rate": 2.0916450461535455e-05, "loss": 1.4978, "step": 31641 }, { "epoch": 2.49, "learning_rate": 2.091015542696684e-05, "loss": 1.4368, "step": 31642 }, { "epoch": 2.49, "learning_rate": 2.0903861268847073e-05, "loss": 1.5311, "step": 31643 }, { "epoch": 2.49, "learning_rate": 2.0897567987218832e-05, "loss": 1.4616, "step": 31644 }, { "epoch": 2.49, "learning_rate": 2.089127558212484e-05, "loss": 1.433, "step": 31645 }, { "epoch": 2.49, "learning_rate": 2.0884984053607838e-05, "loss": 1.4361, "step": 31646 }, { "epoch": 2.49, "learning_rate": 2.0878693401710567e-05, "loss": 1.4567, "step": 31647 }, { "epoch": 2.49, "learning_rate": 2.087240362647572e-05, "loss": 1.4101, "step": 31648 }, { "epoch": 2.49, "learning_rate": 2.0866114727945964e-05, "loss": 1.4614, "step": 31649 }, { "epoch": 2.49, "learning_rate": 2.085982670616405e-05, "loss": 1.413, "step": 31650 }, { "epoch": 2.49, "learning_rate": 2.085353956117266e-05, "loss": 1.4072, "step": 31651 }, { "epoch": 2.49, "learning_rate": 2.0847253293014427e-05, "loss": 1.4825, "step": 31652 }, { "epoch": 2.49, "learning_rate": 2.0840967901732115e-05, "loss": 1.4027, "step": 31653 }, { "epoch": 2.49, "learning_rate": 2.083468338736834e-05, "loss": 1.4256, "step": 31654 }, { "epoch": 2.49, "learning_rate": 2.0828399749965786e-05, "loss": 1.4545, "step": 31655 }, { "epoch": 2.49, "learning_rate": 2.0822116989567083e-05, "loss": 1.4525, "step": 31656 }, { "epoch": 2.49, "learning_rate": 2.0815835106214968e-05, "loss": 1.4799, "step": 31657 }, { "epoch": 2.49, "learning_rate": 2.0809554099952018e-05, "loss": 1.4399, "step": 31658 }, { "epoch": 2.49, "learning_rate": 2.0803273970820887e-05, "loss": 1.4286, "step": 31659 }, { "epoch": 2.49, "learning_rate": 2.0796994718864222e-05, "loss": 1.4937, "step": 31660 }, { "epoch": 2.49, "learning_rate": 2.0790716344124707e-05, "loss": 1.4285, "step": 31661 }, { "epoch": 2.49, "learning_rate": 2.0784438846644923e-05, "loss": 1.456, "step": 31662 }, { "epoch": 2.49, "learning_rate": 2.0778162226467438e-05, "loss": 1.4366, "step": 31663 }, { "epoch": 2.49, "learning_rate": 2.077188648363498e-05, "loss": 1.4521, "step": 31664 }, { "epoch": 2.49, "learning_rate": 2.0765611618190086e-05, "loss": 1.4738, "step": 31665 }, { "epoch": 2.49, "learning_rate": 2.075933763017534e-05, "loss": 1.4147, "step": 31666 }, { "epoch": 2.49, "learning_rate": 2.07530645196334e-05, "loss": 1.4358, "step": 31667 }, { "epoch": 2.49, "learning_rate": 2.074679228660684e-05, "loss": 1.4209, "step": 31668 }, { "epoch": 2.49, "learning_rate": 2.074052093113819e-05, "loss": 1.5103, "step": 31669 }, { "epoch": 2.49, "learning_rate": 2.0734250453270097e-05, "loss": 1.4456, "step": 31670 }, { "epoch": 2.49, "learning_rate": 2.0727980853045113e-05, "loss": 1.4502, "step": 31671 }, { "epoch": 2.49, "learning_rate": 2.0721712130505803e-05, "loss": 1.4436, "step": 31672 }, { "epoch": 2.49, "learning_rate": 2.0715444285694698e-05, "loss": 1.4914, "step": 31673 }, { "epoch": 2.49, "learning_rate": 2.070917731865442e-05, "loss": 1.4083, "step": 31674 }, { "epoch": 2.49, "learning_rate": 2.070291122942746e-05, "loss": 1.4438, "step": 31675 }, { "epoch": 2.49, "learning_rate": 2.0696646018056357e-05, "loss": 1.3995, "step": 31676 }, { "epoch": 2.49, "learning_rate": 2.0690381684583672e-05, "loss": 1.4221, "step": 31677 }, { "epoch": 2.49, "learning_rate": 2.0684118229051976e-05, "loss": 1.4761, "step": 31678 }, { "epoch": 2.49, "learning_rate": 2.067785565150375e-05, "loss": 1.4891, "step": 31679 }, { "epoch": 2.49, "learning_rate": 2.067159395198149e-05, "loss": 1.4918, "step": 31680 }, { "epoch": 2.49, "learning_rate": 2.0665333130527767e-05, "loss": 1.4681, "step": 31681 }, { "epoch": 2.49, "learning_rate": 2.0659073187185045e-05, "loss": 1.4427, "step": 31682 }, { "epoch": 2.49, "learning_rate": 2.065281412199582e-05, "loss": 1.4238, "step": 31683 }, { "epoch": 2.49, "learning_rate": 2.0646555935002645e-05, "loss": 1.4811, "step": 31684 }, { "epoch": 2.49, "learning_rate": 2.064029862624797e-05, "loss": 1.4076, "step": 31685 }, { "epoch": 2.49, "learning_rate": 2.063404219577424e-05, "loss": 1.4673, "step": 31686 }, { "epoch": 2.49, "learning_rate": 2.062778664362401e-05, "loss": 1.4535, "step": 31687 }, { "epoch": 2.49, "learning_rate": 2.0621531969839728e-05, "loss": 1.4649, "step": 31688 }, { "epoch": 2.49, "learning_rate": 2.0615278174463822e-05, "loss": 1.4376, "step": 31689 }, { "epoch": 2.49, "learning_rate": 2.0609025257538765e-05, "loss": 1.4363, "step": 31690 }, { "epoch": 2.49, "learning_rate": 2.060277321910705e-05, "loss": 1.48, "step": 31691 }, { "epoch": 2.49, "learning_rate": 2.059652205921106e-05, "loss": 1.4845, "step": 31692 }, { "epoch": 2.49, "learning_rate": 2.059027177789327e-05, "loss": 1.5536, "step": 31693 }, { "epoch": 2.49, "learning_rate": 2.058402237519617e-05, "loss": 1.4346, "step": 31694 }, { "epoch": 2.49, "learning_rate": 2.057777385116213e-05, "loss": 1.4454, "step": 31695 }, { "epoch": 2.49, "learning_rate": 2.0571526205833576e-05, "loss": 1.3869, "step": 31696 }, { "epoch": 2.49, "learning_rate": 2.056527943925292e-05, "loss": 1.4444, "step": 31697 }, { "epoch": 2.49, "learning_rate": 2.05590335514626e-05, "loss": 1.4702, "step": 31698 }, { "epoch": 2.49, "learning_rate": 2.0552788542505038e-05, "loss": 1.4548, "step": 31699 }, { "epoch": 2.49, "learning_rate": 2.054654441242255e-05, "loss": 1.4448, "step": 31700 }, { "epoch": 2.49, "learning_rate": 2.0540301161257634e-05, "loss": 1.5172, "step": 31701 }, { "epoch": 2.49, "learning_rate": 2.053405878905262e-05, "loss": 1.4576, "step": 31702 }, { "epoch": 2.49, "learning_rate": 2.052781729584988e-05, "loss": 1.4572, "step": 31703 }, { "epoch": 2.49, "learning_rate": 2.0521576681691843e-05, "loss": 1.4713, "step": 31704 }, { "epoch": 2.49, "learning_rate": 2.0515336946620842e-05, "loss": 1.4418, "step": 31705 }, { "epoch": 2.49, "learning_rate": 2.050909809067921e-05, "loss": 1.4128, "step": 31706 }, { "epoch": 2.49, "learning_rate": 2.0502860113909398e-05, "loss": 1.4651, "step": 31707 }, { "epoch": 2.49, "learning_rate": 2.0496623016353654e-05, "loss": 1.412, "step": 31708 }, { "epoch": 2.49, "learning_rate": 2.049038679805441e-05, "loss": 1.4308, "step": 31709 }, { "epoch": 2.49, "learning_rate": 2.0484151459053933e-05, "loss": 1.4323, "step": 31710 }, { "epoch": 2.5, "learning_rate": 2.047791699939462e-05, "loss": 1.4594, "step": 31711 }, { "epoch": 2.5, "learning_rate": 2.0471683419118796e-05, "loss": 1.4133, "step": 31712 }, { "epoch": 2.5, "learning_rate": 2.046545071826875e-05, "loss": 1.4688, "step": 31713 }, { "epoch": 2.5, "learning_rate": 2.045921889688677e-05, "loss": 1.4195, "step": 31714 }, { "epoch": 2.5, "learning_rate": 2.0452987955015255e-05, "loss": 1.4448, "step": 31715 }, { "epoch": 2.5, "learning_rate": 2.0446757892696454e-05, "loss": 1.4839, "step": 31716 }, { "epoch": 2.5, "learning_rate": 2.0440528709972647e-05, "loss": 1.4222, "step": 31717 }, { "epoch": 2.5, "learning_rate": 2.043430040688619e-05, "loss": 1.4471, "step": 31718 }, { "epoch": 2.5, "learning_rate": 2.042807298347931e-05, "loss": 1.3916, "step": 31719 }, { "epoch": 2.5, "learning_rate": 2.0421846439794293e-05, "loss": 1.4299, "step": 31720 }, { "epoch": 2.5, "learning_rate": 2.0415620775873472e-05, "loss": 1.4305, "step": 31721 }, { "epoch": 2.5, "learning_rate": 2.0409395991759058e-05, "loss": 1.4238, "step": 31722 }, { "epoch": 2.5, "learning_rate": 2.0403172087493308e-05, "loss": 1.4599, "step": 31723 }, { "epoch": 2.5, "learning_rate": 2.0396949063118502e-05, "loss": 1.4482, "step": 31724 }, { "epoch": 2.5, "learning_rate": 2.0390726918676938e-05, "loss": 1.4571, "step": 31725 }, { "epoch": 2.5, "learning_rate": 2.0384505654210797e-05, "loss": 1.4363, "step": 31726 }, { "epoch": 2.5, "learning_rate": 2.03782852697623e-05, "loss": 1.4823, "step": 31727 }, { "epoch": 2.5, "learning_rate": 2.0372065765373745e-05, "loss": 1.4246, "step": 31728 }, { "epoch": 2.5, "learning_rate": 2.036584714108735e-05, "loss": 1.4225, "step": 31729 }, { "epoch": 2.5, "learning_rate": 2.0359629396945294e-05, "loss": 1.4583, "step": 31730 }, { "epoch": 2.5, "learning_rate": 2.0353412532989794e-05, "loss": 1.4297, "step": 31731 }, { "epoch": 2.5, "learning_rate": 2.0347196549263102e-05, "loss": 1.4291, "step": 31732 }, { "epoch": 2.5, "learning_rate": 2.0340981445807398e-05, "loss": 1.4382, "step": 31733 }, { "epoch": 2.5, "learning_rate": 2.033476722266485e-05, "loss": 1.3808, "step": 31734 }, { "epoch": 2.5, "learning_rate": 2.0328553879877692e-05, "loss": 1.4116, "step": 31735 }, { "epoch": 2.5, "learning_rate": 2.032234141748812e-05, "loss": 1.5003, "step": 31736 }, { "epoch": 2.5, "learning_rate": 2.0316129835538235e-05, "loss": 1.4597, "step": 31737 }, { "epoch": 2.5, "learning_rate": 2.0309919134070308e-05, "loss": 1.4052, "step": 31738 }, { "epoch": 2.5, "learning_rate": 2.0303709313126432e-05, "loss": 1.4671, "step": 31739 }, { "epoch": 2.5, "learning_rate": 2.029750037274881e-05, "loss": 1.3732, "step": 31740 }, { "epoch": 2.5, "learning_rate": 2.0291292312979573e-05, "loss": 1.4383, "step": 31741 }, { "epoch": 2.5, "learning_rate": 2.0285085133860905e-05, "loss": 1.4121, "step": 31742 }, { "epoch": 2.5, "learning_rate": 2.0278878835434925e-05, "loss": 1.4597, "step": 31743 }, { "epoch": 2.5, "learning_rate": 2.0272673417743747e-05, "loss": 1.4651, "step": 31744 }, { "epoch": 2.5, "learning_rate": 2.026646888082955e-05, "loss": 1.4776, "step": 31745 }, { "epoch": 2.5, "learning_rate": 2.026026522473444e-05, "loss": 1.4575, "step": 31746 }, { "epoch": 2.5, "learning_rate": 2.0254062449500513e-05, "loss": 1.4172, "step": 31747 }, { "epoch": 2.5, "learning_rate": 2.024786055516992e-05, "loss": 1.427, "step": 31748 }, { "epoch": 2.5, "learning_rate": 2.024165954178476e-05, "loss": 1.4698, "step": 31749 }, { "epoch": 2.5, "learning_rate": 2.0235459409387118e-05, "loss": 1.4417, "step": 31750 }, { "epoch": 2.5, "learning_rate": 2.0229260158019055e-05, "loss": 1.4566, "step": 31751 }, { "epoch": 2.5, "learning_rate": 2.0223061787722744e-05, "loss": 1.4617, "step": 31752 }, { "epoch": 2.5, "learning_rate": 2.021686429854023e-05, "loss": 1.4425, "step": 31753 }, { "epoch": 2.5, "learning_rate": 2.021066769051355e-05, "loss": 1.4418, "step": 31754 }, { "epoch": 2.5, "learning_rate": 2.0204471963684814e-05, "loss": 1.4192, "step": 31755 }, { "epoch": 2.5, "learning_rate": 2.019827711809613e-05, "loss": 1.4158, "step": 31756 }, { "epoch": 2.5, "learning_rate": 2.0192083153789507e-05, "loss": 1.4639, "step": 31757 }, { "epoch": 2.5, "learning_rate": 2.0185890070806966e-05, "loss": 1.4237, "step": 31758 }, { "epoch": 2.5, "learning_rate": 2.017969786919062e-05, "loss": 1.4499, "step": 31759 }, { "epoch": 2.5, "learning_rate": 2.0173506548982503e-05, "loss": 1.4328, "step": 31760 }, { "epoch": 2.5, "learning_rate": 2.0167316110224583e-05, "loss": 1.5092, "step": 31761 }, { "epoch": 2.5, "learning_rate": 2.0161126552958995e-05, "loss": 1.4577, "step": 31762 }, { "epoch": 2.5, "learning_rate": 2.0154937877227683e-05, "loss": 1.4297, "step": 31763 }, { "epoch": 2.5, "learning_rate": 2.0148750083072667e-05, "loss": 1.496, "step": 31764 }, { "epoch": 2.5, "learning_rate": 2.0142563170536014e-05, "loss": 1.436, "step": 31765 }, { "epoch": 2.5, "learning_rate": 2.0136377139659686e-05, "loss": 1.423, "step": 31766 }, { "epoch": 2.5, "learning_rate": 2.0130191990485706e-05, "loss": 1.4716, "step": 31767 }, { "epoch": 2.5, "learning_rate": 2.0124007723056003e-05, "loss": 1.4736, "step": 31768 }, { "epoch": 2.5, "learning_rate": 2.0117824337412676e-05, "loss": 1.4378, "step": 31769 }, { "epoch": 2.5, "learning_rate": 2.0111641833597593e-05, "loss": 1.4643, "step": 31770 }, { "epoch": 2.5, "learning_rate": 2.0105460211652818e-05, "loss": 1.4541, "step": 31771 }, { "epoch": 2.5, "learning_rate": 2.0099279471620256e-05, "loss": 1.4456, "step": 31772 }, { "epoch": 2.5, "learning_rate": 2.0093099613541935e-05, "loss": 1.476, "step": 31773 }, { "epoch": 2.5, "learning_rate": 2.0086920637459775e-05, "loss": 1.4346, "step": 31774 }, { "epoch": 2.5, "learning_rate": 2.0080742543415706e-05, "loss": 1.4019, "step": 31775 }, { "epoch": 2.5, "learning_rate": 2.007456533145173e-05, "loss": 1.4705, "step": 31776 }, { "epoch": 2.5, "learning_rate": 2.0068389001609765e-05, "loss": 1.4702, "step": 31777 }, { "epoch": 2.5, "learning_rate": 2.0062213553931688e-05, "loss": 1.4633, "step": 31778 }, { "epoch": 2.5, "learning_rate": 2.005603898845952e-05, "loss": 1.4492, "step": 31779 }, { "epoch": 2.5, "learning_rate": 2.004986530523513e-05, "loss": 1.4292, "step": 31780 }, { "epoch": 2.5, "learning_rate": 2.0043692504300412e-05, "loss": 1.4822, "step": 31781 }, { "epoch": 2.5, "learning_rate": 2.0037520585697337e-05, "loss": 1.4506, "step": 31782 }, { "epoch": 2.5, "learning_rate": 2.0031349549467786e-05, "loss": 1.4402, "step": 31783 }, { "epoch": 2.5, "learning_rate": 2.002517939565364e-05, "loss": 1.4509, "step": 31784 }, { "epoch": 2.5, "learning_rate": 2.001901012429677e-05, "loss": 1.4491, "step": 31785 }, { "epoch": 2.5, "learning_rate": 2.0012841735439106e-05, "loss": 1.4227, "step": 31786 }, { "epoch": 2.5, "learning_rate": 2.0006674229122532e-05, "loss": 1.5069, "step": 31787 }, { "epoch": 2.5, "learning_rate": 2.00005076053889e-05, "loss": 1.4738, "step": 31788 }, { "epoch": 2.5, "learning_rate": 1.9994341864280054e-05, "loss": 1.4315, "step": 31789 }, { "epoch": 2.5, "learning_rate": 1.998817700583792e-05, "loss": 1.4228, "step": 31790 }, { "epoch": 2.5, "learning_rate": 1.9982013030104305e-05, "loss": 1.4225, "step": 31791 }, { "epoch": 2.5, "learning_rate": 1.9975849937121047e-05, "loss": 1.437, "step": 31792 }, { "epoch": 2.5, "learning_rate": 1.9969687726930063e-05, "loss": 1.4363, "step": 31793 }, { "epoch": 2.5, "learning_rate": 1.9963526399573116e-05, "loss": 1.4539, "step": 31794 }, { "epoch": 2.5, "learning_rate": 1.995736595509204e-05, "loss": 1.3937, "step": 31795 }, { "epoch": 2.5, "learning_rate": 1.9951206393528725e-05, "loss": 1.4271, "step": 31796 }, { "epoch": 2.5, "learning_rate": 1.994504771492496e-05, "loss": 1.4918, "step": 31797 }, { "epoch": 2.5, "learning_rate": 1.9938889919322503e-05, "loss": 1.4293, "step": 31798 }, { "epoch": 2.5, "learning_rate": 1.9932733006763253e-05, "loss": 1.5098, "step": 31799 }, { "epoch": 2.5, "learning_rate": 1.9926576977288957e-05, "loss": 1.4085, "step": 31800 }, { "epoch": 2.5, "learning_rate": 1.992042183094143e-05, "loss": 1.4553, "step": 31801 }, { "epoch": 2.5, "learning_rate": 1.9914267567762393e-05, "loss": 1.4769, "step": 31802 }, { "epoch": 2.5, "learning_rate": 1.9908114187793745e-05, "loss": 1.4298, "step": 31803 }, { "epoch": 2.5, "learning_rate": 1.9901961691077217e-05, "loss": 1.4051, "step": 31804 }, { "epoch": 2.5, "learning_rate": 1.9895810077654545e-05, "loss": 1.481, "step": 31805 }, { "epoch": 2.5, "learning_rate": 1.988965934756756e-05, "loss": 1.4158, "step": 31806 }, { "epoch": 2.5, "learning_rate": 1.988350950085798e-05, "loss": 1.443, "step": 31807 }, { "epoch": 2.5, "learning_rate": 1.987736053756757e-05, "loss": 1.5291, "step": 31808 }, { "epoch": 2.5, "learning_rate": 1.987121245773805e-05, "loss": 1.4104, "step": 31809 }, { "epoch": 2.5, "learning_rate": 1.98650652614112e-05, "loss": 1.407, "step": 31810 }, { "epoch": 2.5, "learning_rate": 1.9858918948628755e-05, "loss": 1.4284, "step": 31811 }, { "epoch": 2.5, "learning_rate": 1.9852773519432398e-05, "loss": 1.4846, "step": 31812 }, { "epoch": 2.5, "learning_rate": 1.9846628973863928e-05, "loss": 1.4622, "step": 31813 }, { "epoch": 2.5, "learning_rate": 1.984048531196501e-05, "loss": 1.4456, "step": 31814 }, { "epoch": 2.5, "learning_rate": 1.9834342533777347e-05, "loss": 1.4303, "step": 31815 }, { "epoch": 2.5, "learning_rate": 1.982820063934269e-05, "loss": 1.4673, "step": 31816 }, { "epoch": 2.5, "learning_rate": 1.982205962870272e-05, "loss": 1.4382, "step": 31817 }, { "epoch": 2.5, "learning_rate": 1.9815919501899086e-05, "loss": 1.4923, "step": 31818 }, { "epoch": 2.5, "learning_rate": 1.980978025897354e-05, "loss": 1.4049, "step": 31819 }, { "epoch": 2.5, "learning_rate": 1.980364189996775e-05, "loss": 1.462, "step": 31820 }, { "epoch": 2.5, "learning_rate": 1.9797504424923394e-05, "loss": 1.4384, "step": 31821 }, { "epoch": 2.5, "learning_rate": 1.9791367833882095e-05, "loss": 1.4756, "step": 31822 }, { "epoch": 2.5, "learning_rate": 1.97852321268856e-05, "loss": 1.4175, "step": 31823 }, { "epoch": 2.5, "learning_rate": 1.9779097303975507e-05, "loss": 1.4425, "step": 31824 }, { "epoch": 2.5, "learning_rate": 1.977296336519347e-05, "loss": 1.4662, "step": 31825 }, { "epoch": 2.5, "learning_rate": 1.9766830310581134e-05, "loss": 1.4682, "step": 31826 }, { "epoch": 2.5, "learning_rate": 1.976069814018017e-05, "loss": 1.4459, "step": 31827 }, { "epoch": 2.5, "learning_rate": 1.975456685403221e-05, "loss": 1.4603, "step": 31828 }, { "epoch": 2.5, "learning_rate": 1.9748436452178822e-05, "loss": 1.4314, "step": 31829 }, { "epoch": 2.5, "learning_rate": 1.9742306934661706e-05, "loss": 1.4829, "step": 31830 }, { "epoch": 2.5, "learning_rate": 1.9736178301522444e-05, "loss": 1.4394, "step": 31831 }, { "epoch": 2.5, "learning_rate": 1.97300505528026e-05, "loss": 1.4333, "step": 31832 }, { "epoch": 2.5, "learning_rate": 1.9723923688543846e-05, "loss": 1.4801, "step": 31833 }, { "epoch": 2.5, "learning_rate": 1.971779770878778e-05, "loss": 1.4441, "step": 31834 }, { "epoch": 2.5, "learning_rate": 1.971167261357597e-05, "loss": 1.4705, "step": 31835 }, { "epoch": 2.5, "learning_rate": 1.970554840294998e-05, "loss": 1.4841, "step": 31836 }, { "epoch": 2.5, "learning_rate": 1.969942507695144e-05, "loss": 1.4166, "step": 31837 }, { "epoch": 2.51, "learning_rate": 1.9693302635621894e-05, "loss": 1.4398, "step": 31838 }, { "epoch": 2.51, "learning_rate": 1.9687181079002883e-05, "loss": 1.4521, "step": 31839 }, { "epoch": 2.51, "learning_rate": 1.9681060407136047e-05, "loss": 1.4716, "step": 31840 }, { "epoch": 2.51, "learning_rate": 1.967494062006288e-05, "loss": 1.4823, "step": 31841 }, { "epoch": 2.51, "learning_rate": 1.966882171782495e-05, "loss": 1.4931, "step": 31842 }, { "epoch": 2.51, "learning_rate": 1.966270370046376e-05, "loss": 1.4496, "step": 31843 }, { "epoch": 2.51, "learning_rate": 1.9656586568020927e-05, "loss": 1.4318, "step": 31844 }, { "epoch": 2.51, "learning_rate": 1.9650470320537947e-05, "loss": 1.4833, "step": 31845 }, { "epoch": 2.51, "learning_rate": 1.9644354958056292e-05, "loss": 1.461, "step": 31846 }, { "epoch": 2.51, "learning_rate": 1.9638240480617574e-05, "loss": 1.4184, "step": 31847 }, { "epoch": 2.51, "learning_rate": 1.963212688826326e-05, "loss": 1.4505, "step": 31848 }, { "epoch": 2.51, "learning_rate": 1.962601418103482e-05, "loss": 1.4946, "step": 31849 }, { "epoch": 2.51, "learning_rate": 1.961990235897382e-05, "loss": 1.4509, "step": 31850 }, { "epoch": 2.51, "learning_rate": 1.9613791422121743e-05, "loss": 1.439, "step": 31851 }, { "epoch": 2.51, "learning_rate": 1.960768137052009e-05, "loss": 1.4405, "step": 31852 }, { "epoch": 2.51, "learning_rate": 1.9601572204210274e-05, "loss": 1.3877, "step": 31853 }, { "epoch": 2.51, "learning_rate": 1.959546392323387e-05, "loss": 1.4546, "step": 31854 }, { "epoch": 2.51, "learning_rate": 1.958935652763228e-05, "loss": 1.4812, "step": 31855 }, { "epoch": 2.51, "learning_rate": 1.9583250017446987e-05, "loss": 1.4044, "step": 31856 }, { "epoch": 2.51, "learning_rate": 1.9577144392719467e-05, "loss": 1.4594, "step": 31857 }, { "epoch": 2.51, "learning_rate": 1.9571039653491187e-05, "loss": 1.464, "step": 31858 }, { "epoch": 2.51, "learning_rate": 1.9564935799803517e-05, "loss": 1.4971, "step": 31859 }, { "epoch": 2.51, "learning_rate": 1.9558832831698003e-05, "loss": 1.4729, "step": 31860 }, { "epoch": 2.51, "learning_rate": 1.9552730749216013e-05, "loss": 1.3664, "step": 31861 }, { "epoch": 2.51, "learning_rate": 1.9546629552398997e-05, "loss": 1.4431, "step": 31862 }, { "epoch": 2.51, "learning_rate": 1.9540529241288356e-05, "loss": 1.4458, "step": 31863 }, { "epoch": 2.51, "learning_rate": 1.9534429815925557e-05, "loss": 1.4882, "step": 31864 }, { "epoch": 2.51, "learning_rate": 1.952833127635195e-05, "loss": 1.448, "step": 31865 }, { "epoch": 2.51, "learning_rate": 1.9522233622609e-05, "loss": 1.4676, "step": 31866 }, { "epoch": 2.51, "learning_rate": 1.9516136854738046e-05, "loss": 1.4876, "step": 31867 }, { "epoch": 2.51, "learning_rate": 1.951004097278055e-05, "loss": 1.4282, "step": 31868 }, { "epoch": 2.51, "learning_rate": 1.9503945976777864e-05, "loss": 1.4602, "step": 31869 }, { "epoch": 2.51, "learning_rate": 1.9497851866771354e-05, "loss": 1.4812, "step": 31870 }, { "epoch": 2.51, "learning_rate": 1.9491758642802435e-05, "loss": 1.4279, "step": 31871 }, { "epoch": 2.51, "learning_rate": 1.9485666304912446e-05, "loss": 1.485, "step": 31872 }, { "epoch": 2.51, "learning_rate": 1.9479574853142733e-05, "loss": 1.4659, "step": 31873 }, { "epoch": 2.51, "learning_rate": 1.9473484287534714e-05, "loss": 1.4138, "step": 31874 }, { "epoch": 2.51, "learning_rate": 1.9467394608129706e-05, "loss": 1.4148, "step": 31875 }, { "epoch": 2.51, "learning_rate": 1.9461305814969026e-05, "loss": 1.4285, "step": 31876 }, { "epoch": 2.51, "learning_rate": 1.945521790809407e-05, "loss": 1.4995, "step": 31877 }, { "epoch": 2.51, "learning_rate": 1.9449130887546132e-05, "loss": 1.4865, "step": 31878 }, { "epoch": 2.51, "learning_rate": 1.944304475336657e-05, "loss": 1.4749, "step": 31879 }, { "epoch": 2.51, "learning_rate": 1.943695950559662e-05, "loss": 1.4486, "step": 31880 }, { "epoch": 2.51, "learning_rate": 1.943087514427772e-05, "loss": 1.389, "step": 31881 }, { "epoch": 2.51, "learning_rate": 1.9424791669451127e-05, "loss": 1.4641, "step": 31882 }, { "epoch": 2.51, "learning_rate": 1.9418709081158152e-05, "loss": 1.4648, "step": 31883 }, { "epoch": 2.51, "learning_rate": 1.941262737944004e-05, "loss": 1.4275, "step": 31884 }, { "epoch": 2.51, "learning_rate": 1.9406546564338155e-05, "loss": 1.3989, "step": 31885 }, { "epoch": 2.51, "learning_rate": 1.940046663589375e-05, "loss": 1.4641, "step": 31886 }, { "epoch": 2.51, "learning_rate": 1.9394387594148082e-05, "loss": 1.4875, "step": 31887 }, { "epoch": 2.51, "learning_rate": 1.9388309439142473e-05, "loss": 1.4505, "step": 31888 }, { "epoch": 2.51, "learning_rate": 1.9382232170918167e-05, "loss": 1.4032, "step": 31889 }, { "epoch": 2.51, "learning_rate": 1.937615578951639e-05, "loss": 1.501, "step": 31890 }, { "epoch": 2.51, "learning_rate": 1.9370080294978463e-05, "loss": 1.4877, "step": 31891 }, { "epoch": 2.51, "learning_rate": 1.9364005687345603e-05, "loss": 1.4367, "step": 31892 }, { "epoch": 2.51, "learning_rate": 1.9357931966659025e-05, "loss": 1.3743, "step": 31893 }, { "epoch": 2.51, "learning_rate": 1.935185913296003e-05, "loss": 1.4148, "step": 31894 }, { "epoch": 2.51, "learning_rate": 1.93457871862898e-05, "loss": 1.4492, "step": 31895 }, { "epoch": 2.51, "learning_rate": 1.9339716126689557e-05, "loss": 1.4277, "step": 31896 }, { "epoch": 2.51, "learning_rate": 1.9333645954200515e-05, "loss": 1.4524, "step": 31897 }, { "epoch": 2.51, "learning_rate": 1.932757666886396e-05, "loss": 1.4407, "step": 31898 }, { "epoch": 2.51, "learning_rate": 1.9321508270721054e-05, "loss": 1.469, "step": 31899 }, { "epoch": 2.51, "learning_rate": 1.9315440759812983e-05, "loss": 1.4045, "step": 31900 }, { "epoch": 2.51, "learning_rate": 1.9309374136180916e-05, "loss": 1.4803, "step": 31901 }, { "epoch": 2.51, "learning_rate": 1.9303308399866118e-05, "loss": 1.4823, "step": 31902 }, { "epoch": 2.51, "learning_rate": 1.9297243550909724e-05, "loss": 1.4427, "step": 31903 }, { "epoch": 2.51, "learning_rate": 1.9291179589352902e-05, "loss": 1.4534, "step": 31904 }, { "epoch": 2.51, "learning_rate": 1.9285116515236847e-05, "loss": 1.4325, "step": 31905 }, { "epoch": 2.51, "learning_rate": 1.9279054328602733e-05, "loss": 1.4217, "step": 31906 }, { "epoch": 2.51, "learning_rate": 1.9272993029491672e-05, "loss": 1.4462, "step": 31907 }, { "epoch": 2.51, "learning_rate": 1.9266932617944868e-05, "loss": 1.4233, "step": 31908 }, { "epoch": 2.51, "learning_rate": 1.9260873094003456e-05, "loss": 1.4613, "step": 31909 }, { "epoch": 2.51, "learning_rate": 1.925481445770853e-05, "loss": 1.4139, "step": 31910 }, { "epoch": 2.51, "learning_rate": 1.924875670910131e-05, "loss": 1.4384, "step": 31911 }, { "epoch": 2.51, "learning_rate": 1.924269984822283e-05, "loss": 1.5122, "step": 31912 }, { "epoch": 2.51, "learning_rate": 1.9236643875114294e-05, "loss": 1.4297, "step": 31913 }, { "epoch": 2.51, "learning_rate": 1.9230588789816748e-05, "loss": 1.4462, "step": 31914 }, { "epoch": 2.51, "learning_rate": 1.9224534592371375e-05, "loss": 1.4441, "step": 31915 }, { "epoch": 2.51, "learning_rate": 1.9218481282819246e-05, "loss": 1.447, "step": 31916 }, { "epoch": 2.51, "learning_rate": 1.921242886120143e-05, "loss": 1.4316, "step": 31917 }, { "epoch": 2.51, "learning_rate": 1.9206377327559086e-05, "loss": 1.4337, "step": 31918 }, { "epoch": 2.51, "learning_rate": 1.9200326681933254e-05, "loss": 1.4408, "step": 31919 }, { "epoch": 2.51, "learning_rate": 1.9194276924365014e-05, "loss": 1.4664, "step": 31920 }, { "epoch": 2.51, "learning_rate": 1.9188228054895423e-05, "loss": 1.4237, "step": 31921 }, { "epoch": 2.51, "learning_rate": 1.9182180073565607e-05, "loss": 1.4858, "step": 31922 }, { "epoch": 2.51, "learning_rate": 1.9176132980416603e-05, "loss": 1.4607, "step": 31923 }, { "epoch": 2.51, "learning_rate": 1.917008677548943e-05, "loss": 1.4484, "step": 31924 }, { "epoch": 2.51, "learning_rate": 1.9164041458825185e-05, "loss": 1.4608, "step": 31925 }, { "epoch": 2.51, "learning_rate": 1.9157997030464906e-05, "loss": 1.4546, "step": 31926 }, { "epoch": 2.51, "learning_rate": 1.9151953490449607e-05, "loss": 1.5011, "step": 31927 }, { "epoch": 2.51, "learning_rate": 1.9145910838820322e-05, "loss": 1.5167, "step": 31928 }, { "epoch": 2.51, "learning_rate": 1.913986907561812e-05, "loss": 1.4135, "step": 31929 }, { "epoch": 2.51, "learning_rate": 1.9133828200884e-05, "loss": 1.4969, "step": 31930 }, { "epoch": 2.51, "learning_rate": 1.912778821465893e-05, "loss": 1.5326, "step": 31931 }, { "epoch": 2.51, "learning_rate": 1.9121749116983992e-05, "loss": 1.4341, "step": 31932 }, { "epoch": 2.51, "learning_rate": 1.9115710907900157e-05, "loss": 1.4757, "step": 31933 }, { "epoch": 2.51, "learning_rate": 1.910967358744837e-05, "loss": 1.4345, "step": 31934 }, { "epoch": 2.51, "learning_rate": 1.910363715566972e-05, "loss": 1.4098, "step": 31935 }, { "epoch": 2.51, "learning_rate": 1.9097601612605125e-05, "loss": 1.452, "step": 31936 }, { "epoch": 2.51, "learning_rate": 1.909156695829558e-05, "loss": 1.4598, "step": 31937 }, { "epoch": 2.51, "learning_rate": 1.908553319278202e-05, "loss": 1.4366, "step": 31938 }, { "epoch": 2.51, "learning_rate": 1.9079500316105485e-05, "loss": 1.5198, "step": 31939 }, { "epoch": 2.51, "learning_rate": 1.9073468328306903e-05, "loss": 1.4775, "step": 31940 }, { "epoch": 2.51, "learning_rate": 1.9067437229427172e-05, "loss": 1.4269, "step": 31941 }, { "epoch": 2.51, "learning_rate": 1.9061407019507317e-05, "loss": 1.471, "step": 31942 }, { "epoch": 2.51, "learning_rate": 1.905537769858822e-05, "loss": 1.5256, "step": 31943 }, { "epoch": 2.51, "learning_rate": 1.9049349266710893e-05, "loss": 1.4601, "step": 31944 }, { "epoch": 2.51, "learning_rate": 1.904332172391618e-05, "loss": 1.4405, "step": 31945 }, { "epoch": 2.51, "learning_rate": 1.9037295070245067e-05, "loss": 1.4613, "step": 31946 }, { "epoch": 2.51, "learning_rate": 1.9031269305738467e-05, "loss": 1.3943, "step": 31947 }, { "epoch": 2.51, "learning_rate": 1.9025244430437227e-05, "loss": 1.4585, "step": 31948 }, { "epoch": 2.51, "learning_rate": 1.9019220444382345e-05, "loss": 1.4406, "step": 31949 }, { "epoch": 2.51, "learning_rate": 1.9013197347614656e-05, "loss": 1.4752, "step": 31950 }, { "epoch": 2.51, "learning_rate": 1.9007175140175064e-05, "loss": 1.444, "step": 31951 }, { "epoch": 2.51, "learning_rate": 1.900115382210448e-05, "loss": 1.4441, "step": 31952 }, { "epoch": 2.51, "learning_rate": 1.899513339344378e-05, "loss": 1.4548, "step": 31953 }, { "epoch": 2.51, "learning_rate": 1.898911385423382e-05, "loss": 1.4933, "step": 31954 }, { "epoch": 2.51, "learning_rate": 1.898309520451545e-05, "loss": 1.443, "step": 31955 }, { "epoch": 2.51, "learning_rate": 1.8977077444329603e-05, "loss": 1.4428, "step": 31956 }, { "epoch": 2.51, "learning_rate": 1.897106057371709e-05, "loss": 1.4355, "step": 31957 }, { "epoch": 2.51, "learning_rate": 1.8965044592718724e-05, "loss": 1.4902, "step": 31958 }, { "epoch": 2.51, "learning_rate": 1.8959029501375412e-05, "loss": 1.4368, "step": 31959 }, { "epoch": 2.51, "learning_rate": 1.8953015299727996e-05, "loss": 1.432, "step": 31960 }, { "epoch": 2.51, "learning_rate": 1.89470019878173e-05, "loss": 1.42, "step": 31961 }, { "epoch": 2.51, "learning_rate": 1.894098956568409e-05, "loss": 1.479, "step": 31962 }, { "epoch": 2.51, "learning_rate": 1.893497803336928e-05, "loss": 1.4209, "step": 31963 }, { "epoch": 2.51, "learning_rate": 1.892896739091364e-05, "loss": 1.4885, "step": 31964 }, { "epoch": 2.52, "learning_rate": 1.8922957638357955e-05, "loss": 1.4974, "step": 31965 }, { "epoch": 2.52, "learning_rate": 1.8916948775743073e-05, "loss": 1.4365, "step": 31966 }, { "epoch": 2.52, "learning_rate": 1.891094080310978e-05, "loss": 1.4809, "step": 31967 }, { "epoch": 2.52, "learning_rate": 1.8904933720498828e-05, "loss": 1.4595, "step": 31968 }, { "epoch": 2.52, "learning_rate": 1.8898927527951062e-05, "loss": 1.4201, "step": 31969 }, { "epoch": 2.52, "learning_rate": 1.889292222550722e-05, "loss": 1.5028, "step": 31970 }, { "epoch": 2.52, "learning_rate": 1.8886917813208076e-05, "loss": 1.4689, "step": 31971 }, { "epoch": 2.52, "learning_rate": 1.8880914291094418e-05, "loss": 1.447, "step": 31972 }, { "epoch": 2.52, "learning_rate": 1.8874911659207004e-05, "loss": 1.4453, "step": 31973 }, { "epoch": 2.52, "learning_rate": 1.8868909917586566e-05, "loss": 1.4356, "step": 31974 }, { "epoch": 2.52, "learning_rate": 1.8862909066273806e-05, "loss": 1.4787, "step": 31975 }, { "epoch": 2.52, "learning_rate": 1.885690910530959e-05, "loss": 1.4517, "step": 31976 }, { "epoch": 2.52, "learning_rate": 1.8850910034734605e-05, "loss": 1.4896, "step": 31977 }, { "epoch": 2.52, "learning_rate": 1.884491185458955e-05, "loss": 1.447, "step": 31978 }, { "epoch": 2.52, "learning_rate": 1.883891456491514e-05, "loss": 1.4559, "step": 31979 }, { "epoch": 2.52, "learning_rate": 1.8832918165752164e-05, "loss": 1.4453, "step": 31980 }, { "epoch": 2.52, "learning_rate": 1.882692265714127e-05, "loss": 1.3889, "step": 31981 }, { "epoch": 2.52, "learning_rate": 1.8820928039123155e-05, "loss": 1.4508, "step": 31982 }, { "epoch": 2.52, "learning_rate": 1.8814934311738595e-05, "loss": 1.4263, "step": 31983 }, { "epoch": 2.52, "learning_rate": 1.8808941475028217e-05, "loss": 1.4944, "step": 31984 }, { "epoch": 2.52, "learning_rate": 1.8802949529032706e-05, "loss": 1.5354, "step": 31985 }, { "epoch": 2.52, "learning_rate": 1.87969584737928e-05, "loss": 1.4878, "step": 31986 }, { "epoch": 2.52, "learning_rate": 1.8790968309349147e-05, "loss": 1.4882, "step": 31987 }, { "epoch": 2.52, "learning_rate": 1.878497903574238e-05, "loss": 1.4301, "step": 31988 }, { "epoch": 2.52, "learning_rate": 1.877899065301322e-05, "loss": 1.4213, "step": 31989 }, { "epoch": 2.52, "learning_rate": 1.8773003161202265e-05, "loss": 1.4187, "step": 31990 }, { "epoch": 2.52, "learning_rate": 1.8767016560350234e-05, "loss": 1.4727, "step": 31991 }, { "epoch": 2.52, "learning_rate": 1.8761030850497726e-05, "loss": 1.4716, "step": 31992 }, { "epoch": 2.52, "learning_rate": 1.875504603168541e-05, "loss": 1.4096, "step": 31993 }, { "epoch": 2.52, "learning_rate": 1.8749062103953903e-05, "loss": 1.4491, "step": 31994 }, { "epoch": 2.52, "learning_rate": 1.8743079067343842e-05, "loss": 1.4827, "step": 31995 }, { "epoch": 2.52, "learning_rate": 1.8737096921895806e-05, "loss": 1.4609, "step": 31996 }, { "epoch": 2.52, "learning_rate": 1.873111566765048e-05, "loss": 1.4707, "step": 31997 }, { "epoch": 2.52, "learning_rate": 1.8725135304648437e-05, "loss": 1.4421, "step": 31998 }, { "epoch": 2.52, "learning_rate": 1.8719155832930237e-05, "loss": 1.4626, "step": 31999 }, { "epoch": 2.52, "learning_rate": 1.871317725253657e-05, "loss": 1.4421, "step": 32000 }, { "epoch": 2.52, "learning_rate": 1.8707199563507967e-05, "loss": 1.4212, "step": 32001 }, { "epoch": 2.52, "learning_rate": 1.8701222765885e-05, "loss": 1.4518, "step": 32002 }, { "epoch": 2.52, "learning_rate": 1.8695246859708314e-05, "loss": 1.4519, "step": 32003 }, { "epoch": 2.52, "learning_rate": 1.8689271845018427e-05, "loss": 1.4856, "step": 32004 }, { "epoch": 2.52, "learning_rate": 1.868329772185591e-05, "loss": 1.4433, "step": 32005 }, { "epoch": 2.52, "learning_rate": 1.8677324490261315e-05, "loss": 1.4778, "step": 32006 }, { "epoch": 2.52, "learning_rate": 1.8671352150275253e-05, "loss": 1.4003, "step": 32007 }, { "epoch": 2.52, "learning_rate": 1.8665380701938248e-05, "loss": 1.4653, "step": 32008 }, { "epoch": 2.52, "learning_rate": 1.8659410145290782e-05, "loss": 1.461, "step": 32009 }, { "epoch": 2.52, "learning_rate": 1.865344048037349e-05, "loss": 1.448, "step": 32010 }, { "epoch": 2.52, "learning_rate": 1.8647471707226837e-05, "loss": 1.4669, "step": 32011 }, { "epoch": 2.52, "learning_rate": 1.8641503825891373e-05, "loss": 1.4688, "step": 32012 }, { "epoch": 2.52, "learning_rate": 1.863553683640759e-05, "loss": 1.471, "step": 32013 }, { "epoch": 2.52, "learning_rate": 1.862957073881603e-05, "loss": 1.4664, "step": 32014 }, { "epoch": 2.52, "learning_rate": 1.86236055331572e-05, "loss": 1.4565, "step": 32015 }, { "epoch": 2.52, "learning_rate": 1.8617641219471547e-05, "loss": 1.4754, "step": 32016 }, { "epoch": 2.52, "learning_rate": 1.8611677797799656e-05, "loss": 1.4995, "step": 32017 }, { "epoch": 2.52, "learning_rate": 1.860571526818195e-05, "loss": 1.4531, "step": 32018 }, { "epoch": 2.52, "learning_rate": 1.8599753630658902e-05, "loss": 1.4192, "step": 32019 }, { "epoch": 2.52, "learning_rate": 1.8593792885271043e-05, "loss": 1.4719, "step": 32020 }, { "epoch": 2.52, "learning_rate": 1.858783303205883e-05, "loss": 1.4275, "step": 32021 }, { "epoch": 2.52, "learning_rate": 1.858187407106267e-05, "loss": 1.4196, "step": 32022 }, { "epoch": 2.52, "learning_rate": 1.857591600232306e-05, "loss": 1.4617, "step": 32023 }, { "epoch": 2.52, "learning_rate": 1.856995882588047e-05, "loss": 1.4539, "step": 32024 }, { "epoch": 2.52, "learning_rate": 1.8564002541775354e-05, "loss": 1.4463, "step": 32025 }, { "epoch": 2.52, "learning_rate": 1.8558047150048088e-05, "loss": 1.4001, "step": 32026 }, { "epoch": 2.52, "learning_rate": 1.855209265073918e-05, "loss": 1.4503, "step": 32027 }, { "epoch": 2.52, "learning_rate": 1.854613904388903e-05, "loss": 1.4499, "step": 32028 }, { "epoch": 2.52, "learning_rate": 1.854018632953802e-05, "loss": 1.3729, "step": 32029 }, { "epoch": 2.52, "learning_rate": 1.8534234507726618e-05, "loss": 1.4096, "step": 32030 }, { "epoch": 2.52, "learning_rate": 1.852828357849523e-05, "loss": 1.436, "step": 32031 }, { "epoch": 2.52, "learning_rate": 1.8522333541884233e-05, "loss": 1.3967, "step": 32032 }, { "epoch": 2.52, "learning_rate": 1.8516384397934016e-05, "loss": 1.443, "step": 32033 }, { "epoch": 2.52, "learning_rate": 1.851043614668501e-05, "loss": 1.4903, "step": 32034 }, { "epoch": 2.52, "learning_rate": 1.8504488788177584e-05, "loss": 1.4491, "step": 32035 }, { "epoch": 2.52, "learning_rate": 1.849854232245209e-05, "loss": 1.4741, "step": 32036 }, { "epoch": 2.52, "learning_rate": 1.849259674954895e-05, "loss": 1.4279, "step": 32037 }, { "epoch": 2.52, "learning_rate": 1.848665206950847e-05, "loss": 1.3821, "step": 32038 }, { "epoch": 2.52, "learning_rate": 1.848070828237108e-05, "loss": 1.4772, "step": 32039 }, { "epoch": 2.52, "learning_rate": 1.8474765388177076e-05, "loss": 1.4412, "step": 32040 }, { "epoch": 2.52, "learning_rate": 1.8468823386966875e-05, "loss": 1.3938, "step": 32041 }, { "epoch": 2.52, "learning_rate": 1.8462882278780762e-05, "loss": 1.4291, "step": 32042 }, { "epoch": 2.52, "learning_rate": 1.845694206365907e-05, "loss": 1.4098, "step": 32043 }, { "epoch": 2.52, "learning_rate": 1.845100274164217e-05, "loss": 1.4706, "step": 32044 }, { "epoch": 2.52, "learning_rate": 1.8445064312770374e-05, "loss": 1.4162, "step": 32045 }, { "epoch": 2.52, "learning_rate": 1.8439126777083956e-05, "loss": 1.5098, "step": 32046 }, { "epoch": 2.52, "learning_rate": 1.8433190134623298e-05, "loss": 1.416, "step": 32047 }, { "epoch": 2.52, "learning_rate": 1.8427254385428685e-05, "loss": 1.4068, "step": 32048 }, { "epoch": 2.52, "learning_rate": 1.8421319529540402e-05, "loss": 1.4494, "step": 32049 }, { "epoch": 2.52, "learning_rate": 1.8415385566998714e-05, "loss": 1.494, "step": 32050 }, { "epoch": 2.52, "learning_rate": 1.8409452497843973e-05, "loss": 1.4699, "step": 32051 }, { "epoch": 2.52, "learning_rate": 1.8403520322116434e-05, "loss": 1.4701, "step": 32052 }, { "epoch": 2.52, "learning_rate": 1.839758903985634e-05, "loss": 1.4668, "step": 32053 }, { "epoch": 2.52, "learning_rate": 1.8391658651103985e-05, "loss": 1.4563, "step": 32054 }, { "epoch": 2.52, "learning_rate": 1.8385729155899682e-05, "loss": 1.4928, "step": 32055 }, { "epoch": 2.52, "learning_rate": 1.8379800554283646e-05, "loss": 1.4748, "step": 32056 }, { "epoch": 2.52, "learning_rate": 1.83738728462961e-05, "loss": 1.4912, "step": 32057 }, { "epoch": 2.52, "learning_rate": 1.8367946031977344e-05, "loss": 1.4761, "step": 32058 }, { "epoch": 2.52, "learning_rate": 1.836202011136761e-05, "loss": 1.4171, "step": 32059 }, { "epoch": 2.52, "learning_rate": 1.8356095084507066e-05, "loss": 1.4506, "step": 32060 }, { "epoch": 2.52, "learning_rate": 1.8350170951436033e-05, "loss": 1.4574, "step": 32061 }, { "epoch": 2.52, "learning_rate": 1.8344247712194675e-05, "loss": 1.4716, "step": 32062 }, { "epoch": 2.52, "learning_rate": 1.83383253668232e-05, "loss": 1.4444, "step": 32063 }, { "epoch": 2.52, "learning_rate": 1.8332403915361864e-05, "loss": 1.4657, "step": 32064 }, { "epoch": 2.52, "learning_rate": 1.8326483357850846e-05, "loss": 1.4948, "step": 32065 }, { "epoch": 2.52, "learning_rate": 1.832056369433036e-05, "loss": 1.4301, "step": 32066 }, { "epoch": 2.52, "learning_rate": 1.8314644924840523e-05, "loss": 1.4215, "step": 32067 }, { "epoch": 2.52, "learning_rate": 1.8308727049421618e-05, "loss": 1.4523, "step": 32068 }, { "epoch": 2.52, "learning_rate": 1.8302810068113766e-05, "loss": 1.3938, "step": 32069 }, { "epoch": 2.52, "learning_rate": 1.8296893980957135e-05, "loss": 1.4089, "step": 32070 }, { "epoch": 2.52, "learning_rate": 1.8290978787991957e-05, "loss": 1.4282, "step": 32071 }, { "epoch": 2.52, "learning_rate": 1.828506448925835e-05, "loss": 1.4434, "step": 32072 }, { "epoch": 2.52, "learning_rate": 1.8279151084796467e-05, "loss": 1.4129, "step": 32073 }, { "epoch": 2.52, "learning_rate": 1.8273238574646427e-05, "loss": 1.3885, "step": 32074 }, { "epoch": 2.52, "learning_rate": 1.8267326958848426e-05, "loss": 1.4104, "step": 32075 }, { "epoch": 2.52, "learning_rate": 1.8261416237442605e-05, "loss": 1.4688, "step": 32076 }, { "epoch": 2.52, "learning_rate": 1.8255506410469013e-05, "loss": 1.4438, "step": 32077 }, { "epoch": 2.52, "learning_rate": 1.8249597477967865e-05, "loss": 1.4289, "step": 32078 }, { "epoch": 2.52, "learning_rate": 1.8243689439979246e-05, "loss": 1.4367, "step": 32079 }, { "epoch": 2.52, "learning_rate": 1.8237782296543247e-05, "loss": 1.4392, "step": 32080 }, { "epoch": 2.52, "learning_rate": 1.823187604770001e-05, "loss": 1.4579, "step": 32081 }, { "epoch": 2.52, "learning_rate": 1.8225970693489627e-05, "loss": 1.3934, "step": 32082 }, { "epoch": 2.52, "learning_rate": 1.8220066233952146e-05, "loss": 1.4447, "step": 32083 }, { "epoch": 2.52, "learning_rate": 1.8214162669127736e-05, "loss": 1.4449, "step": 32084 }, { "epoch": 2.52, "learning_rate": 1.8208259999056396e-05, "loss": 1.4388, "step": 32085 }, { "epoch": 2.52, "learning_rate": 1.8202358223778263e-05, "loss": 1.4761, "step": 32086 }, { "epoch": 2.52, "learning_rate": 1.819645734333337e-05, "loss": 1.4519, "step": 32087 }, { "epoch": 2.52, "learning_rate": 1.819055735776182e-05, "loss": 1.4626, "step": 32088 }, { "epoch": 2.52, "learning_rate": 1.8184658267103665e-05, "loss": 1.4222, "step": 32089 }, { "epoch": 2.52, "learning_rate": 1.8178760071398918e-05, "loss": 1.4816, "step": 32090 }, { "epoch": 2.52, "learning_rate": 1.8172862770687617e-05, "loss": 1.441, "step": 32091 }, { "epoch": 2.53, "learning_rate": 1.8166966365009866e-05, "loss": 1.4655, "step": 32092 }, { "epoch": 2.53, "learning_rate": 1.8161070854405664e-05, "loss": 1.4725, "step": 32093 }, { "epoch": 2.53, "learning_rate": 1.8155176238914994e-05, "loss": 1.4211, "step": 32094 }, { "epoch": 2.53, "learning_rate": 1.8149282518577958e-05, "loss": 1.4235, "step": 32095 }, { "epoch": 2.53, "learning_rate": 1.814338969343454e-05, "loss": 1.4331, "step": 32096 }, { "epoch": 2.53, "learning_rate": 1.8137497763524693e-05, "loss": 1.4555, "step": 32097 }, { "epoch": 2.53, "learning_rate": 1.813160672888852e-05, "loss": 1.5239, "step": 32098 }, { "epoch": 2.53, "learning_rate": 1.8125716589565952e-05, "loss": 1.4282, "step": 32099 }, { "epoch": 2.53, "learning_rate": 1.811982734559696e-05, "loss": 1.4628, "step": 32100 }, { "epoch": 2.53, "learning_rate": 1.8113938997021578e-05, "loss": 1.4941, "step": 32101 }, { "epoch": 2.53, "learning_rate": 1.8108051543879787e-05, "loss": 1.435, "step": 32102 }, { "epoch": 2.53, "learning_rate": 1.8102164986211542e-05, "loss": 1.4468, "step": 32103 }, { "epoch": 2.53, "learning_rate": 1.8096279324056778e-05, "loss": 1.4733, "step": 32104 }, { "epoch": 2.53, "learning_rate": 1.809039455745553e-05, "loss": 1.4431, "step": 32105 }, { "epoch": 2.53, "learning_rate": 1.8084510686447694e-05, "loss": 1.4467, "step": 32106 }, { "epoch": 2.53, "learning_rate": 1.8078627711073247e-05, "loss": 1.3905, "step": 32107 }, { "epoch": 2.53, "learning_rate": 1.807274563137208e-05, "loss": 1.4156, "step": 32108 }, { "epoch": 2.53, "learning_rate": 1.8066864447384205e-05, "loss": 1.435, "step": 32109 }, { "epoch": 2.53, "learning_rate": 1.80609841591495e-05, "loss": 1.4092, "step": 32110 }, { "epoch": 2.53, "learning_rate": 1.8055104766707885e-05, "loss": 1.4228, "step": 32111 }, { "epoch": 2.53, "learning_rate": 1.8049226270099326e-05, "loss": 1.4628, "step": 32112 }, { "epoch": 2.53, "learning_rate": 1.8043348669363696e-05, "loss": 1.3984, "step": 32113 }, { "epoch": 2.53, "learning_rate": 1.803747196454087e-05, "loss": 1.4489, "step": 32114 }, { "epoch": 2.53, "learning_rate": 1.803159615567083e-05, "loss": 1.5089, "step": 32115 }, { "epoch": 2.53, "learning_rate": 1.8025721242793402e-05, "loss": 1.4625, "step": 32116 }, { "epoch": 2.53, "learning_rate": 1.801984722594852e-05, "loss": 1.4586, "step": 32117 }, { "epoch": 2.53, "learning_rate": 1.8013974105176006e-05, "loss": 1.4351, "step": 32118 }, { "epoch": 2.53, "learning_rate": 1.8008101880515808e-05, "loss": 1.4379, "step": 32119 }, { "epoch": 2.53, "learning_rate": 1.8002230552007764e-05, "loss": 1.4636, "step": 32120 }, { "epoch": 2.53, "learning_rate": 1.7996360119691688e-05, "loss": 1.4226, "step": 32121 }, { "epoch": 2.53, "learning_rate": 1.799049058360752e-05, "loss": 1.4334, "step": 32122 }, { "epoch": 2.53, "learning_rate": 1.7984621943795075e-05, "loss": 1.4219, "step": 32123 }, { "epoch": 2.53, "learning_rate": 1.7978754200294153e-05, "loss": 1.3798, "step": 32124 }, { "epoch": 2.53, "learning_rate": 1.7972887353144678e-05, "loss": 1.4346, "step": 32125 }, { "epoch": 2.53, "learning_rate": 1.7967021402386444e-05, "loss": 1.3801, "step": 32126 }, { "epoch": 2.53, "learning_rate": 1.7961156348059258e-05, "loss": 1.4346, "step": 32127 }, { "epoch": 2.53, "learning_rate": 1.7955292190202934e-05, "loss": 1.4253, "step": 32128 }, { "epoch": 2.53, "learning_rate": 1.7949428928857327e-05, "loss": 1.4455, "step": 32129 }, { "epoch": 2.53, "learning_rate": 1.794356656406224e-05, "loss": 1.4743, "step": 32130 }, { "epoch": 2.53, "learning_rate": 1.7937705095857417e-05, "loss": 1.4475, "step": 32131 }, { "epoch": 2.53, "learning_rate": 1.79318445242827e-05, "loss": 1.4633, "step": 32132 }, { "epoch": 2.53, "learning_rate": 1.792598484937792e-05, "loss": 1.4355, "step": 32133 }, { "epoch": 2.53, "learning_rate": 1.7920126071182815e-05, "loss": 1.4338, "step": 32134 }, { "epoch": 2.53, "learning_rate": 1.7914268189737137e-05, "loss": 1.4294, "step": 32135 }, { "epoch": 2.53, "learning_rate": 1.7908411205080713e-05, "loss": 1.4607, "step": 32136 }, { "epoch": 2.53, "learning_rate": 1.7902555117253287e-05, "loss": 1.4431, "step": 32137 }, { "epoch": 2.53, "learning_rate": 1.7896699926294572e-05, "loss": 1.4576, "step": 32138 }, { "epoch": 2.53, "learning_rate": 1.7890845632244404e-05, "loss": 1.4479, "step": 32139 }, { "epoch": 2.53, "learning_rate": 1.7884992235142486e-05, "loss": 1.4156, "step": 32140 }, { "epoch": 2.53, "learning_rate": 1.7879139735028537e-05, "loss": 1.4654, "step": 32141 }, { "epoch": 2.53, "learning_rate": 1.7873288131942354e-05, "loss": 1.4928, "step": 32142 }, { "epoch": 2.53, "learning_rate": 1.7867437425923625e-05, "loss": 1.4753, "step": 32143 }, { "epoch": 2.53, "learning_rate": 1.7861587617012087e-05, "loss": 1.4714, "step": 32144 }, { "epoch": 2.53, "learning_rate": 1.78557387052474e-05, "loss": 1.4411, "step": 32145 }, { "epoch": 2.53, "learning_rate": 1.784989069066936e-05, "loss": 1.4875, "step": 32146 }, { "epoch": 2.53, "learning_rate": 1.7844043573317647e-05, "loss": 1.444, "step": 32147 }, { "epoch": 2.53, "learning_rate": 1.783819735323191e-05, "loss": 1.4627, "step": 32148 }, { "epoch": 2.53, "learning_rate": 1.7832352030451886e-05, "loss": 1.4882, "step": 32149 }, { "epoch": 2.53, "learning_rate": 1.7826507605017276e-05, "loss": 1.4395, "step": 32150 }, { "epoch": 2.53, "learning_rate": 1.782066407696775e-05, "loss": 1.4295, "step": 32151 }, { "epoch": 2.53, "learning_rate": 1.7814821446342943e-05, "loss": 1.4263, "step": 32152 }, { "epoch": 2.53, "learning_rate": 1.780897971318257e-05, "loss": 1.4443, "step": 32153 }, { "epoch": 2.53, "learning_rate": 1.7803138877526285e-05, "loss": 1.4511, "step": 32154 }, { "epoch": 2.53, "learning_rate": 1.7797298939413706e-05, "loss": 1.4404, "step": 32155 }, { "epoch": 2.53, "learning_rate": 1.7791459898884535e-05, "loss": 1.4692, "step": 32156 }, { "epoch": 2.53, "learning_rate": 1.778562175597841e-05, "loss": 1.4442, "step": 32157 }, { "epoch": 2.53, "learning_rate": 1.7779784510734906e-05, "loss": 1.445, "step": 32158 }, { "epoch": 2.53, "learning_rate": 1.7773948163193736e-05, "loss": 1.4739, "step": 32159 }, { "epoch": 2.53, "learning_rate": 1.776811271339448e-05, "loss": 1.4012, "step": 32160 }, { "epoch": 2.53, "learning_rate": 1.776227816137677e-05, "loss": 1.4935, "step": 32161 }, { "epoch": 2.53, "learning_rate": 1.7756444507180197e-05, "loss": 1.4845, "step": 32162 }, { "epoch": 2.53, "learning_rate": 1.7750611750844373e-05, "loss": 1.4759, "step": 32163 }, { "epoch": 2.53, "learning_rate": 1.7744779892408955e-05, "loss": 1.4559, "step": 32164 }, { "epoch": 2.53, "learning_rate": 1.7738948931913494e-05, "loss": 1.4793, "step": 32165 }, { "epoch": 2.53, "learning_rate": 1.7733118869397555e-05, "loss": 1.4597, "step": 32166 }, { "epoch": 2.53, "learning_rate": 1.772728970490076e-05, "loss": 1.4585, "step": 32167 }, { "epoch": 2.53, "learning_rate": 1.772146143846269e-05, "loss": 1.4295, "step": 32168 }, { "epoch": 2.53, "learning_rate": 1.771563407012287e-05, "loss": 1.4382, "step": 32169 }, { "epoch": 2.53, "learning_rate": 1.7709807599920928e-05, "loss": 1.4443, "step": 32170 }, { "epoch": 2.53, "learning_rate": 1.7703982027896386e-05, "loss": 1.4732, "step": 32171 }, { "epoch": 2.53, "learning_rate": 1.769815735408876e-05, "loss": 1.4485, "step": 32172 }, { "epoch": 2.53, "learning_rate": 1.7692333578537672e-05, "loss": 1.4404, "step": 32173 }, { "epoch": 2.53, "learning_rate": 1.7686510701282617e-05, "loss": 1.4922, "step": 32174 }, { "epoch": 2.53, "learning_rate": 1.7680688722363123e-05, "loss": 1.4543, "step": 32175 }, { "epoch": 2.53, "learning_rate": 1.767486764181875e-05, "loss": 1.4582, "step": 32176 }, { "epoch": 2.53, "learning_rate": 1.7669047459689007e-05, "loss": 1.4081, "step": 32177 }, { "epoch": 2.53, "learning_rate": 1.7663228176013406e-05, "loss": 1.4864, "step": 32178 }, { "epoch": 2.53, "learning_rate": 1.76574097908314e-05, "loss": 1.4739, "step": 32179 }, { "epoch": 2.53, "learning_rate": 1.765159230418261e-05, "loss": 1.4202, "step": 32180 }, { "epoch": 2.53, "learning_rate": 1.7645775716106453e-05, "loss": 1.4946, "step": 32181 }, { "epoch": 2.53, "learning_rate": 1.763996002664243e-05, "loss": 1.434, "step": 32182 }, { "epoch": 2.53, "learning_rate": 1.763414523583006e-05, "loss": 1.4537, "step": 32183 }, { "epoch": 2.53, "learning_rate": 1.7628331343708796e-05, "loss": 1.4246, "step": 32184 }, { "epoch": 2.53, "learning_rate": 1.762251835031812e-05, "loss": 1.4554, "step": 32185 }, { "epoch": 2.53, "learning_rate": 1.7616706255697454e-05, "loss": 1.4636, "step": 32186 }, { "epoch": 2.53, "learning_rate": 1.761089505988633e-05, "loss": 1.4523, "step": 32187 }, { "epoch": 2.53, "learning_rate": 1.7605084762924186e-05, "loss": 1.3838, "step": 32188 }, { "epoch": 2.53, "learning_rate": 1.7599275364850407e-05, "loss": 1.4278, "step": 32189 }, { "epoch": 2.53, "learning_rate": 1.759346686570451e-05, "loss": 1.4498, "step": 32190 }, { "epoch": 2.53, "learning_rate": 1.7587659265525912e-05, "loss": 1.457, "step": 32191 }, { "epoch": 2.53, "learning_rate": 1.7581852564354015e-05, "loss": 1.4394, "step": 32192 }, { "epoch": 2.53, "learning_rate": 1.757604676222829e-05, "loss": 1.4678, "step": 32193 }, { "epoch": 2.53, "learning_rate": 1.7570241859188123e-05, "loss": 1.4002, "step": 32194 }, { "epoch": 2.53, "learning_rate": 1.7564437855272913e-05, "loss": 1.4903, "step": 32195 }, { "epoch": 2.53, "learning_rate": 1.7558634750522075e-05, "loss": 1.4372, "step": 32196 }, { "epoch": 2.53, "learning_rate": 1.7552832544975055e-05, "loss": 1.4761, "step": 32197 }, { "epoch": 2.53, "learning_rate": 1.7547031238671213e-05, "loss": 1.4835, "step": 32198 }, { "epoch": 2.53, "learning_rate": 1.75412308316499e-05, "loss": 1.467, "step": 32199 }, { "epoch": 2.53, "learning_rate": 1.7535431323950556e-05, "loss": 1.4624, "step": 32200 }, { "epoch": 2.53, "learning_rate": 1.7529632715612546e-05, "loss": 1.4798, "step": 32201 }, { "epoch": 2.53, "learning_rate": 1.7523835006675225e-05, "loss": 1.407, "step": 32202 }, { "epoch": 2.53, "learning_rate": 1.7518038197177925e-05, "loss": 1.4468, "step": 32203 }, { "epoch": 2.53, "learning_rate": 1.7512242287160066e-05, "loss": 1.4454, "step": 32204 }, { "epoch": 2.53, "learning_rate": 1.7506447276660985e-05, "loss": 1.4502, "step": 32205 }, { "epoch": 2.53, "learning_rate": 1.7500653165719965e-05, "loss": 1.4651, "step": 32206 }, { "epoch": 2.53, "learning_rate": 1.749485995437642e-05, "loss": 1.4133, "step": 32207 }, { "epoch": 2.53, "learning_rate": 1.7489067642669662e-05, "loss": 1.3928, "step": 32208 }, { "epoch": 2.53, "learning_rate": 1.748327623063897e-05, "loss": 1.4168, "step": 32209 }, { "epoch": 2.53, "learning_rate": 1.7477485718323698e-05, "loss": 1.4815, "step": 32210 }, { "epoch": 2.53, "learning_rate": 1.747169610576321e-05, "loss": 1.4279, "step": 32211 }, { "epoch": 2.53, "learning_rate": 1.7465907392996763e-05, "loss": 1.455, "step": 32212 }, { "epoch": 2.53, "learning_rate": 1.746011958006364e-05, "loss": 1.4751, "step": 32213 }, { "epoch": 2.53, "learning_rate": 1.7454332667003197e-05, "loss": 1.4396, "step": 32214 }, { "epoch": 2.53, "learning_rate": 1.744854665385468e-05, "loss": 1.4287, "step": 32215 }, { "epoch": 2.53, "learning_rate": 1.7442761540657358e-05, "loss": 1.4284, "step": 32216 }, { "epoch": 2.53, "learning_rate": 1.7436977327450567e-05, "loss": 1.4288, "step": 32217 }, { "epoch": 2.53, "learning_rate": 1.7431194014273546e-05, "loss": 1.4065, "step": 32218 }, { "epoch": 2.54, "learning_rate": 1.7425411601165562e-05, "loss": 1.4756, "step": 32219 }, { "epoch": 2.54, "learning_rate": 1.741963008816583e-05, "loss": 1.453, "step": 32220 }, { "epoch": 2.54, "learning_rate": 1.741384947531369e-05, "loss": 1.4597, "step": 32221 }, { "epoch": 2.54, "learning_rate": 1.7408069762648342e-05, "loss": 1.4344, "step": 32222 }, { "epoch": 2.54, "learning_rate": 1.7402290950209e-05, "loss": 1.4442, "step": 32223 }, { "epoch": 2.54, "learning_rate": 1.7396513038034958e-05, "loss": 1.4639, "step": 32224 }, { "epoch": 2.54, "learning_rate": 1.7390736026165415e-05, "loss": 1.4583, "step": 32225 }, { "epoch": 2.54, "learning_rate": 1.738495991463955e-05, "loss": 1.4227, "step": 32226 }, { "epoch": 2.54, "learning_rate": 1.737918470349664e-05, "loss": 1.4048, "step": 32227 }, { "epoch": 2.54, "learning_rate": 1.7373410392775916e-05, "loss": 1.4645, "step": 32228 }, { "epoch": 2.54, "learning_rate": 1.736763698251653e-05, "loss": 1.4652, "step": 32229 }, { "epoch": 2.54, "learning_rate": 1.736186447275767e-05, "loss": 1.431, "step": 32230 }, { "epoch": 2.54, "learning_rate": 1.73560928635386e-05, "loss": 1.4261, "step": 32231 }, { "epoch": 2.54, "learning_rate": 1.7350322154898446e-05, "loss": 1.4589, "step": 32232 }, { "epoch": 2.54, "learning_rate": 1.7344552346876365e-05, "loss": 1.4259, "step": 32233 }, { "epoch": 2.54, "learning_rate": 1.733878343951162e-05, "loss": 1.4086, "step": 32234 }, { "epoch": 2.54, "learning_rate": 1.7333015432843312e-05, "loss": 1.4488, "step": 32235 }, { "epoch": 2.54, "learning_rate": 1.7327248326910588e-05, "loss": 1.4072, "step": 32236 }, { "epoch": 2.54, "learning_rate": 1.7321482121752666e-05, "loss": 1.5135, "step": 32237 }, { "epoch": 2.54, "learning_rate": 1.731571681740867e-05, "loss": 1.4318, "step": 32238 }, { "epoch": 2.54, "learning_rate": 1.7309952413917717e-05, "loss": 1.3922, "step": 32239 }, { "epoch": 2.54, "learning_rate": 1.7304188911318957e-05, "loss": 1.4261, "step": 32240 }, { "epoch": 2.54, "learning_rate": 1.7298426309651544e-05, "loss": 1.512, "step": 32241 }, { "epoch": 2.54, "learning_rate": 1.7292664608954543e-05, "loss": 1.4327, "step": 32242 }, { "epoch": 2.54, "learning_rate": 1.728690380926716e-05, "loss": 1.4269, "step": 32243 }, { "epoch": 2.54, "learning_rate": 1.7281143910628432e-05, "loss": 1.442, "step": 32244 }, { "epoch": 2.54, "learning_rate": 1.7275384913077523e-05, "loss": 1.4772, "step": 32245 }, { "epoch": 2.54, "learning_rate": 1.7269626816653503e-05, "loss": 1.4252, "step": 32246 }, { "epoch": 2.54, "learning_rate": 1.7263869621395443e-05, "loss": 1.4494, "step": 32247 }, { "epoch": 2.54, "learning_rate": 1.725811332734249e-05, "loss": 1.4303, "step": 32248 }, { "epoch": 2.54, "learning_rate": 1.7252357934533707e-05, "loss": 1.3363, "step": 32249 }, { "epoch": 2.54, "learning_rate": 1.7246603443008118e-05, "loss": 1.4312, "step": 32250 }, { "epoch": 2.54, "learning_rate": 1.724084985280486e-05, "loss": 1.4686, "step": 32251 }, { "epoch": 2.54, "learning_rate": 1.7235097163962958e-05, "loss": 1.4769, "step": 32252 }, { "epoch": 2.54, "learning_rate": 1.7229345376521474e-05, "loss": 1.4261, "step": 32253 }, { "epoch": 2.54, "learning_rate": 1.7223594490519483e-05, "loss": 1.4302, "step": 32254 }, { "epoch": 2.54, "learning_rate": 1.7217844505996016e-05, "loss": 1.443, "step": 32255 }, { "epoch": 2.54, "learning_rate": 1.7212095422990107e-05, "loss": 1.4889, "step": 32256 }, { "epoch": 2.54, "learning_rate": 1.7206347241540762e-05, "loss": 1.4858, "step": 32257 }, { "epoch": 2.54, "learning_rate": 1.7200599961687035e-05, "loss": 1.3917, "step": 32258 }, { "epoch": 2.54, "learning_rate": 1.719485358346799e-05, "loss": 1.4643, "step": 32259 }, { "epoch": 2.54, "learning_rate": 1.7189108106922578e-05, "loss": 1.4929, "step": 32260 }, { "epoch": 2.54, "learning_rate": 1.7183363532089822e-05, "loss": 1.44, "step": 32261 }, { "epoch": 2.54, "learning_rate": 1.7177619859008758e-05, "loss": 1.4562, "step": 32262 }, { "epoch": 2.54, "learning_rate": 1.717187708771835e-05, "loss": 1.4345, "step": 32263 }, { "epoch": 2.54, "learning_rate": 1.716613521825759e-05, "loss": 1.4327, "step": 32264 }, { "epoch": 2.54, "learning_rate": 1.716039425066547e-05, "loss": 1.4678, "step": 32265 }, { "epoch": 2.54, "learning_rate": 1.715465418498099e-05, "loss": 1.3999, "step": 32266 }, { "epoch": 2.54, "learning_rate": 1.7148915021243036e-05, "loss": 1.4682, "step": 32267 }, { "epoch": 2.54, "learning_rate": 1.714317675949069e-05, "loss": 1.4621, "step": 32268 }, { "epoch": 2.54, "learning_rate": 1.7137439399762864e-05, "loss": 1.4132, "step": 32269 }, { "epoch": 2.54, "learning_rate": 1.7131702942098463e-05, "loss": 1.4375, "step": 32270 }, { "epoch": 2.54, "learning_rate": 1.7125967386536504e-05, "loss": 1.4347, "step": 32271 }, { "epoch": 2.54, "learning_rate": 1.7120232733115906e-05, "loss": 1.4961, "step": 32272 }, { "epoch": 2.54, "learning_rate": 1.7114498981875556e-05, "loss": 1.3846, "step": 32273 }, { "epoch": 2.54, "learning_rate": 1.710876613285444e-05, "loss": 1.4736, "step": 32274 }, { "epoch": 2.54, "learning_rate": 1.710303418609149e-05, "loss": 1.434, "step": 32275 }, { "epoch": 2.54, "learning_rate": 1.7097303141625594e-05, "loss": 1.4238, "step": 32276 }, { "epoch": 2.54, "learning_rate": 1.709157299949569e-05, "loss": 1.4617, "step": 32277 }, { "epoch": 2.54, "learning_rate": 1.7085843759740607e-05, "loss": 1.4296, "step": 32278 }, { "epoch": 2.54, "learning_rate": 1.708011542239934e-05, "loss": 1.4381, "step": 32279 }, { "epoch": 2.54, "learning_rate": 1.707438798751073e-05, "loss": 1.4415, "step": 32280 }, { "epoch": 2.54, "learning_rate": 1.7068661455113653e-05, "loss": 1.4141, "step": 32281 }, { "epoch": 2.54, "learning_rate": 1.7062935825247027e-05, "loss": 1.4248, "step": 32282 }, { "epoch": 2.54, "learning_rate": 1.70572110979497e-05, "loss": 1.4462, "step": 32283 }, { "epoch": 2.54, "learning_rate": 1.7051487273260515e-05, "loss": 1.4402, "step": 32284 }, { "epoch": 2.54, "learning_rate": 1.7045764351218404e-05, "loss": 1.5021, "step": 32285 }, { "epoch": 2.54, "learning_rate": 1.7040042331862187e-05, "loss": 1.4734, "step": 32286 }, { "epoch": 2.54, "learning_rate": 1.7034321215230677e-05, "loss": 1.4656, "step": 32287 }, { "epoch": 2.54, "learning_rate": 1.702860100136277e-05, "loss": 1.4173, "step": 32288 }, { "epoch": 2.54, "learning_rate": 1.7022881690297256e-05, "loss": 1.4287, "step": 32289 }, { "epoch": 2.54, "learning_rate": 1.7017163282073033e-05, "loss": 1.4601, "step": 32290 }, { "epoch": 2.54, "learning_rate": 1.7011445776728844e-05, "loss": 1.4705, "step": 32291 }, { "epoch": 2.54, "learning_rate": 1.7005729174303593e-05, "loss": 1.5031, "step": 32292 }, { "epoch": 2.54, "learning_rate": 1.7000013474836037e-05, "loss": 1.4429, "step": 32293 }, { "epoch": 2.54, "learning_rate": 1.699429867836496e-05, "loss": 1.4944, "step": 32294 }, { "epoch": 2.54, "learning_rate": 1.698858478492923e-05, "loss": 1.4575, "step": 32295 }, { "epoch": 2.54, "learning_rate": 1.6982871794567608e-05, "loss": 1.3894, "step": 32296 }, { "epoch": 2.54, "learning_rate": 1.6977159707318893e-05, "loss": 1.4613, "step": 32297 }, { "epoch": 2.54, "learning_rate": 1.6971448523221816e-05, "loss": 1.4164, "step": 32298 }, { "epoch": 2.54, "learning_rate": 1.6965738242315208e-05, "loss": 1.4634, "step": 32299 }, { "epoch": 2.54, "learning_rate": 1.6960028864637843e-05, "loss": 1.41, "step": 32300 }, { "epoch": 2.54, "learning_rate": 1.695432039022842e-05, "loss": 1.4144, "step": 32301 }, { "epoch": 2.54, "learning_rate": 1.6948612819125778e-05, "loss": 1.4299, "step": 32302 }, { "epoch": 2.54, "learning_rate": 1.6942906151368636e-05, "loss": 1.497, "step": 32303 }, { "epoch": 2.54, "learning_rate": 1.6937200386995707e-05, "loss": 1.4532, "step": 32304 }, { "epoch": 2.54, "learning_rate": 1.693149552604575e-05, "loss": 1.4833, "step": 32305 }, { "epoch": 2.54, "learning_rate": 1.6925791568557535e-05, "loss": 1.4488, "step": 32306 }, { "epoch": 2.54, "learning_rate": 1.692008851456976e-05, "loss": 1.472, "step": 32307 }, { "epoch": 2.54, "learning_rate": 1.6914386364121107e-05, "loss": 1.4569, "step": 32308 }, { "epoch": 2.54, "learning_rate": 1.690868511725037e-05, "loss": 1.4191, "step": 32309 }, { "epoch": 2.54, "learning_rate": 1.6902984773996214e-05, "loss": 1.4241, "step": 32310 }, { "epoch": 2.54, "learning_rate": 1.689728533439731e-05, "loss": 1.4946, "step": 32311 }, { "epoch": 2.54, "learning_rate": 1.6891586798492407e-05, "loss": 1.3673, "step": 32312 }, { "epoch": 2.54, "learning_rate": 1.6885889166320178e-05, "loss": 1.3875, "step": 32313 }, { "epoch": 2.54, "learning_rate": 1.6880192437919303e-05, "loss": 1.4244, "step": 32314 }, { "epoch": 2.54, "learning_rate": 1.687449661332844e-05, "loss": 1.4481, "step": 32315 }, { "epoch": 2.54, "learning_rate": 1.6868801692586308e-05, "loss": 1.4642, "step": 32316 }, { "epoch": 2.54, "learning_rate": 1.6863107675731542e-05, "loss": 1.4658, "step": 32317 }, { "epoch": 2.54, "learning_rate": 1.6857414562802772e-05, "loss": 1.4626, "step": 32318 }, { "epoch": 2.54, "learning_rate": 1.685172235383871e-05, "loss": 1.4676, "step": 32319 }, { "epoch": 2.54, "learning_rate": 1.684603104887795e-05, "loss": 1.4357, "step": 32320 }, { "epoch": 2.54, "learning_rate": 1.6840340647959183e-05, "loss": 1.4847, "step": 32321 }, { "epoch": 2.54, "learning_rate": 1.683465115112101e-05, "loss": 1.4456, "step": 32322 }, { "epoch": 2.54, "learning_rate": 1.682896255840208e-05, "loss": 1.3916, "step": 32323 }, { "epoch": 2.54, "learning_rate": 1.6823274869841e-05, "loss": 1.4503, "step": 32324 }, { "epoch": 2.54, "learning_rate": 1.6817588085476375e-05, "loss": 1.425, "step": 32325 }, { "epoch": 2.54, "learning_rate": 1.681190220534685e-05, "loss": 1.4485, "step": 32326 }, { "epoch": 2.54, "learning_rate": 1.6806217229491016e-05, "loss": 1.4401, "step": 32327 }, { "epoch": 2.54, "learning_rate": 1.6800533157947436e-05, "loss": 1.4194, "step": 32328 }, { "epoch": 2.54, "learning_rate": 1.6794849990754755e-05, "loss": 1.4368, "step": 32329 }, { "epoch": 2.54, "learning_rate": 1.6789167727951534e-05, "loss": 1.5148, "step": 32330 }, { "epoch": 2.54, "learning_rate": 1.678348636957635e-05, "loss": 1.4447, "step": 32331 }, { "epoch": 2.54, "learning_rate": 1.6777805915667764e-05, "loss": 1.4511, "step": 32332 }, { "epoch": 2.54, "learning_rate": 1.6772126366264364e-05, "loss": 1.4345, "step": 32333 }, { "epoch": 2.54, "learning_rate": 1.6766447721404725e-05, "loss": 1.494, "step": 32334 }, { "epoch": 2.54, "learning_rate": 1.6760769981127342e-05, "loss": 1.4732, "step": 32335 }, { "epoch": 2.54, "learning_rate": 1.6755093145470806e-05, "loss": 1.3974, "step": 32336 }, { "epoch": 2.54, "learning_rate": 1.674941721447368e-05, "loss": 1.4778, "step": 32337 }, { "epoch": 2.54, "learning_rate": 1.674374218817449e-05, "loss": 1.4761, "step": 32338 }, { "epoch": 2.54, "learning_rate": 1.6738068066611722e-05, "loss": 1.4293, "step": 32339 }, { "epoch": 2.54, "learning_rate": 1.6732394849823954e-05, "loss": 1.4756, "step": 32340 }, { "epoch": 2.54, "learning_rate": 1.672672253784968e-05, "loss": 1.454, "step": 32341 }, { "epoch": 2.54, "learning_rate": 1.6721051130727397e-05, "loss": 1.4336, "step": 32342 }, { "epoch": 2.54, "learning_rate": 1.6715380628495646e-05, "loss": 1.4319, "step": 32343 }, { "epoch": 2.54, "learning_rate": 1.6709711031192907e-05, "loss": 1.4593, "step": 32344 }, { "epoch": 2.54, "learning_rate": 1.6704042338857654e-05, "loss": 1.4414, "step": 32345 }, { "epoch": 2.55, "learning_rate": 1.6698374551528422e-05, "loss": 1.4389, "step": 32346 }, { "epoch": 2.55, "learning_rate": 1.6692707669243662e-05, "loss": 1.4522, "step": 32347 }, { "epoch": 2.55, "learning_rate": 1.6687041692041825e-05, "loss": 1.418, "step": 32348 }, { "epoch": 2.55, "learning_rate": 1.668137661996142e-05, "loss": 1.461, "step": 32349 }, { "epoch": 2.55, "learning_rate": 1.6675712453040925e-05, "loss": 1.4604, "step": 32350 }, { "epoch": 2.55, "learning_rate": 1.6670049191318748e-05, "loss": 1.4446, "step": 32351 }, { "epoch": 2.55, "learning_rate": 1.6664386834833305e-05, "loss": 1.4736, "step": 32352 }, { "epoch": 2.55, "learning_rate": 1.665872538362315e-05, "loss": 1.433, "step": 32353 }, { "epoch": 2.55, "learning_rate": 1.665306483772667e-05, "loss": 1.4602, "step": 32354 }, { "epoch": 2.55, "learning_rate": 1.66474051971823e-05, "loss": 1.508, "step": 32355 }, { "epoch": 2.55, "learning_rate": 1.664174646202841e-05, "loss": 1.4707, "step": 32356 }, { "epoch": 2.55, "learning_rate": 1.6636088632303517e-05, "loss": 1.4507, "step": 32357 }, { "epoch": 2.55, "learning_rate": 1.6630431708045978e-05, "loss": 1.4706, "step": 32358 }, { "epoch": 2.55, "learning_rate": 1.6624775689294174e-05, "loss": 1.432, "step": 32359 }, { "epoch": 2.55, "learning_rate": 1.6619120576086575e-05, "loss": 1.4481, "step": 32360 }, { "epoch": 2.55, "learning_rate": 1.6613466368461554e-05, "loss": 1.442, "step": 32361 }, { "epoch": 2.55, "learning_rate": 1.6607813066457442e-05, "loss": 1.5083, "step": 32362 }, { "epoch": 2.55, "learning_rate": 1.6602160670112697e-05, "loss": 1.4707, "step": 32363 }, { "epoch": 2.55, "learning_rate": 1.6596509179465665e-05, "loss": 1.4769, "step": 32364 }, { "epoch": 2.55, "learning_rate": 1.6590858594554705e-05, "loss": 1.4355, "step": 32365 }, { "epoch": 2.55, "learning_rate": 1.6585208915418203e-05, "loss": 1.4771, "step": 32366 }, { "epoch": 2.55, "learning_rate": 1.6579560142094524e-05, "loss": 1.456, "step": 32367 }, { "epoch": 2.55, "learning_rate": 1.657391227462197e-05, "loss": 1.4954, "step": 32368 }, { "epoch": 2.55, "learning_rate": 1.6568265313038914e-05, "loss": 1.3981, "step": 32369 }, { "epoch": 2.55, "learning_rate": 1.6562619257383743e-05, "loss": 1.4977, "step": 32370 }, { "epoch": 2.55, "learning_rate": 1.6556974107694737e-05, "loss": 1.3972, "step": 32371 }, { "epoch": 2.55, "learning_rate": 1.6551329864010237e-05, "loss": 1.3905, "step": 32372 }, { "epoch": 2.55, "learning_rate": 1.6545686526368545e-05, "loss": 1.4192, "step": 32373 }, { "epoch": 2.55, "learning_rate": 1.654004409480803e-05, "loss": 1.452, "step": 32374 }, { "epoch": 2.55, "learning_rate": 1.6534402569366946e-05, "loss": 1.4552, "step": 32375 }, { "epoch": 2.55, "learning_rate": 1.652876195008361e-05, "loss": 1.4369, "step": 32376 }, { "epoch": 2.55, "learning_rate": 1.652312223699634e-05, "loss": 1.4743, "step": 32377 }, { "epoch": 2.55, "learning_rate": 1.6517483430143408e-05, "loss": 1.4393, "step": 32378 }, { "epoch": 2.55, "learning_rate": 1.6511845529563084e-05, "loss": 1.4327, "step": 32379 }, { "epoch": 2.55, "learning_rate": 1.6506208535293686e-05, "loss": 1.4112, "step": 32380 }, { "epoch": 2.55, "learning_rate": 1.6500572447373468e-05, "loss": 1.4282, "step": 32381 }, { "epoch": 2.55, "learning_rate": 1.6494937265840662e-05, "loss": 1.4736, "step": 32382 }, { "epoch": 2.55, "learning_rate": 1.648930299073356e-05, "loss": 1.4524, "step": 32383 }, { "epoch": 2.55, "learning_rate": 1.6483669622090427e-05, "loss": 1.4424, "step": 32384 }, { "epoch": 2.55, "learning_rate": 1.647803715994952e-05, "loss": 1.4716, "step": 32385 }, { "epoch": 2.55, "learning_rate": 1.6472405604349004e-05, "loss": 1.5036, "step": 32386 }, { "epoch": 2.55, "learning_rate": 1.6466774955327216e-05, "loss": 1.4642, "step": 32387 }, { "epoch": 2.55, "learning_rate": 1.6461145212922328e-05, "loss": 1.4372, "step": 32388 }, { "epoch": 2.55, "learning_rate": 1.6455516377172573e-05, "loss": 1.436, "step": 32389 }, { "epoch": 2.55, "learning_rate": 1.6449888448116137e-05, "loss": 1.4397, "step": 32390 }, { "epoch": 2.55, "learning_rate": 1.6444261425791294e-05, "loss": 1.4315, "step": 32391 }, { "epoch": 2.55, "learning_rate": 1.643863531023621e-05, "loss": 1.4753, "step": 32392 }, { "epoch": 2.55, "learning_rate": 1.6433010101489052e-05, "loss": 1.446, "step": 32393 }, { "epoch": 2.55, "learning_rate": 1.6427385799588077e-05, "loss": 1.5026, "step": 32394 }, { "epoch": 2.55, "learning_rate": 1.6421762404571452e-05, "loss": 1.4716, "step": 32395 }, { "epoch": 2.55, "learning_rate": 1.64161399164773e-05, "loss": 1.4526, "step": 32396 }, { "epoch": 2.55, "learning_rate": 1.6410518335343885e-05, "loss": 1.4286, "step": 32397 }, { "epoch": 2.55, "learning_rate": 1.6404897661209316e-05, "loss": 1.4286, "step": 32398 }, { "epoch": 2.55, "learning_rate": 1.639927789411174e-05, "loss": 1.3563, "step": 32399 }, { "epoch": 2.55, "learning_rate": 1.6393659034089346e-05, "loss": 1.4419, "step": 32400 }, { "epoch": 2.55, "learning_rate": 1.638804108118032e-05, "loss": 1.4318, "step": 32401 }, { "epoch": 2.55, "learning_rate": 1.638242403542275e-05, "loss": 1.4249, "step": 32402 }, { "epoch": 2.55, "learning_rate": 1.637680789685475e-05, "loss": 1.4683, "step": 32403 }, { "epoch": 2.55, "learning_rate": 1.637119266551451e-05, "loss": 1.5127, "step": 32404 }, { "epoch": 2.55, "learning_rate": 1.6365578341440134e-05, "loss": 1.4796, "step": 32405 }, { "epoch": 2.55, "learning_rate": 1.6359964924669704e-05, "loss": 1.3922, "step": 32406 }, { "epoch": 2.55, "learning_rate": 1.635435241524141e-05, "loss": 1.4912, "step": 32407 }, { "epoch": 2.55, "learning_rate": 1.634874081319329e-05, "loss": 1.4626, "step": 32408 }, { "epoch": 2.55, "learning_rate": 1.6343130118563476e-05, "loss": 1.4465, "step": 32409 }, { "epoch": 2.55, "learning_rate": 1.6337520331390018e-05, "loss": 1.4062, "step": 32410 }, { "epoch": 2.55, "learning_rate": 1.633191145171108e-05, "loss": 1.3992, "step": 32411 }, { "epoch": 2.55, "learning_rate": 1.6326303479564682e-05, "loss": 1.4629, "step": 32412 }, { "epoch": 2.55, "learning_rate": 1.6320696414988875e-05, "loss": 1.4631, "step": 32413 }, { "epoch": 2.55, "learning_rate": 1.6315090258021823e-05, "loss": 1.4665, "step": 32414 }, { "epoch": 2.55, "learning_rate": 1.6309485008701494e-05, "loss": 1.4488, "step": 32415 }, { "epoch": 2.55, "learning_rate": 1.6303880667066012e-05, "loss": 1.4386, "step": 32416 }, { "epoch": 2.55, "learning_rate": 1.629827723315339e-05, "loss": 1.4185, "step": 32417 }, { "epoch": 2.55, "learning_rate": 1.6292674707001684e-05, "loss": 1.4212, "step": 32418 }, { "epoch": 2.55, "learning_rate": 1.628707308864895e-05, "loss": 1.4094, "step": 32419 }, { "epoch": 2.55, "learning_rate": 1.628147237813317e-05, "loss": 1.4498, "step": 32420 }, { "epoch": 2.55, "learning_rate": 1.6275872575492434e-05, "loss": 1.4646, "step": 32421 }, { "epoch": 2.55, "learning_rate": 1.6270273680764705e-05, "loss": 1.4444, "step": 32422 }, { "epoch": 2.55, "learning_rate": 1.626467569398801e-05, "loss": 1.4508, "step": 32423 }, { "epoch": 2.55, "learning_rate": 1.62590786152004e-05, "loss": 1.4386, "step": 32424 }, { "epoch": 2.55, "learning_rate": 1.6253482444439824e-05, "loss": 1.4427, "step": 32425 }, { "epoch": 2.55, "learning_rate": 1.6247887181744307e-05, "loss": 1.421, "step": 32426 }, { "epoch": 2.55, "learning_rate": 1.6242292827151797e-05, "loss": 1.4525, "step": 32427 }, { "epoch": 2.55, "learning_rate": 1.6236699380700317e-05, "loss": 1.4424, "step": 32428 }, { "epoch": 2.55, "learning_rate": 1.6231106842427854e-05, "loss": 1.4003, "step": 32429 }, { "epoch": 2.55, "learning_rate": 1.622551521237231e-05, "loss": 1.4606, "step": 32430 }, { "epoch": 2.55, "learning_rate": 1.62199244905717e-05, "loss": 1.4367, "step": 32431 }, { "epoch": 2.55, "learning_rate": 1.6214334677064017e-05, "loss": 1.4257, "step": 32432 }, { "epoch": 2.55, "learning_rate": 1.620874577188716e-05, "loss": 1.4184, "step": 32433 }, { "epoch": 2.55, "learning_rate": 1.6203157775079067e-05, "loss": 1.437, "step": 32434 }, { "epoch": 2.55, "learning_rate": 1.6197570686677725e-05, "loss": 1.412, "step": 32435 }, { "epoch": 2.55, "learning_rate": 1.6191984506721035e-05, "loss": 1.4659, "step": 32436 }, { "epoch": 2.55, "learning_rate": 1.61863992352469e-05, "loss": 1.4935, "step": 32437 }, { "epoch": 2.55, "learning_rate": 1.618081487229329e-05, "loss": 1.4292, "step": 32438 }, { "epoch": 2.55, "learning_rate": 1.617523141789811e-05, "loss": 1.4503, "step": 32439 }, { "epoch": 2.55, "learning_rate": 1.6169648872099227e-05, "loss": 1.4613, "step": 32440 }, { "epoch": 2.55, "learning_rate": 1.6164067234934613e-05, "loss": 1.4803, "step": 32441 }, { "epoch": 2.55, "learning_rate": 1.615848650644212e-05, "loss": 1.5, "step": 32442 }, { "epoch": 2.55, "learning_rate": 1.6152906686659634e-05, "loss": 1.4196, "step": 32443 }, { "epoch": 2.55, "learning_rate": 1.6147327775625025e-05, "loss": 1.42, "step": 32444 }, { "epoch": 2.55, "learning_rate": 1.614174977337623e-05, "loss": 1.4866, "step": 32445 }, { "epoch": 2.55, "learning_rate": 1.613617267995105e-05, "loss": 1.4047, "step": 32446 }, { "epoch": 2.55, "learning_rate": 1.613059649538739e-05, "loss": 1.4337, "step": 32447 }, { "epoch": 2.55, "learning_rate": 1.6125021219723118e-05, "loss": 1.4734, "step": 32448 }, { "epoch": 2.55, "learning_rate": 1.611944685299609e-05, "loss": 1.4729, "step": 32449 }, { "epoch": 2.55, "learning_rate": 1.6113873395244138e-05, "loss": 1.4672, "step": 32450 }, { "epoch": 2.55, "learning_rate": 1.610830084650507e-05, "loss": 1.4507, "step": 32451 }, { "epoch": 2.55, "learning_rate": 1.6102729206816765e-05, "loss": 1.4366, "step": 32452 }, { "epoch": 2.55, "learning_rate": 1.6097158476217055e-05, "loss": 1.4576, "step": 32453 }, { "epoch": 2.55, "learning_rate": 1.6091588654743716e-05, "loss": 1.4187, "step": 32454 }, { "epoch": 2.55, "learning_rate": 1.6086019742434604e-05, "loss": 1.4446, "step": 32455 }, { "epoch": 2.55, "learning_rate": 1.6080451739327537e-05, "loss": 1.4436, "step": 32456 }, { "epoch": 2.55, "learning_rate": 1.6074884645460255e-05, "loss": 1.4247, "step": 32457 }, { "epoch": 2.55, "learning_rate": 1.6069318460870645e-05, "loss": 1.4874, "step": 32458 }, { "epoch": 2.55, "learning_rate": 1.6063753185596457e-05, "loss": 1.3946, "step": 32459 }, { "epoch": 2.55, "learning_rate": 1.605818881967543e-05, "loss": 1.4628, "step": 32460 }, { "epoch": 2.55, "learning_rate": 1.6052625363145428e-05, "loss": 1.5079, "step": 32461 }, { "epoch": 2.55, "learning_rate": 1.6047062816044142e-05, "loss": 1.4431, "step": 32462 }, { "epoch": 2.55, "learning_rate": 1.604150117840941e-05, "loss": 1.4601, "step": 32463 }, { "epoch": 2.55, "learning_rate": 1.6035940450278916e-05, "loss": 1.4341, "step": 32464 }, { "epoch": 2.55, "learning_rate": 1.6030380631690514e-05, "loss": 1.431, "step": 32465 }, { "epoch": 2.55, "learning_rate": 1.6024821722681873e-05, "loss": 1.4626, "step": 32466 }, { "epoch": 2.55, "learning_rate": 1.601926372329078e-05, "loss": 1.4429, "step": 32467 }, { "epoch": 2.55, "learning_rate": 1.6013706633554907e-05, "loss": 1.4427, "step": 32468 }, { "epoch": 2.55, "learning_rate": 1.600815045351207e-05, "loss": 1.4196, "step": 32469 }, { "epoch": 2.55, "learning_rate": 1.600259518319994e-05, "loss": 1.4345, "step": 32470 }, { "epoch": 2.55, "learning_rate": 1.5997040822656205e-05, "loss": 1.4658, "step": 32471 }, { "epoch": 2.55, "learning_rate": 1.5991487371918647e-05, "loss": 1.4314, "step": 32472 }, { "epoch": 2.56, "learning_rate": 1.5985934831024945e-05, "loss": 1.4512, "step": 32473 }, { "epoch": 2.56, "learning_rate": 1.598038320001276e-05, "loss": 1.3844, "step": 32474 }, { "epoch": 2.56, "learning_rate": 1.5974832478919847e-05, "loss": 1.5001, "step": 32475 }, { "epoch": 2.56, "learning_rate": 1.5969282667783846e-05, "loss": 1.4566, "step": 32476 }, { "epoch": 2.56, "learning_rate": 1.596373376664244e-05, "loss": 1.4218, "step": 32477 }, { "epoch": 2.56, "learning_rate": 1.59581857755333e-05, "loss": 1.4358, "step": 32478 }, { "epoch": 2.56, "learning_rate": 1.5952638694494146e-05, "loss": 1.4503, "step": 32479 }, { "epoch": 2.56, "learning_rate": 1.5947092523562598e-05, "loss": 1.4503, "step": 32480 }, { "epoch": 2.56, "learning_rate": 1.5941547262776276e-05, "loss": 1.4056, "step": 32481 }, { "epoch": 2.56, "learning_rate": 1.593600291217292e-05, "loss": 1.4782, "step": 32482 }, { "epoch": 2.56, "learning_rate": 1.593045947179011e-05, "loss": 1.4393, "step": 32483 }, { "epoch": 2.56, "learning_rate": 1.59249169416655e-05, "loss": 1.4148, "step": 32484 }, { "epoch": 2.56, "learning_rate": 1.5919375321836664e-05, "loss": 1.4471, "step": 32485 }, { "epoch": 2.56, "learning_rate": 1.5913834612341337e-05, "loss": 1.5213, "step": 32486 }, { "epoch": 2.56, "learning_rate": 1.5908294813217053e-05, "loss": 1.4709, "step": 32487 }, { "epoch": 2.56, "learning_rate": 1.5902755924501435e-05, "loss": 1.4879, "step": 32488 }, { "epoch": 2.56, "learning_rate": 1.5897217946232138e-05, "loss": 1.4663, "step": 32489 }, { "epoch": 2.56, "learning_rate": 1.589168087844671e-05, "loss": 1.4352, "step": 32490 }, { "epoch": 2.56, "learning_rate": 1.588614472118274e-05, "loss": 1.4188, "step": 32491 }, { "epoch": 2.56, "learning_rate": 1.588060947447787e-05, "loss": 1.4922, "step": 32492 }, { "epoch": 2.56, "learning_rate": 1.5875075138369627e-05, "loss": 1.4286, "step": 32493 }, { "epoch": 2.56, "learning_rate": 1.5869541712895617e-05, "loss": 1.4395, "step": 32494 }, { "epoch": 2.56, "learning_rate": 1.586400919809338e-05, "loss": 1.4807, "step": 32495 }, { "epoch": 2.56, "learning_rate": 1.5858477594000534e-05, "loss": 1.3964, "step": 32496 }, { "epoch": 2.56, "learning_rate": 1.5852946900654583e-05, "loss": 1.4342, "step": 32497 }, { "epoch": 2.56, "learning_rate": 1.584741711809308e-05, "loss": 1.4875, "step": 32498 }, { "epoch": 2.56, "learning_rate": 1.5841888246353612e-05, "loss": 1.4361, "step": 32499 }, { "epoch": 2.56, "learning_rate": 1.583636028547368e-05, "loss": 1.4575, "step": 32500 }, { "epoch": 2.56, "learning_rate": 1.5830833235490793e-05, "loss": 1.4611, "step": 32501 }, { "epoch": 2.56, "learning_rate": 1.5825307096442546e-05, "loss": 1.4543, "step": 32502 }, { "epoch": 2.56, "learning_rate": 1.5819781868366416e-05, "loss": 1.4794, "step": 32503 }, { "epoch": 2.56, "learning_rate": 1.581425755129992e-05, "loss": 1.4544, "step": 32504 }, { "epoch": 2.56, "learning_rate": 1.5808734145280526e-05, "loss": 1.449, "step": 32505 }, { "epoch": 2.56, "learning_rate": 1.5803211650345827e-05, "loss": 1.4415, "step": 32506 }, { "epoch": 2.56, "learning_rate": 1.5797690066533254e-05, "loss": 1.4168, "step": 32507 }, { "epoch": 2.56, "learning_rate": 1.5792169393880278e-05, "loss": 1.4822, "step": 32508 }, { "epoch": 2.56, "learning_rate": 1.5786649632424404e-05, "loss": 1.4311, "step": 32509 }, { "epoch": 2.56, "learning_rate": 1.578113078220315e-05, "loss": 1.4255, "step": 32510 }, { "epoch": 2.56, "learning_rate": 1.5775612843253938e-05, "loss": 1.4235, "step": 32511 }, { "epoch": 2.56, "learning_rate": 1.577009581561422e-05, "loss": 1.4604, "step": 32512 }, { "epoch": 2.56, "learning_rate": 1.576457969932152e-05, "loss": 1.4806, "step": 32513 }, { "epoch": 2.56, "learning_rate": 1.575906449441323e-05, "loss": 1.4607, "step": 32514 }, { "epoch": 2.56, "learning_rate": 1.5753550200926784e-05, "loss": 1.4444, "step": 32515 }, { "epoch": 2.56, "learning_rate": 1.5748036818899677e-05, "loss": 1.3905, "step": 32516 }, { "epoch": 2.56, "learning_rate": 1.5742524348369333e-05, "loss": 1.4516, "step": 32517 }, { "epoch": 2.56, "learning_rate": 1.5737012789373105e-05, "loss": 1.3773, "step": 32518 }, { "epoch": 2.56, "learning_rate": 1.573150214194851e-05, "loss": 1.4616, "step": 32519 }, { "epoch": 2.56, "learning_rate": 1.572599240613292e-05, "loss": 1.4408, "step": 32520 }, { "epoch": 2.56, "learning_rate": 1.5720483581963737e-05, "loss": 1.4701, "step": 32521 }, { "epoch": 2.56, "learning_rate": 1.571497566947835e-05, "loss": 1.418, "step": 32522 }, { "epoch": 2.56, "learning_rate": 1.5709468668714197e-05, "loss": 1.4034, "step": 32523 }, { "epoch": 2.56, "learning_rate": 1.5703962579708644e-05, "loss": 1.4345, "step": 32524 }, { "epoch": 2.56, "learning_rate": 1.569845740249905e-05, "loss": 1.4629, "step": 32525 }, { "epoch": 2.56, "learning_rate": 1.569295313712281e-05, "loss": 1.4348, "step": 32526 }, { "epoch": 2.56, "learning_rate": 1.5687449783617334e-05, "loss": 1.4043, "step": 32527 }, { "epoch": 2.56, "learning_rate": 1.568194734201994e-05, "loss": 1.4124, "step": 32528 }, { "epoch": 2.56, "learning_rate": 1.5676445812367983e-05, "loss": 1.4621, "step": 32529 }, { "epoch": 2.56, "learning_rate": 1.5670945194698864e-05, "loss": 1.4156, "step": 32530 }, { "epoch": 2.56, "learning_rate": 1.5665445489049906e-05, "loss": 1.4578, "step": 32531 }, { "epoch": 2.56, "learning_rate": 1.565994669545839e-05, "loss": 1.4174, "step": 32532 }, { "epoch": 2.56, "learning_rate": 1.5654448813961744e-05, "loss": 1.4275, "step": 32533 }, { "epoch": 2.56, "learning_rate": 1.5648951844597268e-05, "loss": 1.466, "step": 32534 }, { "epoch": 2.56, "learning_rate": 1.5643455787402214e-05, "loss": 1.4407, "step": 32535 }, { "epoch": 2.56, "learning_rate": 1.5637960642413988e-05, "loss": 1.4638, "step": 32536 }, { "epoch": 2.56, "learning_rate": 1.5632466409669857e-05, "loss": 1.4693, "step": 32537 }, { "epoch": 2.56, "learning_rate": 1.5626973089207146e-05, "loss": 1.4587, "step": 32538 }, { "epoch": 2.56, "learning_rate": 1.5621480681063087e-05, "loss": 1.3954, "step": 32539 }, { "epoch": 2.56, "learning_rate": 1.5615989185275034e-05, "loss": 1.4322, "step": 32540 }, { "epoch": 2.56, "learning_rate": 1.5610498601880277e-05, "loss": 1.4983, "step": 32541 }, { "epoch": 2.56, "learning_rate": 1.560500893091607e-05, "loss": 1.4489, "step": 32542 }, { "epoch": 2.56, "learning_rate": 1.5599520172419662e-05, "loss": 1.3997, "step": 32543 }, { "epoch": 2.56, "learning_rate": 1.559403232642836e-05, "loss": 1.4291, "step": 32544 }, { "epoch": 2.56, "learning_rate": 1.558854539297943e-05, "loss": 1.507, "step": 32545 }, { "epoch": 2.56, "learning_rate": 1.5583059372110045e-05, "loss": 1.4502, "step": 32546 }, { "epoch": 2.56, "learning_rate": 1.5577574263857563e-05, "loss": 1.4653, "step": 32547 }, { "epoch": 2.56, "learning_rate": 1.5572090068259162e-05, "loss": 1.4489, "step": 32548 }, { "epoch": 2.56, "learning_rate": 1.5566606785352053e-05, "loss": 1.4333, "step": 32549 }, { "epoch": 2.56, "learning_rate": 1.5561124415173536e-05, "loss": 1.4094, "step": 32550 }, { "epoch": 2.56, "learning_rate": 1.5555642957760783e-05, "loss": 1.4405, "step": 32551 }, { "epoch": 2.56, "learning_rate": 1.5550162413150998e-05, "loss": 1.4377, "step": 32552 }, { "epoch": 2.56, "learning_rate": 1.5544682781381444e-05, "loss": 1.4676, "step": 32553 }, { "epoch": 2.56, "learning_rate": 1.5539204062489303e-05, "loss": 1.4286, "step": 32554 }, { "epoch": 2.56, "learning_rate": 1.5533726256511752e-05, "loss": 1.4431, "step": 32555 }, { "epoch": 2.56, "learning_rate": 1.552824936348595e-05, "loss": 1.4988, "step": 32556 }, { "epoch": 2.56, "learning_rate": 1.5522773383449165e-05, "loss": 1.3952, "step": 32557 }, { "epoch": 2.56, "learning_rate": 1.5517298316438552e-05, "loss": 1.466, "step": 32558 }, { "epoch": 2.56, "learning_rate": 1.5511824162491248e-05, "loss": 1.4542, "step": 32559 }, { "epoch": 2.56, "learning_rate": 1.5506350921644455e-05, "loss": 1.4492, "step": 32560 }, { "epoch": 2.56, "learning_rate": 1.5500878593935328e-05, "loss": 1.3659, "step": 32561 }, { "epoch": 2.56, "learning_rate": 1.549540717940102e-05, "loss": 1.5246, "step": 32562 }, { "epoch": 2.56, "learning_rate": 1.5489936678078633e-05, "loss": 1.4515, "step": 32563 }, { "epoch": 2.56, "learning_rate": 1.5484467090005376e-05, "loss": 1.4508, "step": 32564 }, { "epoch": 2.56, "learning_rate": 1.5478998415218363e-05, "loss": 1.4389, "step": 32565 }, { "epoch": 2.56, "learning_rate": 1.5473530653754668e-05, "loss": 1.4443, "step": 32566 }, { "epoch": 2.56, "learning_rate": 1.546806380565151e-05, "loss": 1.426, "step": 32567 }, { "epoch": 2.56, "learning_rate": 1.5462597870945943e-05, "loss": 1.4076, "step": 32568 }, { "epoch": 2.56, "learning_rate": 1.5457132849675086e-05, "loss": 1.5049, "step": 32569 }, { "epoch": 2.56, "learning_rate": 1.5451668741876062e-05, "loss": 1.4308, "step": 32570 }, { "epoch": 2.56, "learning_rate": 1.5446205547585955e-05, "loss": 1.3974, "step": 32571 }, { "epoch": 2.56, "learning_rate": 1.5440743266841837e-05, "loss": 1.4617, "step": 32572 }, { "epoch": 2.56, "learning_rate": 1.543528189968081e-05, "loss": 1.4673, "step": 32573 }, { "epoch": 2.56, "learning_rate": 1.5429821446140002e-05, "loss": 1.4327, "step": 32574 }, { "epoch": 2.56, "learning_rate": 1.5424361906256438e-05, "loss": 1.4748, "step": 32575 }, { "epoch": 2.56, "learning_rate": 1.5418903280067162e-05, "loss": 1.4782, "step": 32576 }, { "epoch": 2.56, "learning_rate": 1.5413445567609294e-05, "loss": 1.4232, "step": 32577 }, { "epoch": 2.56, "learning_rate": 1.5407988768919853e-05, "loss": 1.4735, "step": 32578 }, { "epoch": 2.56, "learning_rate": 1.5402532884035894e-05, "loss": 1.4151, "step": 32579 }, { "epoch": 2.56, "learning_rate": 1.5397077912994438e-05, "loss": 1.4633, "step": 32580 }, { "epoch": 2.56, "learning_rate": 1.539162385583257e-05, "loss": 1.4822, "step": 32581 }, { "epoch": 2.56, "learning_rate": 1.5386170712587293e-05, "loss": 1.4494, "step": 32582 }, { "epoch": 2.56, "learning_rate": 1.5380718483295613e-05, "loss": 1.456, "step": 32583 }, { "epoch": 2.56, "learning_rate": 1.537526716799458e-05, "loss": 1.4293, "step": 32584 }, { "epoch": 2.56, "learning_rate": 1.5369816766721187e-05, "loss": 1.4445, "step": 32585 }, { "epoch": 2.56, "learning_rate": 1.5364367279512417e-05, "loss": 1.4562, "step": 32586 }, { "epoch": 2.56, "learning_rate": 1.5358918706405345e-05, "loss": 1.4641, "step": 32587 }, { "epoch": 2.56, "learning_rate": 1.5353471047436866e-05, "loss": 1.4425, "step": 32588 }, { "epoch": 2.56, "learning_rate": 1.534802430264404e-05, "loss": 1.4029, "step": 32589 }, { "epoch": 2.56, "learning_rate": 1.5342578472063805e-05, "loss": 1.4413, "step": 32590 }, { "epoch": 2.56, "learning_rate": 1.533713355573316e-05, "loss": 1.3982, "step": 32591 }, { "epoch": 2.56, "learning_rate": 1.533168955368908e-05, "loss": 1.4699, "step": 32592 }, { "epoch": 2.56, "learning_rate": 1.5326246465968482e-05, "loss": 1.4329, "step": 32593 }, { "epoch": 2.56, "learning_rate": 1.532080429260839e-05, "loss": 1.5017, "step": 32594 }, { "epoch": 2.56, "learning_rate": 1.5315363033645705e-05, "loss": 1.4083, "step": 32595 }, { "epoch": 2.56, "learning_rate": 1.5309922689117384e-05, "loss": 1.4545, "step": 32596 }, { "epoch": 2.56, "learning_rate": 1.5304483259060323e-05, "loss": 1.451, "step": 32597 }, { "epoch": 2.56, "learning_rate": 1.529904474351152e-05, "loss": 1.4296, "step": 32598 }, { "epoch": 2.56, "learning_rate": 1.5293607142507884e-05, "loss": 1.3928, "step": 32599 }, { "epoch": 2.57, "learning_rate": 1.5288170456086278e-05, "loss": 1.453, "step": 32600 }, { "epoch": 2.57, "learning_rate": 1.528273468428367e-05, "loss": 1.468, "step": 32601 }, { "epoch": 2.57, "learning_rate": 1.5277299827136964e-05, "loss": 1.4668, "step": 32602 }, { "epoch": 2.57, "learning_rate": 1.5271865884683026e-05, "loss": 1.3954, "step": 32603 }, { "epoch": 2.57, "learning_rate": 1.5266432856958748e-05, "loss": 1.4064, "step": 32604 }, { "epoch": 2.57, "learning_rate": 1.5261000744001084e-05, "loss": 1.4432, "step": 32605 }, { "epoch": 2.57, "learning_rate": 1.5255569545846868e-05, "loss": 1.4365, "step": 32606 }, { "epoch": 2.57, "learning_rate": 1.525013926253294e-05, "loss": 1.3994, "step": 32607 }, { "epoch": 2.57, "learning_rate": 1.5244709894096252e-05, "loss": 1.4479, "step": 32608 }, { "epoch": 2.57, "learning_rate": 1.523928144057361e-05, "loss": 1.4556, "step": 32609 }, { "epoch": 2.57, "learning_rate": 1.5233853902001846e-05, "loss": 1.4702, "step": 32610 }, { "epoch": 2.57, "learning_rate": 1.522842727841787e-05, "loss": 1.489, "step": 32611 }, { "epoch": 2.57, "learning_rate": 1.52230015698585e-05, "loss": 1.4529, "step": 32612 }, { "epoch": 2.57, "learning_rate": 1.5217576776360558e-05, "loss": 1.4497, "step": 32613 }, { "epoch": 2.57, "learning_rate": 1.521215289796091e-05, "loss": 1.4605, "step": 32614 }, { "epoch": 2.57, "learning_rate": 1.5206729934696348e-05, "loss": 1.3837, "step": 32615 }, { "epoch": 2.57, "learning_rate": 1.5201307886603725e-05, "loss": 1.3836, "step": 32616 }, { "epoch": 2.57, "learning_rate": 1.5195886753719794e-05, "loss": 1.4036, "step": 32617 }, { "epoch": 2.57, "learning_rate": 1.5190466536081442e-05, "loss": 1.4264, "step": 32618 }, { "epoch": 2.57, "learning_rate": 1.5185047233725389e-05, "loss": 1.4456, "step": 32619 }, { "epoch": 2.57, "learning_rate": 1.5179628846688507e-05, "loss": 1.4703, "step": 32620 }, { "epoch": 2.57, "learning_rate": 1.51742113750075e-05, "loss": 1.4063, "step": 32621 }, { "epoch": 2.57, "learning_rate": 1.5168794818719238e-05, "loss": 1.4358, "step": 32622 }, { "epoch": 2.57, "learning_rate": 1.5163379177860441e-05, "loss": 1.5084, "step": 32623 }, { "epoch": 2.57, "learning_rate": 1.5157964452467863e-05, "loss": 1.5137, "step": 32624 }, { "epoch": 2.57, "learning_rate": 1.5152550642578343e-05, "loss": 1.4284, "step": 32625 }, { "epoch": 2.57, "learning_rate": 1.5147137748228565e-05, "loss": 1.4454, "step": 32626 }, { "epoch": 2.57, "learning_rate": 1.5141725769455288e-05, "loss": 1.452, "step": 32627 }, { "epoch": 2.57, "learning_rate": 1.5136314706295293e-05, "loss": 1.4601, "step": 32628 }, { "epoch": 2.57, "learning_rate": 1.5130904558785306e-05, "loss": 1.4783, "step": 32629 }, { "epoch": 2.57, "learning_rate": 1.5125495326962011e-05, "loss": 1.4196, "step": 32630 }, { "epoch": 2.57, "learning_rate": 1.5120087010862214e-05, "loss": 1.469, "step": 32631 }, { "epoch": 2.57, "learning_rate": 1.5114679610522584e-05, "loss": 1.4634, "step": 32632 }, { "epoch": 2.57, "learning_rate": 1.5109273125979843e-05, "loss": 1.4157, "step": 32633 }, { "epoch": 2.57, "learning_rate": 1.5103867557270676e-05, "loss": 1.4506, "step": 32634 }, { "epoch": 2.57, "learning_rate": 1.5098462904431807e-05, "loss": 1.4786, "step": 32635 }, { "epoch": 2.57, "learning_rate": 1.5093059167499955e-05, "loss": 1.4274, "step": 32636 }, { "epoch": 2.57, "learning_rate": 1.5087656346511772e-05, "loss": 1.4303, "step": 32637 }, { "epoch": 2.57, "learning_rate": 1.5082254441503949e-05, "loss": 1.4143, "step": 32638 }, { "epoch": 2.57, "learning_rate": 1.507685345251317e-05, "loss": 1.412, "step": 32639 }, { "epoch": 2.57, "learning_rate": 1.5071453379576109e-05, "loss": 1.4198, "step": 32640 }, { "epoch": 2.57, "learning_rate": 1.5066054222729384e-05, "loss": 1.465, "step": 32641 }, { "epoch": 2.57, "learning_rate": 1.5060655982009734e-05, "loss": 1.4229, "step": 32642 }, { "epoch": 2.57, "learning_rate": 1.5055258657453744e-05, "loss": 1.4172, "step": 32643 }, { "epoch": 2.57, "learning_rate": 1.504986224909807e-05, "loss": 1.4333, "step": 32644 }, { "epoch": 2.57, "learning_rate": 1.5044466756979367e-05, "loss": 1.5021, "step": 32645 }, { "epoch": 2.57, "learning_rate": 1.503907218113427e-05, "loss": 1.4159, "step": 32646 }, { "epoch": 2.57, "learning_rate": 1.5033678521599368e-05, "loss": 1.4773, "step": 32647 }, { "epoch": 2.57, "learning_rate": 1.5028285778411348e-05, "loss": 1.4405, "step": 32648 }, { "epoch": 2.57, "learning_rate": 1.5022893951606763e-05, "loss": 1.4336, "step": 32649 }, { "epoch": 2.57, "learning_rate": 1.5017503041222234e-05, "loss": 1.4351, "step": 32650 }, { "epoch": 2.57, "learning_rate": 1.501211304729435e-05, "loss": 1.4593, "step": 32651 }, { "epoch": 2.57, "learning_rate": 1.5006723969859763e-05, "loss": 1.4573, "step": 32652 }, { "epoch": 2.57, "learning_rate": 1.5001335808955029e-05, "loss": 1.4541, "step": 32653 }, { "epoch": 2.57, "learning_rate": 1.4995948564616717e-05, "loss": 1.4362, "step": 32654 }, { "epoch": 2.57, "learning_rate": 1.4990562236881398e-05, "loss": 1.4948, "step": 32655 }, { "epoch": 2.57, "learning_rate": 1.4985176825785677e-05, "loss": 1.44, "step": 32656 }, { "epoch": 2.57, "learning_rate": 1.4979792331366092e-05, "loss": 1.4315, "step": 32657 }, { "epoch": 2.57, "learning_rate": 1.4974408753659195e-05, "loss": 1.4124, "step": 32658 }, { "epoch": 2.57, "learning_rate": 1.4969026092701559e-05, "loss": 1.4576, "step": 32659 }, { "epoch": 2.57, "learning_rate": 1.4963644348529735e-05, "loss": 1.4268, "step": 32660 }, { "epoch": 2.57, "learning_rate": 1.4958263521180197e-05, "loss": 1.4586, "step": 32661 }, { "epoch": 2.57, "learning_rate": 1.4952883610689581e-05, "loss": 1.4461, "step": 32662 }, { "epoch": 2.57, "learning_rate": 1.494750461709434e-05, "loss": 1.4177, "step": 32663 }, { "epoch": 2.57, "learning_rate": 1.4942126540430998e-05, "loss": 1.4954, "step": 32664 }, { "epoch": 2.57, "learning_rate": 1.4936749380736107e-05, "loss": 1.4011, "step": 32665 }, { "epoch": 2.57, "learning_rate": 1.4931373138046138e-05, "loss": 1.415, "step": 32666 }, { "epoch": 2.57, "learning_rate": 1.4925997812397627e-05, "loss": 1.4682, "step": 32667 }, { "epoch": 2.57, "learning_rate": 1.4920623403827015e-05, "loss": 1.448, "step": 32668 }, { "epoch": 2.57, "learning_rate": 1.491524991237087e-05, "loss": 1.4346, "step": 32669 }, { "epoch": 2.57, "learning_rate": 1.490987733806563e-05, "loss": 1.4639, "step": 32670 }, { "epoch": 2.57, "learning_rate": 1.4904505680947748e-05, "loss": 1.4541, "step": 32671 }, { "epoch": 2.57, "learning_rate": 1.489913494105373e-05, "loss": 1.4445, "step": 32672 }, { "epoch": 2.57, "learning_rate": 1.4893765118420048e-05, "loss": 1.4469, "step": 32673 }, { "epoch": 2.57, "learning_rate": 1.4888396213083137e-05, "loss": 1.4693, "step": 32674 }, { "epoch": 2.57, "learning_rate": 1.4883028225079435e-05, "loss": 1.4805, "step": 32675 }, { "epoch": 2.57, "learning_rate": 1.4877661154445431e-05, "loss": 1.5403, "step": 32676 }, { "epoch": 2.57, "learning_rate": 1.4872295001217526e-05, "loss": 1.386, "step": 32677 }, { "epoch": 2.57, "learning_rate": 1.4866929765432162e-05, "loss": 1.4953, "step": 32678 }, { "epoch": 2.57, "learning_rate": 1.486156544712579e-05, "loss": 1.52, "step": 32679 }, { "epoch": 2.57, "learning_rate": 1.4856202046334814e-05, "loss": 1.4584, "step": 32680 }, { "epoch": 2.57, "learning_rate": 1.4850839563095623e-05, "loss": 1.4162, "step": 32681 }, { "epoch": 2.57, "learning_rate": 1.4845477997444654e-05, "loss": 1.3912, "step": 32682 }, { "epoch": 2.57, "learning_rate": 1.4840117349418328e-05, "loss": 1.4601, "step": 32683 }, { "epoch": 2.57, "learning_rate": 1.4834757619053018e-05, "loss": 1.4465, "step": 32684 }, { "epoch": 2.57, "learning_rate": 1.4829398806385073e-05, "loss": 1.484, "step": 32685 }, { "epoch": 2.57, "learning_rate": 1.4824040911450952e-05, "loss": 1.4311, "step": 32686 }, { "epoch": 2.57, "learning_rate": 1.4818683934287007e-05, "loss": 1.4932, "step": 32687 }, { "epoch": 2.57, "learning_rate": 1.4813327874929559e-05, "loss": 1.4562, "step": 32688 }, { "epoch": 2.57, "learning_rate": 1.4807972733415047e-05, "loss": 1.4504, "step": 32689 }, { "epoch": 2.57, "learning_rate": 1.480261850977979e-05, "loss": 1.4916, "step": 32690 }, { "epoch": 2.57, "learning_rate": 1.479726520406016e-05, "loss": 1.4083, "step": 32691 }, { "epoch": 2.57, "learning_rate": 1.4791912816292445e-05, "loss": 1.4271, "step": 32692 }, { "epoch": 2.57, "learning_rate": 1.4786561346513066e-05, "loss": 1.4738, "step": 32693 }, { "epoch": 2.57, "learning_rate": 1.4781210794758308e-05, "loss": 1.4875, "step": 32694 }, { "epoch": 2.57, "learning_rate": 1.4775861161064494e-05, "loss": 1.4191, "step": 32695 }, { "epoch": 2.57, "learning_rate": 1.477051244546798e-05, "loss": 1.45, "step": 32696 }, { "epoch": 2.57, "learning_rate": 1.4765164648005052e-05, "loss": 1.4399, "step": 32697 }, { "epoch": 2.57, "learning_rate": 1.4759817768712012e-05, "loss": 1.4387, "step": 32698 }, { "epoch": 2.57, "learning_rate": 1.4754471807625168e-05, "loss": 1.4668, "step": 32699 }, { "epoch": 2.57, "learning_rate": 1.4749126764780856e-05, "loss": 1.4223, "step": 32700 }, { "epoch": 2.57, "learning_rate": 1.4743782640215345e-05, "loss": 1.4498, "step": 32701 }, { "epoch": 2.57, "learning_rate": 1.4738439433964877e-05, "loss": 1.4368, "step": 32702 }, { "epoch": 2.57, "learning_rate": 1.4733097146065787e-05, "loss": 1.4323, "step": 32703 }, { "epoch": 2.57, "learning_rate": 1.4727755776554312e-05, "loss": 1.4922, "step": 32704 }, { "epoch": 2.57, "learning_rate": 1.4722415325466707e-05, "loss": 1.4208, "step": 32705 }, { "epoch": 2.57, "learning_rate": 1.4717075792839278e-05, "loss": 1.4555, "step": 32706 }, { "epoch": 2.57, "learning_rate": 1.4711737178708261e-05, "loss": 1.4616, "step": 32707 }, { "epoch": 2.57, "learning_rate": 1.4706399483109876e-05, "loss": 1.4401, "step": 32708 }, { "epoch": 2.57, "learning_rate": 1.4701062706080346e-05, "loss": 1.4476, "step": 32709 }, { "epoch": 2.57, "learning_rate": 1.4695726847655976e-05, "loss": 1.4431, "step": 32710 }, { "epoch": 2.57, "learning_rate": 1.469039190787295e-05, "loss": 1.4459, "step": 32711 }, { "epoch": 2.57, "learning_rate": 1.468505788676746e-05, "loss": 1.3787, "step": 32712 }, { "epoch": 2.57, "learning_rate": 1.4679724784375757e-05, "loss": 1.4907, "step": 32713 }, { "epoch": 2.57, "learning_rate": 1.4674392600734063e-05, "loss": 1.4337, "step": 32714 }, { "epoch": 2.57, "learning_rate": 1.4669061335878584e-05, "loss": 1.4728, "step": 32715 }, { "epoch": 2.57, "learning_rate": 1.4663730989845457e-05, "loss": 1.4657, "step": 32716 }, { "epoch": 2.57, "learning_rate": 1.4658401562670952e-05, "loss": 1.4542, "step": 32717 }, { "epoch": 2.57, "learning_rate": 1.4653073054391207e-05, "loss": 1.4417, "step": 32718 }, { "epoch": 2.57, "learning_rate": 1.464774546504236e-05, "loss": 1.4393, "step": 32719 }, { "epoch": 2.57, "learning_rate": 1.4642418794660681e-05, "loss": 1.4119, "step": 32720 }, { "epoch": 2.57, "learning_rate": 1.463709304328226e-05, "loss": 1.4319, "step": 32721 }, { "epoch": 2.57, "learning_rate": 1.4631768210943268e-05, "loss": 1.496, "step": 32722 }, { "epoch": 2.57, "learning_rate": 1.462644429767989e-05, "loss": 1.4281, "step": 32723 }, { "epoch": 2.57, "learning_rate": 1.462112130352825e-05, "loss": 1.4594, "step": 32724 }, { "epoch": 2.57, "learning_rate": 1.461579922852445e-05, "loss": 1.4621, "step": 32725 }, { "epoch": 2.57, "learning_rate": 1.4610478072704695e-05, "loss": 1.4547, "step": 32726 }, { "epoch": 2.58, "learning_rate": 1.4605157836105092e-05, "loss": 1.3533, "step": 32727 }, { "epoch": 2.58, "learning_rate": 1.4599838518761742e-05, "loss": 1.3802, "step": 32728 }, { "epoch": 2.58, "learning_rate": 1.4594520120710718e-05, "loss": 1.4193, "step": 32729 }, { "epoch": 2.58, "learning_rate": 1.4589202641988224e-05, "loss": 1.4774, "step": 32730 }, { "epoch": 2.58, "learning_rate": 1.4583886082630313e-05, "loss": 1.4404, "step": 32731 }, { "epoch": 2.58, "learning_rate": 1.457857044267311e-05, "loss": 1.4449, "step": 32732 }, { "epoch": 2.58, "learning_rate": 1.4573255722152632e-05, "loss": 1.4383, "step": 32733 }, { "epoch": 2.58, "learning_rate": 1.4567941921105052e-05, "loss": 1.4543, "step": 32734 }, { "epoch": 2.58, "learning_rate": 1.456262903956641e-05, "loss": 1.5027, "step": 32735 }, { "epoch": 2.58, "learning_rate": 1.455731707757274e-05, "loss": 1.4125, "step": 32736 }, { "epoch": 2.58, "learning_rate": 1.455200603516018e-05, "loss": 1.4157, "step": 32737 }, { "epoch": 2.58, "learning_rate": 1.4546695912364753e-05, "loss": 1.473, "step": 32738 }, { "epoch": 2.58, "learning_rate": 1.454138670922248e-05, "loss": 1.463, "step": 32739 }, { "epoch": 2.58, "learning_rate": 1.4536078425769466e-05, "loss": 1.4087, "step": 32740 }, { "epoch": 2.58, "learning_rate": 1.453077106204173e-05, "loss": 1.4525, "step": 32741 }, { "epoch": 2.58, "learning_rate": 1.4525464618075261e-05, "loss": 1.4227, "step": 32742 }, { "epoch": 2.58, "learning_rate": 1.4520159093906164e-05, "loss": 1.4651, "step": 32743 }, { "epoch": 2.58, "learning_rate": 1.4514854489570427e-05, "loss": 1.5297, "step": 32744 }, { "epoch": 2.58, "learning_rate": 1.450955080510402e-05, "loss": 1.4407, "step": 32745 }, { "epoch": 2.58, "learning_rate": 1.4504248040542999e-05, "loss": 1.4404, "step": 32746 }, { "epoch": 2.58, "learning_rate": 1.4498946195923383e-05, "loss": 1.4225, "step": 32747 }, { "epoch": 2.58, "learning_rate": 1.4493645271281162e-05, "loss": 1.4525, "step": 32748 }, { "epoch": 2.58, "learning_rate": 1.448834526665229e-05, "loss": 1.4915, "step": 32749 }, { "epoch": 2.58, "learning_rate": 1.4483046182072755e-05, "loss": 1.4463, "step": 32750 }, { "epoch": 2.58, "learning_rate": 1.4477748017578595e-05, "loss": 1.43, "step": 32751 }, { "epoch": 2.58, "learning_rate": 1.4472450773205712e-05, "loss": 1.4527, "step": 32752 }, { "epoch": 2.58, "learning_rate": 1.4467154448990082e-05, "loss": 1.4696, "step": 32753 }, { "epoch": 2.58, "learning_rate": 1.4461859044967721e-05, "loss": 1.4066, "step": 32754 }, { "epoch": 2.58, "learning_rate": 1.4456564561174521e-05, "loss": 1.4254, "step": 32755 }, { "epoch": 2.58, "learning_rate": 1.4451270997646437e-05, "loss": 1.4356, "step": 32756 }, { "epoch": 2.58, "learning_rate": 1.4445978354419436e-05, "loss": 1.4659, "step": 32757 }, { "epoch": 2.58, "learning_rate": 1.4440686631529441e-05, "loss": 1.4435, "step": 32758 }, { "epoch": 2.58, "learning_rate": 1.4435395829012342e-05, "loss": 1.4257, "step": 32759 }, { "epoch": 2.58, "learning_rate": 1.4430105946904108e-05, "loss": 1.4447, "step": 32760 }, { "epoch": 2.58, "learning_rate": 1.4424816985240662e-05, "loss": 1.4196, "step": 32761 }, { "epoch": 2.58, "learning_rate": 1.441952894405789e-05, "loss": 1.4606, "step": 32762 }, { "epoch": 2.58, "learning_rate": 1.4414241823391665e-05, "loss": 1.495, "step": 32763 }, { "epoch": 2.58, "learning_rate": 1.4408955623277956e-05, "loss": 1.4353, "step": 32764 }, { "epoch": 2.58, "learning_rate": 1.4403670343752604e-05, "loss": 1.4177, "step": 32765 }, { "epoch": 2.58, "learning_rate": 1.4398385984851496e-05, "loss": 1.4768, "step": 32766 }, { "epoch": 2.58, "learning_rate": 1.4393102546610502e-05, "loss": 1.4719, "step": 32767 }, { "epoch": 2.58, "learning_rate": 1.4387820029065528e-05, "loss": 1.4597, "step": 32768 }, { "epoch": 2.58, "learning_rate": 1.4382538432252428e-05, "loss": 1.4689, "step": 32769 }, { "epoch": 2.58, "learning_rate": 1.4377257756207006e-05, "loss": 1.4613, "step": 32770 }, { "epoch": 2.58, "learning_rate": 1.4371978000965201e-05, "loss": 1.4105, "step": 32771 }, { "epoch": 2.58, "learning_rate": 1.4366699166562817e-05, "loss": 1.4487, "step": 32772 }, { "epoch": 2.58, "learning_rate": 1.4361421253035677e-05, "loss": 1.4292, "step": 32773 }, { "epoch": 2.58, "learning_rate": 1.435614426041965e-05, "loss": 1.4869, "step": 32774 }, { "epoch": 2.58, "learning_rate": 1.4350868188750558e-05, "loss": 1.4802, "step": 32775 }, { "epoch": 2.58, "learning_rate": 1.434559303806419e-05, "loss": 1.4576, "step": 32776 }, { "epoch": 2.58, "learning_rate": 1.4340318808396385e-05, "loss": 1.4122, "step": 32777 }, { "epoch": 2.58, "learning_rate": 1.433504549978296e-05, "loss": 1.3959, "step": 32778 }, { "epoch": 2.58, "learning_rate": 1.4329773112259723e-05, "loss": 1.4512, "step": 32779 }, { "epoch": 2.58, "learning_rate": 1.432450164586243e-05, "loss": 1.3803, "step": 32780 }, { "epoch": 2.58, "learning_rate": 1.4319231100626933e-05, "loss": 1.4137, "step": 32781 }, { "epoch": 2.58, "learning_rate": 1.431396147658897e-05, "loss": 1.4529, "step": 32782 }, { "epoch": 2.58, "learning_rate": 1.4308692773784313e-05, "loss": 1.4088, "step": 32783 }, { "epoch": 2.58, "learning_rate": 1.4303424992248786e-05, "loss": 1.3772, "step": 32784 }, { "epoch": 2.58, "learning_rate": 1.4298158132018106e-05, "loss": 1.4096, "step": 32785 }, { "epoch": 2.58, "learning_rate": 1.4292892193128047e-05, "loss": 1.3887, "step": 32786 }, { "epoch": 2.58, "learning_rate": 1.428762717561433e-05, "loss": 1.4315, "step": 32787 }, { "epoch": 2.58, "learning_rate": 1.428236307951276e-05, "loss": 1.4537, "step": 32788 }, { "epoch": 2.58, "learning_rate": 1.4277099904859058e-05, "loss": 1.421, "step": 32789 }, { "epoch": 2.58, "learning_rate": 1.4271837651688927e-05, "loss": 1.4428, "step": 32790 }, { "epoch": 2.58, "learning_rate": 1.4266576320038125e-05, "loss": 1.4524, "step": 32791 }, { "epoch": 2.58, "learning_rate": 1.4261315909942356e-05, "loss": 1.4353, "step": 32792 }, { "epoch": 2.58, "learning_rate": 1.4256056421437357e-05, "loss": 1.4604, "step": 32793 }, { "epoch": 2.58, "learning_rate": 1.4250797854558816e-05, "loss": 1.4785, "step": 32794 }, { "epoch": 2.58, "learning_rate": 1.4245540209342454e-05, "loss": 1.4112, "step": 32795 }, { "epoch": 2.58, "learning_rate": 1.4240283485823978e-05, "loss": 1.4785, "step": 32796 }, { "epoch": 2.58, "learning_rate": 1.4235027684039025e-05, "loss": 1.4061, "step": 32797 }, { "epoch": 2.58, "learning_rate": 1.4229772804023332e-05, "loss": 1.4784, "step": 32798 }, { "epoch": 2.58, "learning_rate": 1.4224518845812554e-05, "loss": 1.4553, "step": 32799 }, { "epoch": 2.58, "learning_rate": 1.4219265809442349e-05, "loss": 1.4116, "step": 32800 }, { "epoch": 2.58, "learning_rate": 1.4214013694948417e-05, "loss": 1.3998, "step": 32801 }, { "epoch": 2.58, "learning_rate": 1.4208762502366416e-05, "loss": 1.4612, "step": 32802 }, { "epoch": 2.58, "learning_rate": 1.4203512231731967e-05, "loss": 1.4681, "step": 32803 }, { "epoch": 2.58, "learning_rate": 1.4198262883080708e-05, "loss": 1.4606, "step": 32804 }, { "epoch": 2.58, "learning_rate": 1.4193014456448326e-05, "loss": 1.4854, "step": 32805 }, { "epoch": 2.58, "learning_rate": 1.4187766951870444e-05, "loss": 1.4929, "step": 32806 }, { "epoch": 2.58, "learning_rate": 1.4182520369382633e-05, "loss": 1.4351, "step": 32807 }, { "epoch": 2.58, "learning_rate": 1.4177274709020565e-05, "loss": 1.5063, "step": 32808 }, { "epoch": 2.58, "learning_rate": 1.4172029970819875e-05, "loss": 1.4655, "step": 32809 }, { "epoch": 2.58, "learning_rate": 1.4166786154816157e-05, "loss": 1.4275, "step": 32810 }, { "epoch": 2.58, "learning_rate": 1.416154326104496e-05, "loss": 1.4501, "step": 32811 }, { "epoch": 2.58, "learning_rate": 1.415630128954196e-05, "loss": 1.4291, "step": 32812 }, { "epoch": 2.58, "learning_rate": 1.415106024034271e-05, "loss": 1.4457, "step": 32813 }, { "epoch": 2.58, "learning_rate": 1.4145820113482748e-05, "loss": 1.4733, "step": 32814 }, { "epoch": 2.58, "learning_rate": 1.4140580908997746e-05, "loss": 1.4532, "step": 32815 }, { "epoch": 2.58, "learning_rate": 1.4135342626923225e-05, "loss": 1.437, "step": 32816 }, { "epoch": 2.58, "learning_rate": 1.4130105267294705e-05, "loss": 1.4412, "step": 32817 }, { "epoch": 2.58, "learning_rate": 1.4124868830147828e-05, "loss": 1.4527, "step": 32818 }, { "epoch": 2.58, "learning_rate": 1.4119633315518114e-05, "loss": 1.472, "step": 32819 }, { "epoch": 2.58, "learning_rate": 1.41143987234411e-05, "loss": 1.4639, "step": 32820 }, { "epoch": 2.58, "learning_rate": 1.4109165053952309e-05, "loss": 1.4411, "step": 32821 }, { "epoch": 2.58, "learning_rate": 1.4103932307087312e-05, "loss": 1.4443, "step": 32822 }, { "epoch": 2.58, "learning_rate": 1.4098700482881614e-05, "loss": 1.4717, "step": 32823 }, { "epoch": 2.58, "learning_rate": 1.409346958137072e-05, "loss": 1.4801, "step": 32824 }, { "epoch": 2.58, "learning_rate": 1.4088239602590218e-05, "loss": 1.4169, "step": 32825 }, { "epoch": 2.58, "learning_rate": 1.4083010546575546e-05, "loss": 1.4371, "step": 32826 }, { "epoch": 2.58, "learning_rate": 1.4077782413362243e-05, "loss": 1.4871, "step": 32827 }, { "epoch": 2.58, "learning_rate": 1.4072555202985747e-05, "loss": 1.4392, "step": 32828 }, { "epoch": 2.58, "learning_rate": 1.4067328915481629e-05, "loss": 1.4133, "step": 32829 }, { "epoch": 2.58, "learning_rate": 1.4062103550885328e-05, "loss": 1.4238, "step": 32830 }, { "epoch": 2.58, "learning_rate": 1.40568791092323e-05, "loss": 1.4512, "step": 32831 }, { "epoch": 2.58, "learning_rate": 1.4051655590558081e-05, "loss": 1.4269, "step": 32832 }, { "epoch": 2.58, "learning_rate": 1.4046432994898094e-05, "loss": 1.479, "step": 32833 }, { "epoch": 2.58, "learning_rate": 1.404121132228776e-05, "loss": 1.4149, "step": 32834 }, { "epoch": 2.58, "learning_rate": 1.4035990572762617e-05, "loss": 1.3975, "step": 32835 }, { "epoch": 2.58, "learning_rate": 1.4030770746358056e-05, "loss": 1.4556, "step": 32836 }, { "epoch": 2.58, "learning_rate": 1.4025551843109512e-05, "loss": 1.4769, "step": 32837 }, { "epoch": 2.58, "learning_rate": 1.4020333863052457e-05, "loss": 1.4576, "step": 32838 }, { "epoch": 2.58, "learning_rate": 1.4015116806222266e-05, "loss": 1.4371, "step": 32839 }, { "epoch": 2.58, "learning_rate": 1.4009900672654406e-05, "loss": 1.5019, "step": 32840 }, { "epoch": 2.58, "learning_rate": 1.4004685462384251e-05, "loss": 1.4645, "step": 32841 }, { "epoch": 2.58, "learning_rate": 1.3999471175447274e-05, "loss": 1.483, "step": 32842 }, { "epoch": 2.58, "learning_rate": 1.3994257811878828e-05, "loss": 1.4755, "step": 32843 }, { "epoch": 2.58, "learning_rate": 1.398904537171432e-05, "loss": 1.4384, "step": 32844 }, { "epoch": 2.58, "learning_rate": 1.39838338549891e-05, "loss": 1.4331, "step": 32845 }, { "epoch": 2.58, "learning_rate": 1.397862326173863e-05, "loss": 1.4592, "step": 32846 }, { "epoch": 2.58, "learning_rate": 1.3973413591998245e-05, "loss": 1.4338, "step": 32847 }, { "epoch": 2.58, "learning_rate": 1.3968204845803283e-05, "loss": 1.454, "step": 32848 }, { "epoch": 2.58, "learning_rate": 1.3962997023189165e-05, "loss": 1.4748, "step": 32849 }, { "epoch": 2.58, "learning_rate": 1.3957790124191232e-05, "loss": 1.4412, "step": 32850 }, { "epoch": 2.58, "learning_rate": 1.3952584148844802e-05, "loss": 1.4626, "step": 32851 }, { "epoch": 2.58, "learning_rate": 1.3947379097185268e-05, "loss": 1.4744, "step": 32852 }, { "epoch": 2.58, "learning_rate": 1.3942174969247949e-05, "loss": 1.4594, "step": 32853 }, { "epoch": 2.58, "learning_rate": 1.3936971765068167e-05, "loss": 1.3956, "step": 32854 }, { "epoch": 2.59, "learning_rate": 1.3931769484681244e-05, "loss": 1.4763, "step": 32855 }, { "epoch": 2.59, "learning_rate": 1.3926568128122567e-05, "loss": 1.4238, "step": 32856 }, { "epoch": 2.59, "learning_rate": 1.3921367695427377e-05, "loss": 1.4291, "step": 32857 }, { "epoch": 2.59, "learning_rate": 1.3916168186630994e-05, "loss": 1.4082, "step": 32858 }, { "epoch": 2.59, "learning_rate": 1.3910969601768757e-05, "loss": 1.447, "step": 32859 }, { "epoch": 2.59, "learning_rate": 1.3905771940875921e-05, "loss": 1.4523, "step": 32860 }, { "epoch": 2.59, "learning_rate": 1.3900575203987808e-05, "loss": 1.4257, "step": 32861 }, { "epoch": 2.59, "learning_rate": 1.3895379391139656e-05, "loss": 1.4168, "step": 32862 }, { "epoch": 2.59, "learning_rate": 1.3890184502366785e-05, "loss": 1.4892, "step": 32863 }, { "epoch": 2.59, "learning_rate": 1.3884990537704454e-05, "loss": 1.436, "step": 32864 }, { "epoch": 2.59, "learning_rate": 1.38797974971879e-05, "loss": 1.4544, "step": 32865 }, { "epoch": 2.59, "learning_rate": 1.3874605380852427e-05, "loss": 1.4344, "step": 32866 }, { "epoch": 2.59, "learning_rate": 1.3869414188733257e-05, "loss": 1.3928, "step": 32867 }, { "epoch": 2.59, "learning_rate": 1.3864223920865631e-05, "loss": 1.449, "step": 32868 }, { "epoch": 2.59, "learning_rate": 1.3859034577284816e-05, "loss": 1.4041, "step": 32869 }, { "epoch": 2.59, "learning_rate": 1.3853846158026021e-05, "loss": 1.4657, "step": 32870 }, { "epoch": 2.59, "learning_rate": 1.3848658663124468e-05, "loss": 1.4408, "step": 32871 }, { "epoch": 2.59, "learning_rate": 1.3843472092615376e-05, "loss": 1.4285, "step": 32872 }, { "epoch": 2.59, "learning_rate": 1.3838286446534002e-05, "loss": 1.4372, "step": 32873 }, { "epoch": 2.59, "learning_rate": 1.3833101724915519e-05, "loss": 1.4631, "step": 32874 }, { "epoch": 2.59, "learning_rate": 1.3827917927795113e-05, "loss": 1.4606, "step": 32875 }, { "epoch": 2.59, "learning_rate": 1.3822735055208006e-05, "loss": 1.4172, "step": 32876 }, { "epoch": 2.59, "learning_rate": 1.3817553107189405e-05, "loss": 1.488, "step": 32877 }, { "epoch": 2.59, "learning_rate": 1.3812372083774432e-05, "loss": 1.4447, "step": 32878 }, { "epoch": 2.59, "learning_rate": 1.3807191984998307e-05, "loss": 1.5076, "step": 32879 }, { "epoch": 2.59, "learning_rate": 1.3802012810896218e-05, "loss": 1.499, "step": 32880 }, { "epoch": 2.59, "learning_rate": 1.379683456150329e-05, "loss": 1.4639, "step": 32881 }, { "epoch": 2.59, "learning_rate": 1.3791657236854659e-05, "loss": 1.4456, "step": 32882 }, { "epoch": 2.59, "learning_rate": 1.3786480836985547e-05, "loss": 1.4248, "step": 32883 }, { "epoch": 2.59, "learning_rate": 1.3781305361931044e-05, "loss": 1.4349, "step": 32884 }, { "epoch": 2.59, "learning_rate": 1.3776130811726289e-05, "loss": 1.4429, "step": 32885 }, { "epoch": 2.59, "learning_rate": 1.3770957186406434e-05, "loss": 1.413, "step": 32886 }, { "epoch": 2.59, "learning_rate": 1.3765784486006637e-05, "loss": 1.4541, "step": 32887 }, { "epoch": 2.59, "learning_rate": 1.376061271056197e-05, "loss": 1.5028, "step": 32888 }, { "epoch": 2.59, "learning_rate": 1.3755441860107535e-05, "loss": 1.4519, "step": 32889 }, { "epoch": 2.59, "learning_rate": 1.3750271934678492e-05, "loss": 1.4353, "step": 32890 }, { "epoch": 2.59, "learning_rate": 1.374510293430991e-05, "loss": 1.441, "step": 32891 }, { "epoch": 2.59, "learning_rate": 1.3739934859036878e-05, "loss": 1.4583, "step": 32892 }, { "epoch": 2.59, "learning_rate": 1.37347677088945e-05, "loss": 1.4511, "step": 32893 }, { "epoch": 2.59, "learning_rate": 1.3729601483917869e-05, "loss": 1.402, "step": 32894 }, { "epoch": 2.59, "learning_rate": 1.3724436184142002e-05, "loss": 1.4401, "step": 32895 }, { "epoch": 2.59, "learning_rate": 1.371927180960204e-05, "loss": 1.4148, "step": 32896 }, { "epoch": 2.59, "learning_rate": 1.371410836033302e-05, "loss": 1.4375, "step": 32897 }, { "epoch": 2.59, "learning_rate": 1.370894583637e-05, "loss": 1.4858, "step": 32898 }, { "epoch": 2.59, "learning_rate": 1.3703784237747983e-05, "loss": 1.3696, "step": 32899 }, { "epoch": 2.59, "learning_rate": 1.3698623564502093e-05, "loss": 1.4369, "step": 32900 }, { "epoch": 2.59, "learning_rate": 1.3693463816667334e-05, "loss": 1.4227, "step": 32901 }, { "epoch": 2.59, "learning_rate": 1.3688304994278709e-05, "loss": 1.4336, "step": 32902 }, { "epoch": 2.59, "learning_rate": 1.3683147097371262e-05, "loss": 1.4419, "step": 32903 }, { "epoch": 2.59, "learning_rate": 1.367799012598006e-05, "loss": 1.5171, "step": 32904 }, { "epoch": 2.59, "learning_rate": 1.3672834080140078e-05, "loss": 1.4022, "step": 32905 }, { "epoch": 2.59, "learning_rate": 1.3667678959886285e-05, "loss": 1.468, "step": 32906 }, { "epoch": 2.59, "learning_rate": 1.3662524765253741e-05, "loss": 1.4398, "step": 32907 }, { "epoch": 2.59, "learning_rate": 1.3657371496277413e-05, "loss": 1.4594, "step": 32908 }, { "epoch": 2.59, "learning_rate": 1.3652219152992278e-05, "loss": 1.442, "step": 32909 }, { "epoch": 2.59, "learning_rate": 1.3647067735433353e-05, "loss": 1.4239, "step": 32910 }, { "epoch": 2.59, "learning_rate": 1.3641917243635597e-05, "loss": 1.4137, "step": 32911 }, { "epoch": 2.59, "learning_rate": 1.3636767677633947e-05, "loss": 1.4573, "step": 32912 }, { "epoch": 2.59, "learning_rate": 1.3631619037463409e-05, "loss": 1.4662, "step": 32913 }, { "epoch": 2.59, "learning_rate": 1.3626471323158939e-05, "loss": 1.4503, "step": 32914 }, { "epoch": 2.59, "learning_rate": 1.3621324534755457e-05, "loss": 1.474, "step": 32915 }, { "epoch": 2.59, "learning_rate": 1.3616178672287902e-05, "loss": 1.4748, "step": 32916 }, { "epoch": 2.59, "learning_rate": 1.3611033735791266e-05, "loss": 1.4676, "step": 32917 }, { "epoch": 2.59, "learning_rate": 1.36058897253004e-05, "loss": 1.4499, "step": 32918 }, { "epoch": 2.59, "learning_rate": 1.3600746640850313e-05, "loss": 1.455, "step": 32919 }, { "epoch": 2.59, "learning_rate": 1.3595604482475859e-05, "loss": 1.4892, "step": 32920 }, { "epoch": 2.59, "learning_rate": 1.3590463250212008e-05, "loss": 1.4085, "step": 32921 }, { "epoch": 2.59, "learning_rate": 1.3585322944093618e-05, "loss": 1.4884, "step": 32922 }, { "epoch": 2.59, "learning_rate": 1.3580183564155594e-05, "loss": 1.4436, "step": 32923 }, { "epoch": 2.59, "learning_rate": 1.3575045110432858e-05, "loss": 1.3982, "step": 32924 }, { "epoch": 2.59, "learning_rate": 1.3569907582960281e-05, "loss": 1.4398, "step": 32925 }, { "epoch": 2.59, "learning_rate": 1.3564770981772722e-05, "loss": 1.4241, "step": 32926 }, { "epoch": 2.59, "learning_rate": 1.3559635306905098e-05, "loss": 1.459, "step": 32927 }, { "epoch": 2.59, "learning_rate": 1.3554500558392268e-05, "loss": 1.4469, "step": 32928 }, { "epoch": 2.59, "learning_rate": 1.3549366736269035e-05, "loss": 1.4111, "step": 32929 }, { "epoch": 2.59, "learning_rate": 1.354423384057034e-05, "loss": 1.4965, "step": 32930 }, { "epoch": 2.59, "learning_rate": 1.3539101871331004e-05, "loss": 1.4359, "step": 32931 }, { "epoch": 2.59, "learning_rate": 1.353397082858585e-05, "loss": 1.4594, "step": 32932 }, { "epoch": 2.59, "learning_rate": 1.3528840712369665e-05, "loss": 1.4364, "step": 32933 }, { "epoch": 2.59, "learning_rate": 1.3523711522717407e-05, "loss": 1.4338, "step": 32934 }, { "epoch": 2.59, "learning_rate": 1.3518583259663828e-05, "loss": 1.4884, "step": 32935 }, { "epoch": 2.59, "learning_rate": 1.3513455923243738e-05, "loss": 1.4272, "step": 32936 }, { "epoch": 2.59, "learning_rate": 1.3508329513491973e-05, "loss": 1.4486, "step": 32937 }, { "epoch": 2.59, "learning_rate": 1.3503204030443337e-05, "loss": 1.4395, "step": 32938 }, { "epoch": 2.59, "learning_rate": 1.3498079474132623e-05, "loss": 1.3722, "step": 32939 }, { "epoch": 2.59, "learning_rate": 1.3492955844594583e-05, "loss": 1.4616, "step": 32940 }, { "epoch": 2.59, "learning_rate": 1.3487833141864073e-05, "loss": 1.4757, "step": 32941 }, { "epoch": 2.59, "learning_rate": 1.348271136597585e-05, "loss": 1.418, "step": 32942 }, { "epoch": 2.59, "learning_rate": 1.3477590516964654e-05, "loss": 1.4508, "step": 32943 }, { "epoch": 2.59, "learning_rate": 1.3472470594865287e-05, "loss": 1.4017, "step": 32944 }, { "epoch": 2.59, "learning_rate": 1.3467351599712522e-05, "loss": 1.45, "step": 32945 }, { "epoch": 2.59, "learning_rate": 1.3462233531541067e-05, "loss": 1.4985, "step": 32946 }, { "epoch": 2.59, "learning_rate": 1.3457116390385709e-05, "loss": 1.3775, "step": 32947 }, { "epoch": 2.59, "learning_rate": 1.3452000176281203e-05, "loss": 1.4624, "step": 32948 }, { "epoch": 2.59, "learning_rate": 1.3446884889262222e-05, "loss": 1.4347, "step": 32949 }, { "epoch": 2.59, "learning_rate": 1.3441770529363539e-05, "loss": 1.4073, "step": 32950 }, { "epoch": 2.59, "learning_rate": 1.343665709661989e-05, "loss": 1.4304, "step": 32951 }, { "epoch": 2.59, "learning_rate": 1.3431544591065984e-05, "loss": 1.3994, "step": 32952 }, { "epoch": 2.59, "learning_rate": 1.342643301273651e-05, "loss": 1.5001, "step": 32953 }, { "epoch": 2.59, "learning_rate": 1.3421322361666204e-05, "loss": 1.4526, "step": 32954 }, { "epoch": 2.59, "learning_rate": 1.3416212637889757e-05, "loss": 1.4345, "step": 32955 }, { "epoch": 2.59, "learning_rate": 1.3411103841441857e-05, "loss": 1.4068, "step": 32956 }, { "epoch": 2.59, "learning_rate": 1.3405995972357142e-05, "loss": 1.4082, "step": 32957 }, { "epoch": 2.59, "learning_rate": 1.3400889030670369e-05, "loss": 1.4403, "step": 32958 }, { "epoch": 2.59, "learning_rate": 1.3395783016416178e-05, "loss": 1.4523, "step": 32959 }, { "epoch": 2.59, "learning_rate": 1.3390677929629223e-05, "loss": 1.4575, "step": 32960 }, { "epoch": 2.59, "learning_rate": 1.3385573770344177e-05, "loss": 1.4408, "step": 32961 }, { "epoch": 2.59, "learning_rate": 1.3380470538595711e-05, "loss": 1.4386, "step": 32962 }, { "epoch": 2.59, "learning_rate": 1.3375368234418431e-05, "loss": 1.4311, "step": 32963 }, { "epoch": 2.59, "learning_rate": 1.3370266857847046e-05, "loss": 1.442, "step": 32964 }, { "epoch": 2.59, "learning_rate": 1.3365166408916106e-05, "loss": 1.4949, "step": 32965 }, { "epoch": 2.59, "learning_rate": 1.3360066887660303e-05, "loss": 1.4181, "step": 32966 }, { "epoch": 2.59, "learning_rate": 1.3354968294114226e-05, "loss": 1.4883, "step": 32967 }, { "epoch": 2.59, "learning_rate": 1.3349870628312532e-05, "loss": 1.4755, "step": 32968 }, { "epoch": 2.59, "learning_rate": 1.3344773890289823e-05, "loss": 1.4365, "step": 32969 }, { "epoch": 2.59, "learning_rate": 1.333967808008064e-05, "loss": 1.4333, "step": 32970 }, { "epoch": 2.59, "learning_rate": 1.3334583197719656e-05, "loss": 1.4554, "step": 32971 }, { "epoch": 2.59, "learning_rate": 1.3329489243241442e-05, "loss": 1.4559, "step": 32972 }, { "epoch": 2.59, "learning_rate": 1.3324396216680572e-05, "loss": 1.4768, "step": 32973 }, { "epoch": 2.59, "learning_rate": 1.33193041180716e-05, "loss": 1.4664, "step": 32974 }, { "epoch": 2.59, "learning_rate": 1.3314212947449149e-05, "loss": 1.4691, "step": 32975 }, { "epoch": 2.59, "learning_rate": 1.3309122704847774e-05, "loss": 1.4624, "step": 32976 }, { "epoch": 2.59, "learning_rate": 1.3304033390301983e-05, "loss": 1.4173, "step": 32977 }, { "epoch": 2.59, "learning_rate": 1.3298945003846396e-05, "loss": 1.4319, "step": 32978 }, { "epoch": 2.59, "learning_rate": 1.3293857545515551e-05, "loss": 1.477, "step": 32979 }, { "epoch": 2.59, "learning_rate": 1.328877101534394e-05, "loss": 1.4624, "step": 32980 }, { "epoch": 2.59, "learning_rate": 1.3283685413366119e-05, "loss": 1.4423, "step": 32981 }, { "epoch": 2.6, "learning_rate": 1.3278600739616657e-05, "loss": 1.4816, "step": 32982 }, { "epoch": 2.6, "learning_rate": 1.3273516994130062e-05, "loss": 1.4357, "step": 32983 }, { "epoch": 2.6, "learning_rate": 1.326843417694079e-05, "loss": 1.4576, "step": 32984 }, { "epoch": 2.6, "learning_rate": 1.3263352288083428e-05, "loss": 1.384, "step": 32985 }, { "epoch": 2.6, "learning_rate": 1.3258271327592451e-05, "loss": 1.468, "step": 32986 }, { "epoch": 2.6, "learning_rate": 1.325319129550233e-05, "loss": 1.4084, "step": 32987 }, { "epoch": 2.6, "learning_rate": 1.3248112191847588e-05, "loss": 1.4841, "step": 32988 }, { "epoch": 2.6, "learning_rate": 1.3243034016662712e-05, "loss": 1.4281, "step": 32989 }, { "epoch": 2.6, "learning_rate": 1.3237956769982128e-05, "loss": 1.4622, "step": 32990 }, { "epoch": 2.6, "learning_rate": 1.3232880451840388e-05, "loss": 1.4741, "step": 32991 }, { "epoch": 2.6, "learning_rate": 1.3227805062271902e-05, "loss": 1.4394, "step": 32992 }, { "epoch": 2.6, "learning_rate": 1.3222730601311154e-05, "loss": 1.3981, "step": 32993 }, { "epoch": 2.6, "learning_rate": 1.3217657068992537e-05, "loss": 1.4773, "step": 32994 }, { "epoch": 2.6, "learning_rate": 1.321258446535059e-05, "loss": 1.3958, "step": 32995 }, { "epoch": 2.6, "learning_rate": 1.3207512790419684e-05, "loss": 1.4459, "step": 32996 }, { "epoch": 2.6, "learning_rate": 1.3202442044234308e-05, "loss": 1.4609, "step": 32997 }, { "epoch": 2.6, "learning_rate": 1.3197372226828817e-05, "loss": 1.4281, "step": 32998 }, { "epoch": 2.6, "learning_rate": 1.3192303338237704e-05, "loss": 1.4466, "step": 32999 }, { "epoch": 2.6, "learning_rate": 1.3187235378495353e-05, "loss": 1.4055, "step": 33000 }, { "epoch": 2.6, "learning_rate": 1.3182168347636157e-05, "loss": 1.4632, "step": 33001 }, { "epoch": 2.6, "learning_rate": 1.3177102245694571e-05, "loss": 1.4703, "step": 33002 }, { "epoch": 2.6, "learning_rate": 1.3172037072704932e-05, "loss": 1.4172, "step": 33003 }, { "epoch": 2.6, "learning_rate": 1.316697282870165e-05, "loss": 1.4873, "step": 33004 }, { "epoch": 2.6, "learning_rate": 1.3161909513719126e-05, "loss": 1.4586, "step": 33005 }, { "epoch": 2.6, "learning_rate": 1.315684712779172e-05, "loss": 1.4753, "step": 33006 }, { "epoch": 2.6, "learning_rate": 1.3151785670953785e-05, "loss": 1.5135, "step": 33007 }, { "epoch": 2.6, "learning_rate": 1.3146725143239728e-05, "loss": 1.4366, "step": 33008 }, { "epoch": 2.6, "learning_rate": 1.3141665544683889e-05, "loss": 1.4237, "step": 33009 }, { "epoch": 2.6, "learning_rate": 1.3136606875320604e-05, "loss": 1.4215, "step": 33010 }, { "epoch": 2.6, "learning_rate": 1.3131549135184216e-05, "loss": 1.461, "step": 33011 }, { "epoch": 2.6, "learning_rate": 1.312649232430908e-05, "loss": 1.4543, "step": 33012 }, { "epoch": 2.6, "learning_rate": 1.3121436442729549e-05, "loss": 1.4267, "step": 33013 }, { "epoch": 2.6, "learning_rate": 1.3116381490479932e-05, "loss": 1.4683, "step": 33014 }, { "epoch": 2.6, "learning_rate": 1.3111327467594535e-05, "loss": 1.4211, "step": 33015 }, { "epoch": 2.6, "learning_rate": 1.3106274374107694e-05, "loss": 1.484, "step": 33016 }, { "epoch": 2.6, "learning_rate": 1.3101222210053703e-05, "loss": 1.4886, "step": 33017 }, { "epoch": 2.6, "learning_rate": 1.3096170975466847e-05, "loss": 1.4589, "step": 33018 }, { "epoch": 2.6, "learning_rate": 1.3091120670381467e-05, "loss": 1.4149, "step": 33019 }, { "epoch": 2.6, "learning_rate": 1.3086071294831819e-05, "loss": 1.4413, "step": 33020 }, { "epoch": 2.6, "learning_rate": 1.3081022848852158e-05, "loss": 1.4292, "step": 33021 }, { "epoch": 2.6, "learning_rate": 1.307597533247684e-05, "loss": 1.4248, "step": 33022 }, { "epoch": 2.6, "learning_rate": 1.3070928745740072e-05, "loss": 1.4645, "step": 33023 }, { "epoch": 2.6, "learning_rate": 1.306588308867611e-05, "loss": 1.4337, "step": 33024 }, { "epoch": 2.6, "learning_rate": 1.3060838361319276e-05, "loss": 1.4808, "step": 33025 }, { "epoch": 2.6, "learning_rate": 1.3055794563703758e-05, "loss": 1.497, "step": 33026 }, { "epoch": 2.6, "learning_rate": 1.305075169586383e-05, "loss": 1.4767, "step": 33027 }, { "epoch": 2.6, "learning_rate": 1.3045709757833684e-05, "loss": 1.4741, "step": 33028 }, { "epoch": 2.6, "learning_rate": 1.3040668749647638e-05, "loss": 1.4408, "step": 33029 }, { "epoch": 2.6, "learning_rate": 1.3035628671339865e-05, "loss": 1.5025, "step": 33030 }, { "epoch": 2.6, "learning_rate": 1.303058952294459e-05, "loss": 1.4477, "step": 33031 }, { "epoch": 2.6, "learning_rate": 1.3025551304496002e-05, "loss": 1.3662, "step": 33032 }, { "epoch": 2.6, "learning_rate": 1.3020514016028355e-05, "loss": 1.4492, "step": 33033 }, { "epoch": 2.6, "learning_rate": 1.301547765757584e-05, "loss": 1.5008, "step": 33034 }, { "epoch": 2.6, "learning_rate": 1.3010442229172597e-05, "loss": 1.4269, "step": 33035 }, { "epoch": 2.6, "learning_rate": 1.300540773085288e-05, "loss": 1.4358, "step": 33036 }, { "epoch": 2.6, "learning_rate": 1.3000374162650862e-05, "loss": 1.4365, "step": 33037 }, { "epoch": 2.6, "learning_rate": 1.299534152460065e-05, "loss": 1.4536, "step": 33038 }, { "epoch": 2.6, "learning_rate": 1.29903098167365e-05, "loss": 1.4952, "step": 33039 }, { "epoch": 2.6, "learning_rate": 1.298527903909255e-05, "loss": 1.4743, "step": 33040 }, { "epoch": 2.6, "learning_rate": 1.2980249191702908e-05, "loss": 1.4267, "step": 33041 }, { "epoch": 2.6, "learning_rate": 1.2975220274601778e-05, "loss": 1.4297, "step": 33042 }, { "epoch": 2.6, "learning_rate": 1.2970192287823267e-05, "loss": 1.4525, "step": 33043 }, { "epoch": 2.6, "learning_rate": 1.2965165231401565e-05, "loss": 1.4187, "step": 33044 }, { "epoch": 2.6, "learning_rate": 1.2960139105370726e-05, "loss": 1.4263, "step": 33045 }, { "epoch": 2.6, "learning_rate": 1.2955113909764957e-05, "loss": 1.4387, "step": 33046 }, { "epoch": 2.6, "learning_rate": 1.2950089644618334e-05, "loss": 1.4261, "step": 33047 }, { "epoch": 2.6, "learning_rate": 1.2945066309964957e-05, "loss": 1.4532, "step": 33048 }, { "epoch": 2.6, "learning_rate": 1.2940043905838954e-05, "loss": 1.4065, "step": 33049 }, { "epoch": 2.6, "learning_rate": 1.2935022432274428e-05, "loss": 1.4296, "step": 33050 }, { "epoch": 2.6, "learning_rate": 1.2930001889305452e-05, "loss": 1.4486, "step": 33051 }, { "epoch": 2.6, "learning_rate": 1.29249822769661e-05, "loss": 1.448, "step": 33052 }, { "epoch": 2.6, "learning_rate": 1.291996359529051e-05, "loss": 1.4209, "step": 33053 }, { "epoch": 2.6, "learning_rate": 1.2914945844312708e-05, "loss": 1.4668, "step": 33054 }, { "epoch": 2.6, "learning_rate": 1.2909929024066745e-05, "loss": 1.4442, "step": 33055 }, { "epoch": 2.6, "learning_rate": 1.2904913134586747e-05, "loss": 1.4796, "step": 33056 }, { "epoch": 2.6, "learning_rate": 1.2899898175906737e-05, "loss": 1.4795, "step": 33057 }, { "epoch": 2.6, "learning_rate": 1.289488414806072e-05, "loss": 1.4727, "step": 33058 }, { "epoch": 2.6, "learning_rate": 1.2889871051082784e-05, "loss": 1.5212, "step": 33059 }, { "epoch": 2.6, "learning_rate": 1.2884858885006987e-05, "loss": 1.4357, "step": 33060 }, { "epoch": 2.6, "learning_rate": 1.2879847649867337e-05, "loss": 1.4827, "step": 33061 }, { "epoch": 2.6, "learning_rate": 1.2874837345697819e-05, "loss": 1.4437, "step": 33062 }, { "epoch": 2.6, "learning_rate": 1.2869827972532509e-05, "loss": 1.4881, "step": 33063 }, { "epoch": 2.6, "learning_rate": 1.2864819530405395e-05, "loss": 1.4337, "step": 33064 }, { "epoch": 2.6, "learning_rate": 1.2859812019350469e-05, "loss": 1.4623, "step": 33065 }, { "epoch": 2.6, "learning_rate": 1.285480543940175e-05, "loss": 1.4889, "step": 33066 }, { "epoch": 2.6, "learning_rate": 1.2849799790593213e-05, "loss": 1.4127, "step": 33067 }, { "epoch": 2.6, "learning_rate": 1.2844795072958847e-05, "loss": 1.4177, "step": 33068 }, { "epoch": 2.6, "learning_rate": 1.2839791286532624e-05, "loss": 1.4742, "step": 33069 }, { "epoch": 2.6, "learning_rate": 1.2834788431348552e-05, "loss": 1.4704, "step": 33070 }, { "epoch": 2.6, "learning_rate": 1.2829786507440554e-05, "loss": 1.4279, "step": 33071 }, { "epoch": 2.6, "learning_rate": 1.28247855148426e-05, "loss": 1.4858, "step": 33072 }, { "epoch": 2.6, "learning_rate": 1.2819785453588682e-05, "loss": 1.4401, "step": 33073 }, { "epoch": 2.6, "learning_rate": 1.2814786323712706e-05, "loss": 1.4414, "step": 33074 }, { "epoch": 2.6, "learning_rate": 1.2809788125248593e-05, "loss": 1.446, "step": 33075 }, { "epoch": 2.6, "learning_rate": 1.2804790858230336e-05, "loss": 1.5283, "step": 33076 }, { "epoch": 2.6, "learning_rate": 1.2799794522691837e-05, "loss": 1.4332, "step": 33077 }, { "epoch": 2.6, "learning_rate": 1.2794799118667038e-05, "loss": 1.4488, "step": 33078 }, { "epoch": 2.6, "learning_rate": 1.278980464618981e-05, "loss": 1.4109, "step": 33079 }, { "epoch": 2.6, "learning_rate": 1.2784811105294113e-05, "loss": 1.4567, "step": 33080 }, { "epoch": 2.6, "learning_rate": 1.2779818496013815e-05, "loss": 1.4173, "step": 33081 }, { "epoch": 2.6, "learning_rate": 1.2774826818382811e-05, "loss": 1.4541, "step": 33082 }, { "epoch": 2.6, "learning_rate": 1.2769836072435035e-05, "loss": 1.4396, "step": 33083 }, { "epoch": 2.6, "learning_rate": 1.2764846258204348e-05, "loss": 1.4453, "step": 33084 }, { "epoch": 2.6, "learning_rate": 1.2759857375724603e-05, "loss": 1.4878, "step": 33085 }, { "epoch": 2.6, "learning_rate": 1.2754869425029673e-05, "loss": 1.3883, "step": 33086 }, { "epoch": 2.6, "learning_rate": 1.2749882406153466e-05, "loss": 1.4459, "step": 33087 }, { "epoch": 2.6, "learning_rate": 1.2744896319129822e-05, "loss": 1.3688, "step": 33088 }, { "epoch": 2.6, "learning_rate": 1.2739911163992561e-05, "loss": 1.4771, "step": 33089 }, { "epoch": 2.6, "learning_rate": 1.2734926940775574e-05, "loss": 1.5112, "step": 33090 }, { "epoch": 2.6, "learning_rate": 1.272994364951267e-05, "loss": 1.4309, "step": 33091 }, { "epoch": 2.6, "learning_rate": 1.2724961290237717e-05, "loss": 1.4991, "step": 33092 }, { "epoch": 2.6, "learning_rate": 1.2719979862984508e-05, "loss": 1.4131, "step": 33093 }, { "epoch": 2.6, "learning_rate": 1.2714999367786883e-05, "loss": 1.4563, "step": 33094 }, { "epoch": 2.6, "learning_rate": 1.2710019804678661e-05, "loss": 1.4663, "step": 33095 }, { "epoch": 2.6, "learning_rate": 1.270504117369362e-05, "loss": 1.4705, "step": 33096 }, { "epoch": 2.6, "learning_rate": 1.2700063474865613e-05, "loss": 1.4679, "step": 33097 }, { "epoch": 2.6, "learning_rate": 1.2695086708228398e-05, "loss": 1.4518, "step": 33098 }, { "epoch": 2.6, "learning_rate": 1.2690110873815746e-05, "loss": 1.4317, "step": 33099 }, { "epoch": 2.6, "learning_rate": 1.2685135971661498e-05, "loss": 1.4494, "step": 33100 }, { "epoch": 2.6, "learning_rate": 1.268016200179941e-05, "loss": 1.4499, "step": 33101 }, { "epoch": 2.6, "learning_rate": 1.2675188964263206e-05, "loss": 1.4276, "step": 33102 }, { "epoch": 2.6, "learning_rate": 1.2670216859086707e-05, "loss": 1.4306, "step": 33103 }, { "epoch": 2.6, "learning_rate": 1.2665245686303655e-05, "loss": 1.4616, "step": 33104 }, { "epoch": 2.6, "learning_rate": 1.2660275445947805e-05, "loss": 1.4449, "step": 33105 }, { "epoch": 2.6, "learning_rate": 1.2655306138052828e-05, "loss": 1.4769, "step": 33106 }, { "epoch": 2.6, "learning_rate": 1.2650337762652602e-05, "loss": 1.4679, "step": 33107 }, { "epoch": 2.6, "learning_rate": 1.2645370319780762e-05, "loss": 1.4894, "step": 33108 }, { "epoch": 2.61, "learning_rate": 1.2640403809471083e-05, "loss": 1.4347, "step": 33109 }, { "epoch": 2.61, "learning_rate": 1.2635438231757222e-05, "loss": 1.4661, "step": 33110 }, { "epoch": 2.61, "learning_rate": 1.2630473586672951e-05, "loss": 1.4615, "step": 33111 }, { "epoch": 2.61, "learning_rate": 1.262550987425196e-05, "loss": 1.4069, "step": 33112 }, { "epoch": 2.61, "learning_rate": 1.262054709452794e-05, "loss": 1.437, "step": 33113 }, { "epoch": 2.61, "learning_rate": 1.2615585247534593e-05, "loss": 1.4516, "step": 33114 }, { "epoch": 2.61, "learning_rate": 1.261062433330563e-05, "loss": 1.4592, "step": 33115 }, { "epoch": 2.61, "learning_rate": 1.2605664351874673e-05, "loss": 1.4427, "step": 33116 }, { "epoch": 2.61, "learning_rate": 1.260070530327546e-05, "loss": 1.4491, "step": 33117 }, { "epoch": 2.61, "learning_rate": 1.2595747187541633e-05, "loss": 1.463, "step": 33118 }, { "epoch": 2.61, "learning_rate": 1.259079000470683e-05, "loss": 1.4524, "step": 33119 }, { "epoch": 2.61, "learning_rate": 1.2585833754804775e-05, "loss": 1.42, "step": 33120 }, { "epoch": 2.61, "learning_rate": 1.2580878437869057e-05, "loss": 1.3941, "step": 33121 }, { "epoch": 2.61, "learning_rate": 1.2575924053933317e-05, "loss": 1.4379, "step": 33122 }, { "epoch": 2.61, "learning_rate": 1.2570970603031227e-05, "loss": 1.4605, "step": 33123 }, { "epoch": 2.61, "learning_rate": 1.2566018085196428e-05, "loss": 1.4478, "step": 33124 }, { "epoch": 2.61, "learning_rate": 1.2561066500462525e-05, "loss": 1.4409, "step": 33125 }, { "epoch": 2.61, "learning_rate": 1.255611584886314e-05, "loss": 1.4394, "step": 33126 }, { "epoch": 2.61, "learning_rate": 1.255116613043185e-05, "loss": 1.465, "step": 33127 }, { "epoch": 2.61, "learning_rate": 1.2546217345202308e-05, "loss": 1.4051, "step": 33128 }, { "epoch": 2.61, "learning_rate": 1.2541269493208107e-05, "loss": 1.4446, "step": 33129 }, { "epoch": 2.61, "learning_rate": 1.2536322574482816e-05, "loss": 1.4654, "step": 33130 }, { "epoch": 2.61, "learning_rate": 1.2531376589060043e-05, "loss": 1.5024, "step": 33131 }, { "epoch": 2.61, "learning_rate": 1.2526431536973363e-05, "loss": 1.4542, "step": 33132 }, { "epoch": 2.61, "learning_rate": 1.2521487418256331e-05, "loss": 1.4906, "step": 33133 }, { "epoch": 2.61, "learning_rate": 1.2516544232942554e-05, "loss": 1.4667, "step": 33134 }, { "epoch": 2.61, "learning_rate": 1.2511601981065572e-05, "loss": 1.5069, "step": 33135 }, { "epoch": 2.61, "learning_rate": 1.2506660662658907e-05, "loss": 1.4216, "step": 33136 }, { "epoch": 2.61, "learning_rate": 1.2501720277756183e-05, "loss": 1.4554, "step": 33137 }, { "epoch": 2.61, "learning_rate": 1.2496780826390857e-05, "loss": 1.417, "step": 33138 }, { "epoch": 2.61, "learning_rate": 1.249184230859655e-05, "loss": 1.4269, "step": 33139 }, { "epoch": 2.61, "learning_rate": 1.248690472440672e-05, "loss": 1.4377, "step": 33140 }, { "epoch": 2.61, "learning_rate": 1.2481968073854941e-05, "loss": 1.4574, "step": 33141 }, { "epoch": 2.61, "learning_rate": 1.2477032356974719e-05, "loss": 1.4265, "step": 33142 }, { "epoch": 2.61, "learning_rate": 1.2472097573799545e-05, "loss": 1.4202, "step": 33143 }, { "epoch": 2.61, "learning_rate": 1.2467163724362922e-05, "loss": 1.422, "step": 33144 }, { "epoch": 2.61, "learning_rate": 1.2462230808698375e-05, "loss": 1.3917, "step": 33145 }, { "epoch": 2.61, "learning_rate": 1.245729882683938e-05, "loss": 1.4438, "step": 33146 }, { "epoch": 2.61, "learning_rate": 1.2452367778819405e-05, "loss": 1.4446, "step": 33147 }, { "epoch": 2.61, "learning_rate": 1.2447437664671978e-05, "loss": 1.4497, "step": 33148 }, { "epoch": 2.61, "learning_rate": 1.2442508484430536e-05, "loss": 1.4203, "step": 33149 }, { "epoch": 2.61, "learning_rate": 1.243758023812852e-05, "loss": 1.4536, "step": 33150 }, { "epoch": 2.61, "learning_rate": 1.2432652925799452e-05, "loss": 1.4576, "step": 33151 }, { "epoch": 2.61, "learning_rate": 1.2427726547476758e-05, "loss": 1.4422, "step": 33152 }, { "epoch": 2.61, "learning_rate": 1.2422801103193841e-05, "loss": 1.4359, "step": 33153 }, { "epoch": 2.61, "learning_rate": 1.2417876592984195e-05, "loss": 1.4272, "step": 33154 }, { "epoch": 2.61, "learning_rate": 1.2412953016881271e-05, "loss": 1.4939, "step": 33155 }, { "epoch": 2.61, "learning_rate": 1.2408030374918466e-05, "loss": 1.4506, "step": 33156 }, { "epoch": 2.61, "learning_rate": 1.240310866712918e-05, "loss": 1.4867, "step": 33157 }, { "epoch": 2.61, "learning_rate": 1.2398187893546874e-05, "loss": 1.4221, "step": 33158 }, { "epoch": 2.61, "learning_rate": 1.2393268054204936e-05, "loss": 1.4017, "step": 33159 }, { "epoch": 2.61, "learning_rate": 1.2388349149136756e-05, "loss": 1.5081, "step": 33160 }, { "epoch": 2.61, "learning_rate": 1.2383431178375757e-05, "loss": 1.49, "step": 33161 }, { "epoch": 2.61, "learning_rate": 1.2378514141955331e-05, "loss": 1.4922, "step": 33162 }, { "epoch": 2.61, "learning_rate": 1.237359803990885e-05, "loss": 1.4264, "step": 33163 }, { "epoch": 2.61, "learning_rate": 1.2368682872269653e-05, "loss": 1.431, "step": 33164 }, { "epoch": 2.61, "learning_rate": 1.236376863907118e-05, "loss": 1.4905, "step": 33165 }, { "epoch": 2.61, "learning_rate": 1.2358855340346757e-05, "loss": 1.3934, "step": 33166 }, { "epoch": 2.61, "learning_rate": 1.2353942976129722e-05, "loss": 1.4796, "step": 33167 }, { "epoch": 2.61, "learning_rate": 1.2349031546453497e-05, "loss": 1.485, "step": 33168 }, { "epoch": 2.61, "learning_rate": 1.234412105135134e-05, "loss": 1.4431, "step": 33169 }, { "epoch": 2.61, "learning_rate": 1.2339211490856676e-05, "loss": 1.4485, "step": 33170 }, { "epoch": 2.61, "learning_rate": 1.2334302865002777e-05, "loss": 1.4425, "step": 33171 }, { "epoch": 2.61, "learning_rate": 1.2329395173822998e-05, "loss": 1.42, "step": 33172 }, { "epoch": 2.61, "learning_rate": 1.2324488417350664e-05, "loss": 1.4256, "step": 33173 }, { "epoch": 2.61, "learning_rate": 1.231958259561905e-05, "loss": 1.4351, "step": 33174 }, { "epoch": 2.61, "learning_rate": 1.2314677708661524e-05, "loss": 1.4452, "step": 33175 }, { "epoch": 2.61, "learning_rate": 1.2309773756511349e-05, "loss": 1.4181, "step": 33176 }, { "epoch": 2.61, "learning_rate": 1.2304870739201795e-05, "loss": 1.4171, "step": 33177 }, { "epoch": 2.61, "learning_rate": 1.2299968656766218e-05, "loss": 1.461, "step": 33178 }, { "epoch": 2.61, "learning_rate": 1.229506750923786e-05, "loss": 1.4399, "step": 33179 }, { "epoch": 2.61, "learning_rate": 1.2290167296650011e-05, "loss": 1.444, "step": 33180 }, { "epoch": 2.61, "learning_rate": 1.2285268019035893e-05, "loss": 1.3954, "step": 33181 }, { "epoch": 2.61, "learning_rate": 1.2280369676428847e-05, "loss": 1.4186, "step": 33182 }, { "epoch": 2.61, "learning_rate": 1.227547226886208e-05, "loss": 1.4068, "step": 33183 }, { "epoch": 2.61, "learning_rate": 1.2270575796368831e-05, "loss": 1.4515, "step": 33184 }, { "epoch": 2.61, "learning_rate": 1.2265680258982357e-05, "loss": 1.4256, "step": 33185 }, { "epoch": 2.61, "learning_rate": 1.2260785656735949e-05, "loss": 1.4428, "step": 33186 }, { "epoch": 2.61, "learning_rate": 1.225589198966278e-05, "loss": 1.4364, "step": 33187 }, { "epoch": 2.61, "learning_rate": 1.2250999257796074e-05, "loss": 1.466, "step": 33188 }, { "epoch": 2.61, "learning_rate": 1.2246107461169103e-05, "loss": 1.4197, "step": 33189 }, { "epoch": 2.61, "learning_rate": 1.2241216599815024e-05, "loss": 1.4673, "step": 33190 }, { "epoch": 2.61, "learning_rate": 1.2236326673767045e-05, "loss": 1.4725, "step": 33191 }, { "epoch": 2.61, "learning_rate": 1.223143768305842e-05, "loss": 1.4643, "step": 33192 }, { "epoch": 2.61, "learning_rate": 1.2226549627722293e-05, "loss": 1.4298, "step": 33193 }, { "epoch": 2.61, "learning_rate": 1.2221662507791835e-05, "loss": 1.4611, "step": 33194 }, { "epoch": 2.61, "learning_rate": 1.2216776323300286e-05, "loss": 1.4964, "step": 33195 }, { "epoch": 2.61, "learning_rate": 1.221189107428079e-05, "loss": 1.448, "step": 33196 }, { "epoch": 2.61, "learning_rate": 1.220700676076653e-05, "loss": 1.4281, "step": 33197 }, { "epoch": 2.61, "learning_rate": 1.2202123382790619e-05, "loss": 1.4853, "step": 33198 }, { "epoch": 2.61, "learning_rate": 1.2197240940386261e-05, "loss": 1.441, "step": 33199 }, { "epoch": 2.61, "learning_rate": 1.2192359433586596e-05, "loss": 1.4073, "step": 33200 }, { "epoch": 2.61, "learning_rate": 1.2187478862424716e-05, "loss": 1.4335, "step": 33201 }, { "epoch": 2.61, "learning_rate": 1.2182599226933858e-05, "loss": 1.4247, "step": 33202 }, { "epoch": 2.61, "learning_rate": 1.21777205271471e-05, "loss": 1.4896, "step": 33203 }, { "epoch": 2.61, "learning_rate": 1.2172842763097545e-05, "loss": 1.436, "step": 33204 }, { "epoch": 2.61, "learning_rate": 1.2167965934818319e-05, "loss": 1.4253, "step": 33205 }, { "epoch": 2.61, "learning_rate": 1.216309004234256e-05, "loss": 1.4266, "step": 33206 }, { "epoch": 2.61, "learning_rate": 1.215821508570336e-05, "loss": 1.4684, "step": 33207 }, { "epoch": 2.61, "learning_rate": 1.2153341064933791e-05, "loss": 1.4156, "step": 33208 }, { "epoch": 2.61, "learning_rate": 1.2148467980066978e-05, "loss": 1.4743, "step": 33209 }, { "epoch": 2.61, "learning_rate": 1.2143595831135994e-05, "loss": 1.4395, "step": 33210 }, { "epoch": 2.61, "learning_rate": 1.2138724618173912e-05, "loss": 1.4754, "step": 33211 }, { "epoch": 2.61, "learning_rate": 1.2133854341213823e-05, "loss": 1.4355, "step": 33212 }, { "epoch": 2.61, "learning_rate": 1.2128985000288782e-05, "loss": 1.4568, "step": 33213 }, { "epoch": 2.61, "learning_rate": 1.2124116595431832e-05, "loss": 1.4339, "step": 33214 }, { "epoch": 2.61, "learning_rate": 1.2119249126676062e-05, "loss": 1.4409, "step": 33215 }, { "epoch": 2.61, "learning_rate": 1.2114382594054478e-05, "loss": 1.4312, "step": 33216 }, { "epoch": 2.61, "learning_rate": 1.2109516997600172e-05, "loss": 1.4677, "step": 33217 }, { "epoch": 2.61, "learning_rate": 1.2104652337346116e-05, "loss": 1.4893, "step": 33218 }, { "epoch": 2.61, "learning_rate": 1.2099788613325418e-05, "loss": 1.4474, "step": 33219 }, { "epoch": 2.61, "learning_rate": 1.209492582557105e-05, "loss": 1.4716, "step": 33220 }, { "epoch": 2.61, "learning_rate": 1.2090063974116021e-05, "loss": 1.4471, "step": 33221 }, { "epoch": 2.61, "learning_rate": 1.2085203058993337e-05, "loss": 1.4735, "step": 33222 }, { "epoch": 2.61, "learning_rate": 1.2080343080236037e-05, "loss": 1.4579, "step": 33223 }, { "epoch": 2.61, "learning_rate": 1.2075484037877099e-05, "loss": 1.4759, "step": 33224 }, { "epoch": 2.61, "learning_rate": 1.207062593194949e-05, "loss": 1.3864, "step": 33225 }, { "epoch": 2.61, "learning_rate": 1.2065768762486238e-05, "loss": 1.4314, "step": 33226 }, { "epoch": 2.61, "learning_rate": 1.20609125295203e-05, "loss": 1.4382, "step": 33227 }, { "epoch": 2.61, "learning_rate": 1.2056057233084614e-05, "loss": 1.4793, "step": 33228 }, { "epoch": 2.61, "learning_rate": 1.2051202873212206e-05, "loss": 1.4198, "step": 33229 }, { "epoch": 2.61, "learning_rate": 1.2046349449936e-05, "loss": 1.4044, "step": 33230 }, { "epoch": 2.61, "learning_rate": 1.2041496963288933e-05, "loss": 1.4188, "step": 33231 }, { "epoch": 2.61, "learning_rate": 1.2036645413303964e-05, "loss": 1.4771, "step": 33232 }, { "epoch": 2.61, "learning_rate": 1.2031794800014066e-05, "loss": 1.4516, "step": 33233 }, { "epoch": 2.61, "learning_rate": 1.2026945123452131e-05, "loss": 1.4243, "step": 33234 }, { "epoch": 2.61, "learning_rate": 1.2022096383651097e-05, "loss": 1.4097, "step": 33235 }, { "epoch": 2.62, "learning_rate": 1.201724858064389e-05, "loss": 1.4527, "step": 33236 }, { "epoch": 2.62, "learning_rate": 1.2012401714463433e-05, "loss": 1.4675, "step": 33237 }, { "epoch": 2.62, "learning_rate": 1.2007555785142613e-05, "loss": 1.4227, "step": 33238 }, { "epoch": 2.62, "learning_rate": 1.2002710792714325e-05, "loss": 1.4386, "step": 33239 }, { "epoch": 2.62, "learning_rate": 1.1997866737211493e-05, "loss": 1.4632, "step": 33240 }, { "epoch": 2.62, "learning_rate": 1.1993023618666986e-05, "loss": 1.3934, "step": 33241 }, { "epoch": 2.62, "learning_rate": 1.1988181437113681e-05, "loss": 1.4369, "step": 33242 }, { "epoch": 2.62, "learning_rate": 1.1983340192584467e-05, "loss": 1.4635, "step": 33243 }, { "epoch": 2.62, "learning_rate": 1.1978499885112236e-05, "loss": 1.4212, "step": 33244 }, { "epoch": 2.62, "learning_rate": 1.1973660514729776e-05, "loss": 1.4126, "step": 33245 }, { "epoch": 2.62, "learning_rate": 1.1968822081470031e-05, "loss": 1.4785, "step": 33246 }, { "epoch": 2.62, "learning_rate": 1.1963984585365805e-05, "loss": 1.4788, "step": 33247 }, { "epoch": 2.62, "learning_rate": 1.1959148026449922e-05, "loss": 1.4101, "step": 33248 }, { "epoch": 2.62, "learning_rate": 1.1954312404755239e-05, "loss": 1.4699, "step": 33249 }, { "epoch": 2.62, "learning_rate": 1.1949477720314631e-05, "loss": 1.4304, "step": 33250 }, { "epoch": 2.62, "learning_rate": 1.194464397316089e-05, "loss": 1.4212, "step": 33251 }, { "epoch": 2.62, "learning_rate": 1.1939811163326801e-05, "loss": 1.439, "step": 33252 }, { "epoch": 2.62, "learning_rate": 1.1934979290845242e-05, "loss": 1.4203, "step": 33253 }, { "epoch": 2.62, "learning_rate": 1.193014835574897e-05, "loss": 1.402, "step": 33254 }, { "epoch": 2.62, "learning_rate": 1.1925318358070773e-05, "loss": 1.4226, "step": 33255 }, { "epoch": 2.62, "learning_rate": 1.1920489297843493e-05, "loss": 1.4486, "step": 33256 }, { "epoch": 2.62, "learning_rate": 1.1915661175099905e-05, "loss": 1.43, "step": 33257 }, { "epoch": 2.62, "learning_rate": 1.1910833989872765e-05, "loss": 1.4662, "step": 33258 }, { "epoch": 2.62, "learning_rate": 1.1906007742194829e-05, "loss": 1.4458, "step": 33259 }, { "epoch": 2.62, "learning_rate": 1.1901182432098921e-05, "loss": 1.4126, "step": 33260 }, { "epoch": 2.62, "learning_rate": 1.1896358059617784e-05, "loss": 1.4858, "step": 33261 }, { "epoch": 2.62, "learning_rate": 1.1891534624784139e-05, "loss": 1.4244, "step": 33262 }, { "epoch": 2.62, "learning_rate": 1.188671212763076e-05, "loss": 1.4632, "step": 33263 }, { "epoch": 2.62, "learning_rate": 1.1881890568190406e-05, "loss": 1.3876, "step": 33264 }, { "epoch": 2.62, "learning_rate": 1.1877069946495798e-05, "loss": 1.4583, "step": 33265 }, { "epoch": 2.62, "learning_rate": 1.187225026257963e-05, "loss": 1.4568, "step": 33266 }, { "epoch": 2.62, "learning_rate": 1.186743151647469e-05, "loss": 1.5062, "step": 33267 }, { "epoch": 2.62, "learning_rate": 1.1862613708213654e-05, "loss": 1.4513, "step": 33268 }, { "epoch": 2.62, "learning_rate": 1.1857796837829225e-05, "loss": 1.4474, "step": 33269 }, { "epoch": 2.62, "learning_rate": 1.1852980905354147e-05, "loss": 1.4436, "step": 33270 }, { "epoch": 2.62, "learning_rate": 1.1848165910821095e-05, "loss": 1.4899, "step": 33271 }, { "epoch": 2.62, "learning_rate": 1.1843351854262723e-05, "loss": 1.4398, "step": 33272 }, { "epoch": 2.62, "learning_rate": 1.1838538735711789e-05, "loss": 1.452, "step": 33273 }, { "epoch": 2.62, "learning_rate": 1.1833726555200918e-05, "loss": 1.4186, "step": 33274 }, { "epoch": 2.62, "learning_rate": 1.1828915312762815e-05, "loss": 1.4927, "step": 33275 }, { "epoch": 2.62, "learning_rate": 1.182410500843009e-05, "loss": 1.4225, "step": 33276 }, { "epoch": 2.62, "learning_rate": 1.1819295642235466e-05, "loss": 1.4605, "step": 33277 }, { "epoch": 2.62, "learning_rate": 1.1814487214211566e-05, "loss": 1.4552, "step": 33278 }, { "epoch": 2.62, "learning_rate": 1.180967972439103e-05, "loss": 1.4338, "step": 33279 }, { "epoch": 2.62, "learning_rate": 1.18048731728065e-05, "loss": 1.4886, "step": 33280 }, { "epoch": 2.62, "learning_rate": 1.1800067559490634e-05, "loss": 1.439, "step": 33281 }, { "epoch": 2.62, "learning_rate": 1.179526288447607e-05, "loss": 1.4546, "step": 33282 }, { "epoch": 2.62, "learning_rate": 1.179045914779535e-05, "loss": 1.4898, "step": 33283 }, { "epoch": 2.62, "learning_rate": 1.1785656349481182e-05, "loss": 1.3988, "step": 33284 }, { "epoch": 2.62, "learning_rate": 1.1780854489566138e-05, "loss": 1.4108, "step": 33285 }, { "epoch": 2.62, "learning_rate": 1.1776053568082777e-05, "loss": 1.4667, "step": 33286 }, { "epoch": 2.62, "learning_rate": 1.1771253585063773e-05, "loss": 1.4585, "step": 33287 }, { "epoch": 2.62, "learning_rate": 1.176645454054168e-05, "loss": 1.4205, "step": 33288 }, { "epoch": 2.62, "learning_rate": 1.1761656434549043e-05, "loss": 1.4202, "step": 33289 }, { "epoch": 2.62, "learning_rate": 1.1756859267118484e-05, "loss": 1.4947, "step": 33290 }, { "epoch": 2.62, "learning_rate": 1.1752063038282578e-05, "loss": 1.4321, "step": 33291 }, { "epoch": 2.62, "learning_rate": 1.174726774807388e-05, "loss": 1.4811, "step": 33292 }, { "epoch": 2.62, "learning_rate": 1.1742473396524899e-05, "loss": 1.4592, "step": 33293 }, { "epoch": 2.62, "learning_rate": 1.1737679983668258e-05, "loss": 1.4916, "step": 33294 }, { "epoch": 2.62, "learning_rate": 1.1732887509536449e-05, "loss": 1.4682, "step": 33295 }, { "epoch": 2.62, "learning_rate": 1.1728095974162044e-05, "loss": 1.3975, "step": 33296 }, { "epoch": 2.62, "learning_rate": 1.1723305377577552e-05, "loss": 1.4814, "step": 33297 }, { "epoch": 2.62, "learning_rate": 1.171851571981553e-05, "loss": 1.3994, "step": 33298 }, { "epoch": 2.62, "learning_rate": 1.1713727000908468e-05, "loss": 1.4316, "step": 33299 }, { "epoch": 2.62, "learning_rate": 1.1708939220888875e-05, "loss": 1.4791, "step": 33300 }, { "epoch": 2.62, "learning_rate": 1.170415237978929e-05, "loss": 1.4242, "step": 33301 }, { "epoch": 2.62, "learning_rate": 1.1699366477642186e-05, "loss": 1.4108, "step": 33302 }, { "epoch": 2.62, "learning_rate": 1.169458151448004e-05, "loss": 1.4721, "step": 33303 }, { "epoch": 2.62, "learning_rate": 1.1689797490335389e-05, "loss": 1.4121, "step": 33304 }, { "epoch": 2.62, "learning_rate": 1.1685014405240695e-05, "loss": 1.4591, "step": 33305 }, { "epoch": 2.62, "learning_rate": 1.1680232259228395e-05, "loss": 1.472, "step": 33306 }, { "epoch": 2.62, "learning_rate": 1.1675451052331015e-05, "loss": 1.476, "step": 33307 }, { "epoch": 2.62, "learning_rate": 1.1670670784580977e-05, "loss": 1.3924, "step": 33308 }, { "epoch": 2.62, "learning_rate": 1.1665891456010756e-05, "loss": 1.4494, "step": 33309 }, { "epoch": 2.62, "learning_rate": 1.1661113066652761e-05, "loss": 1.433, "step": 33310 }, { "epoch": 2.62, "learning_rate": 1.1656335616539481e-05, "loss": 1.4576, "step": 33311 }, { "epoch": 2.62, "learning_rate": 1.165155910570334e-05, "loss": 1.4676, "step": 33312 }, { "epoch": 2.62, "learning_rate": 1.1646783534176763e-05, "loss": 1.4785, "step": 33313 }, { "epoch": 2.62, "learning_rate": 1.1642008901992189e-05, "loss": 1.4364, "step": 33314 }, { "epoch": 2.62, "learning_rate": 1.1637235209182027e-05, "loss": 1.4317, "step": 33315 }, { "epoch": 2.62, "learning_rate": 1.1632462455778685e-05, "loss": 1.4398, "step": 33316 }, { "epoch": 2.62, "learning_rate": 1.1627690641814535e-05, "loss": 1.428, "step": 33317 }, { "epoch": 2.62, "learning_rate": 1.1622919767322036e-05, "loss": 1.4232, "step": 33318 }, { "epoch": 2.62, "learning_rate": 1.1618149832333545e-05, "loss": 1.4572, "step": 33319 }, { "epoch": 2.62, "learning_rate": 1.161338083688142e-05, "loss": 1.4597, "step": 33320 }, { "epoch": 2.62, "learning_rate": 1.16086127809981e-05, "loss": 1.4017, "step": 33321 }, { "epoch": 2.62, "learning_rate": 1.1603845664715928e-05, "loss": 1.4383, "step": 33322 }, { "epoch": 2.62, "learning_rate": 1.1599079488067258e-05, "loss": 1.4416, "step": 33323 }, { "epoch": 2.62, "learning_rate": 1.1594314251084469e-05, "loss": 1.4559, "step": 33324 }, { "epoch": 2.62, "learning_rate": 1.1589549953799914e-05, "loss": 1.4438, "step": 33325 }, { "epoch": 2.62, "learning_rate": 1.158478659624592e-05, "loss": 1.4809, "step": 33326 }, { "epoch": 2.62, "learning_rate": 1.1580024178454827e-05, "loss": 1.4245, "step": 33327 }, { "epoch": 2.62, "learning_rate": 1.1575262700459026e-05, "loss": 1.4468, "step": 33328 }, { "epoch": 2.62, "learning_rate": 1.157050216229079e-05, "loss": 1.3753, "step": 33329 }, { "epoch": 2.62, "learning_rate": 1.1565742563982427e-05, "loss": 1.4104, "step": 33330 }, { "epoch": 2.62, "learning_rate": 1.1560983905566295e-05, "loss": 1.4581, "step": 33331 }, { "epoch": 2.62, "learning_rate": 1.1556226187074701e-05, "loss": 1.4223, "step": 33332 }, { "epoch": 2.62, "learning_rate": 1.1551469408539921e-05, "loss": 1.4567, "step": 33333 }, { "epoch": 2.62, "learning_rate": 1.1546713569994243e-05, "loss": 1.4615, "step": 33334 }, { "epoch": 2.62, "learning_rate": 1.1541958671469993e-05, "loss": 1.4417, "step": 33335 }, { "epoch": 2.62, "learning_rate": 1.1537204712999443e-05, "loss": 1.4154, "step": 33336 }, { "epoch": 2.62, "learning_rate": 1.1532451694614836e-05, "loss": 1.513, "step": 33337 }, { "epoch": 2.62, "learning_rate": 1.1527699616348497e-05, "loss": 1.4544, "step": 33338 }, { "epoch": 2.62, "learning_rate": 1.1522948478232646e-05, "loss": 1.4393, "step": 33339 }, { "epoch": 2.62, "learning_rate": 1.1518198280299545e-05, "loss": 1.4454, "step": 33340 }, { "epoch": 2.62, "learning_rate": 1.1513449022581483e-05, "loss": 1.4481, "step": 33341 }, { "epoch": 2.62, "learning_rate": 1.1508700705110651e-05, "loss": 1.418, "step": 33342 }, { "epoch": 2.62, "learning_rate": 1.1503953327919341e-05, "loss": 1.4463, "step": 33343 }, { "epoch": 2.62, "learning_rate": 1.1499206891039742e-05, "loss": 1.4844, "step": 33344 }, { "epoch": 2.62, "learning_rate": 1.1494461394504113e-05, "loss": 1.4737, "step": 33345 }, { "epoch": 2.62, "learning_rate": 1.1489716838344659e-05, "loss": 1.4425, "step": 33346 }, { "epoch": 2.62, "learning_rate": 1.1484973222593574e-05, "loss": 1.4269, "step": 33347 }, { "epoch": 2.62, "learning_rate": 1.1480230547283098e-05, "loss": 1.4287, "step": 33348 }, { "epoch": 2.62, "learning_rate": 1.1475488812445405e-05, "loss": 1.4372, "step": 33349 }, { "epoch": 2.62, "learning_rate": 1.1470748018112719e-05, "loss": 1.4578, "step": 33350 }, { "epoch": 2.62, "learning_rate": 1.146600816431718e-05, "loss": 1.486, "step": 33351 }, { "epoch": 2.62, "learning_rate": 1.1461269251091015e-05, "loss": 1.3577, "step": 33352 }, { "epoch": 2.62, "learning_rate": 1.145653127846638e-05, "loss": 1.4566, "step": 33353 }, { "epoch": 2.62, "learning_rate": 1.1451794246475415e-05, "loss": 1.4551, "step": 33354 }, { "epoch": 2.62, "learning_rate": 1.144705815515033e-05, "loss": 1.4771, "step": 33355 }, { "epoch": 2.62, "learning_rate": 1.144232300452328e-05, "loss": 1.4081, "step": 33356 }, { "epoch": 2.62, "learning_rate": 1.1437588794626357e-05, "loss": 1.438, "step": 33357 }, { "epoch": 2.62, "learning_rate": 1.1432855525491735e-05, "loss": 1.5003, "step": 33358 }, { "epoch": 2.62, "learning_rate": 1.142812319715159e-05, "loss": 1.4508, "step": 33359 }, { "epoch": 2.62, "learning_rate": 1.142339180963801e-05, "loss": 1.4584, "step": 33360 }, { "epoch": 2.62, "learning_rate": 1.1418661362983106e-05, "loss": 1.4498, "step": 33361 }, { "epoch": 2.62, "learning_rate": 1.141393185721905e-05, "loss": 1.4418, "step": 33362 }, { "epoch": 2.63, "learning_rate": 1.1409203292377917e-05, "loss": 1.4359, "step": 33363 }, { "epoch": 2.63, "learning_rate": 1.140447566849178e-05, "loss": 1.4076, "step": 33364 }, { "epoch": 2.63, "learning_rate": 1.1399748985592799e-05, "loss": 1.471, "step": 33365 }, { "epoch": 2.63, "learning_rate": 1.139502324371303e-05, "loss": 1.4293, "step": 33366 }, { "epoch": 2.63, "learning_rate": 1.1390298442884549e-05, "loss": 1.4737, "step": 33367 }, { "epoch": 2.63, "learning_rate": 1.1385574583139462e-05, "loss": 1.4161, "step": 33368 }, { "epoch": 2.63, "learning_rate": 1.1380851664509843e-05, "loss": 1.4523, "step": 33369 }, { "epoch": 2.63, "learning_rate": 1.1376129687027734e-05, "loss": 1.4709, "step": 33370 }, { "epoch": 2.63, "learning_rate": 1.1371408650725194e-05, "loss": 1.4369, "step": 33371 }, { "epoch": 2.63, "learning_rate": 1.1366688555634296e-05, "loss": 1.424, "step": 33372 }, { "epoch": 2.63, "learning_rate": 1.1361969401787064e-05, "loss": 1.4266, "step": 33373 }, { "epoch": 2.63, "learning_rate": 1.1357251189215588e-05, "loss": 1.4069, "step": 33374 }, { "epoch": 2.63, "learning_rate": 1.1352533917951828e-05, "loss": 1.4695, "step": 33375 }, { "epoch": 2.63, "learning_rate": 1.1347817588027875e-05, "loss": 1.4601, "step": 33376 }, { "epoch": 2.63, "learning_rate": 1.1343102199475734e-05, "loss": 1.4404, "step": 33377 }, { "epoch": 2.63, "learning_rate": 1.1338387752327382e-05, "loss": 1.5036, "step": 33378 }, { "epoch": 2.63, "learning_rate": 1.1333674246614876e-05, "loss": 1.4573, "step": 33379 }, { "epoch": 2.63, "learning_rate": 1.1328961682370208e-05, "loss": 1.4493, "step": 33380 }, { "epoch": 2.63, "learning_rate": 1.1324250059625333e-05, "loss": 1.4887, "step": 33381 }, { "epoch": 2.63, "learning_rate": 1.1319539378412312e-05, "loss": 1.4427, "step": 33382 }, { "epoch": 2.63, "learning_rate": 1.1314829638763085e-05, "loss": 1.4627, "step": 33383 }, { "epoch": 2.63, "learning_rate": 1.131012084070959e-05, "loss": 1.4002, "step": 33384 }, { "epoch": 2.63, "learning_rate": 1.1305412984283874e-05, "loss": 1.4131, "step": 33385 }, { "epoch": 2.63, "learning_rate": 1.1300706069517873e-05, "loss": 1.4688, "step": 33386 }, { "epoch": 2.63, "learning_rate": 1.129600009644353e-05, "loss": 1.5071, "step": 33387 }, { "epoch": 2.63, "learning_rate": 1.129129506509277e-05, "loss": 1.4567, "step": 33388 }, { "epoch": 2.63, "learning_rate": 1.1286590975497583e-05, "loss": 1.3918, "step": 33389 }, { "epoch": 2.63, "learning_rate": 1.1281887827689929e-05, "loss": 1.4172, "step": 33390 }, { "epoch": 2.63, "learning_rate": 1.1277185621701695e-05, "loss": 1.4397, "step": 33391 }, { "epoch": 2.63, "learning_rate": 1.1272484357564776e-05, "loss": 1.4068, "step": 33392 }, { "epoch": 2.63, "learning_rate": 1.1267784035311178e-05, "loss": 1.3761, "step": 33393 }, { "epoch": 2.63, "learning_rate": 1.126308465497276e-05, "loss": 1.4928, "step": 33394 }, { "epoch": 2.63, "learning_rate": 1.125838621658141e-05, "loss": 1.4341, "step": 33395 }, { "epoch": 2.63, "learning_rate": 1.125368872016909e-05, "loss": 1.4345, "step": 33396 }, { "epoch": 2.63, "learning_rate": 1.124899216576764e-05, "loss": 1.4496, "step": 33397 }, { "epoch": 2.63, "learning_rate": 1.124429655340895e-05, "loss": 1.4106, "step": 33398 }, { "epoch": 2.63, "learning_rate": 1.1239601883124944e-05, "loss": 1.4463, "step": 33399 }, { "epoch": 2.63, "learning_rate": 1.1234908154947447e-05, "loss": 1.4616, "step": 33400 }, { "epoch": 2.63, "learning_rate": 1.1230215368908335e-05, "loss": 1.4866, "step": 33401 }, { "epoch": 2.63, "learning_rate": 1.1225523525039514e-05, "loss": 1.4231, "step": 33402 }, { "epoch": 2.63, "learning_rate": 1.1220832623372795e-05, "loss": 1.4536, "step": 33403 }, { "epoch": 2.63, "learning_rate": 1.1216142663940048e-05, "loss": 1.4557, "step": 33404 }, { "epoch": 2.63, "learning_rate": 1.1211453646773033e-05, "loss": 1.4729, "step": 33405 }, { "epoch": 2.63, "learning_rate": 1.1206765571903725e-05, "loss": 1.4542, "step": 33406 }, { "epoch": 2.63, "learning_rate": 1.1202078439363881e-05, "loss": 1.4813, "step": 33407 }, { "epoch": 2.63, "learning_rate": 1.1197392249185343e-05, "loss": 1.4561, "step": 33408 }, { "epoch": 2.63, "learning_rate": 1.119270700139987e-05, "loss": 1.4532, "step": 33409 }, { "epoch": 2.63, "learning_rate": 1.118802269603935e-05, "loss": 1.389, "step": 33410 }, { "epoch": 2.63, "learning_rate": 1.118333933313556e-05, "loss": 1.4577, "step": 33411 }, { "epoch": 2.63, "learning_rate": 1.1178656912720257e-05, "loss": 1.4325, "step": 33412 }, { "epoch": 2.63, "learning_rate": 1.1173975434825283e-05, "loss": 1.4351, "step": 33413 }, { "epoch": 2.63, "learning_rate": 1.1169294899482429e-05, "loss": 1.4469, "step": 33414 }, { "epoch": 2.63, "learning_rate": 1.1164615306723401e-05, "loss": 1.4283, "step": 33415 }, { "epoch": 2.63, "learning_rate": 1.1159936656580059e-05, "loss": 1.4715, "step": 33416 }, { "epoch": 2.63, "learning_rate": 1.1155258949084112e-05, "loss": 1.4389, "step": 33417 }, { "epoch": 2.63, "learning_rate": 1.1150582184267332e-05, "loss": 1.4504, "step": 33418 }, { "epoch": 2.63, "learning_rate": 1.1145906362161477e-05, "loss": 1.4698, "step": 33419 }, { "epoch": 2.63, "learning_rate": 1.1141231482798308e-05, "loss": 1.4556, "step": 33420 }, { "epoch": 2.63, "learning_rate": 1.113655754620953e-05, "loss": 1.4868, "step": 33421 }, { "epoch": 2.63, "learning_rate": 1.1131884552426884e-05, "loss": 1.4741, "step": 33422 }, { "epoch": 2.63, "learning_rate": 1.112721250148213e-05, "loss": 1.4831, "step": 33423 }, { "epoch": 2.63, "learning_rate": 1.1122541393406976e-05, "loss": 1.4501, "step": 33424 }, { "epoch": 2.63, "learning_rate": 1.1117871228233093e-05, "loss": 1.4348, "step": 33425 }, { "epoch": 2.63, "learning_rate": 1.1113202005992244e-05, "loss": 1.4791, "step": 33426 }, { "epoch": 2.63, "learning_rate": 1.1108533726716117e-05, "loss": 1.4012, "step": 33427 }, { "epoch": 2.63, "learning_rate": 1.1103866390436406e-05, "loss": 1.4088, "step": 33428 }, { "epoch": 2.63, "learning_rate": 1.1099199997184766e-05, "loss": 1.4644, "step": 33429 }, { "epoch": 2.63, "learning_rate": 1.1094534546992923e-05, "loss": 1.4243, "step": 33430 }, { "epoch": 2.63, "learning_rate": 1.1089870039892551e-05, "loss": 1.4119, "step": 33431 }, { "epoch": 2.63, "learning_rate": 1.108520647591526e-05, "loss": 1.4193, "step": 33432 }, { "epoch": 2.63, "learning_rate": 1.1080543855092789e-05, "loss": 1.4311, "step": 33433 }, { "epoch": 2.63, "learning_rate": 1.1075882177456763e-05, "loss": 1.4943, "step": 33434 }, { "epoch": 2.63, "learning_rate": 1.1071221443038808e-05, "loss": 1.4194, "step": 33435 }, { "epoch": 2.63, "learning_rate": 1.1066561651870598e-05, "loss": 1.4426, "step": 33436 }, { "epoch": 2.63, "learning_rate": 1.106190280398379e-05, "loss": 1.4016, "step": 33437 }, { "epoch": 2.63, "learning_rate": 1.1057244899409978e-05, "loss": 1.4096, "step": 33438 }, { "epoch": 2.63, "learning_rate": 1.1052587938180785e-05, "loss": 1.4339, "step": 33439 }, { "epoch": 2.63, "learning_rate": 1.1047931920327868e-05, "loss": 1.4542, "step": 33440 }, { "epoch": 2.63, "learning_rate": 1.1043276845882804e-05, "loss": 1.4467, "step": 33441 }, { "epoch": 2.63, "learning_rate": 1.1038622714877183e-05, "loss": 1.3961, "step": 33442 }, { "epoch": 2.63, "learning_rate": 1.1033969527342662e-05, "loss": 1.4596, "step": 33443 }, { "epoch": 2.63, "learning_rate": 1.1029317283310785e-05, "loss": 1.4611, "step": 33444 }, { "epoch": 2.63, "learning_rate": 1.1024665982813175e-05, "loss": 1.4615, "step": 33445 }, { "epoch": 2.63, "learning_rate": 1.102001562588134e-05, "loss": 1.4447, "step": 33446 }, { "epoch": 2.63, "learning_rate": 1.1015366212546955e-05, "loss": 1.3961, "step": 33447 }, { "epoch": 2.63, "learning_rate": 1.1010717742841512e-05, "loss": 1.4673, "step": 33448 }, { "epoch": 2.63, "learning_rate": 1.1006070216796586e-05, "loss": 1.4965, "step": 33449 }, { "epoch": 2.63, "learning_rate": 1.1001423634443751e-05, "loss": 1.4707, "step": 33450 }, { "epoch": 2.63, "learning_rate": 1.0996777995814566e-05, "loss": 1.465, "step": 33451 }, { "epoch": 2.63, "learning_rate": 1.0992133300940502e-05, "loss": 1.4571, "step": 33452 }, { "epoch": 2.63, "learning_rate": 1.0987489549853157e-05, "loss": 1.4086, "step": 33453 }, { "epoch": 2.63, "learning_rate": 1.0982846742584051e-05, "loss": 1.4663, "step": 33454 }, { "epoch": 2.63, "learning_rate": 1.0978204879164726e-05, "loss": 1.4249, "step": 33455 }, { "epoch": 2.63, "learning_rate": 1.0973563959626624e-05, "loss": 1.4147, "step": 33456 }, { "epoch": 2.63, "learning_rate": 1.0968923984001338e-05, "loss": 1.4653, "step": 33457 }, { "epoch": 2.63, "learning_rate": 1.0964284952320324e-05, "loss": 1.4452, "step": 33458 }, { "epoch": 2.63, "learning_rate": 1.0959646864615074e-05, "loss": 1.5085, "step": 33459 }, { "epoch": 2.63, "learning_rate": 1.0955009720917113e-05, "loss": 1.4832, "step": 33460 }, { "epoch": 2.63, "learning_rate": 1.0950373521257915e-05, "loss": 1.4811, "step": 33461 }, { "epoch": 2.63, "learning_rate": 1.0945738265668941e-05, "loss": 1.4636, "step": 33462 }, { "epoch": 2.63, "learning_rate": 1.094110395418163e-05, "loss": 1.4637, "step": 33463 }, { "epoch": 2.63, "learning_rate": 1.0936470586827523e-05, "loss": 1.4339, "step": 33464 }, { "epoch": 2.63, "learning_rate": 1.0931838163638029e-05, "loss": 1.5104, "step": 33465 }, { "epoch": 2.63, "learning_rate": 1.092720668464459e-05, "loss": 1.4567, "step": 33466 }, { "epoch": 2.63, "learning_rate": 1.0922576149878698e-05, "loss": 1.4559, "step": 33467 }, { "epoch": 2.63, "learning_rate": 1.0917946559371743e-05, "loss": 1.4681, "step": 33468 }, { "epoch": 2.63, "learning_rate": 1.0913317913155201e-05, "loss": 1.4625, "step": 33469 }, { "epoch": 2.63, "learning_rate": 1.0908690211260446e-05, "loss": 1.4705, "step": 33470 }, { "epoch": 2.63, "learning_rate": 1.090406345371897e-05, "loss": 1.4034, "step": 33471 }, { "epoch": 2.63, "learning_rate": 1.0899437640562114e-05, "loss": 1.4446, "step": 33472 }, { "epoch": 2.63, "learning_rate": 1.0894812771821321e-05, "loss": 1.464, "step": 33473 }, { "epoch": 2.63, "learning_rate": 1.089018884752798e-05, "loss": 1.4658, "step": 33474 }, { "epoch": 2.63, "learning_rate": 1.0885565867713503e-05, "loss": 1.4191, "step": 33475 }, { "epoch": 2.63, "learning_rate": 1.0880943832409244e-05, "loss": 1.4176, "step": 33476 }, { "epoch": 2.63, "learning_rate": 1.087632274164663e-05, "loss": 1.4719, "step": 33477 }, { "epoch": 2.63, "learning_rate": 1.0871702595457005e-05, "loss": 1.4867, "step": 33478 }, { "epoch": 2.63, "learning_rate": 1.0867083393871723e-05, "loss": 1.3905, "step": 33479 }, { "epoch": 2.63, "learning_rate": 1.0862465136922177e-05, "loss": 1.4375, "step": 33480 }, { "epoch": 2.63, "learning_rate": 1.085784782463971e-05, "loss": 1.427, "step": 33481 }, { "epoch": 2.63, "learning_rate": 1.0853231457055678e-05, "loss": 1.4633, "step": 33482 }, { "epoch": 2.63, "learning_rate": 1.0848616034201375e-05, "loss": 1.4108, "step": 33483 }, { "epoch": 2.63, "learning_rate": 1.0844001556108222e-05, "loss": 1.3903, "step": 33484 }, { "epoch": 2.63, "learning_rate": 1.08393880228075e-05, "loss": 1.4432, "step": 33485 }, { "epoch": 2.63, "learning_rate": 1.0834775434330545e-05, "loss": 1.4345, "step": 33486 }, { "epoch": 2.63, "learning_rate": 1.0830163790708635e-05, "loss": 1.4307, "step": 33487 }, { "epoch": 2.63, "learning_rate": 1.0825553091973143e-05, "loss": 1.423, "step": 33488 }, { "epoch": 2.63, "learning_rate": 1.0820943338155347e-05, "loss": 1.449, "step": 33489 }, { "epoch": 2.64, "learning_rate": 1.081633452928652e-05, "loss": 1.4319, "step": 33490 }, { "epoch": 2.64, "learning_rate": 1.0811726665397985e-05, "loss": 1.4314, "step": 33491 }, { "epoch": 2.64, "learning_rate": 1.080711974652102e-05, "loss": 1.4301, "step": 33492 }, { "epoch": 2.64, "learning_rate": 1.0802513772686866e-05, "loss": 1.4851, "step": 33493 }, { "epoch": 2.64, "learning_rate": 1.0797908743926865e-05, "loss": 1.4468, "step": 33494 }, { "epoch": 2.64, "learning_rate": 1.079330466027224e-05, "loss": 1.3995, "step": 33495 }, { "epoch": 2.64, "learning_rate": 1.0788701521754233e-05, "loss": 1.4615, "step": 33496 }, { "epoch": 2.64, "learning_rate": 1.078409932840414e-05, "loss": 1.4251, "step": 33497 }, { "epoch": 2.64, "learning_rate": 1.0779498080253196e-05, "loss": 1.4642, "step": 33498 }, { "epoch": 2.64, "learning_rate": 1.0774897777332597e-05, "loss": 1.4842, "step": 33499 }, { "epoch": 2.64, "learning_rate": 1.0770298419673618e-05, "loss": 1.4336, "step": 33500 }, { "epoch": 2.64, "learning_rate": 1.0765700007307498e-05, "loss": 1.4288, "step": 33501 }, { "epoch": 2.64, "learning_rate": 1.0761102540265449e-05, "loss": 1.3825, "step": 33502 }, { "epoch": 2.64, "learning_rate": 1.0756506018578676e-05, "loss": 1.4391, "step": 33503 }, { "epoch": 2.64, "learning_rate": 1.0751910442278338e-05, "loss": 1.4196, "step": 33504 }, { "epoch": 2.64, "learning_rate": 1.0747315811395729e-05, "loss": 1.4621, "step": 33505 }, { "epoch": 2.64, "learning_rate": 1.0742722125962005e-05, "loss": 1.4637, "step": 33506 }, { "epoch": 2.64, "learning_rate": 1.0738129386008309e-05, "loss": 1.4677, "step": 33507 }, { "epoch": 2.64, "learning_rate": 1.0733537591565899e-05, "loss": 1.3819, "step": 33508 }, { "epoch": 2.64, "learning_rate": 1.0728946742665917e-05, "loss": 1.4268, "step": 33509 }, { "epoch": 2.64, "learning_rate": 1.0724356839339504e-05, "loss": 1.4324, "step": 33510 }, { "epoch": 2.64, "learning_rate": 1.0719767881617868e-05, "loss": 1.4499, "step": 33511 }, { "epoch": 2.64, "learning_rate": 1.0715179869532153e-05, "loss": 1.4485, "step": 33512 }, { "epoch": 2.64, "learning_rate": 1.0710592803113466e-05, "loss": 1.4195, "step": 33513 }, { "epoch": 2.64, "learning_rate": 1.0706006682393014e-05, "loss": 1.4504, "step": 33514 }, { "epoch": 2.64, "learning_rate": 1.0701421507401892e-05, "loss": 1.4305, "step": 33515 }, { "epoch": 2.64, "learning_rate": 1.0696837278171271e-05, "loss": 1.4188, "step": 33516 }, { "epoch": 2.64, "learning_rate": 1.0692253994732231e-05, "loss": 1.4695, "step": 33517 }, { "epoch": 2.64, "learning_rate": 1.0687671657115926e-05, "loss": 1.4866, "step": 33518 }, { "epoch": 2.64, "learning_rate": 1.068309026535345e-05, "loss": 1.3972, "step": 33519 }, { "epoch": 2.64, "learning_rate": 1.0678509819475927e-05, "loss": 1.4301, "step": 33520 }, { "epoch": 2.64, "learning_rate": 1.06739303195144e-05, "loss": 1.4208, "step": 33521 }, { "epoch": 2.64, "learning_rate": 1.0669351765500011e-05, "loss": 1.4364, "step": 33522 }, { "epoch": 2.64, "learning_rate": 1.066477415746385e-05, "loss": 1.5127, "step": 33523 }, { "epoch": 2.64, "learning_rate": 1.0660197495436962e-05, "loss": 1.4389, "step": 33524 }, { "epoch": 2.64, "learning_rate": 1.0655621779450451e-05, "loss": 1.5089, "step": 33525 }, { "epoch": 2.64, "learning_rate": 1.0651047009535379e-05, "loss": 1.4454, "step": 33526 }, { "epoch": 2.64, "learning_rate": 1.064647318572277e-05, "loss": 1.488, "step": 33527 }, { "epoch": 2.64, "learning_rate": 1.0641900308043732e-05, "loss": 1.4406, "step": 33528 }, { "epoch": 2.64, "learning_rate": 1.0637328376529292e-05, "loss": 1.4179, "step": 33529 }, { "epoch": 2.64, "learning_rate": 1.0632757391210456e-05, "loss": 1.4248, "step": 33530 }, { "epoch": 2.64, "learning_rate": 1.0628187352118283e-05, "loss": 1.4578, "step": 33531 }, { "epoch": 2.64, "learning_rate": 1.062361825928385e-05, "loss": 1.4475, "step": 33532 }, { "epoch": 2.64, "learning_rate": 1.0619050112738115e-05, "loss": 1.4519, "step": 33533 }, { "epoch": 2.64, "learning_rate": 1.0614482912512101e-05, "loss": 1.4483, "step": 33534 }, { "epoch": 2.64, "learning_rate": 1.0609916658636835e-05, "loss": 1.4718, "step": 33535 }, { "epoch": 2.64, "learning_rate": 1.0605351351143327e-05, "loss": 1.4553, "step": 33536 }, { "epoch": 2.64, "learning_rate": 1.0600786990062531e-05, "loss": 1.4008, "step": 33537 }, { "epoch": 2.64, "learning_rate": 1.0596223575425495e-05, "loss": 1.4646, "step": 33538 }, { "epoch": 2.64, "learning_rate": 1.0591661107263173e-05, "loss": 1.4276, "step": 33539 }, { "epoch": 2.64, "learning_rate": 1.058709958560654e-05, "loss": 1.4623, "step": 33540 }, { "epoch": 2.64, "learning_rate": 1.0582539010486524e-05, "loss": 1.4115, "step": 33541 }, { "epoch": 2.64, "learning_rate": 1.0577979381934165e-05, "loss": 1.4311, "step": 33542 }, { "epoch": 2.64, "learning_rate": 1.057342069998039e-05, "loss": 1.4469, "step": 33543 }, { "epoch": 2.64, "learning_rate": 1.0568862964656122e-05, "loss": 1.4693, "step": 33544 }, { "epoch": 2.64, "learning_rate": 1.0564306175992355e-05, "loss": 1.4524, "step": 33545 }, { "epoch": 2.64, "learning_rate": 1.0559750334019979e-05, "loss": 1.4854, "step": 33546 }, { "epoch": 2.64, "learning_rate": 1.055519543876997e-05, "loss": 1.492, "step": 33547 }, { "epoch": 2.64, "learning_rate": 1.0550641490273204e-05, "loss": 1.4866, "step": 33548 }, { "epoch": 2.64, "learning_rate": 1.0546088488560672e-05, "loss": 1.465, "step": 33549 }, { "epoch": 2.64, "learning_rate": 1.0541536433663218e-05, "loss": 1.4745, "step": 33550 }, { "epoch": 2.64, "learning_rate": 1.0536985325611764e-05, "loss": 1.4601, "step": 33551 }, { "epoch": 2.64, "learning_rate": 1.0532435164437237e-05, "loss": 1.464, "step": 33552 }, { "epoch": 2.64, "learning_rate": 1.0527885950170495e-05, "loss": 1.4665, "step": 33553 }, { "epoch": 2.64, "learning_rate": 1.0523337682842432e-05, "loss": 1.4516, "step": 33554 }, { "epoch": 2.64, "learning_rate": 1.0518790362483953e-05, "loss": 1.5118, "step": 33555 }, { "epoch": 2.64, "learning_rate": 1.051424398912592e-05, "loss": 1.4266, "step": 33556 }, { "epoch": 2.64, "learning_rate": 1.0509698562799207e-05, "loss": 1.4024, "step": 33557 }, { "epoch": 2.64, "learning_rate": 1.0505154083534623e-05, "loss": 1.4867, "step": 33558 }, { "epoch": 2.64, "learning_rate": 1.0500610551363093e-05, "loss": 1.4641, "step": 33559 }, { "epoch": 2.64, "learning_rate": 1.0496067966315441e-05, "loss": 1.4289, "step": 33560 }, { "epoch": 2.64, "learning_rate": 1.0491526328422462e-05, "loss": 1.5082, "step": 33561 }, { "epoch": 2.64, "learning_rate": 1.0486985637715045e-05, "loss": 1.4627, "step": 33562 }, { "epoch": 2.64, "learning_rate": 1.0482445894224034e-05, "loss": 1.424, "step": 33563 }, { "epoch": 2.64, "learning_rate": 1.047790709798022e-05, "loss": 1.4398, "step": 33564 }, { "epoch": 2.64, "learning_rate": 1.0473369249014395e-05, "loss": 1.4279, "step": 33565 }, { "epoch": 2.64, "learning_rate": 1.046883234735742e-05, "loss": 1.4682, "step": 33566 }, { "epoch": 2.64, "learning_rate": 1.0464296393040067e-05, "loss": 1.4287, "step": 33567 }, { "epoch": 2.64, "learning_rate": 1.045976138609313e-05, "loss": 1.4679, "step": 33568 }, { "epoch": 2.64, "learning_rate": 1.0455227326547417e-05, "loss": 1.4072, "step": 33569 }, { "epoch": 2.64, "learning_rate": 1.0450694214433702e-05, "loss": 1.4368, "step": 33570 }, { "epoch": 2.64, "learning_rate": 1.0446162049782763e-05, "loss": 1.4348, "step": 33571 }, { "epoch": 2.64, "learning_rate": 1.0441630832625375e-05, "loss": 1.4418, "step": 33572 }, { "epoch": 2.64, "learning_rate": 1.0437100562992295e-05, "loss": 1.4229, "step": 33573 }, { "epoch": 2.64, "learning_rate": 1.04325712409143e-05, "loss": 1.3811, "step": 33574 }, { "epoch": 2.64, "learning_rate": 1.0428042866422098e-05, "loss": 1.428, "step": 33575 }, { "epoch": 2.64, "learning_rate": 1.0423515439546481e-05, "loss": 1.4425, "step": 33576 }, { "epoch": 2.64, "learning_rate": 1.0418988960318175e-05, "loss": 1.4638, "step": 33577 }, { "epoch": 2.64, "learning_rate": 1.0414463428767872e-05, "loss": 1.4427, "step": 33578 }, { "epoch": 2.64, "learning_rate": 1.0409938844926363e-05, "loss": 1.4013, "step": 33579 }, { "epoch": 2.64, "learning_rate": 1.0405415208824341e-05, "loss": 1.3921, "step": 33580 }, { "epoch": 2.64, "learning_rate": 1.0400892520492516e-05, "loss": 1.3948, "step": 33581 }, { "epoch": 2.64, "learning_rate": 1.039637077996156e-05, "loss": 1.3979, "step": 33582 }, { "epoch": 2.64, "learning_rate": 1.0391849987262252e-05, "loss": 1.432, "step": 33583 }, { "epoch": 2.64, "learning_rate": 1.0387330142425216e-05, "loss": 1.407, "step": 33584 }, { "epoch": 2.64, "learning_rate": 1.038281124548116e-05, "loss": 1.4175, "step": 33585 }, { "epoch": 2.64, "learning_rate": 1.0378293296460777e-05, "loss": 1.4717, "step": 33586 }, { "epoch": 2.64, "learning_rate": 1.0373776295394743e-05, "loss": 1.4757, "step": 33587 }, { "epoch": 2.64, "learning_rate": 1.0369260242313681e-05, "loss": 1.491, "step": 33588 }, { "epoch": 2.64, "learning_rate": 1.036474513724832e-05, "loss": 1.4492, "step": 33589 }, { "epoch": 2.64, "learning_rate": 1.0360230980229283e-05, "loss": 1.4816, "step": 33590 }, { "epoch": 2.64, "learning_rate": 1.0355717771287197e-05, "loss": 1.4347, "step": 33591 }, { "epoch": 2.64, "learning_rate": 1.0351205510452737e-05, "loss": 1.4259, "step": 33592 }, { "epoch": 2.64, "learning_rate": 1.0346694197756512e-05, "loss": 1.41, "step": 33593 }, { "epoch": 2.64, "learning_rate": 1.0342183833229194e-05, "loss": 1.4231, "step": 33594 }, { "epoch": 2.64, "learning_rate": 1.0337674416901348e-05, "loss": 1.449, "step": 33595 }, { "epoch": 2.64, "learning_rate": 1.0333165948803646e-05, "loss": 1.4305, "step": 33596 }, { "epoch": 2.64, "learning_rate": 1.032865842896668e-05, "loss": 1.3954, "step": 33597 }, { "epoch": 2.64, "learning_rate": 1.0324151857421042e-05, "loss": 1.5157, "step": 33598 }, { "epoch": 2.64, "learning_rate": 1.0319646234197293e-05, "loss": 1.4249, "step": 33599 }, { "epoch": 2.64, "learning_rate": 1.0315141559326107e-05, "loss": 1.4449, "step": 33600 }, { "epoch": 2.64, "learning_rate": 1.0310637832838026e-05, "loss": 1.3824, "step": 33601 }, { "epoch": 2.64, "learning_rate": 1.0306135054763592e-05, "loss": 1.432, "step": 33602 }, { "epoch": 2.64, "learning_rate": 1.0301633225133433e-05, "loss": 1.5024, "step": 33603 }, { "epoch": 2.64, "learning_rate": 1.0297132343978104e-05, "loss": 1.4718, "step": 33604 }, { "epoch": 2.64, "learning_rate": 1.0292632411328133e-05, "loss": 1.429, "step": 33605 }, { "epoch": 2.64, "learning_rate": 1.0288133427214095e-05, "loss": 1.4443, "step": 33606 }, { "epoch": 2.64, "learning_rate": 1.028363539166655e-05, "loss": 1.445, "step": 33607 }, { "epoch": 2.64, "learning_rate": 1.027913830471599e-05, "loss": 1.524, "step": 33608 }, { "epoch": 2.64, "learning_rate": 1.0274642166392971e-05, "loss": 1.466, "step": 33609 }, { "epoch": 2.64, "learning_rate": 1.0270146976728055e-05, "loss": 1.4743, "step": 33610 }, { "epoch": 2.64, "learning_rate": 1.0265652735751716e-05, "loss": 1.4548, "step": 33611 }, { "epoch": 2.64, "learning_rate": 1.0261159443494481e-05, "loss": 1.4593, "step": 33612 }, { "epoch": 2.64, "learning_rate": 1.0256667099986875e-05, "loss": 1.4365, "step": 33613 }, { "epoch": 2.64, "learning_rate": 1.0252175705259374e-05, "loss": 1.4388, "step": 33614 }, { "epoch": 2.64, "learning_rate": 1.0247685259342487e-05, "loss": 1.4542, "step": 33615 }, { "epoch": 2.64, "learning_rate": 1.024319576226667e-05, "loss": 1.4485, "step": 33616 }, { "epoch": 2.65, "learning_rate": 1.023870721406247e-05, "loss": 1.4816, "step": 33617 }, { "epoch": 2.65, "learning_rate": 1.0234219614760309e-05, "loss": 1.4611, "step": 33618 }, { "epoch": 2.65, "learning_rate": 1.022973296439063e-05, "loss": 1.4611, "step": 33619 }, { "epoch": 2.65, "learning_rate": 1.0225247262983976e-05, "loss": 1.4654, "step": 33620 }, { "epoch": 2.65, "learning_rate": 1.0220762510570757e-05, "loss": 1.4461, "step": 33621 }, { "epoch": 2.65, "learning_rate": 1.021627870718138e-05, "loss": 1.4513, "step": 33622 }, { "epoch": 2.65, "learning_rate": 1.0211795852846372e-05, "loss": 1.4302, "step": 33623 }, { "epoch": 2.65, "learning_rate": 1.0207313947596124e-05, "loss": 1.4215, "step": 33624 }, { "epoch": 2.65, "learning_rate": 1.0202832991461063e-05, "loss": 1.4597, "step": 33625 }, { "epoch": 2.65, "learning_rate": 1.0198352984471598e-05, "loss": 1.4592, "step": 33626 }, { "epoch": 2.65, "learning_rate": 1.0193873926658202e-05, "loss": 1.4619, "step": 33627 }, { "epoch": 2.65, "learning_rate": 1.0189395818051255e-05, "loss": 1.4387, "step": 33628 }, { "epoch": 2.65, "learning_rate": 1.0184918658681113e-05, "loss": 1.4306, "step": 33629 }, { "epoch": 2.65, "learning_rate": 1.0180442448578252e-05, "loss": 1.4014, "step": 33630 }, { "epoch": 2.65, "learning_rate": 1.0175967187773032e-05, "loss": 1.4816, "step": 33631 }, { "epoch": 2.65, "learning_rate": 1.0171492876295812e-05, "loss": 1.3753, "step": 33632 }, { "epoch": 2.65, "learning_rate": 1.0167019514177e-05, "loss": 1.3818, "step": 33633 }, { "epoch": 2.65, "learning_rate": 1.0162547101446971e-05, "loss": 1.4623, "step": 33634 }, { "epoch": 2.65, "learning_rate": 1.0158075638136088e-05, "loss": 1.4311, "step": 33635 }, { "epoch": 2.65, "learning_rate": 1.0153605124274656e-05, "loss": 1.4541, "step": 33636 }, { "epoch": 2.65, "learning_rate": 1.0149135559893118e-05, "loss": 1.443, "step": 33637 }, { "epoch": 2.65, "learning_rate": 1.014466694502175e-05, "loss": 1.4283, "step": 33638 }, { "epoch": 2.65, "learning_rate": 1.0140199279690896e-05, "loss": 1.4563, "step": 33639 }, { "epoch": 2.65, "learning_rate": 1.0135732563930948e-05, "loss": 1.4468, "step": 33640 }, { "epoch": 2.65, "learning_rate": 1.0131266797772148e-05, "loss": 1.4313, "step": 33641 }, { "epoch": 2.65, "learning_rate": 1.0126801981244903e-05, "loss": 1.4527, "step": 33642 }, { "epoch": 2.65, "learning_rate": 1.0122338114379442e-05, "loss": 1.4695, "step": 33643 }, { "epoch": 2.65, "learning_rate": 1.0117875197206155e-05, "loss": 1.405, "step": 33644 }, { "epoch": 2.65, "learning_rate": 1.0113413229755286e-05, "loss": 1.4257, "step": 33645 }, { "epoch": 2.65, "learning_rate": 1.0108952212057143e-05, "loss": 1.4727, "step": 33646 }, { "epoch": 2.65, "learning_rate": 1.0104492144142018e-05, "loss": 1.422, "step": 33647 }, { "epoch": 2.65, "learning_rate": 1.0100033026040205e-05, "loss": 1.4362, "step": 33648 }, { "epoch": 2.65, "learning_rate": 1.009557485778193e-05, "loss": 1.4615, "step": 33649 }, { "epoch": 2.65, "learning_rate": 1.0091117639397534e-05, "loss": 1.4371, "step": 33650 }, { "epoch": 2.65, "learning_rate": 1.0086661370917226e-05, "loss": 1.4188, "step": 33651 }, { "epoch": 2.65, "learning_rate": 1.0082206052371283e-05, "loss": 1.4549, "step": 33652 }, { "epoch": 2.65, "learning_rate": 1.0077751683789932e-05, "loss": 1.4619, "step": 33653 }, { "epoch": 2.65, "learning_rate": 1.0073298265203444e-05, "loss": 1.4561, "step": 33654 }, { "epoch": 2.65, "learning_rate": 1.006884579664205e-05, "loss": 1.4959, "step": 33655 }, { "epoch": 2.65, "learning_rate": 1.006439427813594e-05, "loss": 1.4351, "step": 33656 }, { "epoch": 2.65, "learning_rate": 1.0059943709715374e-05, "loss": 1.5092, "step": 33657 }, { "epoch": 2.65, "learning_rate": 1.0055494091410594e-05, "loss": 1.4173, "step": 33658 }, { "epoch": 2.65, "learning_rate": 1.0051045423251775e-05, "loss": 1.4087, "step": 33659 }, { "epoch": 2.65, "learning_rate": 1.004659770526911e-05, "loss": 1.4216, "step": 33660 }, { "epoch": 2.65, "learning_rate": 1.0042150937492827e-05, "loss": 1.4428, "step": 33661 }, { "epoch": 2.65, "learning_rate": 1.0037705119953115e-05, "loss": 1.4352, "step": 33662 }, { "epoch": 2.65, "learning_rate": 1.003326025268012e-05, "loss": 1.4552, "step": 33663 }, { "epoch": 2.65, "learning_rate": 1.0028816335704065e-05, "loss": 1.414, "step": 33664 }, { "epoch": 2.65, "learning_rate": 1.0024373369055111e-05, "loss": 1.4497, "step": 33665 }, { "epoch": 2.65, "learning_rate": 1.00199313527634e-05, "loss": 1.4273, "step": 33666 }, { "epoch": 2.65, "learning_rate": 1.0015490286859124e-05, "loss": 1.4574, "step": 33667 }, { "epoch": 2.65, "learning_rate": 1.0011050171372409e-05, "loss": 1.4508, "step": 33668 }, { "epoch": 2.65, "learning_rate": 1.0006611006333432e-05, "loss": 1.431, "step": 33669 }, { "epoch": 2.65, "learning_rate": 1.0002172791772268e-05, "loss": 1.4342, "step": 33670 }, { "epoch": 2.65, "learning_rate": 9.997735527719126e-06, "loss": 1.4086, "step": 33671 }, { "epoch": 2.65, "learning_rate": 9.993299214204082e-06, "loss": 1.4174, "step": 33672 }, { "epoch": 2.65, "learning_rate": 9.988863851257294e-06, "loss": 1.4552, "step": 33673 }, { "epoch": 2.65, "learning_rate": 9.984429438908826e-06, "loss": 1.4408, "step": 33674 }, { "epoch": 2.65, "learning_rate": 9.979995977188849e-06, "loss": 1.4944, "step": 33675 }, { "epoch": 2.65, "learning_rate": 9.975563466127423e-06, "loss": 1.4423, "step": 33676 }, { "epoch": 2.65, "learning_rate": 9.971131905754626e-06, "loss": 1.5106, "step": 33677 }, { "epoch": 2.65, "learning_rate": 9.966701296100599e-06, "loss": 1.471, "step": 33678 }, { "epoch": 2.65, "learning_rate": 9.962271637195385e-06, "loss": 1.4213, "step": 33679 }, { "epoch": 2.65, "learning_rate": 9.957842929069043e-06, "loss": 1.4162, "step": 33680 }, { "epoch": 2.65, "learning_rate": 9.9534151717517e-06, "loss": 1.4055, "step": 33681 }, { "epoch": 2.65, "learning_rate": 9.94898836527338e-06, "loss": 1.4425, "step": 33682 }, { "epoch": 2.65, "learning_rate": 9.944562509664111e-06, "loss": 1.4619, "step": 33683 }, { "epoch": 2.65, "learning_rate": 9.940137604954002e-06, "loss": 1.4498, "step": 33684 }, { "epoch": 2.65, "learning_rate": 9.935713651173078e-06, "loss": 1.4245, "step": 33685 }, { "epoch": 2.65, "learning_rate": 9.931290648351348e-06, "loss": 1.5091, "step": 33686 }, { "epoch": 2.65, "learning_rate": 9.926868596518839e-06, "loss": 1.4291, "step": 33687 }, { "epoch": 2.65, "learning_rate": 9.922447495705594e-06, "loss": 1.4503, "step": 33688 }, { "epoch": 2.65, "learning_rate": 9.918027345941653e-06, "loss": 1.4272, "step": 33689 }, { "epoch": 2.65, "learning_rate": 9.913608147256979e-06, "loss": 1.395, "step": 33690 }, { "epoch": 2.65, "learning_rate": 9.90918989968163e-06, "loss": 1.5035, "step": 33691 }, { "epoch": 2.65, "learning_rate": 9.904772603245564e-06, "loss": 1.4007, "step": 33692 }, { "epoch": 2.65, "learning_rate": 9.900356257978792e-06, "loss": 1.4856, "step": 33693 }, { "epoch": 2.65, "learning_rate": 9.895940863911255e-06, "loss": 1.4612, "step": 33694 }, { "epoch": 2.65, "learning_rate": 9.891526421072981e-06, "loss": 1.3875, "step": 33695 }, { "epoch": 2.65, "learning_rate": 9.887112929493946e-06, "loss": 1.386, "step": 33696 }, { "epoch": 2.65, "learning_rate": 9.882700389204056e-06, "loss": 1.4442, "step": 33697 }, { "epoch": 2.65, "learning_rate": 9.878288800233325e-06, "loss": 1.437, "step": 33698 }, { "epoch": 2.65, "learning_rate": 9.873878162611693e-06, "loss": 1.4654, "step": 33699 }, { "epoch": 2.65, "learning_rate": 9.869468476369085e-06, "loss": 1.4257, "step": 33700 }, { "epoch": 2.65, "learning_rate": 9.865059741535464e-06, "loss": 1.4343, "step": 33701 }, { "epoch": 2.65, "learning_rate": 9.860651958140769e-06, "loss": 1.4852, "step": 33702 }, { "epoch": 2.65, "learning_rate": 9.856245126214879e-06, "loss": 1.4205, "step": 33703 }, { "epoch": 2.65, "learning_rate": 9.851839245787751e-06, "loss": 1.4131, "step": 33704 }, { "epoch": 2.65, "learning_rate": 9.847434316889313e-06, "loss": 1.4988, "step": 33705 }, { "epoch": 2.65, "learning_rate": 9.843030339549456e-06, "loss": 1.4458, "step": 33706 }, { "epoch": 2.65, "learning_rate": 9.838627313798058e-06, "loss": 1.4508, "step": 33707 }, { "epoch": 2.65, "learning_rate": 9.834225239665045e-06, "loss": 1.4675, "step": 33708 }, { "epoch": 2.65, "learning_rate": 9.829824117180308e-06, "loss": 1.4509, "step": 33709 }, { "epoch": 2.65, "learning_rate": 9.825423946373707e-06, "loss": 1.4439, "step": 33710 }, { "epoch": 2.65, "learning_rate": 9.821024727275101e-06, "loss": 1.4086, "step": 33711 }, { "epoch": 2.65, "learning_rate": 9.8166264599144e-06, "loss": 1.453, "step": 33712 }, { "epoch": 2.65, "learning_rate": 9.812229144321448e-06, "loss": 1.4333, "step": 33713 }, { "epoch": 2.65, "learning_rate": 9.80783278052607e-06, "loss": 1.4513, "step": 33714 }, { "epoch": 2.65, "learning_rate": 9.803437368558175e-06, "loss": 1.4936, "step": 33715 }, { "epoch": 2.65, "learning_rate": 9.799042908447558e-06, "loss": 1.4592, "step": 33716 }, { "epoch": 2.65, "learning_rate": 9.794649400224059e-06, "loss": 1.3954, "step": 33717 }, { "epoch": 2.65, "learning_rate": 9.790256843917538e-06, "loss": 1.4496, "step": 33718 }, { "epoch": 2.65, "learning_rate": 9.785865239557789e-06, "loss": 1.4831, "step": 33719 }, { "epoch": 2.65, "learning_rate": 9.781474587174654e-06, "loss": 1.3866, "step": 33720 }, { "epoch": 2.65, "learning_rate": 9.777084886797893e-06, "loss": 1.4452, "step": 33721 }, { "epoch": 2.65, "learning_rate": 9.77269613845738e-06, "loss": 1.4379, "step": 33722 }, { "epoch": 2.65, "learning_rate": 9.768308342182862e-06, "loss": 1.4566, "step": 33723 }, { "epoch": 2.65, "learning_rate": 9.763921498004145e-06, "loss": 1.4048, "step": 33724 }, { "epoch": 2.65, "learning_rate": 9.759535605951007e-06, "loss": 1.3951, "step": 33725 }, { "epoch": 2.65, "learning_rate": 9.755150666053258e-06, "loss": 1.4755, "step": 33726 }, { "epoch": 2.65, "learning_rate": 9.750766678340622e-06, "loss": 1.4148, "step": 33727 }, { "epoch": 2.65, "learning_rate": 9.746383642842876e-06, "loss": 1.5063, "step": 33728 }, { "epoch": 2.65, "learning_rate": 9.742001559589796e-06, "loss": 1.4342, "step": 33729 }, { "epoch": 2.65, "learning_rate": 9.737620428611142e-06, "loss": 1.4151, "step": 33730 }, { "epoch": 2.65, "learning_rate": 9.733240249936608e-06, "loss": 1.4308, "step": 33731 }, { "epoch": 2.65, "learning_rate": 9.728861023595986e-06, "loss": 1.4875, "step": 33732 }, { "epoch": 2.65, "learning_rate": 9.724482749619e-06, "loss": 1.4187, "step": 33733 }, { "epoch": 2.65, "learning_rate": 9.720105428035329e-06, "loss": 1.4724, "step": 33734 }, { "epoch": 2.65, "learning_rate": 9.715729058874733e-06, "loss": 1.4353, "step": 33735 }, { "epoch": 2.65, "learning_rate": 9.711353642166953e-06, "loss": 1.3895, "step": 33736 }, { "epoch": 2.65, "learning_rate": 9.706979177941666e-06, "loss": 1.4741, "step": 33737 }, { "epoch": 2.65, "learning_rate": 9.702605666228547e-06, "loss": 1.4158, "step": 33738 }, { "epoch": 2.65, "learning_rate": 9.698233107057324e-06, "loss": 1.4074, "step": 33739 }, { "epoch": 2.65, "learning_rate": 9.693861500457672e-06, "loss": 1.4527, "step": 33740 }, { "epoch": 2.65, "learning_rate": 9.689490846459269e-06, "loss": 1.4534, "step": 33741 }, { "epoch": 2.65, "learning_rate": 9.685121145091806e-06, "loss": 1.3879, "step": 33742 }, { "epoch": 2.65, "learning_rate": 9.680752396384928e-06, "loss": 1.4525, "step": 33743 }, { "epoch": 2.66, "learning_rate": 9.676384600368292e-06, "loss": 1.4243, "step": 33744 }, { "epoch": 2.66, "learning_rate": 9.672017757071594e-06, "loss": 1.5051, "step": 33745 }, { "epoch": 2.66, "learning_rate": 9.667651866524456e-06, "loss": 1.4702, "step": 33746 }, { "epoch": 2.66, "learning_rate": 9.663286928756525e-06, "loss": 1.4815, "step": 33747 }, { "epoch": 2.66, "learning_rate": 9.658922943797393e-06, "loss": 1.4576, "step": 33748 }, { "epoch": 2.66, "learning_rate": 9.654559911676767e-06, "loss": 1.4475, "step": 33749 }, { "epoch": 2.66, "learning_rate": 9.650197832424212e-06, "loss": 1.4056, "step": 33750 }, { "epoch": 2.66, "learning_rate": 9.645836706069348e-06, "loss": 1.5023, "step": 33751 }, { "epoch": 2.66, "learning_rate": 9.641476532641807e-06, "loss": 1.4431, "step": 33752 }, { "epoch": 2.66, "learning_rate": 9.637117312171194e-06, "loss": 1.4612, "step": 33753 }, { "epoch": 2.66, "learning_rate": 9.632759044687105e-06, "loss": 1.4564, "step": 33754 }, { "epoch": 2.66, "learning_rate": 9.628401730219098e-06, "loss": 1.4569, "step": 33755 }, { "epoch": 2.66, "learning_rate": 9.624045368796801e-06, "loss": 1.481, "step": 33756 }, { "epoch": 2.66, "learning_rate": 9.619689960449772e-06, "loss": 1.4449, "step": 33757 }, { "epoch": 2.66, "learning_rate": 9.615335505207555e-06, "loss": 1.4601, "step": 33758 }, { "epoch": 2.66, "learning_rate": 9.61098200309976e-06, "loss": 1.4478, "step": 33759 }, { "epoch": 2.66, "learning_rate": 9.606629454155929e-06, "loss": 1.4466, "step": 33760 }, { "epoch": 2.66, "learning_rate": 9.60227785840557e-06, "loss": 1.4381, "step": 33761 }, { "epoch": 2.66, "learning_rate": 9.597927215878316e-06, "loss": 1.4527, "step": 33762 }, { "epoch": 2.66, "learning_rate": 9.593577526603635e-06, "loss": 1.4527, "step": 33763 }, { "epoch": 2.66, "learning_rate": 9.589228790611093e-06, "loss": 1.4979, "step": 33764 }, { "epoch": 2.66, "learning_rate": 9.584881007930161e-06, "loss": 1.4267, "step": 33765 }, { "epoch": 2.66, "learning_rate": 9.580534178590421e-06, "loss": 1.4654, "step": 33766 }, { "epoch": 2.66, "learning_rate": 9.57618830262138e-06, "loss": 1.4308, "step": 33767 }, { "epoch": 2.66, "learning_rate": 9.571843380052512e-06, "loss": 1.3759, "step": 33768 }, { "epoch": 2.66, "learning_rate": 9.567499410913332e-06, "loss": 1.4309, "step": 33769 }, { "epoch": 2.66, "learning_rate": 9.563156395233345e-06, "loss": 1.4499, "step": 33770 }, { "epoch": 2.66, "learning_rate": 9.55881433304203e-06, "loss": 1.4162, "step": 33771 }, { "epoch": 2.66, "learning_rate": 9.554473224368847e-06, "loss": 1.4829, "step": 33772 }, { "epoch": 2.66, "learning_rate": 9.550133069243304e-06, "loss": 1.3951, "step": 33773 }, { "epoch": 2.66, "learning_rate": 9.545793867694846e-06, "loss": 1.4609, "step": 33774 }, { "epoch": 2.66, "learning_rate": 9.541455619752913e-06, "loss": 1.4153, "step": 33775 }, { "epoch": 2.66, "learning_rate": 9.537118325447019e-06, "loss": 1.4231, "step": 33776 }, { "epoch": 2.66, "learning_rate": 9.53278198480657e-06, "loss": 1.44, "step": 33777 }, { "epoch": 2.66, "learning_rate": 9.528446597860995e-06, "loss": 1.4643, "step": 33778 }, { "epoch": 2.66, "learning_rate": 9.52411216463977e-06, "loss": 1.4447, "step": 33779 }, { "epoch": 2.66, "learning_rate": 9.519778685172303e-06, "loss": 1.4666, "step": 33780 }, { "epoch": 2.66, "learning_rate": 9.515446159488021e-06, "loss": 1.4658, "step": 33781 }, { "epoch": 2.66, "learning_rate": 9.511114587616286e-06, "loss": 1.478, "step": 33782 }, { "epoch": 2.66, "learning_rate": 9.506783969586606e-06, "loss": 1.4174, "step": 33783 }, { "epoch": 2.66, "learning_rate": 9.502454305428326e-06, "loss": 1.4543, "step": 33784 }, { "epoch": 2.66, "learning_rate": 9.498125595170836e-06, "loss": 1.4167, "step": 33785 }, { "epoch": 2.66, "learning_rate": 9.493797838843532e-06, "loss": 1.4736, "step": 33786 }, { "epoch": 2.66, "learning_rate": 9.48947103647582e-06, "loss": 1.4722, "step": 33787 }, { "epoch": 2.66, "learning_rate": 9.485145188097066e-06, "loss": 1.4287, "step": 33788 }, { "epoch": 2.66, "learning_rate": 9.480820293736591e-06, "loss": 1.4866, "step": 33789 }, { "epoch": 2.66, "learning_rate": 9.47649635342384e-06, "loss": 1.4637, "step": 33790 }, { "epoch": 2.66, "learning_rate": 9.472173367188124e-06, "loss": 1.4414, "step": 33791 }, { "epoch": 2.66, "learning_rate": 9.467851335058786e-06, "loss": 1.4718, "step": 33792 }, { "epoch": 2.66, "learning_rate": 9.463530257065217e-06, "loss": 1.4093, "step": 33793 }, { "epoch": 2.66, "learning_rate": 9.45921013323671e-06, "loss": 1.4375, "step": 33794 }, { "epoch": 2.66, "learning_rate": 9.45489096360258e-06, "loss": 1.4476, "step": 33795 }, { "epoch": 2.66, "learning_rate": 9.450572748192214e-06, "loss": 1.4182, "step": 33796 }, { "epoch": 2.66, "learning_rate": 9.446255487034893e-06, "loss": 1.462, "step": 33797 }, { "epoch": 2.66, "learning_rate": 9.441939180159924e-06, "loss": 1.4321, "step": 33798 }, { "epoch": 2.66, "learning_rate": 9.437623827596603e-06, "loss": 1.4217, "step": 33799 }, { "epoch": 2.66, "learning_rate": 9.433309429374285e-06, "loss": 1.404, "step": 33800 }, { "epoch": 2.66, "learning_rate": 9.42899598552222e-06, "loss": 1.4053, "step": 33801 }, { "epoch": 2.66, "learning_rate": 9.424683496069663e-06, "loss": 1.4788, "step": 33802 }, { "epoch": 2.66, "learning_rate": 9.420371961045958e-06, "loss": 1.4719, "step": 33803 }, { "epoch": 2.66, "learning_rate": 9.416061380480367e-06, "loss": 1.484, "step": 33804 }, { "epoch": 2.66, "learning_rate": 9.411751754402113e-06, "loss": 1.42, "step": 33805 }, { "epoch": 2.66, "learning_rate": 9.407443082840476e-06, "loss": 1.4395, "step": 33806 }, { "epoch": 2.66, "learning_rate": 9.403135365824732e-06, "loss": 1.489, "step": 33807 }, { "epoch": 2.66, "learning_rate": 9.398828603384124e-06, "loss": 1.4397, "step": 33808 }, { "epoch": 2.66, "learning_rate": 9.394522795547843e-06, "loss": 1.4603, "step": 33809 }, { "epoch": 2.66, "learning_rate": 9.390217942345186e-06, "loss": 1.4674, "step": 33810 }, { "epoch": 2.66, "learning_rate": 9.385914043805343e-06, "loss": 1.4888, "step": 33811 }, { "epoch": 2.66, "learning_rate": 9.381611099957542e-06, "loss": 1.4268, "step": 33812 }, { "epoch": 2.66, "learning_rate": 9.377309110830994e-06, "loss": 1.4264, "step": 33813 }, { "epoch": 2.66, "learning_rate": 9.373008076454924e-06, "loss": 1.4241, "step": 33814 }, { "epoch": 2.66, "learning_rate": 9.368707996858544e-06, "loss": 1.4122, "step": 33815 }, { "epoch": 2.66, "learning_rate": 9.36440887207101e-06, "loss": 1.4681, "step": 33816 }, { "epoch": 2.66, "learning_rate": 9.360110702121537e-06, "loss": 1.4156, "step": 33817 }, { "epoch": 2.66, "learning_rate": 9.355813487039315e-06, "loss": 1.4777, "step": 33818 }, { "epoch": 2.66, "learning_rate": 9.351517226853472e-06, "loss": 1.4331, "step": 33819 }, { "epoch": 2.66, "learning_rate": 9.347221921593234e-06, "loss": 1.4742, "step": 33820 }, { "epoch": 2.66, "learning_rate": 9.342927571287745e-06, "loss": 1.4545, "step": 33821 }, { "epoch": 2.66, "learning_rate": 9.338634175966164e-06, "loss": 1.4852, "step": 33822 }, { "epoch": 2.66, "learning_rate": 9.334341735657602e-06, "loss": 1.4178, "step": 33823 }, { "epoch": 2.66, "learning_rate": 9.330050250391253e-06, "loss": 1.4627, "step": 33824 }, { "epoch": 2.66, "learning_rate": 9.32575972019624e-06, "loss": 1.4899, "step": 33825 }, { "epoch": 2.66, "learning_rate": 9.321470145101662e-06, "loss": 1.4348, "step": 33826 }, { "epoch": 2.66, "learning_rate": 9.317181525136691e-06, "loss": 1.4141, "step": 33827 }, { "epoch": 2.66, "learning_rate": 9.312893860330439e-06, "loss": 1.4098, "step": 33828 }, { "epoch": 2.66, "learning_rate": 9.308607150711949e-06, "loss": 1.429, "step": 33829 }, { "epoch": 2.66, "learning_rate": 9.3043213963104e-06, "loss": 1.5152, "step": 33830 }, { "epoch": 2.66, "learning_rate": 9.300036597154881e-06, "loss": 1.4673, "step": 33831 }, { "epoch": 2.66, "learning_rate": 9.295752753274471e-06, "loss": 1.4765, "step": 33832 }, { "epoch": 2.66, "learning_rate": 9.29146986469823e-06, "loss": 1.4199, "step": 33833 }, { "epoch": 2.66, "learning_rate": 9.28718793145527e-06, "loss": 1.4456, "step": 33834 }, { "epoch": 2.66, "learning_rate": 9.282906953574664e-06, "loss": 1.4503, "step": 33835 }, { "epoch": 2.66, "learning_rate": 9.278626931085442e-06, "loss": 1.4645, "step": 33836 }, { "epoch": 2.66, "learning_rate": 9.274347864016712e-06, "loss": 1.4515, "step": 33837 }, { "epoch": 2.66, "learning_rate": 9.270069752397485e-06, "loss": 1.4252, "step": 33838 }, { "epoch": 2.66, "learning_rate": 9.265792596256837e-06, "loss": 1.4553, "step": 33839 }, { "epoch": 2.66, "learning_rate": 9.26151639562378e-06, "loss": 1.4359, "step": 33840 }, { "epoch": 2.66, "learning_rate": 9.257241150527373e-06, "loss": 1.4232, "step": 33841 }, { "epoch": 2.66, "learning_rate": 9.252966860996624e-06, "loss": 1.4105, "step": 33842 }, { "epoch": 2.66, "learning_rate": 9.248693527060547e-06, "loss": 1.4562, "step": 33843 }, { "epoch": 2.66, "learning_rate": 9.244421148748183e-06, "loss": 1.4306, "step": 33844 }, { "epoch": 2.66, "learning_rate": 9.240149726088508e-06, "loss": 1.4233, "step": 33845 }, { "epoch": 2.66, "learning_rate": 9.235879259110552e-06, "loss": 1.4777, "step": 33846 }, { "epoch": 2.66, "learning_rate": 9.231609747843288e-06, "loss": 1.4163, "step": 33847 }, { "epoch": 2.66, "learning_rate": 9.22734119231573e-06, "loss": 1.4229, "step": 33848 }, { "epoch": 2.66, "learning_rate": 9.223073592556834e-06, "loss": 1.4495, "step": 33849 }, { "epoch": 2.66, "learning_rate": 9.218806948595547e-06, "loss": 1.4392, "step": 33850 }, { "epoch": 2.66, "learning_rate": 9.214541260460912e-06, "loss": 1.4415, "step": 33851 }, { "epoch": 2.66, "learning_rate": 9.210276528181853e-06, "loss": 1.4725, "step": 33852 }, { "epoch": 2.66, "learning_rate": 9.206012751787285e-06, "loss": 1.4268, "step": 33853 }, { "epoch": 2.66, "learning_rate": 9.20174993130623e-06, "loss": 1.4577, "step": 33854 }, { "epoch": 2.66, "learning_rate": 9.197488066767584e-06, "loss": 1.4406, "step": 33855 }, { "epoch": 2.66, "learning_rate": 9.193227158200273e-06, "loss": 1.4876, "step": 33856 }, { "epoch": 2.66, "learning_rate": 9.188967205633275e-06, "loss": 1.4151, "step": 33857 }, { "epoch": 2.66, "learning_rate": 9.184708209095466e-06, "loss": 1.4271, "step": 33858 }, { "epoch": 2.66, "learning_rate": 9.180450168615806e-06, "loss": 1.4117, "step": 33859 }, { "epoch": 2.66, "learning_rate": 9.176193084223138e-06, "loss": 1.4436, "step": 33860 }, { "epoch": 2.66, "learning_rate": 9.171936955946407e-06, "loss": 1.4773, "step": 33861 }, { "epoch": 2.66, "learning_rate": 9.167681783814523e-06, "loss": 1.434, "step": 33862 }, { "epoch": 2.66, "learning_rate": 9.16342756785638e-06, "loss": 1.466, "step": 33863 }, { "epoch": 2.66, "learning_rate": 9.159174308100819e-06, "loss": 1.4038, "step": 33864 }, { "epoch": 2.66, "learning_rate": 9.154922004576754e-06, "loss": 1.4842, "step": 33865 }, { "epoch": 2.66, "learning_rate": 9.150670657313058e-06, "loss": 1.3945, "step": 33866 }, { "epoch": 2.66, "learning_rate": 9.146420266338544e-06, "loss": 1.3676, "step": 33867 }, { "epoch": 2.66, "learning_rate": 9.142170831682139e-06, "loss": 1.454, "step": 33868 }, { "epoch": 2.66, "learning_rate": 9.137922353372652e-06, "loss": 1.4671, "step": 33869 }, { "epoch": 2.66, "learning_rate": 9.133674831438926e-06, "loss": 1.4094, "step": 33870 }, { "epoch": 2.67, "learning_rate": 9.129428265909838e-06, "loss": 1.5145, "step": 33871 }, { "epoch": 2.67, "learning_rate": 9.125182656814183e-06, "loss": 1.4715, "step": 33872 }, { "epoch": 2.67, "learning_rate": 9.120938004180772e-06, "loss": 1.4295, "step": 33873 }, { "epoch": 2.67, "learning_rate": 9.11669430803848e-06, "loss": 1.4895, "step": 33874 }, { "epoch": 2.67, "learning_rate": 9.112451568416085e-06, "loss": 1.4451, "step": 33875 }, { "epoch": 2.67, "learning_rate": 9.108209785342379e-06, "loss": 1.451, "step": 33876 }, { "epoch": 2.67, "learning_rate": 9.103968958846159e-06, "loss": 1.4425, "step": 33877 }, { "epoch": 2.67, "learning_rate": 9.09972908895628e-06, "loss": 1.465, "step": 33878 }, { "epoch": 2.67, "learning_rate": 9.095490175701475e-06, "loss": 1.382, "step": 33879 }, { "epoch": 2.67, "learning_rate": 9.091252219110535e-06, "loss": 1.5583, "step": 33880 }, { "epoch": 2.67, "learning_rate": 9.087015219212219e-06, "loss": 1.4632, "step": 33881 }, { "epoch": 2.67, "learning_rate": 9.08277917603532e-06, "loss": 1.4267, "step": 33882 }, { "epoch": 2.67, "learning_rate": 9.078544089608586e-06, "loss": 1.41, "step": 33883 }, { "epoch": 2.67, "learning_rate": 9.07430995996074e-06, "loss": 1.4478, "step": 33884 }, { "epoch": 2.67, "learning_rate": 9.070076787120595e-06, "loss": 1.4152, "step": 33885 }, { "epoch": 2.67, "learning_rate": 9.06584457111686e-06, "loss": 1.4351, "step": 33886 }, { "epoch": 2.67, "learning_rate": 9.061613311978244e-06, "loss": 1.4724, "step": 33887 }, { "epoch": 2.67, "learning_rate": 9.05738300973351e-06, "loss": 1.4401, "step": 33888 }, { "epoch": 2.67, "learning_rate": 9.053153664411366e-06, "loss": 1.454, "step": 33889 }, { "epoch": 2.67, "learning_rate": 9.048925276040508e-06, "loss": 1.4533, "step": 33890 }, { "epoch": 2.67, "learning_rate": 9.044697844649695e-06, "loss": 1.4112, "step": 33891 }, { "epoch": 2.67, "learning_rate": 9.040471370267571e-06, "loss": 1.429, "step": 33892 }, { "epoch": 2.67, "learning_rate": 9.03624585292288e-06, "loss": 1.4109, "step": 33893 }, { "epoch": 2.67, "learning_rate": 9.032021292644264e-06, "loss": 1.4272, "step": 33894 }, { "epoch": 2.67, "learning_rate": 9.027797689460454e-06, "loss": 1.4659, "step": 33895 }, { "epoch": 2.67, "learning_rate": 9.023575043400106e-06, "loss": 1.4599, "step": 33896 }, { "epoch": 2.67, "learning_rate": 9.019353354491881e-06, "loss": 1.4585, "step": 33897 }, { "epoch": 2.67, "learning_rate": 9.015132622764442e-06, "loss": 1.4837, "step": 33898 }, { "epoch": 2.67, "learning_rate": 9.010912848246449e-06, "loss": 1.4603, "step": 33899 }, { "epoch": 2.67, "learning_rate": 9.006694030966577e-06, "loss": 1.4824, "step": 33900 }, { "epoch": 2.67, "learning_rate": 9.002476170953404e-06, "loss": 1.4825, "step": 33901 }, { "epoch": 2.67, "learning_rate": 8.998259268235642e-06, "loss": 1.48, "step": 33902 }, { "epoch": 2.67, "learning_rate": 8.994043322841881e-06, "loss": 1.4388, "step": 33903 }, { "epoch": 2.67, "learning_rate": 8.989828334800736e-06, "loss": 1.4765, "step": 33904 }, { "epoch": 2.67, "learning_rate": 8.985614304140865e-06, "loss": 1.4564, "step": 33905 }, { "epoch": 2.67, "learning_rate": 8.981401230890844e-06, "loss": 1.4368, "step": 33906 }, { "epoch": 2.67, "learning_rate": 8.97718911507927e-06, "loss": 1.4014, "step": 33907 }, { "epoch": 2.67, "learning_rate": 8.972977956734767e-06, "loss": 1.4088, "step": 33908 }, { "epoch": 2.67, "learning_rate": 8.96876775588593e-06, "loss": 1.4411, "step": 33909 }, { "epoch": 2.67, "learning_rate": 8.964558512561338e-06, "loss": 1.4986, "step": 33910 }, { "epoch": 2.67, "learning_rate": 8.960350226789548e-06, "loss": 1.44, "step": 33911 }, { "epoch": 2.67, "learning_rate": 8.956142898599156e-06, "loss": 1.4265, "step": 33912 }, { "epoch": 2.67, "learning_rate": 8.951936528018721e-06, "loss": 1.4357, "step": 33913 }, { "epoch": 2.67, "learning_rate": 8.947731115076789e-06, "loss": 1.4194, "step": 33914 }, { "epoch": 2.67, "learning_rate": 8.943526659801936e-06, "loss": 1.4622, "step": 33915 }, { "epoch": 2.67, "learning_rate": 8.939323162222705e-06, "loss": 1.4341, "step": 33916 }, { "epoch": 2.67, "learning_rate": 8.935120622367626e-06, "loss": 1.4788, "step": 33917 }, { "epoch": 2.67, "learning_rate": 8.930919040265205e-06, "loss": 1.4557, "step": 33918 }, { "epoch": 2.67, "learning_rate": 8.926718415944022e-06, "loss": 1.4196, "step": 33919 }, { "epoch": 2.67, "learning_rate": 8.922518749432555e-06, "loss": 1.3886, "step": 33920 }, { "epoch": 2.67, "learning_rate": 8.91832004075933e-06, "loss": 1.4397, "step": 33921 }, { "epoch": 2.67, "learning_rate": 8.914122289952858e-06, "loss": 1.4943, "step": 33922 }, { "epoch": 2.67, "learning_rate": 8.909925497041631e-06, "loss": 1.4415, "step": 33923 }, { "epoch": 2.67, "learning_rate": 8.905729662054178e-06, "loss": 1.4001, "step": 33924 }, { "epoch": 2.67, "learning_rate": 8.901534785018927e-06, "loss": 1.4875, "step": 33925 }, { "epoch": 2.67, "learning_rate": 8.897340865964403e-06, "loss": 1.4702, "step": 33926 }, { "epoch": 2.67, "learning_rate": 8.893147904919084e-06, "loss": 1.4189, "step": 33927 }, { "epoch": 2.67, "learning_rate": 8.888955901911398e-06, "loss": 1.4648, "step": 33928 }, { "epoch": 2.67, "learning_rate": 8.88476485696984e-06, "loss": 1.4454, "step": 33929 }, { "epoch": 2.67, "learning_rate": 8.880574770122867e-06, "loss": 1.4124, "step": 33930 }, { "epoch": 2.67, "learning_rate": 8.876385641398875e-06, "loss": 1.4193, "step": 33931 }, { "epoch": 2.67, "learning_rate": 8.872197470826392e-06, "loss": 1.4452, "step": 33932 }, { "epoch": 2.67, "learning_rate": 8.868010258433794e-06, "loss": 1.4836, "step": 33933 }, { "epoch": 2.67, "learning_rate": 8.863824004249526e-06, "loss": 1.3934, "step": 33934 }, { "epoch": 2.67, "learning_rate": 8.859638708301981e-06, "loss": 1.3771, "step": 33935 }, { "epoch": 2.67, "learning_rate": 8.855454370619636e-06, "loss": 1.412, "step": 33936 }, { "epoch": 2.67, "learning_rate": 8.851270991230853e-06, "loss": 1.4869, "step": 33937 }, { "epoch": 2.67, "learning_rate": 8.847088570164024e-06, "loss": 1.4451, "step": 33938 }, { "epoch": 2.67, "learning_rate": 8.842907107447578e-06, "loss": 1.4405, "step": 33939 }, { "epoch": 2.67, "learning_rate": 8.838726603109908e-06, "loss": 1.4063, "step": 33940 }, { "epoch": 2.67, "learning_rate": 8.834547057179391e-06, "loss": 1.4162, "step": 33941 }, { "epoch": 2.67, "learning_rate": 8.83036846968439e-06, "loss": 1.3726, "step": 33942 }, { "epoch": 2.67, "learning_rate": 8.82619084065328e-06, "loss": 1.4444, "step": 33943 }, { "epoch": 2.67, "learning_rate": 8.82201417011444e-06, "loss": 1.477, "step": 33944 }, { "epoch": 2.67, "learning_rate": 8.817838458096193e-06, "loss": 1.3904, "step": 33945 }, { "epoch": 2.67, "learning_rate": 8.81366370462694e-06, "loss": 1.4208, "step": 33946 }, { "epoch": 2.67, "learning_rate": 8.809489909734984e-06, "loss": 1.4408, "step": 33947 }, { "epoch": 2.67, "learning_rate": 8.805317073448675e-06, "loss": 1.4483, "step": 33948 }, { "epoch": 2.67, "learning_rate": 8.801145195796356e-06, "loss": 1.4153, "step": 33949 }, { "epoch": 2.67, "learning_rate": 8.796974276806335e-06, "loss": 1.4301, "step": 33950 }, { "epoch": 2.67, "learning_rate": 8.79280431650694e-06, "loss": 1.4691, "step": 33951 }, { "epoch": 2.67, "learning_rate": 8.788635314926452e-06, "loss": 1.459, "step": 33952 }, { "epoch": 2.67, "learning_rate": 8.784467272093242e-06, "loss": 1.4416, "step": 33953 }, { "epoch": 2.67, "learning_rate": 8.78030018803556e-06, "loss": 1.4456, "step": 33954 }, { "epoch": 2.67, "learning_rate": 8.776134062781664e-06, "loss": 1.4754, "step": 33955 }, { "epoch": 2.67, "learning_rate": 8.771968896359915e-06, "loss": 1.443, "step": 33956 }, { "epoch": 2.67, "learning_rate": 8.767804688798574e-06, "loss": 1.5188, "step": 33957 }, { "epoch": 2.67, "learning_rate": 8.763641440125901e-06, "loss": 1.4193, "step": 33958 }, { "epoch": 2.67, "learning_rate": 8.759479150370141e-06, "loss": 1.4194, "step": 33959 }, { "epoch": 2.67, "learning_rate": 8.755317819559604e-06, "loss": 1.4766, "step": 33960 }, { "epoch": 2.67, "learning_rate": 8.751157447722501e-06, "loss": 1.454, "step": 33961 }, { "epoch": 2.67, "learning_rate": 8.746998034887075e-06, "loss": 1.4215, "step": 33962 }, { "epoch": 2.67, "learning_rate": 8.742839581081607e-06, "loss": 1.4162, "step": 33963 }, { "epoch": 2.67, "learning_rate": 8.738682086334303e-06, "loss": 1.4404, "step": 33964 }, { "epoch": 2.67, "learning_rate": 8.73452555067336e-06, "loss": 1.3757, "step": 33965 }, { "epoch": 2.67, "learning_rate": 8.730369974127072e-06, "loss": 1.4283, "step": 33966 }, { "epoch": 2.67, "learning_rate": 8.726215356723598e-06, "loss": 1.4638, "step": 33967 }, { "epoch": 2.67, "learning_rate": 8.72206169849115e-06, "loss": 1.4416, "step": 33968 }, { "epoch": 2.67, "learning_rate": 8.717908999457956e-06, "loss": 1.4336, "step": 33969 }, { "epoch": 2.67, "learning_rate": 8.713757259652194e-06, "loss": 1.4616, "step": 33970 }, { "epoch": 2.67, "learning_rate": 8.709606479102022e-06, "loss": 1.496, "step": 33971 }, { "epoch": 2.67, "learning_rate": 8.705456657835668e-06, "loss": 1.4507, "step": 33972 }, { "epoch": 2.67, "learning_rate": 8.701307795881297e-06, "loss": 1.4758, "step": 33973 }, { "epoch": 2.67, "learning_rate": 8.69715989326708e-06, "loss": 1.3982, "step": 33974 }, { "epoch": 2.67, "learning_rate": 8.693012950021167e-06, "loss": 1.4038, "step": 33975 }, { "epoch": 2.67, "learning_rate": 8.688866966171698e-06, "loss": 1.4439, "step": 33976 }, { "epoch": 2.67, "learning_rate": 8.68472194174687e-06, "loss": 1.4521, "step": 33977 }, { "epoch": 2.67, "learning_rate": 8.680577876774774e-06, "loss": 1.4018, "step": 33978 }, { "epoch": 2.67, "learning_rate": 8.676434771283558e-06, "loss": 1.4616, "step": 33979 }, { "epoch": 2.67, "learning_rate": 8.672292625301397e-06, "loss": 1.4713, "step": 33980 }, { "epoch": 2.67, "learning_rate": 8.668151438856353e-06, "loss": 1.4664, "step": 33981 }, { "epoch": 2.67, "learning_rate": 8.664011211976569e-06, "loss": 1.47, "step": 33982 }, { "epoch": 2.67, "learning_rate": 8.659871944690156e-06, "loss": 1.416, "step": 33983 }, { "epoch": 2.67, "learning_rate": 8.655733637025225e-06, "loss": 1.3994, "step": 33984 }, { "epoch": 2.67, "learning_rate": 8.651596289009838e-06, "loss": 1.3901, "step": 33985 }, { "epoch": 2.67, "learning_rate": 8.647459900672104e-06, "loss": 1.458, "step": 33986 }, { "epoch": 2.67, "learning_rate": 8.643324472040136e-06, "loss": 1.3999, "step": 33987 }, { "epoch": 2.67, "learning_rate": 8.639190003141994e-06, "loss": 1.4568, "step": 33988 }, { "epoch": 2.67, "learning_rate": 8.635056494005721e-06, "loss": 1.4179, "step": 33989 }, { "epoch": 2.67, "learning_rate": 8.630923944659412e-06, "loss": 1.4687, "step": 33990 }, { "epoch": 2.67, "learning_rate": 8.62679235513113e-06, "loss": 1.4466, "step": 33991 }, { "epoch": 2.67, "learning_rate": 8.622661725448899e-06, "loss": 1.4662, "step": 33992 }, { "epoch": 2.67, "learning_rate": 8.618532055640764e-06, "loss": 1.4327, "step": 33993 }, { "epoch": 2.67, "learning_rate": 8.614403345734788e-06, "loss": 1.4501, "step": 33994 }, { "epoch": 2.67, "learning_rate": 8.610275595758998e-06, "loss": 1.4784, "step": 33995 }, { "epoch": 2.67, "learning_rate": 8.606148805741402e-06, "loss": 1.4193, "step": 33996 }, { "epoch": 2.67, "learning_rate": 8.602022975710032e-06, "loss": 1.4649, "step": 33997 }, { "epoch": 2.68, "learning_rate": 8.597898105692897e-06, "loss": 1.3843, "step": 33998 }, { "epoch": 2.68, "learning_rate": 8.59377419571799e-06, "loss": 1.4417, "step": 33999 }, { "epoch": 2.68, "learning_rate": 8.58965124581334e-06, "loss": 1.4643, "step": 34000 }, { "epoch": 2.68, "learning_rate": 8.585529256006906e-06, "loss": 1.4465, "step": 34001 }, { "epoch": 2.68, "learning_rate": 8.581408226326686e-06, "loss": 1.4143, "step": 34002 }, { "epoch": 2.68, "learning_rate": 8.577288156800654e-06, "loss": 1.3868, "step": 34003 }, { "epoch": 2.68, "learning_rate": 8.573169047456823e-06, "loss": 1.4176, "step": 34004 }, { "epoch": 2.68, "learning_rate": 8.56905089832312e-06, "loss": 1.4961, "step": 34005 }, { "epoch": 2.68, "learning_rate": 8.56493370942749e-06, "loss": 1.4255, "step": 34006 }, { "epoch": 2.68, "learning_rate": 8.560817480797943e-06, "loss": 1.4462, "step": 34007 }, { "epoch": 2.68, "learning_rate": 8.556702212462375e-06, "loss": 1.4235, "step": 34008 }, { "epoch": 2.68, "learning_rate": 8.552587904448743e-06, "loss": 1.4221, "step": 34009 }, { "epoch": 2.68, "learning_rate": 8.548474556784995e-06, "loss": 1.407, "step": 34010 }, { "epoch": 2.68, "learning_rate": 8.544362169499042e-06, "loss": 1.4715, "step": 34011 }, { "epoch": 2.68, "learning_rate": 8.54025074261881e-06, "loss": 1.5173, "step": 34012 }, { "epoch": 2.68, "learning_rate": 8.536140276172176e-06, "loss": 1.3925, "step": 34013 }, { "epoch": 2.68, "learning_rate": 8.53203077018712e-06, "loss": 1.4299, "step": 34014 }, { "epoch": 2.68, "learning_rate": 8.527922224691519e-06, "loss": 1.4489, "step": 34015 }, { "epoch": 2.68, "learning_rate": 8.523814639713217e-06, "loss": 1.4843, "step": 34016 }, { "epoch": 2.68, "learning_rate": 8.519708015280159e-06, "loss": 1.4668, "step": 34017 }, { "epoch": 2.68, "learning_rate": 8.515602351420186e-06, "loss": 1.47, "step": 34018 }, { "epoch": 2.68, "learning_rate": 8.51149764816123e-06, "loss": 1.4599, "step": 34019 }, { "epoch": 2.68, "learning_rate": 8.507393905531101e-06, "loss": 1.452, "step": 34020 }, { "epoch": 2.68, "learning_rate": 8.50329112355771e-06, "loss": 1.4885, "step": 34021 }, { "epoch": 2.68, "learning_rate": 8.499189302268865e-06, "loss": 1.528, "step": 34022 }, { "epoch": 2.68, "learning_rate": 8.495088441692432e-06, "loss": 1.4708, "step": 34023 }, { "epoch": 2.68, "learning_rate": 8.490988541856286e-06, "loss": 1.4705, "step": 34024 }, { "epoch": 2.68, "learning_rate": 8.486889602788239e-06, "loss": 1.4567, "step": 34025 }, { "epoch": 2.68, "learning_rate": 8.482791624516082e-06, "loss": 1.4522, "step": 34026 }, { "epoch": 2.68, "learning_rate": 8.478694607067715e-06, "loss": 1.442, "step": 34027 }, { "epoch": 2.68, "learning_rate": 8.474598550470896e-06, "loss": 1.4949, "step": 34028 }, { "epoch": 2.68, "learning_rate": 8.47050345475347e-06, "loss": 1.4755, "step": 34029 }, { "epoch": 2.68, "learning_rate": 8.46640931994318e-06, "loss": 1.4165, "step": 34030 }, { "epoch": 2.68, "learning_rate": 8.462316146067905e-06, "loss": 1.46, "step": 34031 }, { "epoch": 2.68, "learning_rate": 8.458223933155389e-06, "loss": 1.4096, "step": 34032 }, { "epoch": 2.68, "learning_rate": 8.454132681233394e-06, "loss": 1.4248, "step": 34033 }, { "epoch": 2.68, "learning_rate": 8.450042390329747e-06, "loss": 1.4898, "step": 34034 }, { "epoch": 2.68, "learning_rate": 8.445953060472194e-06, "loss": 1.4305, "step": 34035 }, { "epoch": 2.68, "learning_rate": 8.441864691688527e-06, "loss": 1.4882, "step": 34036 }, { "epoch": 2.68, "learning_rate": 8.437777284006442e-06, "loss": 1.4272, "step": 34037 }, { "epoch": 2.68, "learning_rate": 8.433690837453766e-06, "loss": 1.4579, "step": 34038 }, { "epoch": 2.68, "learning_rate": 8.429605352058194e-06, "loss": 1.4212, "step": 34039 }, { "epoch": 2.68, "learning_rate": 8.42552082784747e-06, "loss": 1.4816, "step": 34040 }, { "epoch": 2.68, "learning_rate": 8.42143726484934e-06, "loss": 1.4427, "step": 34041 }, { "epoch": 2.68, "learning_rate": 8.417354663091531e-06, "loss": 1.4812, "step": 34042 }, { "epoch": 2.68, "learning_rate": 8.413273022601718e-06, "loss": 1.4712, "step": 34043 }, { "epoch": 2.68, "learning_rate": 8.409192343407667e-06, "loss": 1.4715, "step": 34044 }, { "epoch": 2.68, "learning_rate": 8.405112625537086e-06, "loss": 1.399, "step": 34045 }, { "epoch": 2.68, "learning_rate": 8.401033869017637e-06, "loss": 1.4944, "step": 34046 }, { "epoch": 2.68, "learning_rate": 8.396956073876998e-06, "loss": 1.4483, "step": 34047 }, { "epoch": 2.68, "learning_rate": 8.392879240142914e-06, "loss": 1.4219, "step": 34048 }, { "epoch": 2.68, "learning_rate": 8.38880336784301e-06, "loss": 1.4446, "step": 34049 }, { "epoch": 2.68, "learning_rate": 8.384728457005018e-06, "loss": 1.4339, "step": 34050 }, { "epoch": 2.68, "learning_rate": 8.38065450765653e-06, "loss": 1.3983, "step": 34051 }, { "epoch": 2.68, "learning_rate": 8.376581519825277e-06, "loss": 1.4326, "step": 34052 }, { "epoch": 2.68, "learning_rate": 8.372509493538881e-06, "loss": 1.4555, "step": 34053 }, { "epoch": 2.68, "learning_rate": 8.368438428824975e-06, "loss": 1.4382, "step": 34054 }, { "epoch": 2.68, "learning_rate": 8.364368325711219e-06, "loss": 1.3781, "step": 34055 }, { "epoch": 2.68, "learning_rate": 8.360299184225256e-06, "loss": 1.4488, "step": 34056 }, { "epoch": 2.68, "learning_rate": 8.356231004394664e-06, "loss": 1.4761, "step": 34057 }, { "epoch": 2.68, "learning_rate": 8.352163786247124e-06, "loss": 1.4228, "step": 34058 }, { "epoch": 2.68, "learning_rate": 8.348097529810227e-06, "loss": 1.4671, "step": 34059 }, { "epoch": 2.68, "learning_rate": 8.344032235111553e-06, "loss": 1.4559, "step": 34060 }, { "epoch": 2.68, "learning_rate": 8.339967902178763e-06, "loss": 1.391, "step": 34061 }, { "epoch": 2.68, "learning_rate": 8.3359045310394e-06, "loss": 1.3934, "step": 34062 }, { "epoch": 2.68, "learning_rate": 8.331842121721078e-06, "loss": 1.4494, "step": 34063 }, { "epoch": 2.68, "learning_rate": 8.327780674251339e-06, "loss": 1.4225, "step": 34064 }, { "epoch": 2.68, "learning_rate": 8.323720188657796e-06, "loss": 1.4551, "step": 34065 }, { "epoch": 2.68, "learning_rate": 8.319660664968025e-06, "loss": 1.3965, "step": 34066 }, { "epoch": 2.68, "learning_rate": 8.31560210320954e-06, "loss": 1.4747, "step": 34067 }, { "epoch": 2.68, "learning_rate": 8.311544503409967e-06, "loss": 1.4747, "step": 34068 }, { "epoch": 2.68, "learning_rate": 8.307487865596819e-06, "loss": 1.486, "step": 34069 }, { "epoch": 2.68, "learning_rate": 8.30343218979762e-06, "loss": 1.4131, "step": 34070 }, { "epoch": 2.68, "learning_rate": 8.29937747603992e-06, "loss": 1.4439, "step": 34071 }, { "epoch": 2.68, "learning_rate": 8.295323724351261e-06, "loss": 1.4243, "step": 34072 }, { "epoch": 2.68, "learning_rate": 8.291270934759153e-06, "loss": 1.4243, "step": 34073 }, { "epoch": 2.68, "learning_rate": 8.287219107291093e-06, "loss": 1.424, "step": 34074 }, { "epoch": 2.68, "learning_rate": 8.283168241974641e-06, "loss": 1.4826, "step": 34075 }, { "epoch": 2.68, "learning_rate": 8.27911833883726e-06, "loss": 1.4302, "step": 34076 }, { "epoch": 2.68, "learning_rate": 8.275069397906443e-06, "loss": 1.4314, "step": 34077 }, { "epoch": 2.68, "learning_rate": 8.271021419209716e-06, "loss": 1.4142, "step": 34078 }, { "epoch": 2.68, "learning_rate": 8.266974402774529e-06, "loss": 1.4427, "step": 34079 }, { "epoch": 2.68, "learning_rate": 8.262928348628373e-06, "loss": 1.4363, "step": 34080 }, { "epoch": 2.68, "learning_rate": 8.258883256798694e-06, "loss": 1.4826, "step": 34081 }, { "epoch": 2.68, "learning_rate": 8.254839127313017e-06, "loss": 1.4482, "step": 34082 }, { "epoch": 2.68, "learning_rate": 8.250795960198741e-06, "loss": 1.4958, "step": 34083 }, { "epoch": 2.68, "learning_rate": 8.246753755483326e-06, "loss": 1.4318, "step": 34084 }, { "epoch": 2.68, "learning_rate": 8.24271251319425e-06, "loss": 1.4146, "step": 34085 }, { "epoch": 2.68, "learning_rate": 8.238672233358939e-06, "loss": 1.4565, "step": 34086 }, { "epoch": 2.68, "learning_rate": 8.23463291600479e-06, "loss": 1.4341, "step": 34087 }, { "epoch": 2.68, "learning_rate": 8.230594561159249e-06, "loss": 1.4797, "step": 34088 }, { "epoch": 2.68, "learning_rate": 8.22655716884974e-06, "loss": 1.3939, "step": 34089 }, { "epoch": 2.68, "learning_rate": 8.222520739103693e-06, "loss": 1.4348, "step": 34090 }, { "epoch": 2.68, "learning_rate": 8.218485271948456e-06, "loss": 1.484, "step": 34091 }, { "epoch": 2.68, "learning_rate": 8.214450767411485e-06, "loss": 1.4366, "step": 34092 }, { "epoch": 2.68, "learning_rate": 8.210417225520144e-06, "loss": 1.4444, "step": 34093 }, { "epoch": 2.68, "learning_rate": 8.206384646301812e-06, "loss": 1.4534, "step": 34094 }, { "epoch": 2.68, "learning_rate": 8.202353029783899e-06, "loss": 1.4918, "step": 34095 }, { "epoch": 2.68, "learning_rate": 8.198322375993732e-06, "loss": 1.4767, "step": 34096 }, { "epoch": 2.68, "learning_rate": 8.194292684958726e-06, "loss": 1.4047, "step": 34097 }, { "epoch": 2.68, "learning_rate": 8.190263956706206e-06, "loss": 1.4581, "step": 34098 }, { "epoch": 2.68, "learning_rate": 8.186236191263551e-06, "loss": 1.4138, "step": 34099 }, { "epoch": 2.68, "learning_rate": 8.18220938865809e-06, "loss": 1.4026, "step": 34100 }, { "epoch": 2.68, "learning_rate": 8.17818354891715e-06, "loss": 1.4662, "step": 34101 }, { "epoch": 2.68, "learning_rate": 8.174158672068093e-06, "loss": 1.4885, "step": 34102 }, { "epoch": 2.68, "learning_rate": 8.17013475813823e-06, "loss": 1.4675, "step": 34103 }, { "epoch": 2.68, "learning_rate": 8.166111807154907e-06, "loss": 1.3854, "step": 34104 }, { "epoch": 2.68, "learning_rate": 8.162089819145368e-06, "loss": 1.4449, "step": 34105 }, { "epoch": 2.68, "learning_rate": 8.158068794137007e-06, "loss": 1.4797, "step": 34106 }, { "epoch": 2.68, "learning_rate": 8.15404873215707e-06, "loss": 1.4773, "step": 34107 }, { "epoch": 2.68, "learning_rate": 8.150029633232852e-06, "loss": 1.4847, "step": 34108 }, { "epoch": 2.68, "learning_rate": 8.146011497391663e-06, "loss": 1.4145, "step": 34109 }, { "epoch": 2.68, "learning_rate": 8.141994324660783e-06, "loss": 1.3793, "step": 34110 }, { "epoch": 2.68, "learning_rate": 8.137978115067456e-06, "loss": 1.4853, "step": 34111 }, { "epoch": 2.68, "learning_rate": 8.133962868638977e-06, "loss": 1.4135, "step": 34112 }, { "epoch": 2.68, "learning_rate": 8.129948585402623e-06, "loss": 1.4135, "step": 34113 }, { "epoch": 2.68, "learning_rate": 8.125935265385624e-06, "loss": 1.4674, "step": 34114 }, { "epoch": 2.68, "learning_rate": 8.121922908615208e-06, "loss": 1.4809, "step": 34115 }, { "epoch": 2.68, "learning_rate": 8.117911515118653e-06, "loss": 1.4769, "step": 34116 }, { "epoch": 2.68, "learning_rate": 8.113901084923203e-06, "loss": 1.4128, "step": 34117 }, { "epoch": 2.68, "learning_rate": 8.109891618056035e-06, "loss": 1.4467, "step": 34118 }, { "epoch": 2.68, "learning_rate": 8.105883114544414e-06, "loss": 1.4636, "step": 34119 }, { "epoch": 2.68, "learning_rate": 8.10187557441555e-06, "loss": 1.4629, "step": 34120 }, { "epoch": 2.68, "learning_rate": 8.097868997696622e-06, "loss": 1.4617, "step": 34121 }, { "epoch": 2.68, "learning_rate": 8.09386338441489e-06, "loss": 1.4305, "step": 34122 }, { "epoch": 2.68, "learning_rate": 8.089858734597498e-06, "loss": 1.4643, "step": 34123 }, { "epoch": 2.68, "learning_rate": 8.08585504827166e-06, "loss": 1.4319, "step": 34124 }, { "epoch": 2.68, "learning_rate": 8.081852325464522e-06, "loss": 1.4056, "step": 34125 }, { "epoch": 2.69, "learning_rate": 8.077850566203325e-06, "loss": 1.4447, "step": 34126 }, { "epoch": 2.69, "learning_rate": 8.0738497705152e-06, "loss": 1.4268, "step": 34127 }, { "epoch": 2.69, "learning_rate": 8.069849938427275e-06, "loss": 1.4066, "step": 34128 }, { "epoch": 2.69, "learning_rate": 8.06585106996676e-06, "loss": 1.3602, "step": 34129 }, { "epoch": 2.69, "learning_rate": 8.06185316516082e-06, "loss": 1.435, "step": 34130 }, { "epoch": 2.69, "learning_rate": 8.057856224036563e-06, "loss": 1.4544, "step": 34131 }, { "epoch": 2.69, "learning_rate": 8.053860246621101e-06, "loss": 1.4421, "step": 34132 }, { "epoch": 2.69, "learning_rate": 8.049865232941633e-06, "loss": 1.455, "step": 34133 }, { "epoch": 2.69, "learning_rate": 8.045871183025232e-06, "loss": 1.4632, "step": 34134 }, { "epoch": 2.69, "learning_rate": 8.041878096899012e-06, "loss": 1.4533, "step": 34135 }, { "epoch": 2.69, "learning_rate": 8.03788597459012e-06, "loss": 1.3713, "step": 34136 }, { "epoch": 2.69, "learning_rate": 8.033894816125646e-06, "loss": 1.4694, "step": 34137 }, { "epoch": 2.69, "learning_rate": 8.029904621532656e-06, "loss": 1.4352, "step": 34138 }, { "epoch": 2.69, "learning_rate": 8.025915390838295e-06, "loss": 1.479, "step": 34139 }, { "epoch": 2.69, "learning_rate": 8.021927124069621e-06, "loss": 1.4129, "step": 34140 }, { "epoch": 2.69, "learning_rate": 8.0179398212537e-06, "loss": 1.4279, "step": 34141 }, { "epoch": 2.69, "learning_rate": 8.013953482417606e-06, "loss": 1.4306, "step": 34142 }, { "epoch": 2.69, "learning_rate": 8.009968107588404e-06, "loss": 1.4482, "step": 34143 }, { "epoch": 2.69, "learning_rate": 8.005983696793188e-06, "loss": 1.5042, "step": 34144 }, { "epoch": 2.69, "learning_rate": 8.002000250058987e-06, "loss": 1.4825, "step": 34145 }, { "epoch": 2.69, "learning_rate": 7.99801776741283e-06, "loss": 1.4806, "step": 34146 }, { "epoch": 2.69, "learning_rate": 7.994036248881775e-06, "loss": 1.4511, "step": 34147 }, { "epoch": 2.69, "learning_rate": 7.990055694492852e-06, "loss": 1.4365, "step": 34148 }, { "epoch": 2.69, "learning_rate": 7.986076104273075e-06, "loss": 1.4353, "step": 34149 }, { "epoch": 2.69, "learning_rate": 7.982097478249472e-06, "loss": 1.4534, "step": 34150 }, { "epoch": 2.69, "learning_rate": 7.978119816449069e-06, "loss": 1.451, "step": 34151 }, { "epoch": 2.69, "learning_rate": 7.97414311889883e-06, "loss": 1.491, "step": 34152 }, { "epoch": 2.69, "learning_rate": 7.970167385625813e-06, "loss": 1.4862, "step": 34153 }, { "epoch": 2.69, "learning_rate": 7.966192616656968e-06, "loss": 1.4649, "step": 34154 }, { "epoch": 2.69, "learning_rate": 7.96221881201929e-06, "loss": 1.442, "step": 34155 }, { "epoch": 2.69, "learning_rate": 7.95824597173977e-06, "loss": 1.4696, "step": 34156 }, { "epoch": 2.69, "learning_rate": 7.954274095845386e-06, "loss": 1.4465, "step": 34157 }, { "epoch": 2.69, "learning_rate": 7.950303184363088e-06, "loss": 1.4526, "step": 34158 }, { "epoch": 2.69, "learning_rate": 7.946333237319801e-06, "loss": 1.4481, "step": 34159 }, { "epoch": 2.69, "learning_rate": 7.942364254742555e-06, "loss": 1.4288, "step": 34160 }, { "epoch": 2.69, "learning_rate": 7.938396236658262e-06, "loss": 1.4903, "step": 34161 }, { "epoch": 2.69, "learning_rate": 7.934429183093865e-06, "loss": 1.4646, "step": 34162 }, { "epoch": 2.69, "learning_rate": 7.930463094076279e-06, "loss": 1.4852, "step": 34163 }, { "epoch": 2.69, "learning_rate": 7.926497969632479e-06, "loss": 1.4487, "step": 34164 }, { "epoch": 2.69, "learning_rate": 7.922533809789328e-06, "loss": 1.4699, "step": 34165 }, { "epoch": 2.69, "learning_rate": 7.918570614573771e-06, "loss": 1.3873, "step": 34166 }, { "epoch": 2.69, "learning_rate": 7.914608384012721e-06, "loss": 1.4349, "step": 34167 }, { "epoch": 2.69, "learning_rate": 7.910647118133073e-06, "loss": 1.4452, "step": 34168 }, { "epoch": 2.69, "learning_rate": 7.906686816961706e-06, "loss": 1.4433, "step": 34169 }, { "epoch": 2.69, "learning_rate": 7.902727480525528e-06, "loss": 1.4549, "step": 34170 }, { "epoch": 2.69, "learning_rate": 7.898769108851421e-06, "loss": 1.4224, "step": 34171 }, { "epoch": 2.69, "learning_rate": 7.894811701966247e-06, "loss": 1.447, "step": 34172 }, { "epoch": 2.69, "learning_rate": 7.890855259896884e-06, "loss": 1.4588, "step": 34173 }, { "epoch": 2.69, "learning_rate": 7.886899782670208e-06, "loss": 1.4352, "step": 34174 }, { "epoch": 2.69, "learning_rate": 7.882945270313018e-06, "loss": 1.4507, "step": 34175 }, { "epoch": 2.69, "learning_rate": 7.878991722852207e-06, "loss": 1.4712, "step": 34176 }, { "epoch": 2.69, "learning_rate": 7.875039140314638e-06, "loss": 1.4248, "step": 34177 }, { "epoch": 2.69, "learning_rate": 7.871087522727138e-06, "loss": 1.4181, "step": 34178 }, { "epoch": 2.69, "learning_rate": 7.86713687011647e-06, "loss": 1.4847, "step": 34179 }, { "epoch": 2.69, "learning_rate": 7.863187182509544e-06, "loss": 1.4288, "step": 34180 }, { "epoch": 2.69, "learning_rate": 7.859238459933142e-06, "loss": 1.452, "step": 34181 }, { "epoch": 2.69, "learning_rate": 7.855290702414074e-06, "loss": 1.4422, "step": 34182 }, { "epoch": 2.69, "learning_rate": 7.851343909979118e-06, "loss": 1.4452, "step": 34183 }, { "epoch": 2.69, "learning_rate": 7.847398082655105e-06, "loss": 1.446, "step": 34184 }, { "epoch": 2.69, "learning_rate": 7.843453220468809e-06, "loss": 1.5013, "step": 34185 }, { "epoch": 2.69, "learning_rate": 7.839509323447013e-06, "loss": 1.4731, "step": 34186 }, { "epoch": 2.69, "learning_rate": 7.83556639161651e-06, "loss": 1.4183, "step": 34187 }, { "epoch": 2.69, "learning_rate": 7.831624425004047e-06, "loss": 1.494, "step": 34188 }, { "epoch": 2.69, "learning_rate": 7.8276834236364e-06, "loss": 1.4819, "step": 34189 }, { "epoch": 2.69, "learning_rate": 7.823743387540332e-06, "loss": 1.4632, "step": 34190 }, { "epoch": 2.69, "learning_rate": 7.819804316742574e-06, "loss": 1.4457, "step": 34191 }, { "epoch": 2.69, "learning_rate": 7.8158662112699e-06, "loss": 1.4844, "step": 34192 }, { "epoch": 2.69, "learning_rate": 7.811929071149009e-06, "loss": 1.4602, "step": 34193 }, { "epoch": 2.69, "learning_rate": 7.807992896406662e-06, "loss": 1.4196, "step": 34194 }, { "epoch": 2.69, "learning_rate": 7.804057687069604e-06, "loss": 1.4562, "step": 34195 }, { "epoch": 2.69, "learning_rate": 7.80012344316448e-06, "loss": 1.4388, "step": 34196 }, { "epoch": 2.69, "learning_rate": 7.79619016471807e-06, "loss": 1.4679, "step": 34197 }, { "epoch": 2.69, "learning_rate": 7.792257851757066e-06, "loss": 1.4233, "step": 34198 }, { "epoch": 2.69, "learning_rate": 7.788326504308134e-06, "loss": 1.4322, "step": 34199 }, { "epoch": 2.69, "learning_rate": 7.784396122397984e-06, "loss": 1.4592, "step": 34200 }, { "epoch": 2.69, "learning_rate": 7.780466706053312e-06, "loss": 1.4335, "step": 34201 }, { "epoch": 2.69, "learning_rate": 7.776538255300795e-06, "loss": 1.4456, "step": 34202 }, { "epoch": 2.69, "learning_rate": 7.772610770167082e-06, "loss": 1.4232, "step": 34203 }, { "epoch": 2.69, "learning_rate": 7.768684250678864e-06, "loss": 1.4889, "step": 34204 }, { "epoch": 2.69, "learning_rate": 7.764758696862805e-06, "loss": 1.4405, "step": 34205 }, { "epoch": 2.69, "learning_rate": 7.7608341087455e-06, "loss": 1.4552, "step": 34206 }, { "epoch": 2.69, "learning_rate": 7.756910486353663e-06, "loss": 1.4076, "step": 34207 }, { "epoch": 2.69, "learning_rate": 7.752987829713903e-06, "loss": 1.4256, "step": 34208 }, { "epoch": 2.69, "learning_rate": 7.749066138852883e-06, "loss": 1.4658, "step": 34209 }, { "epoch": 2.69, "learning_rate": 7.745145413797166e-06, "loss": 1.4429, "step": 34210 }, { "epoch": 2.69, "learning_rate": 7.74122565457343e-06, "loss": 1.4974, "step": 34211 }, { "epoch": 2.69, "learning_rate": 7.73730686120827e-06, "loss": 1.3935, "step": 34212 }, { "epoch": 2.69, "learning_rate": 7.733389033728265e-06, "loss": 1.4721, "step": 34213 }, { "epoch": 2.69, "learning_rate": 7.729472172160061e-06, "loss": 1.5133, "step": 34214 }, { "epoch": 2.69, "learning_rate": 7.725556276530237e-06, "loss": 1.467, "step": 34215 }, { "epoch": 2.69, "learning_rate": 7.721641346865353e-06, "loss": 1.4576, "step": 34216 }, { "epoch": 2.69, "learning_rate": 7.717727383192008e-06, "loss": 1.4077, "step": 34217 }, { "epoch": 2.69, "learning_rate": 7.713814385536792e-06, "loss": 1.4164, "step": 34218 }, { "epoch": 2.69, "learning_rate": 7.709902353926257e-06, "loss": 1.4104, "step": 34219 }, { "epoch": 2.69, "learning_rate": 7.705991288386942e-06, "loss": 1.4841, "step": 34220 }, { "epoch": 2.69, "learning_rate": 7.70208118894543e-06, "loss": 1.4827, "step": 34221 }, { "epoch": 2.69, "learning_rate": 7.698172055628249e-06, "loss": 1.5171, "step": 34222 }, { "epoch": 2.69, "learning_rate": 7.694263888461976e-06, "loss": 1.4176, "step": 34223 }, { "epoch": 2.69, "learning_rate": 7.690356687473092e-06, "loss": 1.4279, "step": 34224 }, { "epoch": 2.69, "learning_rate": 7.686450452688192e-06, "loss": 1.4202, "step": 34225 }, { "epoch": 2.69, "learning_rate": 7.682545184133737e-06, "loss": 1.3891, "step": 34226 }, { "epoch": 2.69, "learning_rate": 7.678640881836256e-06, "loss": 1.4172, "step": 34227 }, { "epoch": 2.69, "learning_rate": 7.674737545822279e-06, "loss": 1.4763, "step": 34228 }, { "epoch": 2.69, "learning_rate": 7.670835176118284e-06, "loss": 1.521, "step": 34229 }, { "epoch": 2.69, "learning_rate": 7.666933772750766e-06, "loss": 1.4635, "step": 34230 }, { "epoch": 2.69, "learning_rate": 7.663033335746238e-06, "loss": 1.4923, "step": 34231 }, { "epoch": 2.69, "learning_rate": 7.659133865131163e-06, "loss": 1.4208, "step": 34232 }, { "epoch": 2.69, "learning_rate": 7.655235360932e-06, "loss": 1.4379, "step": 34233 }, { "epoch": 2.69, "learning_rate": 7.651337823175263e-06, "loss": 1.4792, "step": 34234 }, { "epoch": 2.69, "learning_rate": 7.647441251887381e-06, "loss": 1.3961, "step": 34235 }, { "epoch": 2.69, "learning_rate": 7.643545647094817e-06, "loss": 1.4944, "step": 34236 }, { "epoch": 2.69, "learning_rate": 7.639651008824e-06, "loss": 1.4588, "step": 34237 }, { "epoch": 2.69, "learning_rate": 7.63575733710139e-06, "loss": 1.4158, "step": 34238 }, { "epoch": 2.69, "learning_rate": 7.631864631953449e-06, "loss": 1.4166, "step": 34239 }, { "epoch": 2.69, "learning_rate": 7.627972893406575e-06, "loss": 1.4654, "step": 34240 }, { "epoch": 2.69, "learning_rate": 7.624082121487196e-06, "loss": 1.3941, "step": 34241 }, { "epoch": 2.69, "learning_rate": 7.6201923162217236e-06, "loss": 1.4068, "step": 34242 }, { "epoch": 2.69, "learning_rate": 7.616303477636587e-06, "loss": 1.4086, "step": 34243 }, { "epoch": 2.69, "learning_rate": 7.6124156057581656e-06, "loss": 1.4634, "step": 34244 }, { "epoch": 2.69, "learning_rate": 7.60852870061287e-06, "loss": 1.5052, "step": 34245 }, { "epoch": 2.69, "learning_rate": 7.604642762227098e-06, "loss": 1.417, "step": 34246 }, { "epoch": 2.69, "learning_rate": 7.600757790627193e-06, "loss": 1.4182, "step": 34247 }, { "epoch": 2.69, "learning_rate": 7.596873785839586e-06, "loss": 1.4479, "step": 34248 }, { "epoch": 2.69, "learning_rate": 7.592990747890621e-06, "loss": 1.5166, "step": 34249 }, { "epoch": 2.69, "learning_rate": 7.5891086768066265e-06, "loss": 1.4651, "step": 34250 }, { "epoch": 2.69, "learning_rate": 7.585227572614033e-06, "loss": 1.3815, "step": 34251 }, { "epoch": 2.69, "learning_rate": 7.581347435339152e-06, "loss": 1.4222, "step": 34252 }, { "epoch": 2.7, "learning_rate": 7.57746826500833e-06, "loss": 1.5019, "step": 34253 }, { "epoch": 2.7, "learning_rate": 7.573590061647844e-06, "loss": 1.4448, "step": 34254 }, { "epoch": 2.7, "learning_rate": 7.569712825284141e-06, "loss": 1.4308, "step": 34255 }, { "epoch": 2.7, "learning_rate": 7.565836555943483e-06, "loss": 1.3866, "step": 34256 }, { "epoch": 2.7, "learning_rate": 7.561961253652199e-06, "loss": 1.4655, "step": 34257 }, { "epoch": 2.7, "learning_rate": 7.5580869184365674e-06, "loss": 1.4377, "step": 34258 }, { "epoch": 2.7, "learning_rate": 7.5542135503229515e-06, "loss": 1.4504, "step": 34259 }, { "epoch": 2.7, "learning_rate": 7.550341149337613e-06, "loss": 1.5038, "step": 34260 }, { "epoch": 2.7, "learning_rate": 7.5464697155068146e-06, "loss": 1.4515, "step": 34261 }, { "epoch": 2.7, "learning_rate": 7.542599248856917e-06, "loss": 1.4173, "step": 34262 }, { "epoch": 2.7, "learning_rate": 7.538729749414135e-06, "loss": 1.4746, "step": 34263 }, { "epoch": 2.7, "learning_rate": 7.534861217204746e-06, "loss": 1.4482, "step": 34264 }, { "epoch": 2.7, "learning_rate": 7.530993652255063e-06, "loss": 1.4818, "step": 34265 }, { "epoch": 2.7, "learning_rate": 7.527127054591298e-06, "loss": 1.4638, "step": 34266 }, { "epoch": 2.7, "learning_rate": 7.523261424239712e-06, "loss": 1.4167, "step": 34267 }, { "epoch": 2.7, "learning_rate": 7.519396761226554e-06, "loss": 1.461, "step": 34268 }, { "epoch": 2.7, "learning_rate": 7.515533065578066e-06, "loss": 1.4564, "step": 34269 }, { "epoch": 2.7, "learning_rate": 7.51167033732048e-06, "loss": 1.4128, "step": 34270 }, { "epoch": 2.7, "learning_rate": 7.507808576480023e-06, "loss": 1.4694, "step": 34271 }, { "epoch": 2.7, "learning_rate": 7.503947783082909e-06, "loss": 1.4849, "step": 34272 }, { "epoch": 2.7, "learning_rate": 7.500087957155365e-06, "loss": 1.4034, "step": 34273 }, { "epoch": 2.7, "learning_rate": 7.496229098723589e-06, "loss": 1.4389, "step": 34274 }, { "epoch": 2.7, "learning_rate": 7.492371207813758e-06, "loss": 1.4347, "step": 34275 }, { "epoch": 2.7, "learning_rate": 7.488514284452101e-06, "loss": 1.4382, "step": 34276 }, { "epoch": 2.7, "learning_rate": 7.484658328664783e-06, "loss": 1.4984, "step": 34277 }, { "epoch": 2.7, "learning_rate": 7.480803340477981e-06, "loss": 1.4236, "step": 34278 }, { "epoch": 2.7, "learning_rate": 7.476949319917874e-06, "loss": 1.4603, "step": 34279 }, { "epoch": 2.7, "learning_rate": 7.473096267010659e-06, "loss": 1.48, "step": 34280 }, { "epoch": 2.7, "learning_rate": 7.46924418178243e-06, "loss": 1.3811, "step": 34281 }, { "epoch": 2.7, "learning_rate": 7.4653930642594e-06, "loss": 1.4549, "step": 34282 }, { "epoch": 2.7, "learning_rate": 7.461542914467683e-06, "loss": 1.5273, "step": 34283 }, { "epoch": 2.7, "learning_rate": 7.457693732433423e-06, "loss": 1.4807, "step": 34284 }, { "epoch": 2.7, "learning_rate": 7.453845518182766e-06, "loss": 1.4382, "step": 34285 }, { "epoch": 2.7, "learning_rate": 7.449998271741842e-06, "loss": 1.4729, "step": 34286 }, { "epoch": 2.7, "learning_rate": 7.446151993136779e-06, "loss": 1.4708, "step": 34287 }, { "epoch": 2.7, "learning_rate": 7.442306682393639e-06, "loss": 1.4852, "step": 34288 }, { "epoch": 2.7, "learning_rate": 7.4384623395386036e-06, "loss": 1.428, "step": 34289 }, { "epoch": 2.7, "learning_rate": 7.434618964597733e-06, "loss": 1.4733, "step": 34290 }, { "epoch": 2.7, "learning_rate": 7.43077655759709e-06, "loss": 1.4596, "step": 34291 }, { "epoch": 2.7, "learning_rate": 7.426935118562838e-06, "loss": 1.4681, "step": 34292 }, { "epoch": 2.7, "learning_rate": 7.423094647521005e-06, "loss": 1.5197, "step": 34293 }, { "epoch": 2.7, "learning_rate": 7.419255144497688e-06, "loss": 1.4142, "step": 34294 }, { "epoch": 2.7, "learning_rate": 7.415416609518915e-06, "loss": 1.4315, "step": 34295 }, { "epoch": 2.7, "learning_rate": 7.411579042610799e-06, "loss": 1.4475, "step": 34296 }, { "epoch": 2.7, "learning_rate": 7.407742443799386e-06, "loss": 1.5093, "step": 34297 }, { "epoch": 2.7, "learning_rate": 7.403906813110688e-06, "loss": 1.4151, "step": 34298 }, { "epoch": 2.7, "learning_rate": 7.400072150570785e-06, "loss": 1.4439, "step": 34299 }, { "epoch": 2.7, "learning_rate": 7.3962384562057055e-06, "loss": 1.4239, "step": 34300 }, { "epoch": 2.7, "learning_rate": 7.392405730041462e-06, "loss": 1.458, "step": 34301 }, { "epoch": 2.7, "learning_rate": 7.388573972104067e-06, "loss": 1.4718, "step": 34302 }, { "epoch": 2.7, "learning_rate": 7.384743182419584e-06, "loss": 1.4661, "step": 34303 }, { "epoch": 2.7, "learning_rate": 7.38091336101399e-06, "loss": 1.4426, "step": 34304 }, { "epoch": 2.7, "learning_rate": 7.3770845079132835e-06, "loss": 1.4188, "step": 34305 }, { "epoch": 2.7, "learning_rate": 7.373256623143476e-06, "loss": 1.4922, "step": 34306 }, { "epoch": 2.7, "learning_rate": 7.369429706730545e-06, "loss": 1.4861, "step": 34307 }, { "epoch": 2.7, "learning_rate": 7.365603758700456e-06, "loss": 1.4668, "step": 34308 }, { "epoch": 2.7, "learning_rate": 7.361778779079236e-06, "loss": 1.4323, "step": 34309 }, { "epoch": 2.7, "learning_rate": 7.3579547678928155e-06, "loss": 1.4543, "step": 34310 }, { "epoch": 2.7, "learning_rate": 7.354131725167172e-06, "loss": 1.472, "step": 34311 }, { "epoch": 2.7, "learning_rate": 7.350309650928238e-06, "loss": 1.389, "step": 34312 }, { "epoch": 2.7, "learning_rate": 7.3464885452019896e-06, "loss": 1.3844, "step": 34313 }, { "epoch": 2.7, "learning_rate": 7.342668408014357e-06, "loss": 1.4205, "step": 34314 }, { "epoch": 2.7, "learning_rate": 7.33884923939127e-06, "loss": 1.4407, "step": 34315 }, { "epoch": 2.7, "learning_rate": 7.335031039358674e-06, "loss": 1.4669, "step": 34316 }, { "epoch": 2.7, "learning_rate": 7.331213807942499e-06, "loss": 1.4685, "step": 34317 }, { "epoch": 2.7, "learning_rate": 7.327397545168656e-06, "loss": 1.4783, "step": 34318 }, { "epoch": 2.7, "learning_rate": 7.323582251063043e-06, "loss": 1.4591, "step": 34319 }, { "epoch": 2.7, "learning_rate": 7.319767925651571e-06, "loss": 1.4139, "step": 34320 }, { "epoch": 2.7, "learning_rate": 7.315954568960153e-06, "loss": 1.4495, "step": 34321 }, { "epoch": 2.7, "learning_rate": 7.312142181014635e-06, "loss": 1.4645, "step": 34322 }, { "epoch": 2.7, "learning_rate": 7.308330761840947e-06, "loss": 1.434, "step": 34323 }, { "epoch": 2.7, "learning_rate": 7.3045203114649506e-06, "loss": 1.4141, "step": 34324 }, { "epoch": 2.7, "learning_rate": 7.300710829912493e-06, "loss": 1.4524, "step": 34325 }, { "epoch": 2.7, "learning_rate": 7.296902317209485e-06, "loss": 1.4236, "step": 34326 }, { "epoch": 2.7, "learning_rate": 7.293094773381775e-06, "loss": 1.4182, "step": 34327 }, { "epoch": 2.7, "learning_rate": 7.289288198455173e-06, "loss": 1.498, "step": 34328 }, { "epoch": 2.7, "learning_rate": 7.285482592455544e-06, "loss": 1.4143, "step": 34329 }, { "epoch": 2.7, "learning_rate": 7.281677955408749e-06, "loss": 1.4968, "step": 34330 }, { "epoch": 2.7, "learning_rate": 7.277874287340602e-06, "loss": 1.4415, "step": 34331 }, { "epoch": 2.7, "learning_rate": 7.274071588276897e-06, "loss": 1.4496, "step": 34332 }, { "epoch": 2.7, "learning_rate": 7.270269858243516e-06, "loss": 1.4497, "step": 34333 }, { "epoch": 2.7, "learning_rate": 7.266469097266237e-06, "loss": 1.424, "step": 34334 }, { "epoch": 2.7, "learning_rate": 7.2626693053708716e-06, "loss": 1.4196, "step": 34335 }, { "epoch": 2.7, "learning_rate": 7.258870482583184e-06, "loss": 1.421, "step": 34336 }, { "epoch": 2.7, "learning_rate": 7.25507262892902e-06, "loss": 1.4492, "step": 34337 }, { "epoch": 2.7, "learning_rate": 7.251275744434126e-06, "loss": 1.4419, "step": 34338 }, { "epoch": 2.7, "learning_rate": 7.247479829124297e-06, "loss": 1.4301, "step": 34339 }, { "epoch": 2.7, "learning_rate": 7.243684883025314e-06, "loss": 1.4191, "step": 34340 }, { "epoch": 2.7, "learning_rate": 7.239890906162921e-06, "loss": 1.4675, "step": 34341 }, { "epoch": 2.7, "learning_rate": 7.236097898562881e-06, "loss": 1.4513, "step": 34342 }, { "epoch": 2.7, "learning_rate": 7.232305860250959e-06, "loss": 1.4544, "step": 34343 }, { "epoch": 2.7, "learning_rate": 7.228514791252898e-06, "loss": 1.431, "step": 34344 }, { "epoch": 2.7, "learning_rate": 7.22472469159443e-06, "loss": 1.5101, "step": 34345 }, { "epoch": 2.7, "learning_rate": 7.2209355613013e-06, "loss": 1.4196, "step": 34346 }, { "epoch": 2.7, "learning_rate": 7.21714740039922e-06, "loss": 1.459, "step": 34347 }, { "epoch": 2.7, "learning_rate": 7.213360208913904e-06, "loss": 1.4564, "step": 34348 }, { "epoch": 2.7, "learning_rate": 7.209573986871065e-06, "loss": 1.4645, "step": 34349 }, { "epoch": 2.7, "learning_rate": 7.205788734296447e-06, "loss": 1.3994, "step": 34350 }, { "epoch": 2.7, "learning_rate": 7.202004451215732e-06, "loss": 1.4744, "step": 34351 }, { "epoch": 2.7, "learning_rate": 7.198221137654597e-06, "loss": 1.3785, "step": 34352 }, { "epoch": 2.7, "learning_rate": 7.194438793638707e-06, "loss": 1.4803, "step": 34353 }, { "epoch": 2.7, "learning_rate": 7.190657419193807e-06, "loss": 1.4479, "step": 34354 }, { "epoch": 2.7, "learning_rate": 7.186877014345526e-06, "loss": 1.462, "step": 34355 }, { "epoch": 2.7, "learning_rate": 7.183097579119513e-06, "loss": 1.4693, "step": 34356 }, { "epoch": 2.7, "learning_rate": 7.179319113541476e-06, "loss": 1.4424, "step": 34357 }, { "epoch": 2.7, "learning_rate": 7.175541617637065e-06, "loss": 1.4041, "step": 34358 }, { "epoch": 2.7, "learning_rate": 7.171765091431874e-06, "loss": 1.4635, "step": 34359 }, { "epoch": 2.7, "learning_rate": 7.167989534951601e-06, "loss": 1.4399, "step": 34360 }, { "epoch": 2.7, "learning_rate": 7.164214948221858e-06, "loss": 1.4221, "step": 34361 }, { "epoch": 2.7, "learning_rate": 7.160441331268257e-06, "loss": 1.4959, "step": 34362 }, { "epoch": 2.7, "learning_rate": 7.156668684116446e-06, "loss": 1.4332, "step": 34363 }, { "epoch": 2.7, "learning_rate": 7.152897006792002e-06, "loss": 1.4939, "step": 34364 }, { "epoch": 2.7, "learning_rate": 7.14912629932059e-06, "loss": 1.43, "step": 34365 }, { "epoch": 2.7, "learning_rate": 7.145356561727755e-06, "loss": 1.4311, "step": 34366 }, { "epoch": 2.7, "learning_rate": 7.141587794039144e-06, "loss": 1.4558, "step": 34367 }, { "epoch": 2.7, "learning_rate": 7.1378199962803025e-06, "loss": 1.5395, "step": 34368 }, { "epoch": 2.7, "learning_rate": 7.134053168476827e-06, "loss": 1.4752, "step": 34369 }, { "epoch": 2.7, "learning_rate": 7.130287310654281e-06, "loss": 1.4175, "step": 34370 }, { "epoch": 2.7, "learning_rate": 7.126522422838243e-06, "loss": 1.3812, "step": 34371 }, { "epoch": 2.7, "learning_rate": 7.1227585050542935e-06, "loss": 1.4671, "step": 34372 }, { "epoch": 2.7, "learning_rate": 7.118995557327945e-06, "loss": 1.4731, "step": 34373 }, { "epoch": 2.7, "learning_rate": 7.115233579684776e-06, "loss": 1.463, "step": 34374 }, { "epoch": 2.7, "learning_rate": 7.111472572150334e-06, "loss": 1.445, "step": 34375 }, { "epoch": 2.7, "learning_rate": 7.107712534750115e-06, "loss": 1.4187, "step": 34376 }, { "epoch": 2.7, "learning_rate": 7.103953467509682e-06, "loss": 1.5177, "step": 34377 }, { "epoch": 2.7, "learning_rate": 7.100195370454565e-06, "loss": 1.4026, "step": 34378 }, { "epoch": 2.7, "learning_rate": 7.096438243610242e-06, "loss": 1.4581, "step": 34379 }, { "epoch": 2.71, "learning_rate": 7.092682087002244e-06, "loss": 1.4267, "step": 34380 }, { "epoch": 2.71, "learning_rate": 7.0889269006560835e-06, "loss": 1.4425, "step": 34381 }, { "epoch": 2.71, "learning_rate": 7.08517268459724e-06, "loss": 1.4898, "step": 34382 }, { "epoch": 2.71, "learning_rate": 7.081419438851194e-06, "loss": 1.4447, "step": 34383 }, { "epoch": 2.71, "learning_rate": 7.077667163443457e-06, "loss": 1.4034, "step": 34384 }, { "epoch": 2.71, "learning_rate": 7.073915858399493e-06, "loss": 1.4366, "step": 34385 }, { "epoch": 2.71, "learning_rate": 7.070165523744747e-06, "loss": 1.4224, "step": 34386 }, { "epoch": 2.71, "learning_rate": 7.066416159504734e-06, "loss": 1.4556, "step": 34387 }, { "epoch": 2.71, "learning_rate": 7.062667765704866e-06, "loss": 1.4341, "step": 34388 }, { "epoch": 2.71, "learning_rate": 7.0589203423706055e-06, "loss": 1.4685, "step": 34389 }, { "epoch": 2.71, "learning_rate": 7.0551738895273655e-06, "loss": 1.4826, "step": 34390 }, { "epoch": 2.71, "learning_rate": 7.051428407200644e-06, "loss": 1.4417, "step": 34391 }, { "epoch": 2.71, "learning_rate": 7.047683895415835e-06, "loss": 1.4074, "step": 34392 }, { "epoch": 2.71, "learning_rate": 7.043940354198335e-06, "loss": 1.4879, "step": 34393 }, { "epoch": 2.71, "learning_rate": 7.040197783573626e-06, "loss": 1.4634, "step": 34394 }, { "epoch": 2.71, "learning_rate": 7.0364561835670516e-06, "loss": 1.4459, "step": 34395 }, { "epoch": 2.71, "learning_rate": 7.03271555420406e-06, "loss": 1.4032, "step": 34396 }, { "epoch": 2.71, "learning_rate": 7.028975895510031e-06, "loss": 1.3912, "step": 34397 }, { "epoch": 2.71, "learning_rate": 7.0252372075103594e-06, "loss": 1.4857, "step": 34398 }, { "epoch": 2.71, "learning_rate": 7.021499490230442e-06, "loss": 1.4302, "step": 34399 }, { "epoch": 2.71, "learning_rate": 7.017762743695627e-06, "loss": 1.4552, "step": 34400 }, { "epoch": 2.71, "learning_rate": 7.014026967931308e-06, "loss": 1.4508, "step": 34401 }, { "epoch": 2.71, "learning_rate": 7.010292162962833e-06, "loss": 1.3938, "step": 34402 }, { "epoch": 2.71, "learning_rate": 7.006558328815548e-06, "loss": 1.4704, "step": 34403 }, { "epoch": 2.71, "learning_rate": 7.00282546551485e-06, "loss": 1.4439, "step": 34404 }, { "epoch": 2.71, "learning_rate": 6.999093573086051e-06, "loss": 1.4194, "step": 34405 }, { "epoch": 2.71, "learning_rate": 6.995362651554498e-06, "loss": 1.4204, "step": 34406 }, { "epoch": 2.71, "learning_rate": 6.9916327009454875e-06, "loss": 1.4517, "step": 34407 }, { "epoch": 2.71, "learning_rate": 6.987903721284399e-06, "loss": 1.4524, "step": 34408 }, { "epoch": 2.71, "learning_rate": 6.984175712596513e-06, "loss": 1.4665, "step": 34409 }, { "epoch": 2.71, "learning_rate": 6.980448674907141e-06, "loss": 1.4458, "step": 34410 }, { "epoch": 2.71, "learning_rate": 6.976722608241597e-06, "loss": 1.4165, "step": 34411 }, { "epoch": 2.71, "learning_rate": 6.9729975126251944e-06, "loss": 1.4713, "step": 34412 }, { "epoch": 2.71, "learning_rate": 6.969273388083213e-06, "loss": 1.4509, "step": 34413 }, { "epoch": 2.71, "learning_rate": 6.9655502346409155e-06, "loss": 1.4205, "step": 34414 }, { "epoch": 2.71, "learning_rate": 6.9618280523236145e-06, "loss": 1.456, "step": 34415 }, { "epoch": 2.71, "learning_rate": 6.958106841156574e-06, "loss": 1.414, "step": 34416 }, { "epoch": 2.71, "learning_rate": 6.954386601165024e-06, "loss": 1.448, "step": 34417 }, { "epoch": 2.71, "learning_rate": 6.950667332374277e-06, "loss": 1.446, "step": 34418 }, { "epoch": 2.71, "learning_rate": 6.946949034809546e-06, "loss": 1.3927, "step": 34419 }, { "epoch": 2.71, "learning_rate": 6.943231708496078e-06, "loss": 1.3902, "step": 34420 }, { "epoch": 2.71, "learning_rate": 6.939515353459135e-06, "loss": 1.4326, "step": 34421 }, { "epoch": 2.71, "learning_rate": 6.935799969723949e-06, "loss": 1.4442, "step": 34422 }, { "epoch": 2.71, "learning_rate": 6.932085557315714e-06, "loss": 1.4567, "step": 34423 }, { "epoch": 2.71, "learning_rate": 6.928372116259662e-06, "loss": 1.4171, "step": 34424 }, { "epoch": 2.71, "learning_rate": 6.924659646581021e-06, "loss": 1.4447, "step": 34425 }, { "epoch": 2.71, "learning_rate": 6.920948148304972e-06, "loss": 1.4648, "step": 34426 }, { "epoch": 2.71, "learning_rate": 6.917237621456745e-06, "loss": 1.4578, "step": 34427 }, { "epoch": 2.71, "learning_rate": 6.913528066061485e-06, "loss": 1.4919, "step": 34428 }, { "epoch": 2.71, "learning_rate": 6.909819482144441e-06, "loss": 1.45, "step": 34429 }, { "epoch": 2.71, "learning_rate": 6.906111869730741e-06, "loss": 1.4477, "step": 34430 }, { "epoch": 2.71, "learning_rate": 6.902405228845581e-06, "loss": 1.4273, "step": 34431 }, { "epoch": 2.71, "learning_rate": 6.898699559514126e-06, "loss": 1.458, "step": 34432 }, { "epoch": 2.71, "learning_rate": 6.8949948617615215e-06, "loss": 1.4557, "step": 34433 }, { "epoch": 2.71, "learning_rate": 6.891291135612931e-06, "loss": 1.4482, "step": 34434 }, { "epoch": 2.71, "learning_rate": 6.8875883810935175e-06, "loss": 1.4131, "step": 34435 }, { "epoch": 2.71, "learning_rate": 6.883886598228394e-06, "loss": 1.4079, "step": 34436 }, { "epoch": 2.71, "learning_rate": 6.880185787042674e-06, "loss": 1.4545, "step": 34437 }, { "epoch": 2.71, "learning_rate": 6.876485947561555e-06, "loss": 1.4438, "step": 34438 }, { "epoch": 2.71, "learning_rate": 6.872787079810099e-06, "loss": 1.433, "step": 34439 }, { "epoch": 2.71, "learning_rate": 6.8690891838134365e-06, "loss": 1.3952, "step": 34440 }, { "epoch": 2.71, "learning_rate": 6.865392259596647e-06, "loss": 1.4215, "step": 34441 }, { "epoch": 2.71, "learning_rate": 6.861696307184878e-06, "loss": 1.4065, "step": 34442 }, { "epoch": 2.71, "learning_rate": 6.858001326603191e-06, "loss": 1.4092, "step": 34443 }, { "epoch": 2.71, "learning_rate": 6.854307317876684e-06, "loss": 1.4319, "step": 34444 }, { "epoch": 2.71, "learning_rate": 6.850614281030453e-06, "loss": 1.4358, "step": 34445 }, { "epoch": 2.71, "learning_rate": 6.8469222160895455e-06, "loss": 1.5018, "step": 34446 }, { "epoch": 2.71, "learning_rate": 6.84323112307904e-06, "loss": 1.4493, "step": 34447 }, { "epoch": 2.71, "learning_rate": 6.839541002023985e-06, "loss": 1.4906, "step": 34448 }, { "epoch": 2.71, "learning_rate": 6.835851852949459e-06, "loss": 1.4467, "step": 34449 }, { "epoch": 2.71, "learning_rate": 6.8321636758804925e-06, "loss": 1.4993, "step": 34450 }, { "epoch": 2.71, "learning_rate": 6.8284764708421146e-06, "loss": 1.4103, "step": 34451 }, { "epoch": 2.71, "learning_rate": 6.824790237859374e-06, "loss": 1.5089, "step": 34452 }, { "epoch": 2.71, "learning_rate": 6.821104976957314e-06, "loss": 1.4423, "step": 34453 }, { "epoch": 2.71, "learning_rate": 6.817420688160918e-06, "loss": 1.462, "step": 34454 }, { "epoch": 2.71, "learning_rate": 6.813737371495231e-06, "loss": 1.47, "step": 34455 }, { "epoch": 2.71, "learning_rate": 6.810055026985267e-06, "loss": 1.4149, "step": 34456 }, { "epoch": 2.71, "learning_rate": 6.806373654655972e-06, "loss": 1.4315, "step": 34457 }, { "epoch": 2.71, "learning_rate": 6.802693254532393e-06, "loss": 1.4478, "step": 34458 }, { "epoch": 2.71, "learning_rate": 6.79901382663951e-06, "loss": 1.3967, "step": 34459 }, { "epoch": 2.71, "learning_rate": 6.795335371002303e-06, "loss": 1.4379, "step": 34460 }, { "epoch": 2.71, "learning_rate": 6.791657887645735e-06, "loss": 1.3921, "step": 34461 }, { "epoch": 2.71, "learning_rate": 6.787981376594787e-06, "loss": 1.3803, "step": 34462 }, { "epoch": 2.71, "learning_rate": 6.784305837874421e-06, "loss": 1.4733, "step": 34463 }, { "epoch": 2.71, "learning_rate": 6.780631271509585e-06, "loss": 1.4698, "step": 34464 }, { "epoch": 2.71, "learning_rate": 6.776957677525208e-06, "loss": 1.407, "step": 34465 }, { "epoch": 2.71, "learning_rate": 6.77328505594627e-06, "loss": 1.4815, "step": 34466 }, { "epoch": 2.71, "learning_rate": 6.769613406797686e-06, "loss": 1.4782, "step": 34467 }, { "epoch": 2.71, "learning_rate": 6.765942730104368e-06, "loss": 1.442, "step": 34468 }, { "epoch": 2.71, "learning_rate": 6.76227302589128e-06, "loss": 1.4621, "step": 34469 }, { "epoch": 2.71, "learning_rate": 6.758604294183301e-06, "loss": 1.4372, "step": 34470 }, { "epoch": 2.71, "learning_rate": 6.754936535005328e-06, "loss": 1.4523, "step": 34471 }, { "epoch": 2.71, "learning_rate": 6.751269748382326e-06, "loss": 1.4718, "step": 34472 }, { "epoch": 2.71, "learning_rate": 6.747603934339141e-06, "loss": 1.4275, "step": 34473 }, { "epoch": 2.71, "learning_rate": 6.743939092900652e-06, "loss": 1.4685, "step": 34474 }, { "epoch": 2.71, "learning_rate": 6.740275224091773e-06, "loss": 1.4692, "step": 34475 }, { "epoch": 2.71, "learning_rate": 6.7366123279373685e-06, "loss": 1.4013, "step": 34476 }, { "epoch": 2.71, "learning_rate": 6.732950404462317e-06, "loss": 1.4614, "step": 34477 }, { "epoch": 2.71, "learning_rate": 6.72928945369145e-06, "loss": 1.4777, "step": 34478 }, { "epoch": 2.71, "learning_rate": 6.725629475649663e-06, "loss": 1.4759, "step": 34479 }, { "epoch": 2.71, "learning_rate": 6.721970470361787e-06, "loss": 1.4394, "step": 34480 }, { "epoch": 2.71, "learning_rate": 6.718312437852669e-06, "loss": 1.4292, "step": 34481 }, { "epoch": 2.71, "learning_rate": 6.714655378147121e-06, "loss": 1.443, "step": 34482 }, { "epoch": 2.71, "learning_rate": 6.7109992912700085e-06, "loss": 1.429, "step": 34483 }, { "epoch": 2.71, "learning_rate": 6.707344177246126e-06, "loss": 1.4948, "step": 34484 }, { "epoch": 2.71, "learning_rate": 6.70369003610029e-06, "loss": 1.5056, "step": 34485 }, { "epoch": 2.71, "learning_rate": 6.700036867857345e-06, "loss": 1.4856, "step": 34486 }, { "epoch": 2.71, "learning_rate": 6.696384672542071e-06, "loss": 1.4083, "step": 34487 }, { "epoch": 2.71, "learning_rate": 6.6927334501792325e-06, "loss": 1.4669, "step": 34488 }, { "epoch": 2.71, "learning_rate": 6.68908320079366e-06, "loss": 1.4412, "step": 34489 }, { "epoch": 2.71, "learning_rate": 6.68543392441015e-06, "loss": 1.4544, "step": 34490 }, { "epoch": 2.71, "learning_rate": 6.681785621053448e-06, "loss": 1.4418, "step": 34491 }, { "epoch": 2.71, "learning_rate": 6.678138290748319e-06, "loss": 1.5232, "step": 34492 }, { "epoch": 2.71, "learning_rate": 6.67449193351956e-06, "loss": 1.449, "step": 34493 }, { "epoch": 2.71, "learning_rate": 6.670846549391901e-06, "loss": 1.4011, "step": 34494 }, { "epoch": 2.71, "learning_rate": 6.667202138390071e-06, "loss": 1.4391, "step": 34495 }, { "epoch": 2.71, "learning_rate": 6.663558700538885e-06, "loss": 1.4542, "step": 34496 }, { "epoch": 2.71, "learning_rate": 6.6599162358630055e-06, "loss": 1.4304, "step": 34497 }, { "epoch": 2.71, "learning_rate": 6.6562747443871965e-06, "loss": 1.4697, "step": 34498 }, { "epoch": 2.71, "learning_rate": 6.652634226136188e-06, "loss": 1.4422, "step": 34499 }, { "epoch": 2.71, "learning_rate": 6.648994681134695e-06, "loss": 1.479, "step": 34500 }, { "epoch": 2.71, "learning_rate": 6.6453561094074125e-06, "loss": 1.4352, "step": 34501 }, { "epoch": 2.71, "learning_rate": 6.641718510979039e-06, "loss": 1.4644, "step": 34502 }, { "epoch": 2.71, "learning_rate": 6.638081885874303e-06, "loss": 1.4196, "step": 34503 }, { "epoch": 2.71, "learning_rate": 6.634446234117868e-06, "loss": 1.473, "step": 34504 }, { "epoch": 2.71, "learning_rate": 6.630811555734416e-06, "loss": 1.4579, "step": 34505 }, { "epoch": 2.71, "learning_rate": 6.627177850748644e-06, "loss": 1.4674, "step": 34506 }, { "epoch": 2.72, "learning_rate": 6.623545119185214e-06, "loss": 1.5135, "step": 34507 }, { "epoch": 2.72, "learning_rate": 6.6199133610688075e-06, "loss": 1.4784, "step": 34508 }, { "epoch": 2.72, "learning_rate": 6.6162825764240365e-06, "loss": 1.4553, "step": 34509 }, { "epoch": 2.72, "learning_rate": 6.612652765275617e-06, "loss": 1.4182, "step": 34510 }, { "epoch": 2.72, "learning_rate": 6.6090239276481435e-06, "loss": 1.4985, "step": 34511 }, { "epoch": 2.72, "learning_rate": 6.605396063566248e-06, "loss": 1.3949, "step": 34512 }, { "epoch": 2.72, "learning_rate": 6.601769173054611e-06, "loss": 1.4572, "step": 34513 }, { "epoch": 2.72, "learning_rate": 6.598143256137811e-06, "loss": 1.4106, "step": 34514 }, { "epoch": 2.72, "learning_rate": 6.59451831284048e-06, "loss": 1.4571, "step": 34515 }, { "epoch": 2.72, "learning_rate": 6.590894343187247e-06, "loss": 1.4878, "step": 34516 }, { "epoch": 2.72, "learning_rate": 6.587271347202694e-06, "loss": 1.4518, "step": 34517 }, { "epoch": 2.72, "learning_rate": 6.5836493249114334e-06, "loss": 1.4516, "step": 34518 }, { "epoch": 2.72, "learning_rate": 6.580028276338028e-06, "loss": 1.4121, "step": 34519 }, { "epoch": 2.72, "learning_rate": 6.576408201507111e-06, "loss": 1.4563, "step": 34520 }, { "epoch": 2.72, "learning_rate": 6.572789100443193e-06, "loss": 1.4205, "step": 34521 }, { "epoch": 2.72, "learning_rate": 6.56917097317094e-06, "loss": 1.4766, "step": 34522 }, { "epoch": 2.72, "learning_rate": 6.565553819714814e-06, "loss": 1.4556, "step": 34523 }, { "epoch": 2.72, "learning_rate": 6.561937640099463e-06, "loss": 1.4466, "step": 34524 }, { "epoch": 2.72, "learning_rate": 6.5583224343494005e-06, "loss": 1.389, "step": 34525 }, { "epoch": 2.72, "learning_rate": 6.5547082024891395e-06, "loss": 1.4704, "step": 34526 }, { "epoch": 2.72, "learning_rate": 6.551094944543278e-06, "loss": 1.4355, "step": 34527 }, { "epoch": 2.72, "learning_rate": 6.547482660536313e-06, "loss": 1.491, "step": 34528 }, { "epoch": 2.72, "learning_rate": 6.543871350492758e-06, "loss": 1.4542, "step": 34529 }, { "epoch": 2.72, "learning_rate": 6.540261014437176e-06, "loss": 1.4234, "step": 34530 }, { "epoch": 2.72, "learning_rate": 6.536651652394065e-06, "loss": 1.4619, "step": 34531 }, { "epoch": 2.72, "learning_rate": 6.533043264387888e-06, "loss": 1.448, "step": 34532 }, { "epoch": 2.72, "learning_rate": 6.529435850443193e-06, "loss": 1.4035, "step": 34533 }, { "epoch": 2.72, "learning_rate": 6.52582941058446e-06, "loss": 1.4432, "step": 34534 }, { "epoch": 2.72, "learning_rate": 6.522223944836152e-06, "loss": 1.4531, "step": 34535 }, { "epoch": 2.72, "learning_rate": 6.518619453222751e-06, "loss": 1.423, "step": 34536 }, { "epoch": 2.72, "learning_rate": 6.515015935768769e-06, "loss": 1.4347, "step": 34537 }, { "epoch": 2.72, "learning_rate": 6.5114133924986546e-06, "loss": 1.4056, "step": 34538 }, { "epoch": 2.72, "learning_rate": 6.507811823436854e-06, "loss": 1.4293, "step": 34539 }, { "epoch": 2.72, "learning_rate": 6.504211228607814e-06, "loss": 1.439, "step": 34540 }, { "epoch": 2.72, "learning_rate": 6.5006116080359996e-06, "loss": 1.4474, "step": 34541 }, { "epoch": 2.72, "learning_rate": 6.497012961745856e-06, "loss": 1.4485, "step": 34542 }, { "epoch": 2.72, "learning_rate": 6.493415289761783e-06, "loss": 1.3797, "step": 34543 }, { "epoch": 2.72, "learning_rate": 6.489818592108242e-06, "loss": 1.4351, "step": 34544 }, { "epoch": 2.72, "learning_rate": 6.4862228688096316e-06, "loss": 1.4193, "step": 34545 }, { "epoch": 2.72, "learning_rate": 6.482628119890348e-06, "loss": 1.4613, "step": 34546 }, { "epoch": 2.72, "learning_rate": 6.479034345374856e-06, "loss": 1.4267, "step": 34547 }, { "epoch": 2.72, "learning_rate": 6.475441545287502e-06, "loss": 1.4954, "step": 34548 }, { "epoch": 2.72, "learning_rate": 6.4718497196527e-06, "loss": 1.4752, "step": 34549 }, { "epoch": 2.72, "learning_rate": 6.46825886849483e-06, "loss": 1.4502, "step": 34550 }, { "epoch": 2.72, "learning_rate": 6.46466899183829e-06, "loss": 1.4597, "step": 34551 }, { "epoch": 2.72, "learning_rate": 6.46108008970741e-06, "loss": 1.4514, "step": 34552 }, { "epoch": 2.72, "learning_rate": 6.457492162126587e-06, "loss": 1.4957, "step": 34553 }, { "epoch": 2.72, "learning_rate": 6.453905209120186e-06, "loss": 1.4369, "step": 34554 }, { "epoch": 2.72, "learning_rate": 6.450319230712569e-06, "loss": 1.3752, "step": 34555 }, { "epoch": 2.72, "learning_rate": 6.446734226928052e-06, "loss": 1.4057, "step": 34556 }, { "epoch": 2.72, "learning_rate": 6.4431501977909975e-06, "loss": 1.376, "step": 34557 }, { "epoch": 2.72, "learning_rate": 6.439567143325736e-06, "loss": 1.4295, "step": 34558 }, { "epoch": 2.72, "learning_rate": 6.435985063556598e-06, "loss": 1.4269, "step": 34559 }, { "epoch": 2.72, "learning_rate": 6.432403958507865e-06, "loss": 1.4214, "step": 34560 }, { "epoch": 2.72, "learning_rate": 6.428823828203899e-06, "loss": 1.4885, "step": 34561 }, { "epoch": 2.72, "learning_rate": 6.4252446726689995e-06, "loss": 1.4656, "step": 34562 }, { "epoch": 2.72, "learning_rate": 6.421666491927446e-06, "loss": 1.4528, "step": 34563 }, { "epoch": 2.72, "learning_rate": 6.418089286003552e-06, "loss": 1.4326, "step": 34564 }, { "epoch": 2.72, "learning_rate": 6.414513054921583e-06, "loss": 1.4636, "step": 34565 }, { "epoch": 2.72, "learning_rate": 6.410937798705834e-06, "loss": 1.4155, "step": 34566 }, { "epoch": 2.72, "learning_rate": 6.407363517380587e-06, "loss": 1.4366, "step": 34567 }, { "epoch": 2.72, "learning_rate": 6.403790210970089e-06, "loss": 1.4454, "step": 34568 }, { "epoch": 2.72, "learning_rate": 6.400217879498637e-06, "loss": 1.4951, "step": 34569 }, { "epoch": 2.72, "learning_rate": 6.396646522990429e-06, "loss": 1.448, "step": 34570 }, { "epoch": 2.72, "learning_rate": 6.393076141469778e-06, "loss": 1.4209, "step": 34571 }, { "epoch": 2.72, "learning_rate": 6.389506734960881e-06, "loss": 1.4974, "step": 34572 }, { "epoch": 2.72, "learning_rate": 6.385938303487953e-06, "loss": 1.5042, "step": 34573 }, { "epoch": 2.72, "learning_rate": 6.382370847075291e-06, "loss": 1.427, "step": 34574 }, { "epoch": 2.72, "learning_rate": 6.378804365747059e-06, "loss": 1.4467, "step": 34575 }, { "epoch": 2.72, "learning_rate": 6.375238859527504e-06, "loss": 1.3962, "step": 34576 }, { "epoch": 2.72, "learning_rate": 6.37167432844079e-06, "loss": 1.4995, "step": 34577 }, { "epoch": 2.72, "learning_rate": 6.368110772511165e-06, "loss": 1.4292, "step": 34578 }, { "epoch": 2.72, "learning_rate": 6.364548191762808e-06, "loss": 1.4152, "step": 34579 }, { "epoch": 2.72, "learning_rate": 6.360986586219885e-06, "loss": 1.4164, "step": 34580 }, { "epoch": 2.72, "learning_rate": 6.357425955906609e-06, "loss": 1.4374, "step": 34581 }, { "epoch": 2.72, "learning_rate": 6.3538663008471435e-06, "loss": 1.3796, "step": 34582 }, { "epoch": 2.72, "learning_rate": 6.350307621065653e-06, "loss": 1.4724, "step": 34583 }, { "epoch": 2.72, "learning_rate": 6.346749916586286e-06, "loss": 1.4946, "step": 34584 }, { "epoch": 2.72, "learning_rate": 6.3431931874332375e-06, "loss": 1.4671, "step": 34585 }, { "epoch": 2.72, "learning_rate": 6.339637433630624e-06, "loss": 1.4402, "step": 34586 }, { "epoch": 2.72, "learning_rate": 6.3360826552025735e-06, "loss": 1.4166, "step": 34587 }, { "epoch": 2.72, "learning_rate": 6.332528852173269e-06, "loss": 1.4206, "step": 34588 }, { "epoch": 2.72, "learning_rate": 6.328976024566807e-06, "loss": 1.5192, "step": 34589 }, { "epoch": 2.72, "learning_rate": 6.3254241724073005e-06, "loss": 1.4109, "step": 34590 }, { "epoch": 2.72, "learning_rate": 6.321873295718899e-06, "loss": 1.4015, "step": 34591 }, { "epoch": 2.72, "learning_rate": 6.3183233945256814e-06, "loss": 1.465, "step": 34592 }, { "epoch": 2.72, "learning_rate": 6.314774468851763e-06, "loss": 1.4949, "step": 34593 }, { "epoch": 2.72, "learning_rate": 6.3112265187212076e-06, "loss": 1.3748, "step": 34594 }, { "epoch": 2.72, "learning_rate": 6.307679544158145e-06, "loss": 1.4338, "step": 34595 }, { "epoch": 2.72, "learning_rate": 6.304133545186657e-06, "loss": 1.4453, "step": 34596 }, { "epoch": 2.72, "learning_rate": 6.300588521830774e-06, "loss": 1.4318, "step": 34597 }, { "epoch": 2.72, "learning_rate": 6.297044474114627e-06, "loss": 1.4123, "step": 34598 }, { "epoch": 2.72, "learning_rate": 6.293501402062212e-06, "loss": 1.4461, "step": 34599 }, { "epoch": 2.72, "learning_rate": 6.289959305697645e-06, "loss": 1.4518, "step": 34600 }, { "epoch": 2.72, "learning_rate": 6.286418185044922e-06, "loss": 1.4492, "step": 34601 }, { "epoch": 2.72, "learning_rate": 6.282878040128142e-06, "loss": 1.4231, "step": 34602 }, { "epoch": 2.72, "learning_rate": 6.279338870971301e-06, "loss": 1.4173, "step": 34603 }, { "epoch": 2.72, "learning_rate": 6.27580067759843e-06, "loss": 1.4719, "step": 34604 }, { "epoch": 2.72, "learning_rate": 6.272263460033577e-06, "loss": 1.4081, "step": 34605 }, { "epoch": 2.72, "learning_rate": 6.268727218300723e-06, "loss": 1.4715, "step": 34606 }, { "epoch": 2.72, "learning_rate": 6.265191952423898e-06, "loss": 1.4307, "step": 34607 }, { "epoch": 2.72, "learning_rate": 6.2616576624271e-06, "loss": 1.376, "step": 34608 }, { "epoch": 2.72, "learning_rate": 6.258124348334326e-06, "loss": 1.5085, "step": 34609 }, { "epoch": 2.72, "learning_rate": 6.254592010169557e-06, "loss": 1.4376, "step": 34610 }, { "epoch": 2.72, "learning_rate": 6.251060647956807e-06, "loss": 1.448, "step": 34611 }, { "epoch": 2.72, "learning_rate": 6.247530261720007e-06, "loss": 1.4033, "step": 34612 }, { "epoch": 2.72, "learning_rate": 6.244000851483155e-06, "loss": 1.4589, "step": 34613 }, { "epoch": 2.72, "learning_rate": 6.2404724172701984e-06, "loss": 1.4309, "step": 34614 }, { "epoch": 2.72, "learning_rate": 6.236944959105083e-06, "loss": 1.4618, "step": 34615 }, { "epoch": 2.72, "learning_rate": 6.233418477011809e-06, "loss": 1.4296, "step": 34616 }, { "epoch": 2.72, "learning_rate": 6.229892971014289e-06, "loss": 1.4429, "step": 34617 }, { "epoch": 2.72, "learning_rate": 6.22636844113642e-06, "loss": 1.404, "step": 34618 }, { "epoch": 2.72, "learning_rate": 6.222844887402201e-06, "loss": 1.413, "step": 34619 }, { "epoch": 2.72, "learning_rate": 6.219322309835528e-06, "loss": 1.3976, "step": 34620 }, { "epoch": 2.72, "learning_rate": 6.215800708460283e-06, "loss": 1.3982, "step": 34621 }, { "epoch": 2.72, "learning_rate": 6.21228008330043e-06, "loss": 1.4972, "step": 34622 }, { "epoch": 2.72, "learning_rate": 6.208760434379833e-06, "loss": 1.4363, "step": 34623 }, { "epoch": 2.72, "learning_rate": 6.20524176172239e-06, "loss": 1.4251, "step": 34624 }, { "epoch": 2.72, "learning_rate": 6.201724065352032e-06, "loss": 1.4581, "step": 34625 }, { "epoch": 2.72, "learning_rate": 6.198207345292605e-06, "loss": 1.5041, "step": 34626 }, { "epoch": 2.72, "learning_rate": 6.194691601567975e-06, "loss": 1.4212, "step": 34627 }, { "epoch": 2.72, "learning_rate": 6.191176834202038e-06, "loss": 1.5071, "step": 34628 }, { "epoch": 2.72, "learning_rate": 6.187663043218677e-06, "loss": 1.3721, "step": 34629 }, { "epoch": 2.72, "learning_rate": 6.184150228641704e-06, "loss": 1.4427, "step": 34630 }, { "epoch": 2.72, "learning_rate": 6.180638390494952e-06, "loss": 1.4722, "step": 34631 }, { "epoch": 2.72, "learning_rate": 6.177127528802334e-06, "loss": 1.4459, "step": 34632 }, { "epoch": 2.72, "learning_rate": 6.173617643587647e-06, "loss": 1.4705, "step": 34633 }, { "epoch": 2.73, "learning_rate": 6.17010873487474e-06, "loss": 1.4464, "step": 34634 }, { "epoch": 2.73, "learning_rate": 6.166600802687394e-06, "loss": 1.4347, "step": 34635 }, { "epoch": 2.73, "learning_rate": 6.1630938470494715e-06, "loss": 1.4261, "step": 34636 }, { "epoch": 2.73, "learning_rate": 6.159587867984772e-06, "loss": 1.4194, "step": 34637 }, { "epoch": 2.73, "learning_rate": 6.156082865517076e-06, "loss": 1.417, "step": 34638 }, { "epoch": 2.73, "learning_rate": 6.152578839670213e-06, "loss": 1.3872, "step": 34639 }, { "epoch": 2.73, "learning_rate": 6.149075790467967e-06, "loss": 1.4896, "step": 34640 }, { "epoch": 2.73, "learning_rate": 6.145573717934083e-06, "loss": 1.4487, "step": 34641 }, { "epoch": 2.73, "learning_rate": 6.142072622092392e-06, "loss": 1.4166, "step": 34642 }, { "epoch": 2.73, "learning_rate": 6.138572502966643e-06, "loss": 1.4973, "step": 34643 }, { "epoch": 2.73, "learning_rate": 6.135073360580567e-06, "loss": 1.4507, "step": 34644 }, { "epoch": 2.73, "learning_rate": 6.131575194957978e-06, "loss": 1.4464, "step": 34645 }, { "epoch": 2.73, "learning_rate": 6.128078006122588e-06, "loss": 1.4802, "step": 34646 }, { "epoch": 2.73, "learning_rate": 6.124581794098166e-06, "loss": 1.4351, "step": 34647 }, { "epoch": 2.73, "learning_rate": 6.121086558908406e-06, "loss": 1.4304, "step": 34648 }, { "epoch": 2.73, "learning_rate": 6.1175923005771065e-06, "loss": 1.4809, "step": 34649 }, { "epoch": 2.73, "learning_rate": 6.114099019127949e-06, "loss": 1.4723, "step": 34650 }, { "epoch": 2.73, "learning_rate": 6.110606714584648e-06, "loss": 1.4188, "step": 34651 }, { "epoch": 2.73, "learning_rate": 6.1071153869709175e-06, "loss": 1.428, "step": 34652 }, { "epoch": 2.73, "learning_rate": 6.103625036310472e-06, "loss": 1.4695, "step": 34653 }, { "epoch": 2.73, "learning_rate": 6.10013566262701e-06, "loss": 1.5068, "step": 34654 }, { "epoch": 2.73, "learning_rate": 6.09664726594421e-06, "loss": 1.4356, "step": 34655 }, { "epoch": 2.73, "learning_rate": 6.093159846285756e-06, "loss": 1.4831, "step": 34656 }, { "epoch": 2.73, "learning_rate": 6.08967340367536e-06, "loss": 1.413, "step": 34657 }, { "epoch": 2.73, "learning_rate": 6.086187938136622e-06, "loss": 1.4548, "step": 34658 }, { "epoch": 2.73, "learning_rate": 6.082703449693288e-06, "loss": 1.4662, "step": 34659 }, { "epoch": 2.73, "learning_rate": 6.079219938368957e-06, "loss": 1.4181, "step": 34660 }, { "epoch": 2.73, "learning_rate": 6.0757374041872915e-06, "loss": 1.4275, "step": 34661 }, { "epoch": 2.73, "learning_rate": 6.072255847171959e-06, "loss": 1.4123, "step": 34662 }, { "epoch": 2.73, "learning_rate": 6.068775267346588e-06, "loss": 1.4265, "step": 34663 }, { "epoch": 2.73, "learning_rate": 6.065295664734809e-06, "loss": 1.4594, "step": 34664 }, { "epoch": 2.73, "learning_rate": 6.061817039360223e-06, "loss": 1.4461, "step": 34665 }, { "epoch": 2.73, "learning_rate": 6.058339391246475e-06, "loss": 1.4537, "step": 34666 }, { "epoch": 2.73, "learning_rate": 6.05486272041718e-06, "loss": 1.4141, "step": 34667 }, { "epoch": 2.73, "learning_rate": 6.051387026895921e-06, "loss": 1.4584, "step": 34668 }, { "epoch": 2.73, "learning_rate": 6.0479123107063096e-06, "loss": 1.4529, "step": 34669 }, { "epoch": 2.73, "learning_rate": 6.044438571871945e-06, "loss": 1.5105, "step": 34670 }, { "epoch": 2.73, "learning_rate": 6.040965810416393e-06, "loss": 1.4357, "step": 34671 }, { "epoch": 2.73, "learning_rate": 6.037494026363232e-06, "loss": 1.409, "step": 34672 }, { "epoch": 2.73, "learning_rate": 6.034023219736045e-06, "loss": 1.4056, "step": 34673 }, { "epoch": 2.73, "learning_rate": 6.0305533905584124e-06, "loss": 1.4688, "step": 34674 }, { "epoch": 2.73, "learning_rate": 6.027084538853833e-06, "loss": 1.4914, "step": 34675 }, { "epoch": 2.73, "learning_rate": 6.023616664645936e-06, "loss": 1.4147, "step": 34676 }, { "epoch": 2.73, "learning_rate": 6.020149767958221e-06, "loss": 1.4615, "step": 34677 }, { "epoch": 2.73, "learning_rate": 6.016683848814219e-06, "loss": 1.4636, "step": 34678 }, { "epoch": 2.73, "learning_rate": 6.013218907237477e-06, "loss": 1.4264, "step": 34679 }, { "epoch": 2.73, "learning_rate": 6.009754943251527e-06, "loss": 1.524, "step": 34680 }, { "epoch": 2.73, "learning_rate": 6.006291956879899e-06, "loss": 1.413, "step": 34681 }, { "epoch": 2.73, "learning_rate": 6.00282994814606e-06, "loss": 1.4792, "step": 34682 }, { "epoch": 2.73, "learning_rate": 5.999368917073555e-06, "loss": 1.4809, "step": 34683 }, { "epoch": 2.73, "learning_rate": 5.995908863685866e-06, "loss": 1.4773, "step": 34684 }, { "epoch": 2.73, "learning_rate": 5.992449788006476e-06, "loss": 1.4357, "step": 34685 }, { "epoch": 2.73, "learning_rate": 5.988991690058914e-06, "loss": 1.491, "step": 34686 }, { "epoch": 2.73, "learning_rate": 5.985534569866612e-06, "loss": 1.4455, "step": 34687 }, { "epoch": 2.73, "learning_rate": 5.982078427453052e-06, "loss": 1.3941, "step": 34688 }, { "epoch": 2.73, "learning_rate": 5.978623262841697e-06, "loss": 1.4772, "step": 34689 }, { "epoch": 2.73, "learning_rate": 5.9751690760560135e-06, "loss": 1.4068, "step": 34690 }, { "epoch": 2.73, "learning_rate": 5.971715867119465e-06, "loss": 1.4668, "step": 34691 }, { "epoch": 2.73, "learning_rate": 5.9682636360554645e-06, "loss": 1.4342, "step": 34692 }, { "epoch": 2.73, "learning_rate": 5.964812382887496e-06, "loss": 1.4365, "step": 34693 }, { "epoch": 2.73, "learning_rate": 5.96136210763894e-06, "loss": 1.4237, "step": 34694 }, { "epoch": 2.73, "learning_rate": 5.957912810333276e-06, "loss": 1.4434, "step": 34695 }, { "epoch": 2.73, "learning_rate": 5.954464490993871e-06, "loss": 1.4444, "step": 34696 }, { "epoch": 2.73, "learning_rate": 5.951017149644172e-06, "loss": 1.4151, "step": 34697 }, { "epoch": 2.73, "learning_rate": 5.9475707863075764e-06, "loss": 1.4465, "step": 34698 }, { "epoch": 2.73, "learning_rate": 5.9441254010074654e-06, "loss": 1.4463, "step": 34699 }, { "epoch": 2.73, "learning_rate": 5.940680993767272e-06, "loss": 1.4541, "step": 34700 }, { "epoch": 2.73, "learning_rate": 5.937237564610342e-06, "loss": 1.4691, "step": 34701 }, { "epoch": 2.73, "learning_rate": 5.933795113560058e-06, "loss": 1.4606, "step": 34702 }, { "epoch": 2.73, "learning_rate": 5.930353640639818e-06, "loss": 1.4659, "step": 34703 }, { "epoch": 2.73, "learning_rate": 5.926913145872969e-06, "loss": 1.4433, "step": 34704 }, { "epoch": 2.73, "learning_rate": 5.923473629282877e-06, "loss": 1.4543, "step": 34705 }, { "epoch": 2.73, "learning_rate": 5.920035090892872e-06, "loss": 1.4313, "step": 34706 }, { "epoch": 2.73, "learning_rate": 5.916597530726352e-06, "loss": 1.4593, "step": 34707 }, { "epoch": 2.73, "learning_rate": 5.9131609488066005e-06, "loss": 1.4669, "step": 34708 }, { "epoch": 2.73, "learning_rate": 5.909725345156946e-06, "loss": 1.3997, "step": 34709 }, { "epoch": 2.73, "learning_rate": 5.906290719800788e-06, "loss": 1.4443, "step": 34710 }, { "epoch": 2.73, "learning_rate": 5.902857072761374e-06, "loss": 1.4755, "step": 34711 }, { "epoch": 2.73, "learning_rate": 5.8994244040620695e-06, "loss": 1.429, "step": 34712 }, { "epoch": 2.73, "learning_rate": 5.8959927137261055e-06, "loss": 1.4384, "step": 34713 }, { "epoch": 2.73, "learning_rate": 5.892562001776863e-06, "loss": 1.4157, "step": 34714 }, { "epoch": 2.73, "learning_rate": 5.889132268237606e-06, "loss": 1.4963, "step": 34715 }, { "epoch": 2.73, "learning_rate": 5.885703513131585e-06, "loss": 1.457, "step": 34716 }, { "epoch": 2.73, "learning_rate": 5.882275736482128e-06, "loss": 1.432, "step": 34717 }, { "epoch": 2.73, "learning_rate": 5.878848938312486e-06, "loss": 1.4148, "step": 34718 }, { "epoch": 2.73, "learning_rate": 5.875423118645906e-06, "loss": 1.4379, "step": 34719 }, { "epoch": 2.73, "learning_rate": 5.871998277505685e-06, "loss": 1.4991, "step": 34720 }, { "epoch": 2.73, "learning_rate": 5.868574414915072e-06, "loss": 1.4457, "step": 34721 }, { "epoch": 2.73, "learning_rate": 5.865151530897283e-06, "loss": 1.4592, "step": 34722 }, { "epoch": 2.73, "learning_rate": 5.8617296254755805e-06, "loss": 1.4435, "step": 34723 }, { "epoch": 2.73, "learning_rate": 5.8583086986731975e-06, "loss": 1.4764, "step": 34724 }, { "epoch": 2.73, "learning_rate": 5.854888750513331e-06, "loss": 1.4419, "step": 34725 }, { "epoch": 2.73, "learning_rate": 5.85146978101923e-06, "loss": 1.4552, "step": 34726 }, { "epoch": 2.73, "learning_rate": 5.8480517902141255e-06, "loss": 1.5081, "step": 34727 }, { "epoch": 2.73, "learning_rate": 5.844634778121182e-06, "loss": 1.4227, "step": 34728 }, { "epoch": 2.73, "learning_rate": 5.841218744763632e-06, "loss": 1.4012, "step": 34729 }, { "epoch": 2.73, "learning_rate": 5.8378036901646385e-06, "loss": 1.4672, "step": 34730 }, { "epoch": 2.73, "learning_rate": 5.8343896143474015e-06, "loss": 1.4308, "step": 34731 }, { "epoch": 2.73, "learning_rate": 5.8309765173351176e-06, "loss": 1.4567, "step": 34732 }, { "epoch": 2.73, "learning_rate": 5.827564399150919e-06, "loss": 1.4159, "step": 34733 }, { "epoch": 2.73, "learning_rate": 5.82415325981802e-06, "loss": 1.4251, "step": 34734 }, { "epoch": 2.73, "learning_rate": 5.820743099359554e-06, "loss": 1.4696, "step": 34735 }, { "epoch": 2.73, "learning_rate": 5.817333917798667e-06, "loss": 1.4247, "step": 34736 }, { "epoch": 2.73, "learning_rate": 5.813925715158524e-06, "loss": 1.4106, "step": 34737 }, { "epoch": 2.73, "learning_rate": 5.810518491462257e-06, "loss": 1.4879, "step": 34738 }, { "epoch": 2.73, "learning_rate": 5.807112246732998e-06, "loss": 1.4542, "step": 34739 }, { "epoch": 2.73, "learning_rate": 5.8037069809938775e-06, "loss": 1.4501, "step": 34740 }, { "epoch": 2.73, "learning_rate": 5.8003026942679945e-06, "loss": 1.4346, "step": 34741 }, { "epoch": 2.73, "learning_rate": 5.796899386578496e-06, "loss": 1.4339, "step": 34742 }, { "epoch": 2.73, "learning_rate": 5.7934970579484655e-06, "loss": 1.4394, "step": 34743 }, { "epoch": 2.73, "learning_rate": 5.790095708401016e-06, "loss": 1.4495, "step": 34744 }, { "epoch": 2.73, "learning_rate": 5.7866953379592465e-06, "loss": 1.421, "step": 34745 }, { "epoch": 2.73, "learning_rate": 5.783295946646221e-06, "loss": 1.4389, "step": 34746 }, { "epoch": 2.73, "learning_rate": 5.779897534485023e-06, "loss": 1.4304, "step": 34747 }, { "epoch": 2.73, "learning_rate": 5.776500101498749e-06, "loss": 1.4462, "step": 34748 }, { "epoch": 2.73, "learning_rate": 5.773103647710447e-06, "loss": 1.3992, "step": 34749 }, { "epoch": 2.73, "learning_rate": 5.769708173143167e-06, "loss": 1.402, "step": 34750 }, { "epoch": 2.73, "learning_rate": 5.7663136778199894e-06, "loss": 1.4633, "step": 34751 }, { "epoch": 2.73, "learning_rate": 5.762920161763945e-06, "loss": 1.4519, "step": 34752 }, { "epoch": 2.73, "learning_rate": 5.759527624998067e-06, "loss": 1.5026, "step": 34753 }, { "epoch": 2.73, "learning_rate": 5.756136067545402e-06, "loss": 1.4644, "step": 34754 }, { "epoch": 2.73, "learning_rate": 5.752745489428983e-06, "loss": 1.4358, "step": 34755 }, { "epoch": 2.73, "learning_rate": 5.749355890671791e-06, "loss": 1.4519, "step": 34756 }, { "epoch": 2.73, "learning_rate": 5.745967271296892e-06, "loss": 1.4347, "step": 34757 }, { "epoch": 2.73, "learning_rate": 5.742579631327266e-06, "loss": 1.4307, "step": 34758 }, { "epoch": 2.73, "learning_rate": 5.739192970785928e-06, "loss": 1.4571, "step": 34759 }, { "epoch": 2.73, "learning_rate": 5.735807289695826e-06, "loss": 1.4613, "step": 34760 }, { "epoch": 2.74, "learning_rate": 5.7324225880800105e-06, "loss": 1.3896, "step": 34761 }, { "epoch": 2.74, "learning_rate": 5.729038865961444e-06, "loss": 1.4813, "step": 34762 }, { "epoch": 2.74, "learning_rate": 5.725656123363043e-06, "loss": 1.4754, "step": 34763 }, { "epoch": 2.74, "learning_rate": 5.7222743603078545e-06, "loss": 1.4646, "step": 34764 }, { "epoch": 2.74, "learning_rate": 5.7188935768188115e-06, "loss": 1.4941, "step": 34765 }, { "epoch": 2.74, "learning_rate": 5.7155137729188445e-06, "loss": 1.4469, "step": 34766 }, { "epoch": 2.74, "learning_rate": 5.712134948630903e-06, "loss": 1.4651, "step": 34767 }, { "epoch": 2.74, "learning_rate": 5.7087571039779675e-06, "loss": 1.4727, "step": 34768 }, { "epoch": 2.74, "learning_rate": 5.705380238982937e-06, "loss": 1.4164, "step": 34769 }, { "epoch": 2.74, "learning_rate": 5.702004353668726e-06, "loss": 1.448, "step": 34770 }, { "epoch": 2.74, "learning_rate": 5.6986294480583005e-06, "loss": 1.4283, "step": 34771 }, { "epoch": 2.74, "learning_rate": 5.695255522174524e-06, "loss": 1.4493, "step": 34772 }, { "epoch": 2.74, "learning_rate": 5.691882576040347e-06, "loss": 1.4129, "step": 34773 }, { "epoch": 2.74, "learning_rate": 5.6885106096786315e-06, "loss": 1.4091, "step": 34774 }, { "epoch": 2.74, "learning_rate": 5.685139623112312e-06, "loss": 1.4519, "step": 34775 }, { "epoch": 2.74, "learning_rate": 5.681769616364268e-06, "loss": 1.4464, "step": 34776 }, { "epoch": 2.74, "learning_rate": 5.678400589457333e-06, "loss": 1.4532, "step": 34777 }, { "epoch": 2.74, "learning_rate": 5.6750325424144375e-06, "loss": 1.4354, "step": 34778 }, { "epoch": 2.74, "learning_rate": 5.67166547525843e-06, "loss": 1.4808, "step": 34779 }, { "epoch": 2.74, "learning_rate": 5.668299388012143e-06, "loss": 1.4958, "step": 34780 }, { "epoch": 2.74, "learning_rate": 5.664934280698474e-06, "loss": 1.3468, "step": 34781 }, { "epoch": 2.74, "learning_rate": 5.661570153340239e-06, "loss": 1.5227, "step": 34782 }, { "epoch": 2.74, "learning_rate": 5.658207005960303e-06, "loss": 1.4577, "step": 34783 }, { "epoch": 2.74, "learning_rate": 5.6548448385814795e-06, "loss": 1.4201, "step": 34784 }, { "epoch": 2.74, "learning_rate": 5.651483651226602e-06, "loss": 1.4441, "step": 34785 }, { "epoch": 2.74, "learning_rate": 5.648123443918501e-06, "loss": 1.4428, "step": 34786 }, { "epoch": 2.74, "learning_rate": 5.644764216679959e-06, "loss": 1.4092, "step": 34787 }, { "epoch": 2.74, "learning_rate": 5.641405969533808e-06, "loss": 1.3982, "step": 34788 }, { "epoch": 2.74, "learning_rate": 5.638048702502878e-06, "loss": 1.4666, "step": 34789 }, { "epoch": 2.74, "learning_rate": 5.63469241560992e-06, "loss": 1.4631, "step": 34790 }, { "epoch": 2.74, "learning_rate": 5.631337108877715e-06, "loss": 1.4875, "step": 34791 }, { "epoch": 2.74, "learning_rate": 5.627982782329077e-06, "loss": 1.4776, "step": 34792 }, { "epoch": 2.74, "learning_rate": 5.624629435986772e-06, "loss": 1.3966, "step": 34793 }, { "epoch": 2.74, "learning_rate": 5.621277069873531e-06, "loss": 1.4083, "step": 34794 }, { "epoch": 2.74, "learning_rate": 5.61792568401217e-06, "loss": 1.4382, "step": 34795 }, { "epoch": 2.74, "learning_rate": 5.6145752784254205e-06, "loss": 1.4499, "step": 34796 }, { "epoch": 2.74, "learning_rate": 5.611225853135997e-06, "loss": 1.4093, "step": 34797 }, { "epoch": 2.74, "learning_rate": 5.6078774081667e-06, "loss": 1.5057, "step": 34798 }, { "epoch": 2.74, "learning_rate": 5.604529943540226e-06, "loss": 1.4566, "step": 34799 }, { "epoch": 2.74, "learning_rate": 5.601183459279307e-06, "loss": 1.4316, "step": 34800 }, { "epoch": 2.74, "learning_rate": 5.5978379554066585e-06, "loss": 1.4668, "step": 34801 }, { "epoch": 2.74, "learning_rate": 5.594493431945013e-06, "loss": 1.4145, "step": 34802 }, { "epoch": 2.74, "learning_rate": 5.5911498889170684e-06, "loss": 1.4624, "step": 34803 }, { "epoch": 2.74, "learning_rate": 5.587807326345506e-06, "loss": 1.4611, "step": 34804 }, { "epoch": 2.74, "learning_rate": 5.584465744253042e-06, "loss": 1.4106, "step": 34805 }, { "epoch": 2.74, "learning_rate": 5.581125142662374e-06, "loss": 1.4765, "step": 34806 }, { "epoch": 2.74, "learning_rate": 5.577785521596184e-06, "loss": 1.4254, "step": 34807 }, { "epoch": 2.74, "learning_rate": 5.574446881077105e-06, "loss": 1.4649, "step": 34808 }, { "epoch": 2.74, "learning_rate": 5.5711092211278344e-06, "loss": 1.4482, "step": 34809 }, { "epoch": 2.74, "learning_rate": 5.567772541771038e-06, "loss": 1.3694, "step": 34810 }, { "epoch": 2.74, "learning_rate": 5.564436843029363e-06, "loss": 1.4689, "step": 34811 }, { "epoch": 2.74, "learning_rate": 5.5611021249254424e-06, "loss": 1.5131, "step": 34812 }, { "epoch": 2.74, "learning_rate": 5.557768387481959e-06, "loss": 1.4212, "step": 34813 }, { "epoch": 2.74, "learning_rate": 5.554435630721477e-06, "loss": 1.4685, "step": 34814 }, { "epoch": 2.74, "learning_rate": 5.5511038546666944e-06, "loss": 1.4932, "step": 34815 }, { "epoch": 2.74, "learning_rate": 5.54777305934021e-06, "loss": 1.4464, "step": 34816 }, { "epoch": 2.74, "learning_rate": 5.544443244764624e-06, "loss": 1.4362, "step": 34817 }, { "epoch": 2.74, "learning_rate": 5.541114410962532e-06, "loss": 1.397, "step": 34818 }, { "epoch": 2.74, "learning_rate": 5.537786557956553e-06, "loss": 1.4679, "step": 34819 }, { "epoch": 2.74, "learning_rate": 5.534459685769299e-06, "loss": 1.4773, "step": 34820 }, { "epoch": 2.74, "learning_rate": 5.531133794423337e-06, "loss": 1.4196, "step": 34821 }, { "epoch": 2.74, "learning_rate": 5.527808883941248e-06, "loss": 1.4762, "step": 34822 }, { "epoch": 2.74, "learning_rate": 5.5244849543456314e-06, "loss": 1.4208, "step": 34823 }, { "epoch": 2.74, "learning_rate": 5.521162005659019e-06, "loss": 1.4657, "step": 34824 }, { "epoch": 2.74, "learning_rate": 5.517840037903976e-06, "loss": 1.4029, "step": 34825 }, { "epoch": 2.74, "learning_rate": 5.514519051103083e-06, "loss": 1.4072, "step": 34826 }, { "epoch": 2.74, "learning_rate": 5.511199045278874e-06, "loss": 1.4236, "step": 34827 }, { "epoch": 2.74, "learning_rate": 5.507880020453864e-06, "loss": 1.4357, "step": 34828 }, { "epoch": 2.74, "learning_rate": 5.504561976650635e-06, "loss": 1.4772, "step": 34829 }, { "epoch": 2.74, "learning_rate": 5.501244913891684e-06, "loss": 1.4668, "step": 34830 }, { "epoch": 2.74, "learning_rate": 5.497928832199528e-06, "loss": 1.4294, "step": 34831 }, { "epoch": 2.74, "learning_rate": 5.494613731596714e-06, "loss": 1.4217, "step": 34832 }, { "epoch": 2.74, "learning_rate": 5.491299612105726e-06, "loss": 1.499, "step": 34833 }, { "epoch": 2.74, "learning_rate": 5.487986473749045e-06, "loss": 1.4605, "step": 34834 }, { "epoch": 2.74, "learning_rate": 5.484674316549187e-06, "loss": 1.4791, "step": 34835 }, { "epoch": 2.74, "learning_rate": 5.48136314052865e-06, "loss": 1.4768, "step": 34836 }, { "epoch": 2.74, "learning_rate": 5.478052945709915e-06, "loss": 1.4306, "step": 34837 }, { "epoch": 2.74, "learning_rate": 5.474743732115433e-06, "loss": 1.4141, "step": 34838 }, { "epoch": 2.74, "learning_rate": 5.4714354997677015e-06, "loss": 1.4827, "step": 34839 }, { "epoch": 2.74, "learning_rate": 5.468128248689169e-06, "loss": 1.4549, "step": 34840 }, { "epoch": 2.74, "learning_rate": 5.464821978902268e-06, "loss": 1.53, "step": 34841 }, { "epoch": 2.74, "learning_rate": 5.461516690429463e-06, "loss": 1.4069, "step": 34842 }, { "epoch": 2.74, "learning_rate": 5.45821238329322e-06, "loss": 1.4868, "step": 34843 }, { "epoch": 2.74, "learning_rate": 5.454909057515938e-06, "loss": 1.4606, "step": 34844 }, { "epoch": 2.74, "learning_rate": 5.451606713120033e-06, "loss": 1.4468, "step": 34845 }, { "epoch": 2.74, "learning_rate": 5.448305350127985e-06, "loss": 1.4511, "step": 34846 }, { "epoch": 2.74, "learning_rate": 5.445004968562161e-06, "loss": 1.4547, "step": 34847 }, { "epoch": 2.74, "learning_rate": 5.441705568444976e-06, "loss": 1.4895, "step": 34848 }, { "epoch": 2.74, "learning_rate": 5.438407149798846e-06, "loss": 1.4391, "step": 34849 }, { "epoch": 2.74, "learning_rate": 5.435109712646152e-06, "loss": 1.4631, "step": 34850 }, { "epoch": 2.74, "learning_rate": 5.431813257009276e-06, "loss": 1.443, "step": 34851 }, { "epoch": 2.74, "learning_rate": 5.428517782910602e-06, "loss": 1.4593, "step": 34852 }, { "epoch": 2.74, "learning_rate": 5.4252232903725265e-06, "loss": 1.4219, "step": 34853 }, { "epoch": 2.74, "learning_rate": 5.4219297794174e-06, "loss": 1.4237, "step": 34854 }, { "epoch": 2.74, "learning_rate": 5.418637250067587e-06, "loss": 1.4354, "step": 34855 }, { "epoch": 2.74, "learning_rate": 5.415345702345436e-06, "loss": 1.4987, "step": 34856 }, { "epoch": 2.74, "learning_rate": 5.412055136273313e-06, "loss": 1.4171, "step": 34857 }, { "epoch": 2.74, "learning_rate": 5.408765551873534e-06, "loss": 1.4567, "step": 34858 }, { "epoch": 2.74, "learning_rate": 5.405476949168447e-06, "loss": 1.4582, "step": 34859 }, { "epoch": 2.74, "learning_rate": 5.402189328180384e-06, "loss": 1.4475, "step": 34860 }, { "epoch": 2.74, "learning_rate": 5.3989026889316444e-06, "loss": 1.4296, "step": 34861 }, { "epoch": 2.74, "learning_rate": 5.39561703144456e-06, "loss": 1.4946, "step": 34862 }, { "epoch": 2.74, "learning_rate": 5.392332355741447e-06, "loss": 1.4535, "step": 34863 }, { "epoch": 2.74, "learning_rate": 5.389048661844603e-06, "loss": 1.4576, "step": 34864 }, { "epoch": 2.74, "learning_rate": 5.385765949776294e-06, "loss": 1.4212, "step": 34865 }, { "epoch": 2.74, "learning_rate": 5.382484219558819e-06, "loss": 1.462, "step": 34866 }, { "epoch": 2.74, "learning_rate": 5.379203471214511e-06, "loss": 1.4893, "step": 34867 }, { "epoch": 2.74, "learning_rate": 5.375923704765583e-06, "loss": 1.4573, "step": 34868 }, { "epoch": 2.74, "learning_rate": 5.372644920234303e-06, "loss": 1.4168, "step": 34869 }, { "epoch": 2.74, "learning_rate": 5.369367117642987e-06, "loss": 1.4126, "step": 34870 }, { "epoch": 2.74, "learning_rate": 5.366090297013847e-06, "loss": 1.4308, "step": 34871 }, { "epoch": 2.74, "learning_rate": 5.3628144583691194e-06, "loss": 1.51, "step": 34872 }, { "epoch": 2.74, "learning_rate": 5.3595396017310835e-06, "loss": 1.4978, "step": 34873 }, { "epoch": 2.74, "learning_rate": 5.356265727121939e-06, "loss": 1.4141, "step": 34874 }, { "epoch": 2.74, "learning_rate": 5.352992834563935e-06, "loss": 1.4328, "step": 34875 }, { "epoch": 2.74, "learning_rate": 5.349720924079287e-06, "loss": 1.479, "step": 34876 }, { "epoch": 2.74, "learning_rate": 5.346449995690227e-06, "loss": 1.4441, "step": 34877 }, { "epoch": 2.74, "learning_rate": 5.343180049418921e-06, "loss": 1.428, "step": 34878 }, { "epoch": 2.74, "learning_rate": 5.339911085287601e-06, "loss": 1.4387, "step": 34879 }, { "epoch": 2.74, "learning_rate": 5.33664310331845e-06, "loss": 1.3907, "step": 34880 }, { "epoch": 2.74, "learning_rate": 5.333376103533682e-06, "loss": 1.5017, "step": 34881 }, { "epoch": 2.74, "learning_rate": 5.33011008595543e-06, "loss": 1.422, "step": 34882 }, { "epoch": 2.74, "learning_rate": 5.326845050605894e-06, "loss": 1.4208, "step": 34883 }, { "epoch": 2.74, "learning_rate": 5.323580997507254e-06, "loss": 1.4244, "step": 34884 }, { "epoch": 2.74, "learning_rate": 5.3203179266816774e-06, "loss": 1.426, "step": 34885 }, { "epoch": 2.74, "learning_rate": 5.317055838151263e-06, "loss": 1.4364, "step": 34886 }, { "epoch": 2.74, "learning_rate": 5.313794731938226e-06, "loss": 1.4413, "step": 34887 }, { "epoch": 2.75, "learning_rate": 5.3105346080646815e-06, "loss": 1.4424, "step": 34888 }, { "epoch": 2.75, "learning_rate": 5.307275466552729e-06, "loss": 1.3684, "step": 34889 }, { "epoch": 2.75, "learning_rate": 5.304017307424552e-06, "loss": 1.3863, "step": 34890 }, { "epoch": 2.75, "learning_rate": 5.300760130702264e-06, "loss": 1.4282, "step": 34891 }, { "epoch": 2.75, "learning_rate": 5.297503936407932e-06, "loss": 1.4289, "step": 34892 }, { "epoch": 2.75, "learning_rate": 5.294248724563704e-06, "loss": 1.4357, "step": 34893 }, { "epoch": 2.75, "learning_rate": 5.290994495191681e-06, "loss": 1.4456, "step": 34894 }, { "epoch": 2.75, "learning_rate": 5.2877412483139425e-06, "loss": 1.4801, "step": 34895 }, { "epoch": 2.75, "learning_rate": 5.284488983952573e-06, "loss": 1.4056, "step": 34896 }, { "epoch": 2.75, "learning_rate": 5.281237702129687e-06, "loss": 1.4391, "step": 34897 }, { "epoch": 2.75, "learning_rate": 5.277987402867301e-06, "loss": 1.4854, "step": 34898 }, { "epoch": 2.75, "learning_rate": 5.274738086187547e-06, "loss": 1.4115, "step": 34899 }, { "epoch": 2.75, "learning_rate": 5.271489752112424e-06, "loss": 1.4364, "step": 34900 }, { "epoch": 2.75, "learning_rate": 5.268242400664047e-06, "loss": 1.4662, "step": 34901 }, { "epoch": 2.75, "learning_rate": 5.264996031864433e-06, "loss": 1.3979, "step": 34902 }, { "epoch": 2.75, "learning_rate": 5.261750645735596e-06, "loss": 1.4424, "step": 34903 }, { "epoch": 2.75, "learning_rate": 5.25850624229962e-06, "loss": 1.4104, "step": 34904 }, { "epoch": 2.75, "learning_rate": 5.255262821578521e-06, "loss": 1.4358, "step": 34905 }, { "epoch": 2.75, "learning_rate": 5.25202038359428e-06, "loss": 1.4187, "step": 34906 }, { "epoch": 2.75, "learning_rate": 5.24877892836898e-06, "loss": 1.4196, "step": 34907 }, { "epoch": 2.75, "learning_rate": 5.24553845592457e-06, "loss": 1.3993, "step": 34908 }, { "epoch": 2.75, "learning_rate": 5.242298966283065e-06, "loss": 1.4153, "step": 34909 }, { "epoch": 2.75, "learning_rate": 5.239060459466482e-06, "loss": 1.4481, "step": 34910 }, { "epoch": 2.75, "learning_rate": 5.235822935496786e-06, "loss": 1.4117, "step": 34911 }, { "epoch": 2.75, "learning_rate": 5.232586394395977e-06, "loss": 1.463, "step": 34912 }, { "epoch": 2.75, "learning_rate": 5.229350836185986e-06, "loss": 1.4742, "step": 34913 }, { "epoch": 2.75, "learning_rate": 5.22611626088883e-06, "loss": 1.4211, "step": 34914 }, { "epoch": 2.75, "learning_rate": 5.222882668526457e-06, "loss": 1.431, "step": 34915 }, { "epoch": 2.75, "learning_rate": 5.219650059120817e-06, "loss": 1.4606, "step": 34916 }, { "epoch": 2.75, "learning_rate": 5.216418432693842e-06, "loss": 1.4266, "step": 34917 }, { "epoch": 2.75, "learning_rate": 5.213187789267498e-06, "loss": 1.4623, "step": 34918 }, { "epoch": 2.75, "learning_rate": 5.209958128863717e-06, "loss": 1.3893, "step": 34919 }, { "epoch": 2.75, "learning_rate": 5.206729451504399e-06, "loss": 1.4387, "step": 34920 }, { "epoch": 2.75, "learning_rate": 5.203501757211492e-06, "loss": 1.4419, "step": 34921 }, { "epoch": 2.75, "learning_rate": 5.200275046006913e-06, "loss": 1.4679, "step": 34922 }, { "epoch": 2.75, "learning_rate": 5.197049317912544e-06, "loss": 1.4526, "step": 34923 }, { "epoch": 2.75, "learning_rate": 5.193824572950317e-06, "loss": 1.4531, "step": 34924 }, { "epoch": 2.75, "learning_rate": 5.190600811142099e-06, "loss": 1.4287, "step": 34925 }, { "epoch": 2.75, "learning_rate": 5.187378032509787e-06, "loss": 1.4201, "step": 34926 }, { "epoch": 2.75, "learning_rate": 5.1841562370752655e-06, "loss": 1.4664, "step": 34927 }, { "epoch": 2.75, "learning_rate": 5.1809354248604326e-06, "loss": 1.4379, "step": 34928 }, { "epoch": 2.75, "learning_rate": 5.177715595887089e-06, "loss": 1.4655, "step": 34929 }, { "epoch": 2.75, "learning_rate": 5.174496750177148e-06, "loss": 1.4871, "step": 34930 }, { "epoch": 2.75, "learning_rate": 5.171278887752461e-06, "loss": 1.4357, "step": 34931 }, { "epoch": 2.75, "learning_rate": 5.1680620086348766e-06, "loss": 1.3697, "step": 34932 }, { "epoch": 2.75, "learning_rate": 5.16484611284621e-06, "loss": 1.493, "step": 34933 }, { "epoch": 2.75, "learning_rate": 5.161631200408328e-06, "loss": 1.4477, "step": 34934 }, { "epoch": 2.75, "learning_rate": 5.15841727134303e-06, "loss": 1.4422, "step": 34935 }, { "epoch": 2.75, "learning_rate": 5.1552043256721635e-06, "loss": 1.4278, "step": 34936 }, { "epoch": 2.75, "learning_rate": 5.151992363417495e-06, "loss": 1.517, "step": 34937 }, { "epoch": 2.75, "learning_rate": 5.148781384600892e-06, "loss": 1.4254, "step": 34938 }, { "epoch": 2.75, "learning_rate": 5.145571389244135e-06, "loss": 1.459, "step": 34939 }, { "epoch": 2.75, "learning_rate": 5.142362377368992e-06, "loss": 1.4698, "step": 34940 }, { "epoch": 2.75, "learning_rate": 5.139154348997276e-06, "loss": 1.4389, "step": 34941 }, { "epoch": 2.75, "learning_rate": 5.135947304150756e-06, "loss": 1.4791, "step": 34942 }, { "epoch": 2.75, "learning_rate": 5.1327412428512125e-06, "loss": 1.4416, "step": 34943 }, { "epoch": 2.75, "learning_rate": 5.129536165120413e-06, "loss": 1.4153, "step": 34944 }, { "epoch": 2.75, "learning_rate": 5.126332070980104e-06, "loss": 1.4871, "step": 34945 }, { "epoch": 2.75, "learning_rate": 5.123128960452089e-06, "loss": 1.4345, "step": 34946 }, { "epoch": 2.75, "learning_rate": 5.1199268335580305e-06, "loss": 1.4412, "step": 34947 }, { "epoch": 2.75, "learning_rate": 5.116725690319762e-06, "loss": 1.4751, "step": 34948 }, { "epoch": 2.75, "learning_rate": 5.1135255307589495e-06, "loss": 1.3945, "step": 34949 }, { "epoch": 2.75, "learning_rate": 5.110326354897343e-06, "loss": 1.4443, "step": 34950 }, { "epoch": 2.75, "learning_rate": 5.107128162756674e-06, "loss": 1.4051, "step": 34951 }, { "epoch": 2.75, "learning_rate": 5.103930954358643e-06, "loss": 1.4833, "step": 34952 }, { "epoch": 2.75, "learning_rate": 5.100734729724965e-06, "loss": 1.388, "step": 34953 }, { "epoch": 2.75, "learning_rate": 5.097539488877323e-06, "loss": 1.4639, "step": 34954 }, { "epoch": 2.75, "learning_rate": 5.094345231837433e-06, "loss": 1.4264, "step": 34955 }, { "epoch": 2.75, "learning_rate": 5.091151958626976e-06, "loss": 1.4926, "step": 34956 }, { "epoch": 2.75, "learning_rate": 5.087959669267605e-06, "loss": 1.3806, "step": 34957 }, { "epoch": 2.75, "learning_rate": 5.08476836378105e-06, "loss": 1.4331, "step": 34958 }, { "epoch": 2.75, "learning_rate": 5.081578042188944e-06, "loss": 1.4647, "step": 34959 }, { "epoch": 2.75, "learning_rate": 5.078388704512937e-06, "loss": 1.3969, "step": 34960 }, { "epoch": 2.75, "learning_rate": 5.075200350774678e-06, "loss": 1.4883, "step": 34961 }, { "epoch": 2.75, "learning_rate": 5.072012980995865e-06, "loss": 1.4357, "step": 34962 }, { "epoch": 2.75, "learning_rate": 5.0688265951981e-06, "loss": 1.4924, "step": 34963 }, { "epoch": 2.75, "learning_rate": 5.065641193403014e-06, "loss": 1.4575, "step": 34964 }, { "epoch": 2.75, "learning_rate": 5.0624567756322566e-06, "loss": 1.458, "step": 34965 }, { "epoch": 2.75, "learning_rate": 5.059273341907427e-06, "loss": 1.4502, "step": 34966 }, { "epoch": 2.75, "learning_rate": 5.056090892250142e-06, "loss": 1.4397, "step": 34967 }, { "epoch": 2.75, "learning_rate": 5.052909426682017e-06, "loss": 1.3788, "step": 34968 }, { "epoch": 2.75, "learning_rate": 5.049728945224651e-06, "loss": 1.4377, "step": 34969 }, { "epoch": 2.75, "learning_rate": 5.046549447899645e-06, "loss": 1.4248, "step": 34970 }, { "epoch": 2.75, "learning_rate": 5.043370934728547e-06, "loss": 1.473, "step": 34971 }, { "epoch": 2.75, "learning_rate": 5.0401934057329894e-06, "loss": 1.4095, "step": 34972 }, { "epoch": 2.75, "learning_rate": 5.037016860934523e-06, "loss": 1.4463, "step": 34973 }, { "epoch": 2.75, "learning_rate": 5.033841300354713e-06, "loss": 1.4691, "step": 34974 }, { "epoch": 2.75, "learning_rate": 5.0306667240151254e-06, "loss": 1.4583, "step": 34975 }, { "epoch": 2.75, "learning_rate": 5.027493131937277e-06, "loss": 1.4089, "step": 34976 }, { "epoch": 2.75, "learning_rate": 5.024320524142783e-06, "loss": 1.402, "step": 34977 }, { "epoch": 2.75, "learning_rate": 5.021148900653127e-06, "loss": 1.4364, "step": 34978 }, { "epoch": 2.75, "learning_rate": 5.0179782614898915e-06, "loss": 1.3802, "step": 34979 }, { "epoch": 2.75, "learning_rate": 5.014808606674558e-06, "loss": 1.4355, "step": 34980 }, { "epoch": 2.75, "learning_rate": 5.011639936228662e-06, "loss": 1.4801, "step": 34981 }, { "epoch": 2.75, "learning_rate": 5.0084722501737336e-06, "loss": 1.4501, "step": 34982 }, { "epoch": 2.75, "learning_rate": 5.005305548531258e-06, "loss": 1.4759, "step": 34983 }, { "epoch": 2.75, "learning_rate": 5.002139831322732e-06, "loss": 1.4356, "step": 34984 }, { "epoch": 2.75, "learning_rate": 4.9989750985696745e-06, "loss": 1.4908, "step": 34985 }, { "epoch": 2.75, "learning_rate": 4.995811350293566e-06, "loss": 1.4146, "step": 34986 }, { "epoch": 2.75, "learning_rate": 4.992648586515858e-06, "loss": 1.4271, "step": 34987 }, { "epoch": 2.75, "learning_rate": 4.989486807258047e-06, "loss": 1.4495, "step": 34988 }, { "epoch": 2.75, "learning_rate": 4.986326012541619e-06, "loss": 1.4764, "step": 34989 }, { "epoch": 2.75, "learning_rate": 4.983166202387989e-06, "loss": 1.4544, "step": 34990 }, { "epoch": 2.75, "learning_rate": 4.98000737681864e-06, "loss": 1.4828, "step": 34991 }, { "epoch": 2.75, "learning_rate": 4.9768495358550045e-06, "loss": 1.484, "step": 34992 }, { "epoch": 2.75, "learning_rate": 4.973692679518531e-06, "loss": 1.4629, "step": 34993 }, { "epoch": 2.75, "learning_rate": 4.970536807830672e-06, "loss": 1.4906, "step": 34994 }, { "epoch": 2.75, "learning_rate": 4.9673819208128074e-06, "loss": 1.4332, "step": 34995 }, { "epoch": 2.75, "learning_rate": 4.964228018486405e-06, "loss": 1.4624, "step": 34996 }, { "epoch": 2.75, "learning_rate": 4.961075100872863e-06, "loss": 1.4591, "step": 34997 }, { "epoch": 2.75, "learning_rate": 4.95792316799355e-06, "loss": 1.4727, "step": 34998 }, { "epoch": 2.75, "learning_rate": 4.954772219869929e-06, "loss": 1.4573, "step": 34999 }, { "epoch": 2.75, "learning_rate": 4.9516222565233524e-06, "loss": 1.464, "step": 35000 }, { "epoch": 2.75, "learning_rate": 4.948473277975201e-06, "loss": 1.4448, "step": 35001 }, { "epoch": 2.75, "learning_rate": 4.945325284246893e-06, "loss": 1.4957, "step": 35002 }, { "epoch": 2.75, "learning_rate": 4.942178275359776e-06, "loss": 1.4507, "step": 35003 }, { "epoch": 2.75, "learning_rate": 4.939032251335201e-06, "loss": 1.4536, "step": 35004 }, { "epoch": 2.75, "learning_rate": 4.93588721219455e-06, "loss": 1.4368, "step": 35005 }, { "epoch": 2.75, "learning_rate": 4.93274315795919e-06, "loss": 1.4719, "step": 35006 }, { "epoch": 2.75, "learning_rate": 4.929600088650437e-06, "loss": 1.4995, "step": 35007 }, { "epoch": 2.75, "learning_rate": 4.926458004289624e-06, "loss": 1.4657, "step": 35008 }, { "epoch": 2.75, "learning_rate": 4.923316904898134e-06, "loss": 1.4102, "step": 35009 }, { "epoch": 2.75, "learning_rate": 4.920176790497249e-06, "loss": 1.4652, "step": 35010 }, { "epoch": 2.75, "learning_rate": 4.917037661108303e-06, "loss": 1.4345, "step": 35011 }, { "epoch": 2.75, "learning_rate": 4.913899516752612e-06, "loss": 1.4197, "step": 35012 }, { "epoch": 2.75, "learning_rate": 4.9107623574514755e-06, "loss": 1.4759, "step": 35013 }, { "epoch": 2.75, "learning_rate": 4.907626183226193e-06, "loss": 1.456, "step": 35014 }, { "epoch": 2.76, "learning_rate": 4.904490994098048e-06, "loss": 1.4515, "step": 35015 }, { "epoch": 2.76, "learning_rate": 4.901356790088373e-06, "loss": 1.4879, "step": 35016 }, { "epoch": 2.76, "learning_rate": 4.898223571218385e-06, "loss": 1.506, "step": 35017 }, { "epoch": 2.76, "learning_rate": 4.895091337509383e-06, "loss": 1.4294, "step": 35018 }, { "epoch": 2.76, "learning_rate": 4.891960088982666e-06, "loss": 1.4331, "step": 35019 }, { "epoch": 2.76, "learning_rate": 4.888829825659435e-06, "loss": 1.4016, "step": 35020 }, { "epoch": 2.76, "learning_rate": 4.885700547560972e-06, "loss": 1.4037, "step": 35021 }, { "epoch": 2.76, "learning_rate": 4.882572254708528e-06, "loss": 1.4014, "step": 35022 }, { "epoch": 2.76, "learning_rate": 4.879444947123351e-06, "loss": 1.4214, "step": 35023 }, { "epoch": 2.76, "learning_rate": 4.876318624826625e-06, "loss": 1.4799, "step": 35024 }, { "epoch": 2.76, "learning_rate": 4.873193287839616e-06, "loss": 1.4605, "step": 35025 }, { "epoch": 2.76, "learning_rate": 4.870068936183557e-06, "loss": 1.4593, "step": 35026 }, { "epoch": 2.76, "learning_rate": 4.866945569879632e-06, "loss": 1.4454, "step": 35027 }, { "epoch": 2.76, "learning_rate": 4.863823188949073e-06, "loss": 1.4454, "step": 35028 }, { "epoch": 2.76, "learning_rate": 4.86070179341303e-06, "loss": 1.4513, "step": 35029 }, { "epoch": 2.76, "learning_rate": 4.857581383292752e-06, "loss": 1.5065, "step": 35030 }, { "epoch": 2.76, "learning_rate": 4.85446195860939e-06, "loss": 1.4448, "step": 35031 }, { "epoch": 2.76, "learning_rate": 4.8513435193841265e-06, "loss": 1.4156, "step": 35032 }, { "epoch": 2.76, "learning_rate": 4.848226065638144e-06, "loss": 1.4363, "step": 35033 }, { "epoch": 2.76, "learning_rate": 4.8451095973926264e-06, "loss": 1.4308, "step": 35034 }, { "epoch": 2.76, "learning_rate": 4.841994114668673e-06, "loss": 1.4464, "step": 35035 }, { "epoch": 2.76, "learning_rate": 4.838879617487501e-06, "loss": 1.4103, "step": 35036 }, { "epoch": 2.76, "learning_rate": 4.835766105870242e-06, "loss": 1.4273, "step": 35037 }, { "epoch": 2.76, "learning_rate": 4.832653579837997e-06, "loss": 1.4555, "step": 35038 }, { "epoch": 2.76, "learning_rate": 4.829542039411915e-06, "loss": 1.4021, "step": 35039 }, { "epoch": 2.76, "learning_rate": 4.826431484613147e-06, "loss": 1.4491, "step": 35040 }, { "epoch": 2.76, "learning_rate": 4.823321915462808e-06, "loss": 1.4618, "step": 35041 }, { "epoch": 2.76, "learning_rate": 4.820213331981982e-06, "loss": 1.4623, "step": 35042 }, { "epoch": 2.76, "learning_rate": 4.8171057341918e-06, "loss": 1.3892, "step": 35043 }, { "epoch": 2.76, "learning_rate": 4.813999122113349e-06, "loss": 1.4924, "step": 35044 }, { "epoch": 2.76, "learning_rate": 4.810893495767709e-06, "loss": 1.4131, "step": 35045 }, { "epoch": 2.76, "learning_rate": 4.807788855176015e-06, "loss": 1.4506, "step": 35046 }, { "epoch": 2.76, "learning_rate": 4.804685200359281e-06, "loss": 1.4123, "step": 35047 }, { "epoch": 2.76, "learning_rate": 4.801582531338627e-06, "loss": 1.4399, "step": 35048 }, { "epoch": 2.76, "learning_rate": 4.798480848135083e-06, "loss": 1.3856, "step": 35049 }, { "epoch": 2.76, "learning_rate": 4.7953801507697345e-06, "loss": 1.4363, "step": 35050 }, { "epoch": 2.76, "learning_rate": 4.792280439263629e-06, "loss": 1.4439, "step": 35051 }, { "epoch": 2.76, "learning_rate": 4.789181713637802e-06, "loss": 1.462, "step": 35052 }, { "epoch": 2.76, "learning_rate": 4.786083973913301e-06, "loss": 1.3979, "step": 35053 }, { "epoch": 2.76, "learning_rate": 4.7829872201111455e-06, "loss": 1.4136, "step": 35054 }, { "epoch": 2.76, "learning_rate": 4.7798914522523655e-06, "loss": 1.3698, "step": 35055 }, { "epoch": 2.76, "learning_rate": 4.7767966703579796e-06, "loss": 1.4085, "step": 35056 }, { "epoch": 2.76, "learning_rate": 4.77370287444902e-06, "loss": 1.4949, "step": 35057 }, { "epoch": 2.76, "learning_rate": 4.770610064546488e-06, "loss": 1.4243, "step": 35058 }, { "epoch": 2.76, "learning_rate": 4.767518240671331e-06, "loss": 1.4586, "step": 35059 }, { "epoch": 2.76, "learning_rate": 4.764427402844617e-06, "loss": 1.3752, "step": 35060 }, { "epoch": 2.76, "learning_rate": 4.76133755108728e-06, "loss": 1.4561, "step": 35061 }, { "epoch": 2.76, "learning_rate": 4.758248685420285e-06, "loss": 1.4496, "step": 35062 }, { "epoch": 2.76, "learning_rate": 4.755160805864666e-06, "loss": 1.4359, "step": 35063 }, { "epoch": 2.76, "learning_rate": 4.75207391244134e-06, "loss": 1.4188, "step": 35064 }, { "epoch": 2.76, "learning_rate": 4.748988005171289e-06, "loss": 1.4639, "step": 35065 }, { "epoch": 2.76, "learning_rate": 4.745903084075431e-06, "loss": 1.4312, "step": 35066 }, { "epoch": 2.76, "learning_rate": 4.7428191491747484e-06, "loss": 1.4261, "step": 35067 }, { "epoch": 2.76, "learning_rate": 4.739736200490174e-06, "loss": 1.4644, "step": 35068 }, { "epoch": 2.76, "learning_rate": 4.7366542380426084e-06, "loss": 1.4927, "step": 35069 }, { "epoch": 2.76, "learning_rate": 4.733573261853002e-06, "loss": 1.4402, "step": 35070 }, { "epoch": 2.76, "learning_rate": 4.7304932719422705e-06, "loss": 1.3981, "step": 35071 }, { "epoch": 2.76, "learning_rate": 4.727414268331331e-06, "loss": 1.4064, "step": 35072 }, { "epoch": 2.76, "learning_rate": 4.72433625104105e-06, "loss": 1.4092, "step": 35073 }, { "epoch": 2.76, "learning_rate": 4.721259220092393e-06, "loss": 1.4602, "step": 35074 }, { "epoch": 2.76, "learning_rate": 4.718183175506213e-06, "loss": 1.4315, "step": 35075 }, { "epoch": 2.76, "learning_rate": 4.715108117303373e-06, "loss": 1.42, "step": 35076 }, { "epoch": 2.76, "learning_rate": 4.712034045504792e-06, "loss": 1.4471, "step": 35077 }, { "epoch": 2.76, "learning_rate": 4.70896096013132e-06, "loss": 1.4481, "step": 35078 }, { "epoch": 2.76, "learning_rate": 4.705888861203805e-06, "loss": 1.4099, "step": 35079 }, { "epoch": 2.76, "learning_rate": 4.702817748743148e-06, "loss": 1.4489, "step": 35080 }, { "epoch": 2.76, "learning_rate": 4.699747622770184e-06, "loss": 1.4969, "step": 35081 }, { "epoch": 2.76, "learning_rate": 4.696678483305744e-06, "loss": 1.4803, "step": 35082 }, { "epoch": 2.76, "learning_rate": 4.693610330370645e-06, "loss": 1.4614, "step": 35083 }, { "epoch": 2.76, "learning_rate": 4.690543163985771e-06, "loss": 1.476, "step": 35084 }, { "epoch": 2.76, "learning_rate": 4.687476984171923e-06, "loss": 1.4294, "step": 35085 }, { "epoch": 2.76, "learning_rate": 4.6844117909498824e-06, "loss": 1.4672, "step": 35086 }, { "epoch": 2.76, "learning_rate": 4.681347584340517e-06, "loss": 1.4778, "step": 35087 }, { "epoch": 2.76, "learning_rate": 4.678284364364626e-06, "loss": 1.4248, "step": 35088 }, { "epoch": 2.76, "learning_rate": 4.675222131042977e-06, "loss": 1.3874, "step": 35089 }, { "epoch": 2.76, "learning_rate": 4.672160884396353e-06, "loss": 1.4223, "step": 35090 }, { "epoch": 2.76, "learning_rate": 4.669100624445587e-06, "loss": 1.4324, "step": 35091 }, { "epoch": 2.76, "learning_rate": 4.666041351211414e-06, "loss": 1.4208, "step": 35092 }, { "epoch": 2.76, "learning_rate": 4.662983064714615e-06, "loss": 1.4666, "step": 35093 }, { "epoch": 2.76, "learning_rate": 4.659925764975958e-06, "loss": 1.416, "step": 35094 }, { "epoch": 2.76, "learning_rate": 4.65686945201621e-06, "loss": 1.4267, "step": 35095 }, { "epoch": 2.76, "learning_rate": 4.6538141258561035e-06, "loss": 1.4632, "step": 35096 }, { "epoch": 2.76, "learning_rate": 4.6507597865163894e-06, "loss": 1.5155, "step": 35097 }, { "epoch": 2.76, "learning_rate": 4.647706434017817e-06, "loss": 1.4903, "step": 35098 }, { "epoch": 2.76, "learning_rate": 4.644654068381087e-06, "loss": 1.4696, "step": 35099 }, { "epoch": 2.76, "learning_rate": 4.641602689626967e-06, "loss": 1.4391, "step": 35100 }, { "epoch": 2.76, "learning_rate": 4.638552297776138e-06, "loss": 1.4072, "step": 35101 }, { "epoch": 2.76, "learning_rate": 4.635502892849302e-06, "loss": 1.4402, "step": 35102 }, { "epoch": 2.76, "learning_rate": 4.632454474867192e-06, "loss": 1.4596, "step": 35103 }, { "epoch": 2.76, "learning_rate": 4.629407043850508e-06, "loss": 1.4686, "step": 35104 }, { "epoch": 2.76, "learning_rate": 4.626360599819934e-06, "loss": 1.49, "step": 35105 }, { "epoch": 2.76, "learning_rate": 4.623315142796136e-06, "loss": 1.4739, "step": 35106 }, { "epoch": 2.76, "learning_rate": 4.620270672799797e-06, "loss": 1.4302, "step": 35107 }, { "epoch": 2.76, "learning_rate": 4.6172271898516026e-06, "loss": 1.4283, "step": 35108 }, { "epoch": 2.76, "learning_rate": 4.614184693972201e-06, "loss": 1.4658, "step": 35109 }, { "epoch": 2.76, "learning_rate": 4.611143185182259e-06, "loss": 1.4765, "step": 35110 }, { "epoch": 2.76, "learning_rate": 4.608102663502428e-06, "loss": 1.4416, "step": 35111 }, { "epoch": 2.76, "learning_rate": 4.60506312895334e-06, "loss": 1.4199, "step": 35112 }, { "epoch": 2.76, "learning_rate": 4.60202458155563e-06, "loss": 1.4327, "step": 35113 }, { "epoch": 2.76, "learning_rate": 4.598987021329947e-06, "loss": 1.4719, "step": 35114 }, { "epoch": 2.76, "learning_rate": 4.595950448296892e-06, "loss": 1.4706, "step": 35115 }, { "epoch": 2.76, "learning_rate": 4.5929148624770985e-06, "loss": 1.4523, "step": 35116 }, { "epoch": 2.76, "learning_rate": 4.589880263891166e-06, "loss": 1.4241, "step": 35117 }, { "epoch": 2.76, "learning_rate": 4.586846652559711e-06, "loss": 1.4578, "step": 35118 }, { "epoch": 2.76, "learning_rate": 4.5838140285033185e-06, "loss": 1.4388, "step": 35119 }, { "epoch": 2.76, "learning_rate": 4.580782391742571e-06, "loss": 1.4147, "step": 35120 }, { "epoch": 2.76, "learning_rate": 4.577751742298086e-06, "loss": 1.4014, "step": 35121 }, { "epoch": 2.76, "learning_rate": 4.574722080190396e-06, "loss": 1.4347, "step": 35122 }, { "epoch": 2.76, "learning_rate": 4.5716934054401025e-06, "loss": 1.4247, "step": 35123 }, { "epoch": 2.76, "learning_rate": 4.5686657180677545e-06, "loss": 1.451, "step": 35124 }, { "epoch": 2.76, "learning_rate": 4.565639018093903e-06, "loss": 1.3938, "step": 35125 }, { "epoch": 2.76, "learning_rate": 4.562613305539115e-06, "loss": 1.4639, "step": 35126 }, { "epoch": 2.76, "learning_rate": 4.559588580423923e-06, "loss": 1.4901, "step": 35127 }, { "epoch": 2.76, "learning_rate": 4.556564842768862e-06, "loss": 1.4157, "step": 35128 }, { "epoch": 2.76, "learning_rate": 4.553542092594464e-06, "loss": 1.4231, "step": 35129 }, { "epoch": 2.76, "learning_rate": 4.550520329921231e-06, "loss": 1.4005, "step": 35130 }, { "epoch": 2.76, "learning_rate": 4.547499554769729e-06, "loss": 1.4106, "step": 35131 }, { "epoch": 2.76, "learning_rate": 4.544479767160425e-06, "loss": 1.4889, "step": 35132 }, { "epoch": 2.76, "learning_rate": 4.541460967113836e-06, "loss": 1.4651, "step": 35133 }, { "epoch": 2.76, "learning_rate": 4.538443154650445e-06, "loss": 1.4403, "step": 35134 }, { "epoch": 2.76, "learning_rate": 4.53542632979077e-06, "loss": 1.4588, "step": 35135 }, { "epoch": 2.76, "learning_rate": 4.532410492555277e-06, "loss": 1.4161, "step": 35136 }, { "epoch": 2.76, "learning_rate": 4.529395642964418e-06, "loss": 1.4273, "step": 35137 }, { "epoch": 2.76, "learning_rate": 4.526381781038707e-06, "loss": 1.4638, "step": 35138 }, { "epoch": 2.76, "learning_rate": 4.52336890679858e-06, "loss": 1.4432, "step": 35139 }, { "epoch": 2.76, "learning_rate": 4.520357020264486e-06, "loss": 1.4147, "step": 35140 }, { "epoch": 2.76, "learning_rate": 4.517346121456894e-06, "loss": 1.4028, "step": 35141 }, { "epoch": 2.77, "learning_rate": 4.514336210396252e-06, "loss": 1.4689, "step": 35142 }, { "epoch": 2.77, "learning_rate": 4.511327287102978e-06, "loss": 1.4253, "step": 35143 }, { "epoch": 2.77, "learning_rate": 4.5083193515974895e-06, "loss": 1.4373, "step": 35144 }, { "epoch": 2.77, "learning_rate": 4.505312403900235e-06, "loss": 1.447, "step": 35145 }, { "epoch": 2.77, "learning_rate": 4.502306444031617e-06, "loss": 1.4317, "step": 35146 }, { "epoch": 2.77, "learning_rate": 4.499301472012018e-06, "loss": 1.3922, "step": 35147 }, { "epoch": 2.77, "learning_rate": 4.4962974878619055e-06, "loss": 1.4731, "step": 35148 }, { "epoch": 2.77, "learning_rate": 4.493294491601612e-06, "loss": 1.4594, "step": 35149 }, { "epoch": 2.77, "learning_rate": 4.490292483251573e-06, "loss": 1.3961, "step": 35150 }, { "epoch": 2.77, "learning_rate": 4.487291462832121e-06, "loss": 1.437, "step": 35151 }, { "epoch": 2.77, "learning_rate": 4.48429143036369e-06, "loss": 1.4451, "step": 35152 }, { "epoch": 2.77, "learning_rate": 4.481292385866614e-06, "loss": 1.4503, "step": 35153 }, { "epoch": 2.77, "learning_rate": 4.478294329361243e-06, "loss": 1.4412, "step": 35154 }, { "epoch": 2.77, "learning_rate": 4.4752972608679606e-06, "loss": 1.4706, "step": 35155 }, { "epoch": 2.77, "learning_rate": 4.472301180407101e-06, "loss": 1.4395, "step": 35156 }, { "epoch": 2.77, "learning_rate": 4.469306087998997e-06, "loss": 1.4771, "step": 35157 }, { "epoch": 2.77, "learning_rate": 4.466311983664001e-06, "loss": 1.4231, "step": 35158 }, { "epoch": 2.77, "learning_rate": 4.463318867422444e-06, "loss": 1.5165, "step": 35159 }, { "epoch": 2.77, "learning_rate": 4.4603267392946455e-06, "loss": 1.4307, "step": 35160 }, { "epoch": 2.77, "learning_rate": 4.457335599300871e-06, "loss": 1.4555, "step": 35161 }, { "epoch": 2.77, "learning_rate": 4.454345447461505e-06, "loss": 1.4331, "step": 35162 }, { "epoch": 2.77, "learning_rate": 4.451356283796814e-06, "loss": 1.4756, "step": 35163 }, { "epoch": 2.77, "learning_rate": 4.448368108327083e-06, "loss": 1.4215, "step": 35164 }, { "epoch": 2.77, "learning_rate": 4.4453809210725945e-06, "loss": 1.4393, "step": 35165 }, { "epoch": 2.77, "learning_rate": 4.442394722053666e-06, "loss": 1.4305, "step": 35166 }, { "epoch": 2.77, "learning_rate": 4.439409511290565e-06, "loss": 1.4451, "step": 35167 }, { "epoch": 2.77, "learning_rate": 4.436425288803525e-06, "loss": 1.4537, "step": 35168 }, { "epoch": 2.77, "learning_rate": 4.433442054612829e-06, "loss": 1.3891, "step": 35169 }, { "epoch": 2.77, "learning_rate": 4.430459808738746e-06, "loss": 1.4806, "step": 35170 }, { "epoch": 2.77, "learning_rate": 4.427478551201491e-06, "loss": 1.4261, "step": 35171 }, { "epoch": 2.77, "learning_rate": 4.4244982820213495e-06, "loss": 1.4613, "step": 35172 }, { "epoch": 2.77, "learning_rate": 4.421519001218521e-06, "loss": 1.4794, "step": 35173 }, { "epoch": 2.77, "learning_rate": 4.418540708813223e-06, "loss": 1.4131, "step": 35174 }, { "epoch": 2.77, "learning_rate": 4.415563404825706e-06, "loss": 1.3854, "step": 35175 }, { "epoch": 2.77, "learning_rate": 4.412587089276171e-06, "loss": 1.4473, "step": 35176 }, { "epoch": 2.77, "learning_rate": 4.409611762184834e-06, "loss": 1.4137, "step": 35177 }, { "epoch": 2.77, "learning_rate": 4.40663742357188e-06, "loss": 1.469, "step": 35178 }, { "epoch": 2.77, "learning_rate": 4.403664073457524e-06, "loss": 1.4058, "step": 35179 }, { "epoch": 2.77, "learning_rate": 4.400691711861954e-06, "loss": 1.4721, "step": 35180 }, { "epoch": 2.77, "learning_rate": 4.3977203388053e-06, "loss": 1.4746, "step": 35181 }, { "epoch": 2.77, "learning_rate": 4.394749954307797e-06, "loss": 1.4668, "step": 35182 }, { "epoch": 2.77, "learning_rate": 4.391780558389596e-06, "loss": 1.4026, "step": 35183 }, { "epoch": 2.77, "learning_rate": 4.3888121510708475e-06, "loss": 1.5041, "step": 35184 }, { "epoch": 2.77, "learning_rate": 4.385844732371685e-06, "loss": 1.4289, "step": 35185 }, { "epoch": 2.77, "learning_rate": 4.382878302312309e-06, "loss": 1.4476, "step": 35186 }, { "epoch": 2.77, "learning_rate": 4.379912860912838e-06, "loss": 1.4494, "step": 35187 }, { "epoch": 2.77, "learning_rate": 4.376948408193371e-06, "loss": 1.4311, "step": 35188 }, { "epoch": 2.77, "learning_rate": 4.373984944174091e-06, "loss": 1.4693, "step": 35189 }, { "epoch": 2.77, "learning_rate": 4.371022468875085e-06, "loss": 1.3864, "step": 35190 }, { "epoch": 2.77, "learning_rate": 4.368060982316451e-06, "loss": 1.4643, "step": 35191 }, { "epoch": 2.77, "learning_rate": 4.3651004845183244e-06, "loss": 1.4575, "step": 35192 }, { "epoch": 2.77, "learning_rate": 4.362140975500822e-06, "loss": 1.3845, "step": 35193 }, { "epoch": 2.77, "learning_rate": 4.359182455283994e-06, "loss": 1.4897, "step": 35194 }, { "epoch": 2.77, "learning_rate": 4.356224923887941e-06, "loss": 1.4027, "step": 35195 }, { "epoch": 2.77, "learning_rate": 4.3532683813327305e-06, "loss": 1.506, "step": 35196 }, { "epoch": 2.77, "learning_rate": 4.3503128276384804e-06, "loss": 1.4674, "step": 35197 }, { "epoch": 2.77, "learning_rate": 4.347358262825223e-06, "loss": 1.4486, "step": 35198 }, { "epoch": 2.77, "learning_rate": 4.3444046869130275e-06, "loss": 1.4728, "step": 35199 }, { "epoch": 2.77, "learning_rate": 4.3414520999219435e-06, "loss": 1.4037, "step": 35200 }, { "epoch": 2.77, "learning_rate": 4.338500501872022e-06, "loss": 1.3636, "step": 35201 }, { "epoch": 2.77, "learning_rate": 4.335549892783297e-06, "loss": 1.4461, "step": 35202 }, { "epoch": 2.77, "learning_rate": 4.332600272675801e-06, "loss": 1.4669, "step": 35203 }, { "epoch": 2.77, "learning_rate": 4.32965164156957e-06, "loss": 1.4734, "step": 35204 }, { "epoch": 2.77, "learning_rate": 4.326703999484604e-06, "loss": 1.4295, "step": 35205 }, { "epoch": 2.77, "learning_rate": 4.3237573464409536e-06, "loss": 1.4229, "step": 35206 }, { "epoch": 2.77, "learning_rate": 4.320811682458586e-06, "loss": 1.4859, "step": 35207 }, { "epoch": 2.77, "learning_rate": 4.317867007557502e-06, "loss": 1.4641, "step": 35208 }, { "epoch": 2.77, "learning_rate": 4.314923321757719e-06, "loss": 1.4502, "step": 35209 }, { "epoch": 2.77, "learning_rate": 4.31198062507922e-06, "loss": 1.4262, "step": 35210 }, { "epoch": 2.77, "learning_rate": 4.30903891754194e-06, "loss": 1.4308, "step": 35211 }, { "epoch": 2.77, "learning_rate": 4.3060981991659135e-06, "loss": 1.4327, "step": 35212 }, { "epoch": 2.77, "learning_rate": 4.303158469971074e-06, "loss": 1.4354, "step": 35213 }, { "epoch": 2.77, "learning_rate": 4.3002197299774055e-06, "loss": 1.4522, "step": 35214 }, { "epoch": 2.77, "learning_rate": 4.297281979204809e-06, "loss": 1.4596, "step": 35215 }, { "epoch": 2.77, "learning_rate": 4.294345217673284e-06, "loss": 1.4272, "step": 35216 }, { "epoch": 2.77, "learning_rate": 4.291409445402749e-06, "loss": 1.4739, "step": 35217 }, { "epoch": 2.77, "learning_rate": 4.288474662413138e-06, "loss": 1.4205, "step": 35218 }, { "epoch": 2.77, "learning_rate": 4.285540868724352e-06, "loss": 1.4266, "step": 35219 }, { "epoch": 2.77, "learning_rate": 4.282608064356341e-06, "loss": 1.514, "step": 35220 }, { "epoch": 2.77, "learning_rate": 4.279676249329023e-06, "loss": 1.4319, "step": 35221 }, { "epoch": 2.77, "learning_rate": 4.276745423662265e-06, "loss": 1.4459, "step": 35222 }, { "epoch": 2.77, "learning_rate": 4.273815587376001e-06, "loss": 1.4331, "step": 35223 }, { "epoch": 2.77, "learning_rate": 4.270886740490115e-06, "loss": 1.4522, "step": 35224 }, { "epoch": 2.77, "learning_rate": 4.267958883024475e-06, "loss": 1.4326, "step": 35225 }, { "epoch": 2.77, "learning_rate": 4.265032014998998e-06, "loss": 1.4736, "step": 35226 }, { "epoch": 2.77, "learning_rate": 4.262106136433519e-06, "loss": 1.4757, "step": 35227 }, { "epoch": 2.77, "learning_rate": 4.259181247347887e-06, "loss": 1.4309, "step": 35228 }, { "epoch": 2.77, "learning_rate": 4.256257347762004e-06, "loss": 1.4826, "step": 35229 }, { "epoch": 2.77, "learning_rate": 4.253334437695721e-06, "loss": 1.4155, "step": 35230 }, { "epoch": 2.77, "learning_rate": 4.2504125171688556e-06, "loss": 1.4297, "step": 35231 }, { "epoch": 2.77, "learning_rate": 4.247491586201257e-06, "loss": 1.4243, "step": 35232 }, { "epoch": 2.77, "learning_rate": 4.244571644812761e-06, "loss": 1.4873, "step": 35233 }, { "epoch": 2.77, "learning_rate": 4.241652693023201e-06, "loss": 1.4362, "step": 35234 }, { "epoch": 2.77, "learning_rate": 4.238734730852361e-06, "loss": 1.4569, "step": 35235 }, { "epoch": 2.77, "learning_rate": 4.2358177583200755e-06, "loss": 1.4099, "step": 35236 }, { "epoch": 2.77, "learning_rate": 4.232901775446163e-06, "loss": 1.4314, "step": 35237 }, { "epoch": 2.77, "learning_rate": 4.229986782250405e-06, "loss": 1.5123, "step": 35238 }, { "epoch": 2.77, "learning_rate": 4.227072778752588e-06, "loss": 1.4638, "step": 35239 }, { "epoch": 2.77, "learning_rate": 4.224159764972513e-06, "loss": 1.4933, "step": 35240 }, { "epoch": 2.77, "learning_rate": 4.221247740929945e-06, "loss": 1.411, "step": 35241 }, { "epoch": 2.77, "learning_rate": 4.218336706644637e-06, "loss": 1.4525, "step": 35242 }, { "epoch": 2.77, "learning_rate": 4.21542666213639e-06, "loss": 1.4294, "step": 35243 }, { "epoch": 2.77, "learning_rate": 4.212517607424937e-06, "loss": 1.4184, "step": 35244 }, { "epoch": 2.77, "learning_rate": 4.209609542530046e-06, "loss": 1.4468, "step": 35245 }, { "epoch": 2.77, "learning_rate": 4.2067024674714344e-06, "loss": 1.4709, "step": 35246 }, { "epoch": 2.77, "learning_rate": 4.203796382268887e-06, "loss": 1.4268, "step": 35247 }, { "epoch": 2.77, "learning_rate": 4.200891286942088e-06, "loss": 1.4533, "step": 35248 }, { "epoch": 2.77, "learning_rate": 4.1979871815107705e-06, "loss": 1.4634, "step": 35249 }, { "epoch": 2.77, "learning_rate": 4.195084065994686e-06, "loss": 1.4288, "step": 35250 }, { "epoch": 2.77, "learning_rate": 4.192181940413502e-06, "loss": 1.4233, "step": 35251 }, { "epoch": 2.77, "learning_rate": 4.189280804786938e-06, "loss": 1.4698, "step": 35252 }, { "epoch": 2.77, "learning_rate": 4.1863806591346915e-06, "loss": 1.4468, "step": 35253 }, { "epoch": 2.77, "learning_rate": 4.1834815034764655e-06, "loss": 1.4568, "step": 35254 }, { "epoch": 2.77, "learning_rate": 4.180583337831927e-06, "loss": 1.4442, "step": 35255 }, { "epoch": 2.77, "learning_rate": 4.177686162220745e-06, "loss": 1.4096, "step": 35256 }, { "epoch": 2.77, "learning_rate": 4.174789976662618e-06, "loss": 1.4515, "step": 35257 }, { "epoch": 2.77, "learning_rate": 4.171894781177199e-06, "loss": 1.4657, "step": 35258 }, { "epoch": 2.77, "learning_rate": 4.169000575784121e-06, "loss": 1.382, "step": 35259 }, { "epoch": 2.77, "learning_rate": 4.166107360503051e-06, "loss": 1.4543, "step": 35260 }, { "epoch": 2.77, "learning_rate": 4.163215135353643e-06, "loss": 1.4276, "step": 35261 }, { "epoch": 2.77, "learning_rate": 4.160323900355544e-06, "loss": 1.466, "step": 35262 }, { "epoch": 2.77, "learning_rate": 4.157433655528325e-06, "loss": 1.4403, "step": 35263 }, { "epoch": 2.77, "learning_rate": 4.154544400891685e-06, "loss": 1.4689, "step": 35264 }, { "epoch": 2.77, "learning_rate": 4.151656136465193e-06, "loss": 1.461, "step": 35265 }, { "epoch": 2.77, "learning_rate": 4.1487688622684645e-06, "loss": 1.4356, "step": 35266 }, { "epoch": 2.77, "learning_rate": 4.145882578321102e-06, "loss": 1.4375, "step": 35267 }, { "epoch": 2.77, "learning_rate": 4.142997284642724e-06, "loss": 1.4275, "step": 35268 }, { "epoch": 2.78, "learning_rate": 4.140112981252897e-06, "loss": 1.4017, "step": 35269 }, { "epoch": 2.78, "learning_rate": 4.1372296681712044e-06, "loss": 1.4839, "step": 35270 }, { "epoch": 2.78, "learning_rate": 4.134347345417249e-06, "loss": 1.444, "step": 35271 }, { "epoch": 2.78, "learning_rate": 4.131466013010565e-06, "loss": 1.5185, "step": 35272 }, { "epoch": 2.78, "learning_rate": 4.128585670970719e-06, "loss": 1.4192, "step": 35273 }, { "epoch": 2.78, "learning_rate": 4.125706319317296e-06, "loss": 1.4414, "step": 35274 }, { "epoch": 2.78, "learning_rate": 4.122827958069813e-06, "loss": 1.4458, "step": 35275 }, { "epoch": 2.78, "learning_rate": 4.119950587247839e-06, "loss": 1.4336, "step": 35276 }, { "epoch": 2.78, "learning_rate": 4.117074206870874e-06, "loss": 1.4559, "step": 35277 }, { "epoch": 2.78, "learning_rate": 4.114198816958503e-06, "loss": 1.4833, "step": 35278 }, { "epoch": 2.78, "learning_rate": 4.1113244175302095e-06, "loss": 1.4507, "step": 35279 }, { "epoch": 2.78, "learning_rate": 4.1084510086054954e-06, "loss": 1.3741, "step": 35280 }, { "epoch": 2.78, "learning_rate": 4.105578590203895e-06, "loss": 1.4592, "step": 35281 }, { "epoch": 2.78, "learning_rate": 4.102707162344926e-06, "loss": 1.4258, "step": 35282 }, { "epoch": 2.78, "learning_rate": 4.099836725048039e-06, "loss": 1.4286, "step": 35283 }, { "epoch": 2.78, "learning_rate": 4.096967278332753e-06, "loss": 1.4437, "step": 35284 }, { "epoch": 2.78, "learning_rate": 4.09409882221855e-06, "loss": 1.4644, "step": 35285 }, { "epoch": 2.78, "learning_rate": 4.091231356724884e-06, "loss": 1.4196, "step": 35286 }, { "epoch": 2.78, "learning_rate": 4.0883648818712535e-06, "loss": 1.4674, "step": 35287 }, { "epoch": 2.78, "learning_rate": 4.085499397677095e-06, "loss": 1.4844, "step": 35288 }, { "epoch": 2.78, "learning_rate": 4.082634904161891e-06, "loss": 1.4409, "step": 35289 }, { "epoch": 2.78, "learning_rate": 4.079771401345044e-06, "loss": 1.4794, "step": 35290 }, { "epoch": 2.78, "learning_rate": 4.076908889246022e-06, "loss": 1.431, "step": 35291 }, { "epoch": 2.78, "learning_rate": 4.074047367884292e-06, "loss": 1.488, "step": 35292 }, { "epoch": 2.78, "learning_rate": 4.0711868372792385e-06, "loss": 1.4693, "step": 35293 }, { "epoch": 2.78, "learning_rate": 4.06832729745028e-06, "loss": 1.4093, "step": 35294 }, { "epoch": 2.78, "learning_rate": 4.065468748416867e-06, "loss": 1.4553, "step": 35295 }, { "epoch": 2.78, "learning_rate": 4.062611190198384e-06, "loss": 1.4587, "step": 35296 }, { "epoch": 2.78, "learning_rate": 4.059754622814232e-06, "loss": 1.3302, "step": 35297 }, { "epoch": 2.78, "learning_rate": 4.056899046283812e-06, "loss": 1.4627, "step": 35298 }, { "epoch": 2.78, "learning_rate": 4.05404446062651e-06, "loss": 1.4454, "step": 35299 }, { "epoch": 2.78, "learning_rate": 4.051190865861709e-06, "loss": 1.4605, "step": 35300 }, { "epoch": 2.78, "learning_rate": 4.048338262008777e-06, "loss": 1.4146, "step": 35301 }, { "epoch": 2.78, "learning_rate": 4.0454866490870985e-06, "loss": 1.422, "step": 35302 }, { "epoch": 2.78, "learning_rate": 4.042636027115992e-06, "loss": 1.4842, "step": 35303 }, { "epoch": 2.78, "learning_rate": 4.039786396114858e-06, "loss": 1.4749, "step": 35304 }, { "epoch": 2.78, "learning_rate": 4.036937756103031e-06, "loss": 1.4306, "step": 35305 }, { "epoch": 2.78, "learning_rate": 4.034090107099846e-06, "loss": 1.4484, "step": 35306 }, { "epoch": 2.78, "learning_rate": 4.031243449124621e-06, "loss": 1.4923, "step": 35307 }, { "epoch": 2.78, "learning_rate": 4.028397782196724e-06, "loss": 1.4409, "step": 35308 }, { "epoch": 2.78, "learning_rate": 4.025553106335439e-06, "loss": 1.3835, "step": 35309 }, { "epoch": 2.78, "learning_rate": 4.0227094215600995e-06, "loss": 1.4481, "step": 35310 }, { "epoch": 2.78, "learning_rate": 4.019866727890008e-06, "loss": 1.4478, "step": 35311 }, { "epoch": 2.78, "learning_rate": 4.0170250253444666e-06, "loss": 1.4629, "step": 35312 }, { "epoch": 2.78, "learning_rate": 4.0141843139427585e-06, "loss": 1.4391, "step": 35313 }, { "epoch": 2.78, "learning_rate": 4.0113445937041685e-06, "loss": 1.4384, "step": 35314 }, { "epoch": 2.78, "learning_rate": 4.008505864647999e-06, "loss": 1.4805, "step": 35315 }, { "epoch": 2.78, "learning_rate": 4.005668126793515e-06, "loss": 1.452, "step": 35316 }, { "epoch": 2.78, "learning_rate": 4.0028313801599545e-06, "loss": 1.4622, "step": 35317 }, { "epoch": 2.78, "learning_rate": 3.9999956247666165e-06, "loss": 1.4371, "step": 35318 }, { "epoch": 2.78, "learning_rate": 3.9971608606327365e-06, "loss": 1.3884, "step": 35319 }, { "epoch": 2.78, "learning_rate": 3.994327087777566e-06, "loss": 1.4693, "step": 35320 }, { "epoch": 2.78, "learning_rate": 3.991494306220339e-06, "loss": 1.4531, "step": 35321 }, { "epoch": 2.78, "learning_rate": 3.988662515980273e-06, "loss": 1.3954, "step": 35322 }, { "epoch": 2.78, "learning_rate": 3.985831717076638e-06, "loss": 1.3814, "step": 35323 }, { "epoch": 2.78, "learning_rate": 3.983001909528616e-06, "loss": 1.4154, "step": 35324 }, { "epoch": 2.78, "learning_rate": 3.980173093355443e-06, "loss": 1.4453, "step": 35325 }, { "epoch": 2.78, "learning_rate": 3.977345268576321e-06, "loss": 1.4274, "step": 35326 }, { "epoch": 2.78, "learning_rate": 3.974518435210416e-06, "loss": 1.4703, "step": 35327 }, { "epoch": 2.78, "learning_rate": 3.971692593276965e-06, "loss": 1.4521, "step": 35328 }, { "epoch": 2.78, "learning_rate": 3.968867742795151e-06, "loss": 1.4033, "step": 35329 }, { "epoch": 2.78, "learning_rate": 3.966043883784125e-06, "loss": 1.4444, "step": 35330 }, { "epoch": 2.78, "learning_rate": 3.9632210162630575e-06, "loss": 1.5305, "step": 35331 }, { "epoch": 2.78, "learning_rate": 3.960399140251147e-06, "loss": 1.436, "step": 35332 }, { "epoch": 2.78, "learning_rate": 3.957578255767529e-06, "loss": 1.4533, "step": 35333 }, { "epoch": 2.78, "learning_rate": 3.954758362831356e-06, "loss": 1.4468, "step": 35334 }, { "epoch": 2.78, "learning_rate": 3.951939461461778e-06, "loss": 1.4637, "step": 35335 }, { "epoch": 2.78, "learning_rate": 3.949121551677964e-06, "loss": 1.4667, "step": 35336 }, { "epoch": 2.78, "learning_rate": 3.946304633498981e-06, "loss": 1.3603, "step": 35337 }, { "epoch": 2.78, "learning_rate": 3.943488706943998e-06, "loss": 1.4235, "step": 35338 }, { "epoch": 2.78, "learning_rate": 3.940673772032133e-06, "loss": 1.458, "step": 35339 }, { "epoch": 2.78, "learning_rate": 3.937859828782486e-06, "loss": 1.4726, "step": 35340 }, { "epoch": 2.78, "learning_rate": 3.935046877214177e-06, "loss": 1.4611, "step": 35341 }, { "epoch": 2.78, "learning_rate": 3.932234917346289e-06, "loss": 1.4795, "step": 35342 }, { "epoch": 2.78, "learning_rate": 3.929423949197924e-06, "loss": 1.4456, "step": 35343 }, { "epoch": 2.78, "learning_rate": 3.926613972788151e-06, "loss": 1.4485, "step": 35344 }, { "epoch": 2.78, "learning_rate": 3.92380498813607e-06, "loss": 1.4668, "step": 35345 }, { "epoch": 2.78, "learning_rate": 3.920996995260733e-06, "loss": 1.4359, "step": 35346 }, { "epoch": 2.78, "learning_rate": 3.918189994181225e-06, "loss": 1.4831, "step": 35347 }, { "epoch": 2.78, "learning_rate": 3.915383984916581e-06, "loss": 1.4411, "step": 35348 }, { "epoch": 2.78, "learning_rate": 3.912578967485868e-06, "loss": 1.4106, "step": 35349 }, { "epoch": 2.78, "learning_rate": 3.9097749419081225e-06, "loss": 1.4501, "step": 35350 }, { "epoch": 2.78, "learning_rate": 3.9069719082023775e-06, "loss": 1.4337, "step": 35351 }, { "epoch": 2.78, "learning_rate": 3.904169866387702e-06, "loss": 1.3529, "step": 35352 }, { "epoch": 2.78, "learning_rate": 3.901368816483081e-06, "loss": 1.4215, "step": 35353 }, { "epoch": 2.78, "learning_rate": 3.898568758507514e-06, "loss": 1.4204, "step": 35354 }, { "epoch": 2.78, "learning_rate": 3.895769692480055e-06, "loss": 1.4569, "step": 35355 }, { "epoch": 2.78, "learning_rate": 3.892971618419705e-06, "loss": 1.4193, "step": 35356 }, { "epoch": 2.78, "learning_rate": 3.890174536345431e-06, "loss": 1.4501, "step": 35357 }, { "epoch": 2.78, "learning_rate": 3.8873784462762515e-06, "loss": 1.4317, "step": 35358 }, { "epoch": 2.78, "learning_rate": 3.884583348231135e-06, "loss": 1.4536, "step": 35359 }, { "epoch": 2.78, "learning_rate": 3.881789242229083e-06, "loss": 1.398, "step": 35360 }, { "epoch": 2.78, "learning_rate": 3.8789961282890305e-06, "loss": 1.4447, "step": 35361 }, { "epoch": 2.78, "learning_rate": 3.876204006429961e-06, "loss": 1.4218, "step": 35362 }, { "epoch": 2.78, "learning_rate": 3.873412876670829e-06, "loss": 1.4988, "step": 35363 }, { "epoch": 2.78, "learning_rate": 3.870622739030582e-06, "loss": 1.3944, "step": 35364 }, { "epoch": 2.78, "learning_rate": 3.867833593528175e-06, "loss": 1.4752, "step": 35365 }, { "epoch": 2.78, "learning_rate": 3.865045440182541e-06, "loss": 1.4212, "step": 35366 }, { "epoch": 2.78, "learning_rate": 3.862258279012598e-06, "loss": 1.4688, "step": 35367 }, { "epoch": 2.78, "learning_rate": 3.859472110037248e-06, "loss": 1.4593, "step": 35368 }, { "epoch": 2.78, "learning_rate": 3.85668693327546e-06, "loss": 1.4367, "step": 35369 }, { "epoch": 2.78, "learning_rate": 3.853902748746118e-06, "loss": 1.4922, "step": 35370 }, { "epoch": 2.78, "learning_rate": 3.851119556468124e-06, "loss": 1.4057, "step": 35371 }, { "epoch": 2.78, "learning_rate": 3.848337356460379e-06, "loss": 1.447, "step": 35372 }, { "epoch": 2.78, "learning_rate": 3.845556148741769e-06, "loss": 1.4835, "step": 35373 }, { "epoch": 2.78, "learning_rate": 3.842775933331177e-06, "loss": 1.4592, "step": 35374 }, { "epoch": 2.78, "learning_rate": 3.839996710247472e-06, "loss": 1.3919, "step": 35375 }, { "epoch": 2.78, "learning_rate": 3.837218479509557e-06, "loss": 1.4306, "step": 35376 }, { "epoch": 2.78, "learning_rate": 3.834441241136249e-06, "loss": 1.427, "step": 35377 }, { "epoch": 2.78, "learning_rate": 3.831664995146416e-06, "loss": 1.4808, "step": 35378 }, { "epoch": 2.78, "learning_rate": 3.828889741558943e-06, "loss": 1.4155, "step": 35379 }, { "epoch": 2.78, "learning_rate": 3.826115480392633e-06, "loss": 1.4656, "step": 35380 }, { "epoch": 2.78, "learning_rate": 3.8233422116663195e-06, "loss": 1.4294, "step": 35381 }, { "epoch": 2.78, "learning_rate": 3.820569935398854e-06, "loss": 1.4498, "step": 35382 }, { "epoch": 2.78, "learning_rate": 3.817798651609055e-06, "loss": 1.415, "step": 35383 }, { "epoch": 2.78, "learning_rate": 3.815028360315742e-06, "loss": 1.4537, "step": 35384 }, { "epoch": 2.78, "learning_rate": 3.8122590615376812e-06, "loss": 1.4619, "step": 35385 }, { "epoch": 2.78, "learning_rate": 3.8094907552937258e-06, "loss": 1.4378, "step": 35386 }, { "epoch": 2.78, "learning_rate": 3.806723441602677e-06, "loss": 1.4295, "step": 35387 }, { "epoch": 2.78, "learning_rate": 3.8039571204832863e-06, "loss": 1.4377, "step": 35388 }, { "epoch": 2.78, "learning_rate": 3.801191791954322e-06, "loss": 1.4095, "step": 35389 }, { "epoch": 2.78, "learning_rate": 3.7984274560346195e-06, "loss": 1.4402, "step": 35390 }, { "epoch": 2.78, "learning_rate": 3.7956641127429133e-06, "loss": 1.4837, "step": 35391 }, { "epoch": 2.78, "learning_rate": 3.7929017620979386e-06, "loss": 1.4806, "step": 35392 }, { "epoch": 2.78, "learning_rate": 3.790140404118497e-06, "loss": 1.452, "step": 35393 }, { "epoch": 2.78, "learning_rate": 3.7873800388233234e-06, "loss": 1.4479, "step": 35394 }, { "epoch": 2.78, "learning_rate": 3.7846206662311197e-06, "loss": 1.4576, "step": 35395 }, { "epoch": 2.79, "learning_rate": 3.7818622863606873e-06, "loss": 1.4284, "step": 35396 }, { "epoch": 2.79, "learning_rate": 3.7791048992307115e-06, "loss": 1.3846, "step": 35397 }, { "epoch": 2.79, "learning_rate": 3.7763485048599107e-06, "loss": 1.5076, "step": 35398 }, { "epoch": 2.79, "learning_rate": 3.7735931032670198e-06, "loss": 1.4451, "step": 35399 }, { "epoch": 2.79, "learning_rate": 3.77083869447074e-06, "loss": 1.399, "step": 35400 }, { "epoch": 2.79, "learning_rate": 3.7680852784897576e-06, "loss": 1.4201, "step": 35401 }, { "epoch": 2.79, "learning_rate": 3.7653328553427896e-06, "loss": 1.4616, "step": 35402 }, { "epoch": 2.79, "learning_rate": 3.7625814250485054e-06, "loss": 1.4512, "step": 35403 }, { "epoch": 2.79, "learning_rate": 3.759830987625606e-06, "loss": 1.5024, "step": 35404 }, { "epoch": 2.79, "learning_rate": 3.757081543092744e-06, "loss": 1.495, "step": 35405 }, { "epoch": 2.79, "learning_rate": 3.7543330914685863e-06, "loss": 1.4088, "step": 35406 }, { "epoch": 2.79, "learning_rate": 3.7515856327718196e-06, "loss": 1.4468, "step": 35407 }, { "epoch": 2.79, "learning_rate": 3.7488391670210783e-06, "loss": 1.4425, "step": 35408 }, { "epoch": 2.79, "learning_rate": 3.7460936942349972e-06, "loss": 1.4294, "step": 35409 }, { "epoch": 2.79, "learning_rate": 3.7433492144322284e-06, "loss": 1.4543, "step": 35410 }, { "epoch": 2.79, "learning_rate": 3.740605727631424e-06, "loss": 1.4631, "step": 35411 }, { "epoch": 2.79, "learning_rate": 3.737863233851185e-06, "loss": 1.4503, "step": 35412 }, { "epoch": 2.79, "learning_rate": 3.735121733110147e-06, "loss": 1.4378, "step": 35413 }, { "epoch": 2.79, "learning_rate": 3.7323812254269114e-06, "loss": 1.3899, "step": 35414 }, { "epoch": 2.79, "learning_rate": 3.7296417108200805e-06, "loss": 1.4473, "step": 35415 }, { "epoch": 2.79, "learning_rate": 3.726903189308256e-06, "loss": 1.4132, "step": 35416 }, { "epoch": 2.79, "learning_rate": 3.7241656609100723e-06, "loss": 1.4576, "step": 35417 }, { "epoch": 2.79, "learning_rate": 3.7214291256440654e-06, "loss": 1.4936, "step": 35418 }, { "epoch": 2.79, "learning_rate": 3.7186935835288202e-06, "loss": 1.4425, "step": 35419 }, { "epoch": 2.79, "learning_rate": 3.715959034582938e-06, "loss": 1.4067, "step": 35420 }, { "epoch": 2.79, "learning_rate": 3.7132254788249717e-06, "loss": 1.4426, "step": 35421 }, { "epoch": 2.79, "learning_rate": 3.7104929162734553e-06, "loss": 1.3846, "step": 35422 }, { "epoch": 2.79, "learning_rate": 3.707761346946975e-06, "loss": 1.4264, "step": 35423 }, { "epoch": 2.79, "learning_rate": 3.7050307708640648e-06, "loss": 1.4555, "step": 35424 }, { "epoch": 2.79, "learning_rate": 3.7023011880432772e-06, "loss": 1.4204, "step": 35425 }, { "epoch": 2.79, "learning_rate": 3.699572598503098e-06, "loss": 1.453, "step": 35426 }, { "epoch": 2.79, "learning_rate": 3.696845002262111e-06, "loss": 1.4485, "step": 35427 }, { "epoch": 2.79, "learning_rate": 3.6941183993388024e-06, "loss": 1.4647, "step": 35428 }, { "epoch": 2.79, "learning_rate": 3.6913927897516904e-06, "loss": 1.4167, "step": 35429 }, { "epoch": 2.79, "learning_rate": 3.688668173519277e-06, "loss": 1.4243, "step": 35430 }, { "epoch": 2.79, "learning_rate": 3.6859445506600803e-06, "loss": 1.4485, "step": 35431 }, { "epoch": 2.79, "learning_rate": 3.683221921192553e-06, "loss": 1.4742, "step": 35432 }, { "epoch": 2.79, "learning_rate": 3.680500285135213e-06, "loss": 1.3931, "step": 35433 }, { "epoch": 2.79, "learning_rate": 3.6777796425065454e-06, "loss": 1.4493, "step": 35434 }, { "epoch": 2.79, "learning_rate": 3.6750599933250025e-06, "loss": 1.4198, "step": 35435 }, { "epoch": 2.79, "learning_rate": 3.672341337609036e-06, "loss": 1.4799, "step": 35436 }, { "epoch": 2.79, "learning_rate": 3.6696236753771478e-06, "loss": 1.4829, "step": 35437 }, { "epoch": 2.79, "learning_rate": 3.666907006647757e-06, "loss": 1.4959, "step": 35438 }, { "epoch": 2.79, "learning_rate": 3.664191331439298e-06, "loss": 1.4664, "step": 35439 }, { "epoch": 2.79, "learning_rate": 3.6614766497702396e-06, "loss": 1.4402, "step": 35440 }, { "epoch": 2.79, "learning_rate": 3.6587629616589842e-06, "loss": 1.4098, "step": 35441 }, { "epoch": 2.79, "learning_rate": 3.6560502671239833e-06, "loss": 1.4622, "step": 35442 }, { "epoch": 2.79, "learning_rate": 3.653338566183639e-06, "loss": 1.4612, "step": 35443 }, { "epoch": 2.79, "learning_rate": 3.6506278588563697e-06, "loss": 1.4858, "step": 35444 }, { "epoch": 2.79, "learning_rate": 3.647918145160578e-06, "loss": 1.4623, "step": 35445 }, { "epoch": 2.79, "learning_rate": 3.645209425114631e-06, "loss": 1.4113, "step": 35446 }, { "epoch": 2.79, "learning_rate": 3.642501698736966e-06, "loss": 1.4673, "step": 35447 }, { "epoch": 2.79, "learning_rate": 3.6397949660459503e-06, "loss": 1.3848, "step": 35448 }, { "epoch": 2.79, "learning_rate": 3.637089227059953e-06, "loss": 1.4274, "step": 35449 }, { "epoch": 2.79, "learning_rate": 3.6343844817973424e-06, "loss": 1.4311, "step": 35450 }, { "epoch": 2.79, "learning_rate": 3.631680730276504e-06, "loss": 1.491, "step": 35451 }, { "epoch": 2.79, "learning_rate": 3.6289779725157897e-06, "loss": 1.4357, "step": 35452 }, { "epoch": 2.79, "learning_rate": 3.6262762085335185e-06, "loss": 1.4191, "step": 35453 }, { "epoch": 2.79, "learning_rate": 3.6235754383480585e-06, "loss": 1.4054, "step": 35454 }, { "epoch": 2.79, "learning_rate": 3.6208756619777624e-06, "loss": 1.4516, "step": 35455 }, { "epoch": 2.79, "learning_rate": 3.618176879440915e-06, "loss": 1.4047, "step": 35456 }, { "epoch": 2.79, "learning_rate": 3.6154790907559016e-06, "loss": 1.4276, "step": 35457 }, { "epoch": 2.79, "learning_rate": 3.6127822959409746e-06, "loss": 1.4718, "step": 35458 }, { "epoch": 2.79, "learning_rate": 3.6100864950145027e-06, "loss": 1.4214, "step": 35459 }, { "epoch": 2.79, "learning_rate": 3.6073916879947208e-06, "loss": 1.4807, "step": 35460 }, { "epoch": 2.79, "learning_rate": 3.604697874899981e-06, "loss": 1.4816, "step": 35461 }, { "epoch": 2.79, "learning_rate": 3.602005055748569e-06, "loss": 1.4393, "step": 35462 }, { "epoch": 2.79, "learning_rate": 3.5993132305587202e-06, "loss": 1.424, "step": 35463 }, { "epoch": 2.79, "learning_rate": 3.596622399348753e-06, "loss": 1.4717, "step": 35464 }, { "epoch": 2.79, "learning_rate": 3.593932562136953e-06, "loss": 1.483, "step": 35465 }, { "epoch": 2.79, "learning_rate": 3.591243718941539e-06, "loss": 1.447, "step": 35466 }, { "epoch": 2.79, "learning_rate": 3.5885558697807795e-06, "loss": 1.4389, "step": 35467 }, { "epoch": 2.79, "learning_rate": 3.585869014672943e-06, "loss": 1.4093, "step": 35468 }, { "epoch": 2.79, "learning_rate": 3.5831831536362654e-06, "loss": 1.4178, "step": 35469 }, { "epoch": 2.79, "learning_rate": 3.580498286688949e-06, "loss": 1.4337, "step": 35470 }, { "epoch": 2.79, "learning_rate": 3.5778144138492614e-06, "loss": 1.453, "step": 35471 }, { "epoch": 2.79, "learning_rate": 3.575131535135423e-06, "loss": 1.4568, "step": 35472 }, { "epoch": 2.79, "learning_rate": 3.5724496505656175e-06, "loss": 1.4691, "step": 35473 }, { "epoch": 2.79, "learning_rate": 3.5697687601580816e-06, "loss": 1.4596, "step": 35474 }, { "epoch": 2.79, "learning_rate": 3.5670888639310167e-06, "loss": 1.447, "step": 35475 }, { "epoch": 2.79, "learning_rate": 3.564409961902592e-06, "loss": 1.4439, "step": 35476 }, { "epoch": 2.79, "learning_rate": 3.5617320540910266e-06, "loss": 1.4527, "step": 35477 }, { "epoch": 2.79, "learning_rate": 3.5590551405144885e-06, "loss": 1.4279, "step": 35478 }, { "epoch": 2.79, "learning_rate": 3.556379221191147e-06, "loss": 1.4577, "step": 35479 }, { "epoch": 2.79, "learning_rate": 3.5537042961391703e-06, "loss": 1.4514, "step": 35480 }, { "epoch": 2.79, "learning_rate": 3.5510303653767445e-06, "loss": 1.4293, "step": 35481 }, { "epoch": 2.79, "learning_rate": 3.548357428922005e-06, "loss": 1.3958, "step": 35482 }, { "epoch": 2.79, "learning_rate": 3.5456854867930874e-06, "loss": 1.4455, "step": 35483 }, { "epoch": 2.79, "learning_rate": 3.543014539008143e-06, "loss": 1.5019, "step": 35484 }, { "epoch": 2.79, "learning_rate": 3.5403445855853252e-06, "loss": 1.4469, "step": 35485 }, { "epoch": 2.79, "learning_rate": 3.5376756265427354e-06, "loss": 1.4395, "step": 35486 }, { "epoch": 2.79, "learning_rate": 3.5350076618984925e-06, "loss": 1.4067, "step": 35487 }, { "epoch": 2.79, "learning_rate": 3.532340691670732e-06, "loss": 1.4167, "step": 35488 }, { "epoch": 2.79, "learning_rate": 3.5296747158775563e-06, "loss": 1.4505, "step": 35489 }, { "epoch": 2.79, "learning_rate": 3.527009734537051e-06, "loss": 1.4427, "step": 35490 }, { "epoch": 2.79, "learning_rate": 3.5243457476673174e-06, "loss": 1.4468, "step": 35491 }, { "epoch": 2.79, "learning_rate": 3.5216827552864592e-06, "loss": 1.436, "step": 35492 }, { "epoch": 2.79, "learning_rate": 3.5190207574125274e-06, "loss": 1.392, "step": 35493 }, { "epoch": 2.79, "learning_rate": 3.5163597540636078e-06, "loss": 1.4102, "step": 35494 }, { "epoch": 2.79, "learning_rate": 3.5136997452577696e-06, "loss": 1.4672, "step": 35495 }, { "epoch": 2.79, "learning_rate": 3.5110407310130816e-06, "loss": 1.4687, "step": 35496 }, { "epoch": 2.79, "learning_rate": 3.5083827113475793e-06, "loss": 1.4028, "step": 35497 }, { "epoch": 2.79, "learning_rate": 3.5057256862793315e-06, "loss": 1.3887, "step": 35498 }, { "epoch": 2.79, "learning_rate": 3.503069655826357e-06, "loss": 1.4524, "step": 35499 }, { "epoch": 2.79, "learning_rate": 3.5004146200066916e-06, "loss": 1.4184, "step": 35500 }, { "epoch": 2.79, "learning_rate": 3.4977605788383713e-06, "loss": 1.3881, "step": 35501 }, { "epoch": 2.79, "learning_rate": 3.4951075323393972e-06, "loss": 1.4031, "step": 35502 }, { "epoch": 2.79, "learning_rate": 3.4924554805278225e-06, "loss": 1.4654, "step": 35503 }, { "epoch": 2.79, "learning_rate": 3.4898044234215993e-06, "loss": 1.4497, "step": 35504 }, { "epoch": 2.79, "learning_rate": 3.487154361038763e-06, "loss": 1.506, "step": 35505 }, { "epoch": 2.79, "learning_rate": 3.4845052933972994e-06, "loss": 1.4859, "step": 35506 }, { "epoch": 2.79, "learning_rate": 3.481857220515177e-06, "loss": 1.447, "step": 35507 }, { "epoch": 2.79, "learning_rate": 3.479210142410399e-06, "loss": 1.4727, "step": 35508 }, { "epoch": 2.79, "learning_rate": 3.4765640591009338e-06, "loss": 1.407, "step": 35509 }, { "epoch": 2.79, "learning_rate": 3.4739189706047166e-06, "loss": 1.3684, "step": 35510 }, { "epoch": 2.79, "learning_rate": 3.4712748769397335e-06, "loss": 1.46, "step": 35511 }, { "epoch": 2.79, "learning_rate": 3.4686317781239535e-06, "loss": 1.4737, "step": 35512 }, { "epoch": 2.79, "learning_rate": 3.4659896741752955e-06, "loss": 1.4056, "step": 35513 }, { "epoch": 2.79, "learning_rate": 3.4633485651116955e-06, "loss": 1.4674, "step": 35514 }, { "epoch": 2.79, "learning_rate": 3.460708450951105e-06, "loss": 1.4681, "step": 35515 }, { "epoch": 2.79, "learning_rate": 3.458069331711427e-06, "loss": 1.4654, "step": 35516 }, { "epoch": 2.79, "learning_rate": 3.4554312074105804e-06, "loss": 1.4281, "step": 35517 }, { "epoch": 2.79, "learning_rate": 3.4527940780665007e-06, "loss": 1.4346, "step": 35518 }, { "epoch": 2.79, "learning_rate": 3.4501579436970904e-06, "loss": 1.5012, "step": 35519 }, { "epoch": 2.79, "learning_rate": 3.4475228043202184e-06, "loss": 1.4602, "step": 35520 }, { "epoch": 2.79, "learning_rate": 3.4448886599537874e-06, "loss": 1.4221, "step": 35521 }, { "epoch": 2.79, "learning_rate": 3.442255510615699e-06, "loss": 1.4892, "step": 35522 }, { "epoch": 2.79, "learning_rate": 3.439623356323823e-06, "loss": 1.4641, "step": 35523 }, { "epoch": 2.8, "learning_rate": 3.4369921970959945e-06, "loss": 1.4374, "step": 35524 }, { "epoch": 2.8, "learning_rate": 3.434362032950133e-06, "loss": 1.4771, "step": 35525 }, { "epoch": 2.8, "learning_rate": 3.4317328639040743e-06, "loss": 1.4734, "step": 35526 }, { "epoch": 2.8, "learning_rate": 3.4291046899756535e-06, "loss": 1.4268, "step": 35527 }, { "epoch": 2.8, "learning_rate": 3.4264775111827236e-06, "loss": 1.3813, "step": 35528 }, { "epoch": 2.8, "learning_rate": 3.4238513275431367e-06, "loss": 1.4224, "step": 35529 }, { "epoch": 2.8, "learning_rate": 3.4212261390747286e-06, "loss": 1.4098, "step": 35530 }, { "epoch": 2.8, "learning_rate": 3.4186019457952686e-06, "loss": 1.4177, "step": 35531 }, { "epoch": 2.8, "learning_rate": 3.415978747722642e-06, "loss": 1.4471, "step": 35532 }, { "epoch": 2.8, "learning_rate": 3.413356544874618e-06, "loss": 1.4356, "step": 35533 }, { "epoch": 2.8, "learning_rate": 3.4107353372689994e-06, "loss": 1.4282, "step": 35534 }, { "epoch": 2.8, "learning_rate": 3.408115124923605e-06, "loss": 1.4964, "step": 35535 }, { "epoch": 2.8, "learning_rate": 3.4054959078562206e-06, "loss": 1.368, "step": 35536 }, { "epoch": 2.8, "learning_rate": 3.402877686084615e-06, "loss": 1.4923, "step": 35537 }, { "epoch": 2.8, "learning_rate": 3.400260459626558e-06, "loss": 1.4674, "step": 35538 }, { "epoch": 2.8, "learning_rate": 3.3976442284998352e-06, "loss": 1.4572, "step": 35539 }, { "epoch": 2.8, "learning_rate": 3.3950289927222318e-06, "loss": 1.4164, "step": 35540 }, { "epoch": 2.8, "learning_rate": 3.392414752311434e-06, "loss": 1.4658, "step": 35541 }, { "epoch": 2.8, "learning_rate": 3.3898015072852614e-06, "loss": 1.4854, "step": 35542 }, { "epoch": 2.8, "learning_rate": 3.387189257661432e-06, "loss": 1.4042, "step": 35543 }, { "epoch": 2.8, "learning_rate": 3.384578003457683e-06, "loss": 1.5157, "step": 35544 }, { "epoch": 2.8, "learning_rate": 3.3819677446917158e-06, "loss": 1.44, "step": 35545 }, { "epoch": 2.8, "learning_rate": 3.3793584813813e-06, "loss": 1.4259, "step": 35546 }, { "epoch": 2.8, "learning_rate": 3.3767502135441383e-06, "loss": 1.4246, "step": 35547 }, { "epoch": 2.8, "learning_rate": 3.3741429411978993e-06, "loss": 1.4684, "step": 35548 }, { "epoch": 2.8, "learning_rate": 3.3715366643603357e-06, "loss": 1.4825, "step": 35549 }, { "epoch": 2.8, "learning_rate": 3.368931383049117e-06, "loss": 1.4811, "step": 35550 }, { "epoch": 2.8, "learning_rate": 3.3663270972819288e-06, "loss": 1.4549, "step": 35551 }, { "epoch": 2.8, "learning_rate": 3.3637238070764737e-06, "loss": 1.4062, "step": 35552 }, { "epoch": 2.8, "learning_rate": 3.3611215124504043e-06, "loss": 1.3899, "step": 35553 }, { "epoch": 2.8, "learning_rate": 3.358520213421406e-06, "loss": 1.4569, "step": 35554 }, { "epoch": 2.8, "learning_rate": 3.355919910007132e-06, "loss": 1.477, "step": 35555 }, { "epoch": 2.8, "learning_rate": 3.3533206022252347e-06, "loss": 1.442, "step": 35556 }, { "epoch": 2.8, "learning_rate": 3.350722290093366e-06, "loss": 1.4638, "step": 35557 }, { "epoch": 2.8, "learning_rate": 3.348124973629146e-06, "loss": 1.4855, "step": 35558 }, { "epoch": 2.8, "learning_rate": 3.345528652850227e-06, "loss": 1.425, "step": 35559 }, { "epoch": 2.8, "learning_rate": 3.342933327774261e-06, "loss": 1.5128, "step": 35560 }, { "epoch": 2.8, "learning_rate": 3.3403389984188513e-06, "loss": 1.4442, "step": 35561 }, { "epoch": 2.8, "learning_rate": 3.337745664801583e-06, "loss": 1.388, "step": 35562 }, { "epoch": 2.8, "learning_rate": 3.3351533269400932e-06, "loss": 1.4693, "step": 35563 }, { "epoch": 2.8, "learning_rate": 3.3325619848519837e-06, "loss": 1.4039, "step": 35564 }, { "epoch": 2.8, "learning_rate": 3.3299716385548236e-06, "loss": 1.4623, "step": 35565 }, { "epoch": 2.8, "learning_rate": 3.3273822880662327e-06, "loss": 1.4101, "step": 35566 }, { "epoch": 2.8, "learning_rate": 3.32479393340378e-06, "loss": 1.4102, "step": 35567 }, { "epoch": 2.8, "learning_rate": 3.3222065745850178e-06, "loss": 1.4044, "step": 35568 }, { "epoch": 2.8, "learning_rate": 3.3196202116275494e-06, "loss": 1.419, "step": 35569 }, { "epoch": 2.8, "learning_rate": 3.3170348445489103e-06, "loss": 1.4357, "step": 35570 }, { "epoch": 2.8, "learning_rate": 3.3144504733666535e-06, "loss": 1.427, "step": 35571 }, { "epoch": 2.8, "learning_rate": 3.311867098098314e-06, "loss": 1.4598, "step": 35572 }, { "epoch": 2.8, "learning_rate": 3.3092847187614624e-06, "loss": 1.4593, "step": 35573 }, { "epoch": 2.8, "learning_rate": 3.3067033353736173e-06, "loss": 1.4847, "step": 35574 }, { "epoch": 2.8, "learning_rate": 3.304122947952281e-06, "loss": 1.4485, "step": 35575 }, { "epoch": 2.8, "learning_rate": 3.301543556515024e-06, "loss": 1.4702, "step": 35576 }, { "epoch": 2.8, "learning_rate": 3.2989651610793312e-06, "loss": 1.4532, "step": 35577 }, { "epoch": 2.8, "learning_rate": 3.2963877616627223e-06, "loss": 1.4439, "step": 35578 }, { "epoch": 2.8, "learning_rate": 3.29381135828265e-06, "loss": 1.4389, "step": 35579 }, { "epoch": 2.8, "learning_rate": 3.29123595095665e-06, "loss": 1.4283, "step": 35580 }, { "epoch": 2.8, "learning_rate": 3.288661539702209e-06, "loss": 1.4541, "step": 35581 }, { "epoch": 2.8, "learning_rate": 3.2860881245367786e-06, "loss": 1.4287, "step": 35582 }, { "epoch": 2.8, "learning_rate": 3.2835157054778626e-06, "loss": 1.4198, "step": 35583 }, { "epoch": 2.8, "learning_rate": 3.2809442825428966e-06, "loss": 1.3919, "step": 35584 }, { "epoch": 2.8, "learning_rate": 3.27837385574935e-06, "loss": 1.4265, "step": 35585 }, { "epoch": 2.8, "learning_rate": 3.275804425114692e-06, "loss": 1.4625, "step": 35586 }, { "epoch": 2.8, "learning_rate": 3.273235990656359e-06, "loss": 1.3746, "step": 35587 }, { "epoch": 2.8, "learning_rate": 3.270668552391753e-06, "loss": 1.4535, "step": 35588 }, { "epoch": 2.8, "learning_rate": 3.2681021103383443e-06, "loss": 1.4702, "step": 35589 }, { "epoch": 2.8, "learning_rate": 3.2655366645135683e-06, "loss": 1.4497, "step": 35590 }, { "epoch": 2.8, "learning_rate": 3.2629722149348115e-06, "loss": 1.3907, "step": 35591 }, { "epoch": 2.8, "learning_rate": 3.260408761619493e-06, "loss": 1.4592, "step": 35592 }, { "epoch": 2.8, "learning_rate": 3.2578463045850323e-06, "loss": 1.4195, "step": 35593 }, { "epoch": 2.8, "learning_rate": 3.2552848438488157e-06, "loss": 1.4304, "step": 35594 }, { "epoch": 2.8, "learning_rate": 3.2527243794282288e-06, "loss": 1.4431, "step": 35595 }, { "epoch": 2.8, "learning_rate": 3.250164911340658e-06, "loss": 1.4603, "step": 35596 }, { "epoch": 2.8, "learning_rate": 3.2476064396034896e-06, "loss": 1.4143, "step": 35597 }, { "epoch": 2.8, "learning_rate": 3.245048964234093e-06, "loss": 1.4442, "step": 35598 }, { "epoch": 2.8, "learning_rate": 3.2424924852498036e-06, "loss": 1.4784, "step": 35599 }, { "epoch": 2.8, "learning_rate": 3.239937002668025e-06, "loss": 1.4354, "step": 35600 }, { "epoch": 2.8, "learning_rate": 3.237382516506093e-06, "loss": 1.4101, "step": 35601 }, { "epoch": 2.8, "learning_rate": 3.234829026781327e-06, "loss": 1.4248, "step": 35602 }, { "epoch": 2.8, "learning_rate": 3.23227653351108e-06, "loss": 1.4231, "step": 35603 }, { "epoch": 2.8, "learning_rate": 3.229725036712688e-06, "loss": 1.4337, "step": 35604 }, { "epoch": 2.8, "learning_rate": 3.2271745364034708e-06, "loss": 1.5154, "step": 35605 }, { "epoch": 2.8, "learning_rate": 3.2246250326007308e-06, "loss": 1.4506, "step": 35606 }, { "epoch": 2.8, "learning_rate": 3.222076525321804e-06, "loss": 1.4947, "step": 35607 }, { "epoch": 2.8, "learning_rate": 3.219529014583977e-06, "loss": 1.4476, "step": 35608 }, { "epoch": 2.8, "learning_rate": 3.216982500404519e-06, "loss": 1.4545, "step": 35609 }, { "epoch": 2.8, "learning_rate": 3.214436982800783e-06, "loss": 1.4069, "step": 35610 }, { "epoch": 2.8, "learning_rate": 3.2118924617900223e-06, "loss": 1.4365, "step": 35611 }, { "epoch": 2.8, "learning_rate": 3.209348937389489e-06, "loss": 1.4104, "step": 35612 }, { "epoch": 2.8, "learning_rate": 3.206806409616469e-06, "loss": 1.428, "step": 35613 }, { "epoch": 2.8, "learning_rate": 3.204264878488233e-06, "loss": 1.4228, "step": 35614 }, { "epoch": 2.8, "learning_rate": 3.201724344022033e-06, "loss": 1.4552, "step": 35615 }, { "epoch": 2.8, "learning_rate": 3.1991848062351054e-06, "loss": 1.4273, "step": 35616 }, { "epoch": 2.8, "learning_rate": 3.1966462651447033e-06, "loss": 1.4539, "step": 35617 }, { "epoch": 2.8, "learning_rate": 3.1941087207680627e-06, "loss": 1.457, "step": 35618 }, { "epoch": 2.8, "learning_rate": 3.1915721731224033e-06, "loss": 1.4061, "step": 35619 }, { "epoch": 2.8, "learning_rate": 3.189036622224961e-06, "loss": 1.4182, "step": 35620 }, { "epoch": 2.8, "learning_rate": 3.1865020680929388e-06, "loss": 1.4244, "step": 35621 }, { "epoch": 2.8, "learning_rate": 3.1839685107435563e-06, "loss": 1.459, "step": 35622 }, { "epoch": 2.8, "learning_rate": 3.181435950194e-06, "loss": 1.4321, "step": 35623 }, { "epoch": 2.8, "learning_rate": 3.1789043864614726e-06, "loss": 1.4667, "step": 35624 }, { "epoch": 2.8, "learning_rate": 3.176373819563177e-06, "loss": 1.454, "step": 35625 }, { "epoch": 2.8, "learning_rate": 3.1738442495162495e-06, "loss": 1.4229, "step": 35626 }, { "epoch": 2.8, "learning_rate": 3.1713156763379265e-06, "loss": 1.4645, "step": 35627 }, { "epoch": 2.8, "learning_rate": 3.1687881000453274e-06, "loss": 1.4167, "step": 35628 }, { "epoch": 2.8, "learning_rate": 3.166261520655622e-06, "loss": 1.4863, "step": 35629 }, { "epoch": 2.8, "learning_rate": 3.1637359381859797e-06, "loss": 1.4171, "step": 35630 }, { "epoch": 2.8, "learning_rate": 3.1612113526535533e-06, "loss": 1.4358, "step": 35631 }, { "epoch": 2.8, "learning_rate": 3.158687764075446e-06, "loss": 1.4027, "step": 35632 }, { "epoch": 2.8, "learning_rate": 3.1561651724688275e-06, "loss": 1.4684, "step": 35633 }, { "epoch": 2.8, "learning_rate": 3.1536435778508172e-06, "loss": 1.3878, "step": 35634 }, { "epoch": 2.8, "learning_rate": 3.1511229802385187e-06, "loss": 1.4342, "step": 35635 }, { "epoch": 2.8, "learning_rate": 3.1486033796490507e-06, "loss": 1.4259, "step": 35636 }, { "epoch": 2.8, "learning_rate": 3.1460847760995332e-06, "loss": 1.4397, "step": 35637 }, { "epoch": 2.8, "learning_rate": 3.14356716960707e-06, "loss": 1.462, "step": 35638 }, { "epoch": 2.8, "learning_rate": 3.141050560188729e-06, "loss": 1.4155, "step": 35639 }, { "epoch": 2.8, "learning_rate": 3.138534947861615e-06, "loss": 1.4556, "step": 35640 }, { "epoch": 2.8, "learning_rate": 3.1360203326428135e-06, "loss": 1.4242, "step": 35641 }, { "epoch": 2.8, "learning_rate": 3.133506714549394e-06, "loss": 1.4189, "step": 35642 }, { "epoch": 2.8, "learning_rate": 3.1309940935983934e-06, "loss": 1.4375, "step": 35643 }, { "epoch": 2.8, "learning_rate": 3.1284824698069145e-06, "loss": 1.4714, "step": 35644 }, { "epoch": 2.8, "learning_rate": 3.125971843191977e-06, "loss": 1.4474, "step": 35645 }, { "epoch": 2.8, "learning_rate": 3.1234622137706334e-06, "loss": 1.471, "step": 35646 }, { "epoch": 2.8, "learning_rate": 3.1209535815599374e-06, "loss": 1.4229, "step": 35647 }, { "epoch": 2.8, "learning_rate": 3.1184459465769252e-06, "loss": 1.4617, "step": 35648 }, { "epoch": 2.8, "learning_rate": 3.1159393088386e-06, "loss": 1.4604, "step": 35649 }, { "epoch": 2.8, "learning_rate": 3.113433668361964e-06, "loss": 1.4609, "step": 35650 }, { "epoch": 2.81, "learning_rate": 3.1109290251640884e-06, "loss": 1.4717, "step": 35651 }, { "epoch": 2.81, "learning_rate": 3.108425379261925e-06, "loss": 1.4312, "step": 35652 }, { "epoch": 2.81, "learning_rate": 3.1059227306724945e-06, "loss": 1.3954, "step": 35653 }, { "epoch": 2.81, "learning_rate": 3.103421079412782e-06, "loss": 1.4364, "step": 35654 }, { "epoch": 2.81, "learning_rate": 3.1009204254997923e-06, "loss": 1.4972, "step": 35655 }, { "epoch": 2.81, "learning_rate": 3.098420768950477e-06, "loss": 1.4414, "step": 35656 }, { "epoch": 2.81, "learning_rate": 3.0959221097818067e-06, "loss": 1.4682, "step": 35657 }, { "epoch": 2.81, "learning_rate": 3.093424448010784e-06, "loss": 1.4345, "step": 35658 }, { "epoch": 2.81, "learning_rate": 3.0909277836543287e-06, "loss": 1.3734, "step": 35659 }, { "epoch": 2.81, "learning_rate": 3.088432116729378e-06, "loss": 1.4344, "step": 35660 }, { "epoch": 2.81, "learning_rate": 3.085937447252934e-06, "loss": 1.4683, "step": 35661 }, { "epoch": 2.81, "learning_rate": 3.0834437752419004e-06, "loss": 1.4874, "step": 35662 }, { "epoch": 2.81, "learning_rate": 3.0809511007131804e-06, "loss": 1.4447, "step": 35663 }, { "epoch": 2.81, "learning_rate": 3.0784594236837433e-06, "loss": 1.515, "step": 35664 }, { "epoch": 2.81, "learning_rate": 3.075968744170493e-06, "loss": 1.4554, "step": 35665 }, { "epoch": 2.81, "learning_rate": 3.0734790621903316e-06, "loss": 1.4186, "step": 35666 }, { "epoch": 2.81, "learning_rate": 3.070990377760163e-06, "loss": 1.4049, "step": 35667 }, { "epoch": 2.81, "learning_rate": 3.0685026908968734e-06, "loss": 1.4511, "step": 35668 }, { "epoch": 2.81, "learning_rate": 3.0660160016173996e-06, "loss": 1.455, "step": 35669 }, { "epoch": 2.81, "learning_rate": 3.063530309938578e-06, "loss": 1.4154, "step": 35670 }, { "epoch": 2.81, "learning_rate": 3.061045615877278e-06, "loss": 1.4347, "step": 35671 }, { "epoch": 2.81, "learning_rate": 3.0585619194504198e-06, "loss": 1.4335, "step": 35672 }, { "epoch": 2.81, "learning_rate": 3.056079220674823e-06, "loss": 1.4401, "step": 35673 }, { "epoch": 2.81, "learning_rate": 3.0535975195673578e-06, "loss": 1.4232, "step": 35674 }, { "epoch": 2.81, "learning_rate": 3.0511168161448773e-06, "loss": 1.4437, "step": 35675 }, { "epoch": 2.81, "learning_rate": 3.048637110424235e-06, "loss": 1.4215, "step": 35676 }, { "epoch": 2.81, "learning_rate": 3.046158402422233e-06, "loss": 1.4716, "step": 35677 }, { "epoch": 2.81, "learning_rate": 3.0436806921557253e-06, "loss": 1.4299, "step": 35678 }, { "epoch": 2.81, "learning_rate": 3.041203979641532e-06, "loss": 1.4278, "step": 35679 }, { "epoch": 2.81, "learning_rate": 3.0387282648964563e-06, "loss": 1.5027, "step": 35680 }, { "epoch": 2.81, "learning_rate": 3.0362535479373175e-06, "loss": 1.3878, "step": 35681 }, { "epoch": 2.81, "learning_rate": 3.033779828780919e-06, "loss": 1.444, "step": 35682 }, { "epoch": 2.81, "learning_rate": 3.0313071074440474e-06, "loss": 1.3747, "step": 35683 }, { "epoch": 2.81, "learning_rate": 3.02883538394349e-06, "loss": 1.4741, "step": 35684 }, { "epoch": 2.81, "learning_rate": 3.0263646582960654e-06, "loss": 1.458, "step": 35685 }, { "epoch": 2.81, "learning_rate": 3.0238949305184947e-06, "loss": 1.4509, "step": 35686 }, { "epoch": 2.81, "learning_rate": 3.0214262006275635e-06, "loss": 1.4226, "step": 35687 }, { "epoch": 2.81, "learning_rate": 3.018958468640059e-06, "loss": 1.4658, "step": 35688 }, { "epoch": 2.81, "learning_rate": 3.016491734572718e-06, "loss": 1.4165, "step": 35689 }, { "epoch": 2.81, "learning_rate": 3.0140259984422765e-06, "loss": 1.4648, "step": 35690 }, { "epoch": 2.81, "learning_rate": 3.0115612602654713e-06, "loss": 1.4587, "step": 35691 }, { "epoch": 2.81, "learning_rate": 3.009097520059056e-06, "loss": 1.4193, "step": 35692 }, { "epoch": 2.81, "learning_rate": 3.006634777839767e-06, "loss": 1.4173, "step": 35693 }, { "epoch": 2.81, "learning_rate": 3.0041730336242907e-06, "loss": 1.4751, "step": 35694 }, { "epoch": 2.81, "learning_rate": 3.0017122874293807e-06, "loss": 1.4234, "step": 35695 }, { "epoch": 2.81, "learning_rate": 2.9992525392717236e-06, "loss": 1.4817, "step": 35696 }, { "epoch": 2.81, "learning_rate": 2.9967937891679896e-06, "loss": 1.468, "step": 35697 }, { "epoch": 2.81, "learning_rate": 2.994336037134931e-06, "loss": 1.4497, "step": 35698 }, { "epoch": 2.81, "learning_rate": 2.9918792831891857e-06, "loss": 1.4541, "step": 35699 }, { "epoch": 2.81, "learning_rate": 2.9894235273474733e-06, "loss": 1.4398, "step": 35700 }, { "epoch": 2.81, "learning_rate": 2.98696876962643e-06, "loss": 1.4494, "step": 35701 }, { "epoch": 2.81, "learning_rate": 2.9845150100427595e-06, "loss": 1.4467, "step": 35702 }, { "epoch": 2.81, "learning_rate": 2.9820622486130986e-06, "loss": 1.4552, "step": 35703 }, { "epoch": 2.81, "learning_rate": 2.9796104853541005e-06, "loss": 1.4641, "step": 35704 }, { "epoch": 2.81, "learning_rate": 2.977159720282418e-06, "loss": 1.4978, "step": 35705 }, { "epoch": 2.81, "learning_rate": 2.9747099534146888e-06, "loss": 1.4344, "step": 35706 }, { "epoch": 2.81, "learning_rate": 2.9722611847675327e-06, "loss": 1.4304, "step": 35707 }, { "epoch": 2.81, "learning_rate": 2.9698134143575856e-06, "loss": 1.3818, "step": 35708 }, { "epoch": 2.81, "learning_rate": 2.967366642201485e-06, "loss": 1.4496, "step": 35709 }, { "epoch": 2.81, "learning_rate": 2.9649208683158176e-06, "loss": 1.4816, "step": 35710 }, { "epoch": 2.81, "learning_rate": 2.9624760927171863e-06, "loss": 1.4421, "step": 35711 }, { "epoch": 2.81, "learning_rate": 2.9600323154222117e-06, "loss": 1.4651, "step": 35712 }, { "epoch": 2.81, "learning_rate": 2.95758953644748e-06, "loss": 1.46, "step": 35713 }, { "epoch": 2.81, "learning_rate": 2.955147755809545e-06, "loss": 1.425, "step": 35714 }, { "epoch": 2.81, "learning_rate": 2.9527069735250096e-06, "loss": 1.4258, "step": 35715 }, { "epoch": 2.81, "learning_rate": 2.950267189610478e-06, "loss": 1.4444, "step": 35716 }, { "epoch": 2.81, "learning_rate": 2.9478284040824698e-06, "loss": 1.4184, "step": 35717 }, { "epoch": 2.81, "learning_rate": 2.9453906169575547e-06, "loss": 1.4582, "step": 35718 }, { "epoch": 2.81, "learning_rate": 2.942953828252287e-06, "loss": 1.5014, "step": 35719 }, { "epoch": 2.81, "learning_rate": 2.9405180379832195e-06, "loss": 1.4772, "step": 35720 }, { "epoch": 2.81, "learning_rate": 2.9380832461668556e-06, "loss": 1.4196, "step": 35721 }, { "epoch": 2.81, "learning_rate": 2.9356494528197662e-06, "loss": 1.4301, "step": 35722 }, { "epoch": 2.81, "learning_rate": 2.93321665795847e-06, "loss": 1.4728, "step": 35723 }, { "epoch": 2.81, "learning_rate": 2.9307848615994723e-06, "loss": 1.4364, "step": 35724 }, { "epoch": 2.81, "learning_rate": 2.9283540637592584e-06, "loss": 1.452, "step": 35725 }, { "epoch": 2.81, "learning_rate": 2.925924264454399e-06, "loss": 1.4334, "step": 35726 }, { "epoch": 2.81, "learning_rate": 2.9234954637013308e-06, "loss": 1.4608, "step": 35727 }, { "epoch": 2.81, "learning_rate": 2.9210676615165573e-06, "loss": 1.4682, "step": 35728 }, { "epoch": 2.81, "learning_rate": 2.918640857916582e-06, "loss": 1.4638, "step": 35729 }, { "epoch": 2.81, "learning_rate": 2.916215052917875e-06, "loss": 1.4224, "step": 35730 }, { "epoch": 2.81, "learning_rate": 2.9137902465368736e-06, "loss": 1.3743, "step": 35731 }, { "epoch": 2.81, "learning_rate": 2.9113664387900804e-06, "loss": 1.4028, "step": 35732 }, { "epoch": 2.81, "learning_rate": 2.9089436296939495e-06, "loss": 1.4703, "step": 35733 }, { "epoch": 2.81, "learning_rate": 2.9065218192649177e-06, "loss": 1.4724, "step": 35734 }, { "epoch": 2.81, "learning_rate": 2.9041010075194216e-06, "loss": 1.4706, "step": 35735 }, { "epoch": 2.81, "learning_rate": 2.901681194473915e-06, "loss": 1.4374, "step": 35736 }, { "epoch": 2.81, "learning_rate": 2.899262380144818e-06, "loss": 1.4243, "step": 35737 }, { "epoch": 2.81, "learning_rate": 2.8968445645485337e-06, "loss": 1.4396, "step": 35738 }, { "epoch": 2.81, "learning_rate": 2.8944277477015166e-06, "loss": 1.4796, "step": 35739 }, { "epoch": 2.81, "learning_rate": 2.8920119296201526e-06, "loss": 1.4343, "step": 35740 }, { "epoch": 2.81, "learning_rate": 2.889597110320829e-06, "loss": 1.456, "step": 35741 }, { "epoch": 2.81, "learning_rate": 2.8871832898199833e-06, "loss": 1.4594, "step": 35742 }, { "epoch": 2.81, "learning_rate": 2.884770468133968e-06, "loss": 1.4516, "step": 35743 }, { "epoch": 2.81, "learning_rate": 2.88235864527917e-06, "loss": 1.446, "step": 35744 }, { "epoch": 2.81, "learning_rate": 2.8799478212719775e-06, "loss": 1.4451, "step": 35745 }, { "epoch": 2.81, "learning_rate": 2.8775379961287593e-06, "loss": 1.4458, "step": 35746 }, { "epoch": 2.81, "learning_rate": 2.875129169865853e-06, "loss": 1.5022, "step": 35747 }, { "epoch": 2.81, "learning_rate": 2.8727213424996454e-06, "loss": 1.4472, "step": 35748 }, { "epoch": 2.81, "learning_rate": 2.87031451404644e-06, "loss": 1.4768, "step": 35749 }, { "epoch": 2.81, "learning_rate": 2.8679086845226408e-06, "loss": 1.4345, "step": 35750 }, { "epoch": 2.81, "learning_rate": 2.865503853944534e-06, "loss": 1.4278, "step": 35751 }, { "epoch": 2.81, "learning_rate": 2.8631000223284574e-06, "loss": 1.4369, "step": 35752 }, { "epoch": 2.81, "learning_rate": 2.8606971896907307e-06, "loss": 1.4417, "step": 35753 }, { "epoch": 2.81, "learning_rate": 2.858295356047691e-06, "loss": 1.4711, "step": 35754 }, { "epoch": 2.81, "learning_rate": 2.855894521415608e-06, "loss": 1.4887, "step": 35755 }, { "epoch": 2.81, "learning_rate": 2.853494685810803e-06, "loss": 1.4198, "step": 35756 }, { "epoch": 2.81, "learning_rate": 2.8510958492495793e-06, "loss": 1.4211, "step": 35757 }, { "epoch": 2.81, "learning_rate": 2.8486980117481906e-06, "loss": 1.439, "step": 35758 }, { "epoch": 2.81, "learning_rate": 2.846301173322957e-06, "loss": 1.4217, "step": 35759 }, { "epoch": 2.81, "learning_rate": 2.8439053339901317e-06, "loss": 1.4588, "step": 35760 }, { "epoch": 2.81, "learning_rate": 2.8415104937659694e-06, "loss": 1.4407, "step": 35761 }, { "epoch": 2.81, "learning_rate": 2.8391166526667398e-06, "loss": 1.5068, "step": 35762 }, { "epoch": 2.81, "learning_rate": 2.8367238107086964e-06, "loss": 1.4668, "step": 35763 }, { "epoch": 2.81, "learning_rate": 2.83433196790811e-06, "loss": 1.4301, "step": 35764 }, { "epoch": 2.81, "learning_rate": 2.831941124281184e-06, "loss": 1.4512, "step": 35765 }, { "epoch": 2.81, "learning_rate": 2.8295512798441555e-06, "loss": 1.4769, "step": 35766 }, { "epoch": 2.81, "learning_rate": 2.8271624346132617e-06, "loss": 1.4374, "step": 35767 }, { "epoch": 2.81, "learning_rate": 2.824774588604739e-06, "loss": 1.3901, "step": 35768 }, { "epoch": 2.81, "learning_rate": 2.822387741834742e-06, "loss": 1.4775, "step": 35769 }, { "epoch": 2.81, "learning_rate": 2.82000189431954e-06, "loss": 1.4219, "step": 35770 }, { "epoch": 2.81, "learning_rate": 2.8176170460753043e-06, "loss": 1.4614, "step": 35771 }, { "epoch": 2.81, "learning_rate": 2.8152331971182053e-06, "loss": 1.4604, "step": 35772 }, { "epoch": 2.81, "learning_rate": 2.812850347464479e-06, "loss": 1.4832, "step": 35773 }, { "epoch": 2.81, "learning_rate": 2.810468497130264e-06, "loss": 1.4651, "step": 35774 }, { "epoch": 2.81, "learning_rate": 2.808087646131729e-06, "loss": 1.4437, "step": 35775 }, { "epoch": 2.81, "learning_rate": 2.8057077944850625e-06, "loss": 1.5062, "step": 35776 }, { "epoch": 2.81, "learning_rate": 2.8033289422064178e-06, "loss": 1.4525, "step": 35777 }, { "epoch": 2.82, "learning_rate": 2.8009510893119147e-06, "loss": 1.4407, "step": 35778 }, { "epoch": 2.82, "learning_rate": 2.798574235817741e-06, "loss": 1.4049, "step": 35779 }, { "epoch": 2.82, "learning_rate": 2.796198381740017e-06, "loss": 1.4252, "step": 35780 }, { "epoch": 2.82, "learning_rate": 2.7938235270948628e-06, "loss": 1.4932, "step": 35781 }, { "epoch": 2.82, "learning_rate": 2.7914496718984325e-06, "loss": 1.3952, "step": 35782 }, { "epoch": 2.82, "learning_rate": 2.7890768161667963e-06, "loss": 1.3963, "step": 35783 }, { "epoch": 2.82, "learning_rate": 2.7867049599161083e-06, "loss": 1.4542, "step": 35784 }, { "epoch": 2.82, "learning_rate": 2.7843341031624557e-06, "loss": 1.415, "step": 35785 }, { "epoch": 2.82, "learning_rate": 2.781964245921908e-06, "loss": 1.4934, "step": 35786 }, { "epoch": 2.82, "learning_rate": 2.7795953882106036e-06, "loss": 1.4374, "step": 35787 }, { "epoch": 2.82, "learning_rate": 2.7772275300446124e-06, "loss": 1.4074, "step": 35788 }, { "epoch": 2.82, "learning_rate": 2.774860671439988e-06, "loss": 1.4223, "step": 35789 }, { "epoch": 2.82, "learning_rate": 2.7724948124128176e-06, "loss": 1.4578, "step": 35790 }, { "epoch": 2.82, "learning_rate": 2.7701299529791555e-06, "loss": 1.4752, "step": 35791 }, { "epoch": 2.82, "learning_rate": 2.7677660931550715e-06, "loss": 1.4514, "step": 35792 }, { "epoch": 2.82, "learning_rate": 2.7654032329566035e-06, "loss": 1.4021, "step": 35793 }, { "epoch": 2.82, "learning_rate": 2.763041372399788e-06, "loss": 1.4377, "step": 35794 }, { "epoch": 2.82, "learning_rate": 2.7606805115006793e-06, "loss": 1.4436, "step": 35795 }, { "epoch": 2.82, "learning_rate": 2.7583206502752807e-06, "loss": 1.4738, "step": 35796 }, { "epoch": 2.82, "learning_rate": 2.755961788739647e-06, "loss": 1.4619, "step": 35797 }, { "epoch": 2.82, "learning_rate": 2.753603926909781e-06, "loss": 1.4472, "step": 35798 }, { "epoch": 2.82, "learning_rate": 2.7512470648016706e-06, "loss": 1.4583, "step": 35799 }, { "epoch": 2.82, "learning_rate": 2.7488912024313525e-06, "loss": 1.4174, "step": 35800 }, { "epoch": 2.82, "learning_rate": 2.7465363398147975e-06, "loss": 1.4953, "step": 35801 }, { "epoch": 2.82, "learning_rate": 2.7441824769679934e-06, "loss": 1.4544, "step": 35802 }, { "epoch": 2.82, "learning_rate": 2.741829613906926e-06, "loss": 1.4273, "step": 35803 }, { "epoch": 2.82, "learning_rate": 2.7394777506475674e-06, "loss": 1.4055, "step": 35804 }, { "epoch": 2.82, "learning_rate": 2.737126887205904e-06, "loss": 1.3954, "step": 35805 }, { "epoch": 2.82, "learning_rate": 2.734777023597873e-06, "loss": 1.4289, "step": 35806 }, { "epoch": 2.82, "learning_rate": 2.732428159839445e-06, "loss": 1.4603, "step": 35807 }, { "epoch": 2.82, "learning_rate": 2.7300802959465573e-06, "loss": 1.4302, "step": 35808 }, { "epoch": 2.82, "learning_rate": 2.7277334319351472e-06, "loss": 1.4464, "step": 35809 }, { "epoch": 2.82, "learning_rate": 2.7253875678211524e-06, "loss": 1.4844, "step": 35810 }, { "epoch": 2.82, "learning_rate": 2.723042703620526e-06, "loss": 1.4448, "step": 35811 }, { "epoch": 2.82, "learning_rate": 2.7206988393491556e-06, "loss": 1.4443, "step": 35812 }, { "epoch": 2.82, "learning_rate": 2.7183559750229624e-06, "loss": 1.4192, "step": 35813 }, { "epoch": 2.82, "learning_rate": 2.716014110657849e-06, "loss": 1.4307, "step": 35814 }, { "epoch": 2.82, "learning_rate": 2.7136732462697373e-06, "loss": 1.4802, "step": 35815 }, { "epoch": 2.82, "learning_rate": 2.711333381874481e-06, "loss": 1.4182, "step": 35816 }, { "epoch": 2.82, "learning_rate": 2.708994517488017e-06, "loss": 1.4669, "step": 35817 }, { "epoch": 2.82, "learning_rate": 2.7066566531261826e-06, "loss": 1.4396, "step": 35818 }, { "epoch": 2.82, "learning_rate": 2.704319788804882e-06, "loss": 1.4328, "step": 35819 }, { "epoch": 2.82, "learning_rate": 2.7019839245399355e-06, "loss": 1.423, "step": 35820 }, { "epoch": 2.82, "learning_rate": 2.699649060347264e-06, "loss": 1.4635, "step": 35821 }, { "epoch": 2.82, "learning_rate": 2.697315196242672e-06, "loss": 1.4354, "step": 35822 }, { "epoch": 2.82, "learning_rate": 2.6949823322420294e-06, "loss": 1.4404, "step": 35823 }, { "epoch": 2.82, "learning_rate": 2.692650468361157e-06, "loss": 1.4484, "step": 35824 }, { "epoch": 2.82, "learning_rate": 2.6903196046158928e-06, "loss": 1.4396, "step": 35825 }, { "epoch": 2.82, "learning_rate": 2.6879897410220897e-06, "loss": 1.4022, "step": 35826 }, { "epoch": 2.82, "learning_rate": 2.685660877595519e-06, "loss": 1.437, "step": 35827 }, { "epoch": 2.82, "learning_rate": 2.6833330143520183e-06, "loss": 1.4389, "step": 35828 }, { "epoch": 2.82, "learning_rate": 2.6810061513074075e-06, "loss": 1.4363, "step": 35829 }, { "epoch": 2.82, "learning_rate": 2.6786802884774584e-06, "loss": 1.4343, "step": 35830 }, { "epoch": 2.82, "learning_rate": 2.676355425877974e-06, "loss": 1.4749, "step": 35831 }, { "epoch": 2.82, "learning_rate": 2.6740315635247255e-06, "loss": 1.4379, "step": 35832 }, { "epoch": 2.82, "learning_rate": 2.6717087014335003e-06, "loss": 1.446, "step": 35833 }, { "epoch": 2.82, "learning_rate": 2.6693868396200857e-06, "loss": 1.4906, "step": 35834 }, { "epoch": 2.82, "learning_rate": 2.6670659781002356e-06, "loss": 1.4636, "step": 35835 }, { "epoch": 2.82, "learning_rate": 2.664746116889688e-06, "loss": 1.4384, "step": 35836 }, { "epoch": 2.82, "learning_rate": 2.6624272560042126e-06, "loss": 1.4627, "step": 35837 }, { "epoch": 2.82, "learning_rate": 2.6601093954595476e-06, "loss": 1.4444, "step": 35838 }, { "epoch": 2.82, "learning_rate": 2.6577925352714303e-06, "loss": 1.421, "step": 35839 }, { "epoch": 2.82, "learning_rate": 2.6554766754555813e-06, "loss": 1.3944, "step": 35840 }, { "epoch": 2.82, "learning_rate": 2.653161816027738e-06, "loss": 1.4377, "step": 35841 }, { "epoch": 2.82, "learning_rate": 2.650847957003638e-06, "loss": 1.4325, "step": 35842 }, { "epoch": 2.82, "learning_rate": 2.648535098398952e-06, "loss": 1.4216, "step": 35843 }, { "epoch": 2.82, "learning_rate": 2.6462232402293835e-06, "loss": 1.4625, "step": 35844 }, { "epoch": 2.82, "learning_rate": 2.6439123825106546e-06, "loss": 1.4115, "step": 35845 }, { "epoch": 2.82, "learning_rate": 2.6416025252584518e-06, "loss": 1.4407, "step": 35846 }, { "epoch": 2.82, "learning_rate": 2.639293668488429e-06, "loss": 1.452, "step": 35847 }, { "epoch": 2.82, "learning_rate": 2.6369858122162912e-06, "loss": 1.4252, "step": 35848 }, { "epoch": 2.82, "learning_rate": 2.634678956457692e-06, "loss": 1.4136, "step": 35849 }, { "epoch": 2.82, "learning_rate": 2.632373101228302e-06, "loss": 1.5095, "step": 35850 }, { "epoch": 2.82, "learning_rate": 2.630068246543793e-06, "loss": 1.4292, "step": 35851 }, { "epoch": 2.82, "learning_rate": 2.6277643924197845e-06, "loss": 1.4229, "step": 35852 }, { "epoch": 2.82, "learning_rate": 2.6254615388719147e-06, "loss": 1.4179, "step": 35853 }, { "epoch": 2.82, "learning_rate": 2.6231596859158378e-06, "loss": 1.4983, "step": 35854 }, { "epoch": 2.82, "learning_rate": 2.620858833567191e-06, "loss": 1.4428, "step": 35855 }, { "epoch": 2.82, "learning_rate": 2.6185589818415785e-06, "loss": 1.4596, "step": 35856 }, { "epoch": 2.82, "learning_rate": 2.6162601307545885e-06, "loss": 1.4305, "step": 35857 }, { "epoch": 2.82, "learning_rate": 2.6139622803218906e-06, "loss": 1.4508, "step": 35858 }, { "epoch": 2.82, "learning_rate": 2.6116654305590567e-06, "loss": 1.419, "step": 35859 }, { "epoch": 2.82, "learning_rate": 2.609369581481674e-06, "loss": 1.4244, "step": 35860 }, { "epoch": 2.82, "learning_rate": 2.60707473310533e-06, "loss": 1.3975, "step": 35861 }, { "epoch": 2.82, "learning_rate": 2.6047808854456122e-06, "loss": 1.4292, "step": 35862 }, { "epoch": 2.82, "learning_rate": 2.602488038518091e-06, "loss": 1.4561, "step": 35863 }, { "epoch": 2.82, "learning_rate": 2.6001961923383387e-06, "loss": 1.5049, "step": 35864 }, { "epoch": 2.82, "learning_rate": 2.597905346921908e-06, "loss": 1.4621, "step": 35865 }, { "epoch": 2.82, "learning_rate": 2.5956155022843704e-06, "loss": 1.4605, "step": 35866 }, { "epoch": 2.82, "learning_rate": 2.593326658441247e-06, "loss": 1.4716, "step": 35867 }, { "epoch": 2.82, "learning_rate": 2.5910388154080917e-06, "loss": 1.4791, "step": 35868 }, { "epoch": 2.82, "learning_rate": 2.5887519732004426e-06, "loss": 1.4292, "step": 35869 }, { "epoch": 2.82, "learning_rate": 2.5864661318338033e-06, "loss": 1.4489, "step": 35870 }, { "epoch": 2.82, "learning_rate": 2.5841812913237116e-06, "loss": 1.4837, "step": 35871 }, { "epoch": 2.82, "learning_rate": 2.5818974516856884e-06, "loss": 1.3893, "step": 35872 }, { "epoch": 2.82, "learning_rate": 2.5796146129352213e-06, "loss": 1.4156, "step": 35873 }, { "epoch": 2.82, "learning_rate": 2.5773327750878147e-06, "loss": 1.4513, "step": 35874 }, { "epoch": 2.82, "learning_rate": 2.575051938158973e-06, "loss": 1.4256, "step": 35875 }, { "epoch": 2.82, "learning_rate": 2.5727721021641833e-06, "loss": 1.4218, "step": 35876 }, { "epoch": 2.82, "learning_rate": 2.5704932671189006e-06, "loss": 1.45, "step": 35877 }, { "epoch": 2.82, "learning_rate": 2.568215433038612e-06, "loss": 1.3913, "step": 35878 }, { "epoch": 2.82, "learning_rate": 2.5659385999387715e-06, "loss": 1.4402, "step": 35879 }, { "epoch": 2.82, "learning_rate": 2.5636627678348677e-06, "loss": 1.4463, "step": 35880 }, { "epoch": 2.82, "learning_rate": 2.5613879367423206e-06, "loss": 1.4057, "step": 35881 }, { "epoch": 2.82, "learning_rate": 2.5591141066765853e-06, "loss": 1.42, "step": 35882 }, { "epoch": 2.82, "learning_rate": 2.5568412776530988e-06, "loss": 1.4613, "step": 35883 }, { "epoch": 2.82, "learning_rate": 2.554569449687299e-06, "loss": 1.4777, "step": 35884 }, { "epoch": 2.82, "learning_rate": 2.5522986227946075e-06, "loss": 1.4289, "step": 35885 }, { "epoch": 2.82, "learning_rate": 2.5500287969904276e-06, "loss": 1.4597, "step": 35886 }, { "epoch": 2.82, "learning_rate": 2.547759972290181e-06, "loss": 1.4743, "step": 35887 }, { "epoch": 2.82, "learning_rate": 2.5454921487092884e-06, "loss": 1.4097, "step": 35888 }, { "epoch": 2.82, "learning_rate": 2.543225326263121e-06, "loss": 1.42, "step": 35889 }, { "epoch": 2.82, "learning_rate": 2.5409595049670994e-06, "loss": 1.4327, "step": 35890 }, { "epoch": 2.82, "learning_rate": 2.538694684836562e-06, "loss": 1.4414, "step": 35891 }, { "epoch": 2.82, "learning_rate": 2.536430865886929e-06, "loss": 1.4623, "step": 35892 }, { "epoch": 2.82, "learning_rate": 2.534168048133556e-06, "loss": 1.5071, "step": 35893 }, { "epoch": 2.82, "learning_rate": 2.5319062315917793e-06, "loss": 1.4622, "step": 35894 }, { "epoch": 2.82, "learning_rate": 2.5296454162770042e-06, "loss": 1.4249, "step": 35895 }, { "epoch": 2.82, "learning_rate": 2.5273856022045515e-06, "loss": 1.4253, "step": 35896 }, { "epoch": 2.82, "learning_rate": 2.525126789389775e-06, "loss": 1.4454, "step": 35897 }, { "epoch": 2.82, "learning_rate": 2.5228689778479804e-06, "loss": 1.4433, "step": 35898 }, { "epoch": 2.82, "learning_rate": 2.5206121675945378e-06, "loss": 1.4455, "step": 35899 }, { "epoch": 2.82, "learning_rate": 2.518356358644752e-06, "loss": 1.4578, "step": 35900 }, { "epoch": 2.82, "learning_rate": 2.516101551013927e-06, "loss": 1.449, "step": 35901 }, { "epoch": 2.82, "learning_rate": 2.513847744717401e-06, "loss": 1.4961, "step": 35902 }, { "epoch": 2.82, "learning_rate": 2.5115949397704614e-06, "loss": 1.4693, "step": 35903 }, { "epoch": 2.82, "learning_rate": 2.5093431361883797e-06, "loss": 1.4214, "step": 35904 }, { "epoch": 2.83, "learning_rate": 2.5070923339864767e-06, "loss": 1.4456, "step": 35905 }, { "epoch": 2.83, "learning_rate": 2.504842533180024e-06, "loss": 1.5058, "step": 35906 }, { "epoch": 2.83, "learning_rate": 2.5025937337843085e-06, "loss": 1.4129, "step": 35907 }, { "epoch": 2.83, "learning_rate": 2.5003459358145517e-06, "loss": 1.4116, "step": 35908 }, { "epoch": 2.83, "learning_rate": 2.498099139286075e-06, "loss": 1.4525, "step": 35909 }, { "epoch": 2.83, "learning_rate": 2.495853344214116e-06, "loss": 1.4445, "step": 35910 }, { "epoch": 2.83, "learning_rate": 2.493608550613896e-06, "loss": 1.4339, "step": 35911 }, { "epoch": 2.83, "learning_rate": 2.4913647585006857e-06, "loss": 1.4544, "step": 35912 }, { "epoch": 2.83, "learning_rate": 2.48912196788969e-06, "loss": 1.4528, "step": 35913 }, { "epoch": 2.83, "learning_rate": 2.4868801787961802e-06, "loss": 1.4964, "step": 35914 }, { "epoch": 2.83, "learning_rate": 2.48463939123531e-06, "loss": 1.5202, "step": 35915 }, { "epoch": 2.83, "learning_rate": 2.482399605222368e-06, "loss": 1.5168, "step": 35916 }, { "epoch": 2.83, "learning_rate": 2.4801608207725086e-06, "loss": 1.4345, "step": 35917 }, { "epoch": 2.83, "learning_rate": 2.477923037900953e-06, "loss": 1.4546, "step": 35918 }, { "epoch": 2.83, "learning_rate": 2.475686256622872e-06, "loss": 1.4554, "step": 35919 }, { "epoch": 2.83, "learning_rate": 2.4734504769535033e-06, "loss": 1.4875, "step": 35920 }, { "epoch": 2.83, "learning_rate": 2.471215698907969e-06, "loss": 1.4198, "step": 35921 }, { "epoch": 2.83, "learning_rate": 2.468981922501473e-06, "loss": 1.4785, "step": 35922 }, { "epoch": 2.83, "learning_rate": 2.4667491477491864e-06, "loss": 1.4867, "step": 35923 }, { "epoch": 2.83, "learning_rate": 2.4645173746662473e-06, "loss": 1.4406, "step": 35924 }, { "epoch": 2.83, "learning_rate": 2.4622866032678266e-06, "loss": 1.4343, "step": 35925 }, { "epoch": 2.83, "learning_rate": 2.460056833569063e-06, "loss": 1.4186, "step": 35926 }, { "epoch": 2.83, "learning_rate": 2.4578280655850766e-06, "loss": 1.4089, "step": 35927 }, { "epoch": 2.83, "learning_rate": 2.455600299331023e-06, "loss": 1.4236, "step": 35928 }, { "epoch": 2.83, "learning_rate": 2.4533735348220396e-06, "loss": 1.4368, "step": 35929 }, { "epoch": 2.83, "learning_rate": 2.4511477720732143e-06, "loss": 1.4439, "step": 35930 }, { "epoch": 2.83, "learning_rate": 2.448923011099685e-06, "loss": 1.3632, "step": 35931 }, { "epoch": 2.83, "learning_rate": 2.4466992519165063e-06, "loss": 1.4245, "step": 35932 }, { "epoch": 2.83, "learning_rate": 2.4444764945388495e-06, "loss": 1.4731, "step": 35933 }, { "epoch": 2.83, "learning_rate": 2.4422547389817525e-06, "loss": 1.3963, "step": 35934 }, { "epoch": 2.83, "learning_rate": 2.44003398526032e-06, "loss": 1.3863, "step": 35935 }, { "epoch": 2.83, "learning_rate": 2.4378142333896233e-06, "loss": 1.4285, "step": 35936 }, { "epoch": 2.83, "learning_rate": 2.4355954833847336e-06, "loss": 1.4591, "step": 35937 }, { "epoch": 2.83, "learning_rate": 2.433377735260739e-06, "loss": 1.4571, "step": 35938 }, { "epoch": 2.83, "learning_rate": 2.4311609890326433e-06, "loss": 1.428, "step": 35939 }, { "epoch": 2.83, "learning_rate": 2.4289452447155522e-06, "loss": 1.4361, "step": 35940 }, { "epoch": 2.83, "learning_rate": 2.4267305023244864e-06, "loss": 1.4408, "step": 35941 }, { "epoch": 2.83, "learning_rate": 2.4245167618744675e-06, "loss": 1.4737, "step": 35942 }, { "epoch": 2.83, "learning_rate": 2.4223040233805668e-06, "loss": 1.4527, "step": 35943 }, { "epoch": 2.83, "learning_rate": 2.4200922868577556e-06, "loss": 1.45, "step": 35944 }, { "epoch": 2.83, "learning_rate": 2.4178815523210883e-06, "loss": 1.4791, "step": 35945 }, { "epoch": 2.83, "learning_rate": 2.4156718197855697e-06, "loss": 1.4374, "step": 35946 }, { "epoch": 2.83, "learning_rate": 2.413463089266188e-06, "loss": 1.4857, "step": 35947 }, { "epoch": 2.83, "learning_rate": 2.411255360777947e-06, "loss": 1.4409, "step": 35948 }, { "epoch": 2.83, "learning_rate": 2.4090486343358195e-06, "loss": 1.4046, "step": 35949 }, { "epoch": 2.83, "learning_rate": 2.406842909954826e-06, "loss": 1.4256, "step": 35950 }, { "epoch": 2.83, "learning_rate": 2.404638187649904e-06, "loss": 1.4786, "step": 35951 }, { "epoch": 2.83, "learning_rate": 2.402434467436043e-06, "loss": 1.4312, "step": 35952 }, { "epoch": 2.83, "learning_rate": 2.400231749328213e-06, "loss": 1.4021, "step": 35953 }, { "epoch": 2.83, "learning_rate": 2.3980300333413527e-06, "loss": 1.4695, "step": 35954 }, { "epoch": 2.83, "learning_rate": 2.3958293194904166e-06, "loss": 1.444, "step": 35955 }, { "epoch": 2.83, "learning_rate": 2.393629607790343e-06, "loss": 1.4152, "step": 35956 }, { "epoch": 2.83, "learning_rate": 2.3914308982560692e-06, "loss": 1.4394, "step": 35957 }, { "epoch": 2.83, "learning_rate": 2.3892331909025177e-06, "loss": 1.4043, "step": 35958 }, { "epoch": 2.83, "learning_rate": 2.3870364857446087e-06, "loss": 1.4304, "step": 35959 }, { "epoch": 2.83, "learning_rate": 2.3848407827972816e-06, "loss": 1.4368, "step": 35960 }, { "epoch": 2.83, "learning_rate": 2.3826460820754236e-06, "loss": 1.4228, "step": 35961 }, { "epoch": 2.83, "learning_rate": 2.380452383593906e-06, "loss": 1.4524, "step": 35962 }, { "epoch": 2.83, "learning_rate": 2.378259687367684e-06, "loss": 1.4204, "step": 35963 }, { "epoch": 2.83, "learning_rate": 2.376067993411612e-06, "loss": 1.4261, "step": 35964 }, { "epoch": 2.83, "learning_rate": 2.373877301740562e-06, "loss": 1.4464, "step": 35965 }, { "epoch": 2.83, "learning_rate": 2.3716876123694216e-06, "loss": 1.4364, "step": 35966 }, { "epoch": 2.83, "learning_rate": 2.3694989253130457e-06, "loss": 1.4396, "step": 35967 }, { "epoch": 2.83, "learning_rate": 2.3673112405863224e-06, "loss": 1.4785, "step": 35968 }, { "epoch": 2.83, "learning_rate": 2.365124558204057e-06, "loss": 1.4564, "step": 35969 }, { "epoch": 2.83, "learning_rate": 2.3629388781811533e-06, "loss": 1.4089, "step": 35970 }, { "epoch": 2.83, "learning_rate": 2.3607542005324163e-06, "loss": 1.4844, "step": 35971 }, { "epoch": 2.83, "learning_rate": 2.3585705252726682e-06, "loss": 1.4882, "step": 35972 }, { "epoch": 2.83, "learning_rate": 2.3563878524167635e-06, "loss": 1.4419, "step": 35973 }, { "epoch": 2.83, "learning_rate": 2.3542061819795065e-06, "loss": 1.43, "step": 35974 }, { "epoch": 2.83, "learning_rate": 2.3520255139757195e-06, "loss": 1.3838, "step": 35975 }, { "epoch": 2.83, "learning_rate": 2.349845848420173e-06, "loss": 1.4351, "step": 35976 }, { "epoch": 2.83, "learning_rate": 2.347667185327723e-06, "loss": 1.479, "step": 35977 }, { "epoch": 2.83, "learning_rate": 2.3454895247131233e-06, "loss": 1.4297, "step": 35978 }, { "epoch": 2.83, "learning_rate": 2.343312866591163e-06, "loss": 1.4158, "step": 35979 }, { "epoch": 2.83, "learning_rate": 2.341137210976629e-06, "loss": 1.4395, "step": 35980 }, { "epoch": 2.83, "learning_rate": 2.338962557884294e-06, "loss": 1.4364, "step": 35981 }, { "epoch": 2.83, "learning_rate": 2.336788907328896e-06, "loss": 1.4143, "step": 35982 }, { "epoch": 2.83, "learning_rate": 2.334616259325223e-06, "loss": 1.4416, "step": 35983 }, { "epoch": 2.83, "learning_rate": 2.332444613888029e-06, "loss": 1.4229, "step": 35984 }, { "epoch": 2.83, "learning_rate": 2.3302739710320374e-06, "loss": 1.4644, "step": 35985 }, { "epoch": 2.83, "learning_rate": 2.328104330771985e-06, "loss": 1.4392, "step": 35986 }, { "epoch": 2.83, "learning_rate": 2.325935693122627e-06, "loss": 1.4603, "step": 35987 }, { "epoch": 2.83, "learning_rate": 2.3237680580986684e-06, "loss": 1.404, "step": 35988 }, { "epoch": 2.83, "learning_rate": 2.3216014257148474e-06, "loss": 1.4135, "step": 35989 }, { "epoch": 2.83, "learning_rate": 2.319435795985819e-06, "loss": 1.4603, "step": 35990 }, { "epoch": 2.83, "learning_rate": 2.3172711689263545e-06, "loss": 1.4619, "step": 35991 }, { "epoch": 2.83, "learning_rate": 2.315107544551109e-06, "loss": 1.4443, "step": 35992 }, { "epoch": 2.83, "learning_rate": 2.3129449228747877e-06, "loss": 1.3894, "step": 35993 }, { "epoch": 2.83, "learning_rate": 2.3107833039120784e-06, "loss": 1.437, "step": 35994 }, { "epoch": 2.83, "learning_rate": 2.3086226876776357e-06, "loss": 1.4323, "step": 35995 }, { "epoch": 2.83, "learning_rate": 2.3064630741861325e-06, "loss": 1.4352, "step": 35996 }, { "epoch": 2.83, "learning_rate": 2.3043044634522558e-06, "loss": 1.4723, "step": 35997 }, { "epoch": 2.83, "learning_rate": 2.302146855490644e-06, "loss": 1.5074, "step": 35998 }, { "epoch": 2.83, "learning_rate": 2.299990250315953e-06, "loss": 1.4462, "step": 35999 }, { "epoch": 2.83, "learning_rate": 2.2978346479428034e-06, "loss": 1.4468, "step": 36000 }, { "epoch": 2.83, "learning_rate": 2.295680048385867e-06, "loss": 1.4438, "step": 36001 }, { "epoch": 2.83, "learning_rate": 2.2935264516597663e-06, "loss": 1.4519, "step": 36002 }, { "epoch": 2.83, "learning_rate": 2.291373857779072e-06, "loss": 1.438, "step": 36003 }, { "epoch": 2.83, "learning_rate": 2.289222266758456e-06, "loss": 1.3825, "step": 36004 }, { "epoch": 2.83, "learning_rate": 2.287071678612523e-06, "loss": 1.4723, "step": 36005 }, { "epoch": 2.83, "learning_rate": 2.2849220933558287e-06, "loss": 1.5298, "step": 36006 }, { "epoch": 2.83, "learning_rate": 2.282773511003011e-06, "loss": 1.3931, "step": 36007 }, { "epoch": 2.83, "learning_rate": 2.280625931568658e-06, "loss": 1.4528, "step": 36008 }, { "epoch": 2.83, "learning_rate": 2.278479355067325e-06, "loss": 1.3999, "step": 36009 }, { "epoch": 2.83, "learning_rate": 2.276333781513584e-06, "loss": 1.4344, "step": 36010 }, { "epoch": 2.83, "learning_rate": 2.2741892109220396e-06, "loss": 1.4821, "step": 36011 }, { "epoch": 2.83, "learning_rate": 2.272045643307213e-06, "loss": 1.4228, "step": 36012 }, { "epoch": 2.83, "learning_rate": 2.2699030786836767e-06, "loss": 1.4509, "step": 36013 }, { "epoch": 2.83, "learning_rate": 2.2677615170659692e-06, "loss": 1.4725, "step": 36014 }, { "epoch": 2.83, "learning_rate": 2.2656209584686447e-06, "loss": 1.4702, "step": 36015 }, { "epoch": 2.83, "learning_rate": 2.2634814029062254e-06, "loss": 1.4991, "step": 36016 }, { "epoch": 2.83, "learning_rate": 2.261342850393233e-06, "loss": 1.457, "step": 36017 }, { "epoch": 2.83, "learning_rate": 2.259205300944206e-06, "loss": 1.4626, "step": 36018 }, { "epoch": 2.83, "learning_rate": 2.2570687545736322e-06, "loss": 1.4564, "step": 36019 }, { "epoch": 2.83, "learning_rate": 2.254933211296034e-06, "loss": 1.459, "step": 36020 }, { "epoch": 2.83, "learning_rate": 2.252798671125916e-06, "loss": 1.4527, "step": 36021 }, { "epoch": 2.83, "learning_rate": 2.2506651340777503e-06, "loss": 1.4065, "step": 36022 }, { "epoch": 2.83, "learning_rate": 2.2485326001660255e-06, "loss": 1.4233, "step": 36023 }, { "epoch": 2.83, "learning_rate": 2.2464010694052457e-06, "loss": 1.4698, "step": 36024 }, { "epoch": 2.83, "learning_rate": 2.2442705418098673e-06, "loss": 1.4683, "step": 36025 }, { "epoch": 2.83, "learning_rate": 2.2421410173943444e-06, "loss": 1.4361, "step": 36026 }, { "epoch": 2.83, "learning_rate": 2.240012496173149e-06, "loss": 1.4528, "step": 36027 }, { "epoch": 2.83, "learning_rate": 2.23788497816072e-06, "loss": 1.4583, "step": 36028 }, { "epoch": 2.83, "learning_rate": 2.235758463371512e-06, "loss": 1.4288, "step": 36029 }, { "epoch": 2.83, "learning_rate": 2.2336329518199638e-06, "loss": 1.3762, "step": 36030 }, { "epoch": 2.83, "learning_rate": 2.2315084435204966e-06, "loss": 1.4363, "step": 36031 }, { "epoch": 2.84, "learning_rate": 2.229384938487566e-06, "loss": 1.4854, "step": 36032 }, { "epoch": 2.84, "learning_rate": 2.227262436735544e-06, "loss": 1.4992, "step": 36033 }, { "epoch": 2.84, "learning_rate": 2.225140938278869e-06, "loss": 1.424, "step": 36034 }, { "epoch": 2.84, "learning_rate": 2.2230204431319286e-06, "loss": 1.461, "step": 36035 }, { "epoch": 2.84, "learning_rate": 2.220900951309146e-06, "loss": 1.4455, "step": 36036 }, { "epoch": 2.84, "learning_rate": 2.218782462824875e-06, "loss": 1.4251, "step": 36037 }, { "epoch": 2.84, "learning_rate": 2.2166649776935385e-06, "loss": 1.4622, "step": 36038 }, { "epoch": 2.84, "learning_rate": 2.2145484959294746e-06, "loss": 1.5024, "step": 36039 }, { "epoch": 2.84, "learning_rate": 2.2124330175470884e-06, "loss": 1.4884, "step": 36040 }, { "epoch": 2.84, "learning_rate": 2.2103185425607184e-06, "loss": 1.4514, "step": 36041 }, { "epoch": 2.84, "learning_rate": 2.2082050709847197e-06, "loss": 1.4482, "step": 36042 }, { "epoch": 2.84, "learning_rate": 2.2060926028334647e-06, "loss": 1.5003, "step": 36043 }, { "epoch": 2.84, "learning_rate": 2.2039811381212748e-06, "loss": 1.4254, "step": 36044 }, { "epoch": 2.84, "learning_rate": 2.2018706768624883e-06, "loss": 1.421, "step": 36045 }, { "epoch": 2.84, "learning_rate": 2.1997612190714444e-06, "loss": 1.4428, "step": 36046 }, { "epoch": 2.84, "learning_rate": 2.1976527647624642e-06, "loss": 1.4491, "step": 36047 }, { "epoch": 2.84, "learning_rate": 2.195545313949837e-06, "loss": 1.428, "step": 36048 }, { "epoch": 2.84, "learning_rate": 2.1934388666479173e-06, "loss": 1.4235, "step": 36049 }, { "epoch": 2.84, "learning_rate": 2.1913334228709777e-06, "loss": 1.4054, "step": 36050 }, { "epoch": 2.84, "learning_rate": 2.1892289826332897e-06, "loss": 1.4957, "step": 36051 }, { "epoch": 2.84, "learning_rate": 2.187125545949192e-06, "loss": 1.4121, "step": 36052 }, { "epoch": 2.84, "learning_rate": 2.18502311283294e-06, "loss": 1.4319, "step": 36053 }, { "epoch": 2.84, "learning_rate": 2.182921683298805e-06, "loss": 1.4312, "step": 36054 }, { "epoch": 2.84, "learning_rate": 2.1808212573610595e-06, "loss": 1.4293, "step": 36055 }, { "epoch": 2.84, "learning_rate": 2.1787218350339754e-06, "loss": 1.3971, "step": 36056 }, { "epoch": 2.84, "learning_rate": 2.176623416331774e-06, "loss": 1.482, "step": 36057 }, { "epoch": 2.84, "learning_rate": 2.174526001268745e-06, "loss": 1.5202, "step": 36058 }, { "epoch": 2.84, "learning_rate": 2.1724295898591093e-06, "loss": 1.4907, "step": 36059 }, { "epoch": 2.84, "learning_rate": 2.1703341821170726e-06, "loss": 1.4252, "step": 36060 }, { "epoch": 2.84, "learning_rate": 2.168239778056907e-06, "loss": 1.448, "step": 36061 }, { "epoch": 2.84, "learning_rate": 2.1661463776928013e-06, "loss": 1.4549, "step": 36062 }, { "epoch": 2.84, "learning_rate": 2.1640539810389936e-06, "loss": 1.4036, "step": 36063 }, { "epoch": 2.84, "learning_rate": 2.1619625881096726e-06, "loss": 1.4447, "step": 36064 }, { "epoch": 2.84, "learning_rate": 2.159872198919044e-06, "loss": 1.4295, "step": 36065 }, { "epoch": 2.84, "learning_rate": 2.1577828134812957e-06, "loss": 1.4406, "step": 36066 }, { "epoch": 2.84, "learning_rate": 2.1556944318106175e-06, "loss": 1.4121, "step": 36067 }, { "epoch": 2.84, "learning_rate": 2.15360705392118e-06, "loss": 1.4007, "step": 36068 }, { "epoch": 2.84, "learning_rate": 2.1515206798271732e-06, "loss": 1.4793, "step": 36069 }, { "epoch": 2.84, "learning_rate": 2.149435309542752e-06, "loss": 1.4679, "step": 36070 }, { "epoch": 2.84, "learning_rate": 2.1473509430820546e-06, "loss": 1.4241, "step": 36071 }, { "epoch": 2.84, "learning_rate": 2.14526758045927e-06, "loss": 1.4263, "step": 36072 }, { "epoch": 2.84, "learning_rate": 2.143185221688537e-06, "loss": 1.4763, "step": 36073 }, { "epoch": 2.84, "learning_rate": 2.141103866783944e-06, "loss": 1.4787, "step": 36074 }, { "epoch": 2.84, "learning_rate": 2.1390235157596967e-06, "loss": 1.4598, "step": 36075 }, { "epoch": 2.84, "learning_rate": 2.136944168629867e-06, "loss": 1.4347, "step": 36076 }, { "epoch": 2.84, "learning_rate": 2.1348658254085936e-06, "loss": 1.4159, "step": 36077 }, { "epoch": 2.84, "learning_rate": 2.1327884861099653e-06, "loss": 1.4343, "step": 36078 }, { "epoch": 2.84, "learning_rate": 2.1307121507481207e-06, "loss": 1.4114, "step": 36079 }, { "epoch": 2.84, "learning_rate": 2.1286368193371484e-06, "loss": 1.4162, "step": 36080 }, { "epoch": 2.84, "learning_rate": 2.1265624918911037e-06, "loss": 1.415, "step": 36081 }, { "epoch": 2.84, "learning_rate": 2.124489168424126e-06, "loss": 1.4567, "step": 36082 }, { "epoch": 2.84, "learning_rate": 2.122416848950237e-06, "loss": 1.4852, "step": 36083 }, { "epoch": 2.84, "learning_rate": 2.1203455334835586e-06, "loss": 1.4287, "step": 36084 }, { "epoch": 2.84, "learning_rate": 2.118275222038096e-06, "loss": 1.4391, "step": 36085 }, { "epoch": 2.84, "learning_rate": 2.1162059146279553e-06, "loss": 1.4492, "step": 36086 }, { "epoch": 2.84, "learning_rate": 2.114137611267175e-06, "loss": 1.3952, "step": 36087 }, { "epoch": 2.84, "learning_rate": 2.112070311969777e-06, "loss": 1.4616, "step": 36088 }, { "epoch": 2.84, "learning_rate": 2.1100040167498167e-06, "loss": 1.4454, "step": 36089 }, { "epoch": 2.84, "learning_rate": 2.1079387256213164e-06, "loss": 1.4619, "step": 36090 }, { "epoch": 2.84, "learning_rate": 2.1058744385982817e-06, "loss": 1.459, "step": 36091 }, { "epoch": 2.84, "learning_rate": 2.1038111556947512e-06, "loss": 1.4874, "step": 36092 }, { "epoch": 2.84, "learning_rate": 2.1017488769247304e-06, "loss": 1.4513, "step": 36093 }, { "epoch": 2.84, "learning_rate": 2.099687602302225e-06, "loss": 1.4259, "step": 36094 }, { "epoch": 2.84, "learning_rate": 2.097627331841223e-06, "loss": 1.4343, "step": 36095 }, { "epoch": 2.84, "learning_rate": 2.0955680655556972e-06, "loss": 1.4278, "step": 36096 }, { "epoch": 2.84, "learning_rate": 2.09350980345967e-06, "loss": 1.4489, "step": 36097 }, { "epoch": 2.84, "learning_rate": 2.0914525455670626e-06, "loss": 1.5032, "step": 36098 }, { "epoch": 2.84, "learning_rate": 2.0893962918918817e-06, "loss": 1.4358, "step": 36099 }, { "epoch": 2.84, "learning_rate": 2.087341042448082e-06, "loss": 1.3875, "step": 36100 }, { "epoch": 2.84, "learning_rate": 2.085286797249619e-06, "loss": 1.4965, "step": 36101 }, { "epoch": 2.84, "learning_rate": 2.0832335563103986e-06, "loss": 1.4633, "step": 36102 }, { "epoch": 2.84, "learning_rate": 2.081181319644426e-06, "loss": 1.4734, "step": 36103 }, { "epoch": 2.84, "learning_rate": 2.0791300872655903e-06, "loss": 1.422, "step": 36104 }, { "epoch": 2.84, "learning_rate": 2.0770798591878303e-06, "loss": 1.4316, "step": 36105 }, { "epoch": 2.84, "learning_rate": 2.0750306354250846e-06, "loss": 1.4552, "step": 36106 }, { "epoch": 2.84, "learning_rate": 2.072982415991242e-06, "loss": 1.4015, "step": 36107 }, { "epoch": 2.84, "learning_rate": 2.0709352009001925e-06, "loss": 1.3916, "step": 36108 }, { "epoch": 2.84, "learning_rate": 2.0688889901658735e-06, "loss": 1.4962, "step": 36109 }, { "epoch": 2.84, "learning_rate": 2.0668437838021745e-06, "loss": 1.4066, "step": 36110 }, { "epoch": 2.84, "learning_rate": 2.064799581822968e-06, "loss": 1.4065, "step": 36111 }, { "epoch": 2.84, "learning_rate": 2.0627563842421093e-06, "loss": 1.4507, "step": 36112 }, { "epoch": 2.84, "learning_rate": 2.0607141910735203e-06, "loss": 1.4771, "step": 36113 }, { "epoch": 2.84, "learning_rate": 2.0586730023310404e-06, "loss": 1.4195, "step": 36114 }, { "epoch": 2.84, "learning_rate": 2.0566328180285253e-06, "loss": 1.4306, "step": 36115 }, { "epoch": 2.84, "learning_rate": 2.0545936381798465e-06, "loss": 1.4711, "step": 36116 }, { "epoch": 2.84, "learning_rate": 2.052555462798827e-06, "loss": 1.441, "step": 36117 }, { "epoch": 2.84, "learning_rate": 2.050518291899289e-06, "loss": 1.4199, "step": 36118 }, { "epoch": 2.84, "learning_rate": 2.0484821254951045e-06, "loss": 1.4745, "step": 36119 }, { "epoch": 2.84, "learning_rate": 2.046446963600096e-06, "loss": 1.4642, "step": 36120 }, { "epoch": 2.84, "learning_rate": 2.0444128062280517e-06, "loss": 1.442, "step": 36121 }, { "epoch": 2.84, "learning_rate": 2.0423796533927784e-06, "loss": 1.4696, "step": 36122 }, { "epoch": 2.84, "learning_rate": 2.040347505108114e-06, "loss": 1.4393, "step": 36123 }, { "epoch": 2.84, "learning_rate": 2.038316361387832e-06, "loss": 1.4199, "step": 36124 }, { "epoch": 2.84, "learning_rate": 2.0362862222457366e-06, "loss": 1.436, "step": 36125 }, { "epoch": 2.84, "learning_rate": 2.034257087695601e-06, "loss": 1.4161, "step": 36126 }, { "epoch": 2.84, "learning_rate": 2.0322289577511976e-06, "loss": 1.4652, "step": 36127 }, { "epoch": 2.84, "learning_rate": 2.0302018324263146e-06, "loss": 1.4142, "step": 36128 }, { "epoch": 2.84, "learning_rate": 2.0281757117347088e-06, "loss": 1.4512, "step": 36129 }, { "epoch": 2.84, "learning_rate": 2.0261505956901347e-06, "loss": 1.4426, "step": 36130 }, { "epoch": 2.84, "learning_rate": 2.024126484306332e-06, "loss": 1.4396, "step": 36131 }, { "epoch": 2.84, "learning_rate": 2.0221033775970396e-06, "loss": 1.4523, "step": 36132 }, { "epoch": 2.84, "learning_rate": 2.020081275576013e-06, "loss": 1.4389, "step": 36133 }, { "epoch": 2.84, "learning_rate": 2.018060178256975e-06, "loss": 1.4533, "step": 36134 }, { "epoch": 2.84, "learning_rate": 2.0160400856536476e-06, "loss": 1.4051, "step": 36135 }, { "epoch": 2.84, "learning_rate": 2.014020997779736e-06, "loss": 1.4227, "step": 36136 }, { "epoch": 2.84, "learning_rate": 2.0120029146489638e-06, "loss": 1.4308, "step": 36137 }, { "epoch": 2.84, "learning_rate": 2.0099858362750355e-06, "loss": 1.4208, "step": 36138 }, { "epoch": 2.84, "learning_rate": 2.0079697626716072e-06, "loss": 1.4397, "step": 36139 }, { "epoch": 2.84, "learning_rate": 2.0059546938524186e-06, "loss": 1.4958, "step": 36140 }, { "epoch": 2.84, "learning_rate": 2.0039406298311243e-06, "loss": 1.4053, "step": 36141 }, { "epoch": 2.84, "learning_rate": 2.001927570621398e-06, "loss": 1.4782, "step": 36142 }, { "epoch": 2.84, "learning_rate": 1.999915516236894e-06, "loss": 1.4585, "step": 36143 }, { "epoch": 2.84, "learning_rate": 1.997904466691319e-06, "loss": 1.4054, "step": 36144 }, { "epoch": 2.84, "learning_rate": 1.9958944219982955e-06, "loss": 1.434, "step": 36145 }, { "epoch": 2.84, "learning_rate": 1.993885382171445e-06, "loss": 1.4571, "step": 36146 }, { "epoch": 2.84, "learning_rate": 1.9918773472244743e-06, "loss": 1.4481, "step": 36147 }, { "epoch": 2.84, "learning_rate": 1.989870317170955e-06, "loss": 1.438, "step": 36148 }, { "epoch": 2.84, "learning_rate": 1.9878642920245438e-06, "loss": 1.469, "step": 36149 }, { "epoch": 2.84, "learning_rate": 1.985859271798862e-06, "loss": 1.4887, "step": 36150 }, { "epoch": 2.84, "learning_rate": 1.9838552565074994e-06, "loss": 1.4183, "step": 36151 }, { "epoch": 2.84, "learning_rate": 1.9818522461640786e-06, "loss": 1.4191, "step": 36152 }, { "epoch": 2.84, "learning_rate": 1.9798502407822047e-06, "loss": 1.4386, "step": 36153 }, { "epoch": 2.84, "learning_rate": 1.9778492403754675e-06, "loss": 1.423, "step": 36154 }, { "epoch": 2.84, "learning_rate": 1.975849244957439e-06, "loss": 1.4449, "step": 36155 }, { "epoch": 2.84, "learning_rate": 1.973850254541709e-06, "loss": 1.4356, "step": 36156 }, { "epoch": 2.84, "learning_rate": 1.9718522691418493e-06, "loss": 1.4791, "step": 36157 }, { "epoch": 2.84, "learning_rate": 1.9698552887714327e-06, "loss": 1.4509, "step": 36158 }, { "epoch": 2.85, "learning_rate": 1.967859313443998e-06, "loss": 1.481, "step": 36159 }, { "epoch": 2.85, "learning_rate": 1.965864343173118e-06, "loss": 1.4153, "step": 36160 }, { "epoch": 2.85, "learning_rate": 1.963870377972332e-06, "loss": 1.3959, "step": 36161 }, { "epoch": 2.85, "learning_rate": 1.9618774178551623e-06, "loss": 1.4241, "step": 36162 }, { "epoch": 2.85, "learning_rate": 1.959885462835148e-06, "loss": 1.4258, "step": 36163 }, { "epoch": 2.85, "learning_rate": 1.9578945129258116e-06, "loss": 1.4487, "step": 36164 }, { "epoch": 2.85, "learning_rate": 1.9559045681406924e-06, "loss": 1.5016, "step": 36165 }, { "epoch": 2.85, "learning_rate": 1.9539156284932633e-06, "loss": 1.431, "step": 36166 }, { "epoch": 2.85, "learning_rate": 1.951927693997063e-06, "loss": 1.4341, "step": 36167 }, { "epoch": 2.85, "learning_rate": 1.9499407646655805e-06, "loss": 1.4003, "step": 36168 }, { "epoch": 2.85, "learning_rate": 1.9479548405122723e-06, "loss": 1.4129, "step": 36169 }, { "epoch": 2.85, "learning_rate": 1.9459699215506774e-06, "loss": 1.4256, "step": 36170 }, { "epoch": 2.85, "learning_rate": 1.943986007794218e-06, "loss": 1.4828, "step": 36171 }, { "epoch": 2.85, "learning_rate": 1.942003099256401e-06, "loss": 1.4404, "step": 36172 }, { "epoch": 2.85, "learning_rate": 1.9400211959506805e-06, "loss": 1.5148, "step": 36173 }, { "epoch": 2.85, "learning_rate": 1.938040297890514e-06, "loss": 1.4478, "step": 36174 }, { "epoch": 2.85, "learning_rate": 1.93606040508934e-06, "loss": 1.4284, "step": 36175 }, { "epoch": 2.85, "learning_rate": 1.934081517560615e-06, "loss": 1.4619, "step": 36176 }, { "epoch": 2.85, "learning_rate": 1.932103635317761e-06, "loss": 1.4533, "step": 36177 }, { "epoch": 2.85, "learning_rate": 1.9301267583742173e-06, "loss": 1.4283, "step": 36178 }, { "epoch": 2.85, "learning_rate": 1.9281508867433904e-06, "loss": 1.4567, "step": 36179 }, { "epoch": 2.85, "learning_rate": 1.9261760204387187e-06, "loss": 1.4847, "step": 36180 }, { "epoch": 2.85, "learning_rate": 1.9242021594735922e-06, "loss": 1.4592, "step": 36181 }, { "epoch": 2.85, "learning_rate": 1.9222293038614165e-06, "loss": 1.4522, "step": 36182 }, { "epoch": 2.85, "learning_rate": 1.9202574536155814e-06, "loss": 1.4631, "step": 36183 }, { "epoch": 2.85, "learning_rate": 1.918286608749492e-06, "loss": 1.4201, "step": 36184 }, { "epoch": 2.85, "learning_rate": 1.9163167692765215e-06, "loss": 1.3976, "step": 36185 }, { "epoch": 2.85, "learning_rate": 1.9143479352100256e-06, "loss": 1.4559, "step": 36186 }, { "epoch": 2.85, "learning_rate": 1.9123801065633935e-06, "loss": 1.4512, "step": 36187 }, { "epoch": 2.85, "learning_rate": 1.9104132833499817e-06, "loss": 1.4829, "step": 36188 }, { "epoch": 2.85, "learning_rate": 1.908447465583146e-06, "loss": 1.4351, "step": 36189 }, { "epoch": 2.85, "learning_rate": 1.906482653276209e-06, "loss": 1.4476, "step": 36190 }, { "epoch": 2.85, "learning_rate": 1.9045188464425598e-06, "loss": 1.4752, "step": 36191 }, { "epoch": 2.85, "learning_rate": 1.902556045095488e-06, "loss": 1.4222, "step": 36192 }, { "epoch": 2.85, "learning_rate": 1.9005942492483162e-06, "loss": 1.4864, "step": 36193 }, { "epoch": 2.85, "learning_rate": 1.8986334589144004e-06, "loss": 1.4642, "step": 36194 }, { "epoch": 2.85, "learning_rate": 1.8966736741070298e-06, "loss": 1.4577, "step": 36195 }, { "epoch": 2.85, "learning_rate": 1.8947148948395275e-06, "loss": 1.5067, "step": 36196 }, { "epoch": 2.85, "learning_rate": 1.8927571211251657e-06, "loss": 1.4875, "step": 36197 }, { "epoch": 2.85, "learning_rate": 1.8908003529772509e-06, "loss": 1.4402, "step": 36198 }, { "epoch": 2.85, "learning_rate": 1.888844590409072e-06, "loss": 1.4748, "step": 36199 }, { "epoch": 2.85, "learning_rate": 1.8868898334339021e-06, "loss": 1.4312, "step": 36200 }, { "epoch": 2.85, "learning_rate": 1.884936082065014e-06, "loss": 1.4433, "step": 36201 }, { "epoch": 2.85, "learning_rate": 1.8829833363156633e-06, "loss": 1.4393, "step": 36202 }, { "epoch": 2.85, "learning_rate": 1.8810315961991395e-06, "loss": 1.4231, "step": 36203 }, { "epoch": 2.85, "learning_rate": 1.879080861728649e-06, "loss": 1.4374, "step": 36204 }, { "epoch": 2.85, "learning_rate": 1.877131132917481e-06, "loss": 1.4501, "step": 36205 }, { "epoch": 2.85, "learning_rate": 1.8751824097788414e-06, "loss": 1.4568, "step": 36206 }, { "epoch": 2.85, "learning_rate": 1.87323469232597e-06, "loss": 1.4235, "step": 36207 }, { "epoch": 2.85, "learning_rate": 1.8712879805720892e-06, "loss": 1.4482, "step": 36208 }, { "epoch": 2.85, "learning_rate": 1.8693422745304388e-06, "loss": 1.4424, "step": 36209 }, { "epoch": 2.85, "learning_rate": 1.8673975742141911e-06, "loss": 1.4277, "step": 36210 }, { "epoch": 2.85, "learning_rate": 1.8654538796365692e-06, "loss": 1.4493, "step": 36211 }, { "epoch": 2.85, "learning_rate": 1.863511190810779e-06, "loss": 1.4324, "step": 36212 }, { "epoch": 2.85, "learning_rate": 1.8615695077499936e-06, "loss": 1.4882, "step": 36213 }, { "epoch": 2.85, "learning_rate": 1.8596288304673857e-06, "loss": 1.4453, "step": 36214 }, { "epoch": 2.85, "learning_rate": 1.857689158976161e-06, "loss": 1.4439, "step": 36215 }, { "epoch": 2.85, "learning_rate": 1.8557504932894762e-06, "loss": 1.453, "step": 36216 }, { "epoch": 2.85, "learning_rate": 1.853812833420487e-06, "loss": 1.4722, "step": 36217 }, { "epoch": 2.85, "learning_rate": 1.85187617938235e-06, "loss": 1.4649, "step": 36218 }, { "epoch": 2.85, "learning_rate": 1.8499405311882376e-06, "loss": 1.4762, "step": 36219 }, { "epoch": 2.85, "learning_rate": 1.8480058888512561e-06, "loss": 1.4191, "step": 36220 }, { "epoch": 2.85, "learning_rate": 1.8460722523845618e-06, "loss": 1.4485, "step": 36221 }, { "epoch": 2.85, "learning_rate": 1.844139621801294e-06, "loss": 1.4483, "step": 36222 }, { "epoch": 2.85, "learning_rate": 1.842207997114542e-06, "loss": 1.4777, "step": 36223 }, { "epoch": 2.85, "learning_rate": 1.8402773783374292e-06, "loss": 1.431, "step": 36224 }, { "epoch": 2.85, "learning_rate": 1.8383477654830946e-06, "loss": 1.428, "step": 36225 }, { "epoch": 2.85, "learning_rate": 1.8364191585646116e-06, "loss": 1.4206, "step": 36226 }, { "epoch": 2.85, "learning_rate": 1.8344915575950692e-06, "loss": 1.4828, "step": 36227 }, { "epoch": 2.85, "learning_rate": 1.8325649625875738e-06, "loss": 1.4249, "step": 36228 }, { "epoch": 2.85, "learning_rate": 1.8306393735551817e-06, "loss": 1.4746, "step": 36229 }, { "epoch": 2.85, "learning_rate": 1.828714790510999e-06, "loss": 1.4162, "step": 36230 }, { "epoch": 2.85, "learning_rate": 1.8267912134680651e-06, "loss": 1.4459, "step": 36231 }, { "epoch": 2.85, "learning_rate": 1.8248686424394532e-06, "loss": 1.3936, "step": 36232 }, { "epoch": 2.85, "learning_rate": 1.8229470774382194e-06, "loss": 1.423, "step": 36233 }, { "epoch": 2.85, "learning_rate": 1.8210265184773864e-06, "loss": 1.4493, "step": 36234 }, { "epoch": 2.85, "learning_rate": 1.8191069655700274e-06, "loss": 1.4564, "step": 36235 }, { "epoch": 2.85, "learning_rate": 1.8171884187291485e-06, "loss": 1.4448, "step": 36236 }, { "epoch": 2.85, "learning_rate": 1.815270877967806e-06, "loss": 1.4887, "step": 36237 }, { "epoch": 2.85, "learning_rate": 1.8133543432989727e-06, "loss": 1.4617, "step": 36238 }, { "epoch": 2.85, "learning_rate": 1.811438814735705e-06, "loss": 1.4424, "step": 36239 }, { "epoch": 2.85, "learning_rate": 1.8095242922909925e-06, "loss": 1.3788, "step": 36240 }, { "epoch": 2.85, "learning_rate": 1.807610775977808e-06, "loss": 1.4387, "step": 36241 }, { "epoch": 2.85, "learning_rate": 1.8056982658091912e-06, "loss": 1.4305, "step": 36242 }, { "epoch": 2.85, "learning_rate": 1.8037867617980983e-06, "loss": 1.3969, "step": 36243 }, { "epoch": 2.85, "learning_rate": 1.8018762639575024e-06, "loss": 1.4413, "step": 36244 }, { "epoch": 2.85, "learning_rate": 1.799966772300393e-06, "loss": 1.4131, "step": 36245 }, { "epoch": 2.85, "learning_rate": 1.7980582868397265e-06, "loss": 1.4884, "step": 36246 }, { "epoch": 2.85, "learning_rate": 1.796150807588459e-06, "loss": 1.4372, "step": 36247 }, { "epoch": 2.85, "learning_rate": 1.794244334559547e-06, "loss": 1.4093, "step": 36248 }, { "epoch": 2.85, "learning_rate": 1.7923388677659135e-06, "loss": 1.4238, "step": 36249 }, { "epoch": 2.85, "learning_rate": 1.7904344072205145e-06, "loss": 1.441, "step": 36250 }, { "epoch": 2.85, "learning_rate": 1.7885309529362735e-06, "loss": 1.4193, "step": 36251 }, { "epoch": 2.85, "learning_rate": 1.7866285049261298e-06, "loss": 1.4382, "step": 36252 }, { "epoch": 2.85, "learning_rate": 1.7847270632029898e-06, "loss": 1.4151, "step": 36253 }, { "epoch": 2.85, "learning_rate": 1.7828266277797597e-06, "loss": 1.4499, "step": 36254 }, { "epoch": 2.85, "learning_rate": 1.7809271986693296e-06, "loss": 1.4616, "step": 36255 }, { "epoch": 2.85, "learning_rate": 1.7790287758846223e-06, "loss": 1.4244, "step": 36256 }, { "epoch": 2.85, "learning_rate": 1.7771313594385272e-06, "loss": 1.4414, "step": 36257 }, { "epoch": 2.85, "learning_rate": 1.7752349493438844e-06, "loss": 1.4493, "step": 36258 }, { "epoch": 2.85, "learning_rate": 1.7733395456136167e-06, "loss": 1.4658, "step": 36259 }, { "epoch": 2.85, "learning_rate": 1.7714451482605808e-06, "loss": 1.4165, "step": 36260 }, { "epoch": 2.85, "learning_rate": 1.7695517572976158e-06, "loss": 1.4293, "step": 36261 }, { "epoch": 2.85, "learning_rate": 1.767659372737612e-06, "loss": 1.4755, "step": 36262 }, { "epoch": 2.85, "learning_rate": 1.7657679945933922e-06, "loss": 1.404, "step": 36263 }, { "epoch": 2.85, "learning_rate": 1.7638776228777962e-06, "loss": 1.4193, "step": 36264 }, { "epoch": 2.85, "learning_rate": 1.7619882576036638e-06, "loss": 1.4477, "step": 36265 }, { "epoch": 2.85, "learning_rate": 1.7600998987838345e-06, "loss": 1.472, "step": 36266 }, { "epoch": 2.85, "learning_rate": 1.7582125464311314e-06, "loss": 1.4645, "step": 36267 }, { "epoch": 2.85, "learning_rate": 1.7563262005583444e-06, "loss": 1.4309, "step": 36268 }, { "epoch": 2.85, "learning_rate": 1.7544408611783133e-06, "loss": 1.4263, "step": 36269 }, { "epoch": 2.85, "learning_rate": 1.7525565283038113e-06, "loss": 1.448, "step": 36270 }, { "epoch": 2.85, "learning_rate": 1.7506732019476278e-06, "loss": 1.45, "step": 36271 }, { "epoch": 2.85, "learning_rate": 1.7487908821225693e-06, "loss": 1.439, "step": 36272 }, { "epoch": 2.85, "learning_rate": 1.746909568841426e-06, "loss": 1.4209, "step": 36273 }, { "epoch": 2.85, "learning_rate": 1.745029262116937e-06, "loss": 1.4746, "step": 36274 }, { "epoch": 2.85, "learning_rate": 1.7431499619618927e-06, "loss": 1.4234, "step": 36275 }, { "epoch": 2.85, "learning_rate": 1.7412716683890326e-06, "loss": 1.4847, "step": 36276 }, { "epoch": 2.85, "learning_rate": 1.7393943814111467e-06, "loss": 1.4237, "step": 36277 }, { "epoch": 2.85, "learning_rate": 1.7375181010409244e-06, "loss": 1.4755, "step": 36278 }, { "epoch": 2.85, "learning_rate": 1.735642827291156e-06, "loss": 1.4816, "step": 36279 }, { "epoch": 2.85, "learning_rate": 1.7337685601745478e-06, "loss": 1.5291, "step": 36280 }, { "epoch": 2.85, "learning_rate": 1.7318952997038394e-06, "loss": 1.4367, "step": 36281 }, { "epoch": 2.85, "learning_rate": 1.7300230458917207e-06, "loss": 1.4734, "step": 36282 }, { "epoch": 2.85, "learning_rate": 1.7281517987509486e-06, "loss": 1.4532, "step": 36283 }, { "epoch": 2.85, "learning_rate": 1.7262815582941791e-06, "loss": 1.3819, "step": 36284 }, { "epoch": 2.85, "learning_rate": 1.7244123245341523e-06, "loss": 1.4545, "step": 36285 }, { "epoch": 2.86, "learning_rate": 1.7225440974835247e-06, "loss": 1.4163, "step": 36286 }, { "epoch": 2.86, "learning_rate": 1.7206768771550195e-06, "loss": 1.409, "step": 36287 }, { "epoch": 2.86, "learning_rate": 1.7188106635612597e-06, "loss": 1.4301, "step": 36288 }, { "epoch": 2.86, "learning_rate": 1.7169454567149688e-06, "loss": 1.4147, "step": 36289 }, { "epoch": 2.86, "learning_rate": 1.7150812566287863e-06, "loss": 1.4397, "step": 36290 }, { "epoch": 2.86, "learning_rate": 1.7132180633153859e-06, "loss": 1.4084, "step": 36291 }, { "epoch": 2.86, "learning_rate": 1.7113558767873735e-06, "loss": 1.4295, "step": 36292 }, { "epoch": 2.86, "learning_rate": 1.7094946970574397e-06, "loss": 1.4847, "step": 36293 }, { "epoch": 2.86, "learning_rate": 1.7076345241382072e-06, "loss": 1.4469, "step": 36294 }, { "epoch": 2.86, "learning_rate": 1.7057753580422828e-06, "loss": 1.4233, "step": 36295 }, { "epoch": 2.86, "learning_rate": 1.703917198782323e-06, "loss": 1.4349, "step": 36296 }, { "epoch": 2.86, "learning_rate": 1.7020600463709177e-06, "loss": 1.424, "step": 36297 }, { "epoch": 2.86, "learning_rate": 1.700203900820707e-06, "loss": 1.5193, "step": 36298 }, { "epoch": 2.86, "learning_rate": 1.6983487621442471e-06, "loss": 1.4529, "step": 36299 }, { "epoch": 2.86, "learning_rate": 1.6964946303541781e-06, "loss": 1.4614, "step": 36300 }, { "epoch": 2.86, "learning_rate": 1.6946415054630735e-06, "loss": 1.4557, "step": 36301 }, { "epoch": 2.86, "learning_rate": 1.6927893874835064e-06, "loss": 1.5279, "step": 36302 }, { "epoch": 2.86, "learning_rate": 1.69093827642805e-06, "loss": 1.4201, "step": 36303 }, { "epoch": 2.86, "learning_rate": 1.6890881723092942e-06, "loss": 1.4633, "step": 36304 }, { "epoch": 2.86, "learning_rate": 1.6872390751397624e-06, "loss": 1.4341, "step": 36305 }, { "epoch": 2.86, "learning_rate": 1.6853909849320447e-06, "loss": 1.5004, "step": 36306 }, { "epoch": 2.86, "learning_rate": 1.6835439016986806e-06, "loss": 1.3987, "step": 36307 }, { "epoch": 2.86, "learning_rate": 1.681697825452194e-06, "loss": 1.435, "step": 36308 }, { "epoch": 2.86, "learning_rate": 1.6798527562051244e-06, "loss": 1.4309, "step": 36309 }, { "epoch": 2.86, "learning_rate": 1.6780086939700289e-06, "loss": 1.4849, "step": 36310 }, { "epoch": 2.86, "learning_rate": 1.6761656387593968e-06, "loss": 1.4571, "step": 36311 }, { "epoch": 2.86, "learning_rate": 1.6743235905857356e-06, "loss": 1.5078, "step": 36312 }, { "epoch": 2.86, "learning_rate": 1.6724825494615512e-06, "loss": 1.4416, "step": 36313 }, { "epoch": 2.86, "learning_rate": 1.6706425153993842e-06, "loss": 1.4097, "step": 36314 }, { "epoch": 2.86, "learning_rate": 1.6688034884116908e-06, "loss": 1.4359, "step": 36315 }, { "epoch": 2.86, "learning_rate": 1.6669654685109612e-06, "loss": 1.4894, "step": 36316 }, { "epoch": 2.86, "learning_rate": 1.6651284557096856e-06, "loss": 1.4722, "step": 36317 }, { "epoch": 2.86, "learning_rate": 1.663292450020337e-06, "loss": 1.3667, "step": 36318 }, { "epoch": 2.86, "learning_rate": 1.6614574514553558e-06, "loss": 1.4589, "step": 36319 }, { "epoch": 2.86, "learning_rate": 1.6596234600272318e-06, "loss": 1.4863, "step": 36320 }, { "epoch": 2.86, "learning_rate": 1.6577904757484052e-06, "loss": 1.4397, "step": 36321 }, { "epoch": 2.86, "learning_rate": 1.655958498631299e-06, "loss": 1.3791, "step": 36322 }, { "epoch": 2.86, "learning_rate": 1.6541275286883872e-06, "loss": 1.4358, "step": 36323 }, { "epoch": 2.86, "learning_rate": 1.6522975659320924e-06, "loss": 1.45, "step": 36324 }, { "epoch": 2.86, "learning_rate": 1.6504686103748222e-06, "loss": 1.4369, "step": 36325 }, { "epoch": 2.86, "learning_rate": 1.6486406620289993e-06, "loss": 1.4315, "step": 36326 }, { "epoch": 2.86, "learning_rate": 1.6468137209070476e-06, "loss": 1.4162, "step": 36327 }, { "epoch": 2.86, "learning_rate": 1.6449877870213569e-06, "loss": 1.4438, "step": 36328 }, { "epoch": 2.86, "learning_rate": 1.643162860384334e-06, "loss": 1.4743, "step": 36329 }, { "epoch": 2.86, "learning_rate": 1.6413389410083689e-06, "loss": 1.4419, "step": 36330 }, { "epoch": 2.86, "learning_rate": 1.639516028905835e-06, "loss": 1.4428, "step": 36331 }, { "epoch": 2.86, "learning_rate": 1.6376941240891228e-06, "loss": 1.4706, "step": 36332 }, { "epoch": 2.86, "learning_rate": 1.6358732265705721e-06, "loss": 1.4187, "step": 36333 }, { "epoch": 2.86, "learning_rate": 1.6340533363625897e-06, "loss": 1.3821, "step": 36334 }, { "epoch": 2.86, "learning_rate": 1.6322344534775156e-06, "loss": 1.3741, "step": 36335 }, { "epoch": 2.86, "learning_rate": 1.6304165779276734e-06, "loss": 1.4301, "step": 36336 }, { "epoch": 2.86, "learning_rate": 1.6285997097254366e-06, "loss": 1.4467, "step": 36337 }, { "epoch": 2.86, "learning_rate": 1.6267838488831287e-06, "loss": 1.4267, "step": 36338 }, { "epoch": 2.86, "learning_rate": 1.624968995413073e-06, "loss": 1.4933, "step": 36339 }, { "epoch": 2.86, "learning_rate": 1.6231551493276095e-06, "loss": 1.4811, "step": 36340 }, { "epoch": 2.86, "learning_rate": 1.6213423106390455e-06, "loss": 1.4187, "step": 36341 }, { "epoch": 2.86, "learning_rate": 1.6195304793596708e-06, "loss": 1.4301, "step": 36342 }, { "epoch": 2.86, "learning_rate": 1.617719655501809e-06, "loss": 1.428, "step": 36343 }, { "epoch": 2.86, "learning_rate": 1.6159098390777336e-06, "loss": 1.4303, "step": 36344 }, { "epoch": 2.86, "learning_rate": 1.6141010300997515e-06, "loss": 1.4593, "step": 36345 }, { "epoch": 2.86, "learning_rate": 1.612293228580136e-06, "loss": 1.4583, "step": 36346 }, { "epoch": 2.86, "learning_rate": 1.6104864345311773e-06, "loss": 1.4452, "step": 36347 }, { "epoch": 2.86, "learning_rate": 1.608680647965116e-06, "loss": 1.4969, "step": 36348 }, { "epoch": 2.86, "learning_rate": 1.6068758688942251e-06, "loss": 1.4095, "step": 36349 }, { "epoch": 2.86, "learning_rate": 1.6050720973307617e-06, "loss": 1.4479, "step": 36350 }, { "epoch": 2.86, "learning_rate": 1.603269333286966e-06, "loss": 1.4696, "step": 36351 }, { "epoch": 2.86, "learning_rate": 1.6014675767750785e-06, "loss": 1.4378, "step": 36352 }, { "epoch": 2.86, "learning_rate": 1.599666827807322e-06, "loss": 1.4399, "step": 36353 }, { "epoch": 2.86, "learning_rate": 1.5978670863959543e-06, "loss": 1.4323, "step": 36354 }, { "epoch": 2.86, "learning_rate": 1.5960683525531648e-06, "loss": 1.3648, "step": 36355 }, { "epoch": 2.86, "learning_rate": 1.594270626291161e-06, "loss": 1.469, "step": 36356 }, { "epoch": 2.86, "learning_rate": 1.5924739076221827e-06, "loss": 1.3986, "step": 36357 }, { "epoch": 2.86, "learning_rate": 1.5906781965584037e-06, "loss": 1.4699, "step": 36358 }, { "epoch": 2.86, "learning_rate": 1.5888834931119975e-06, "loss": 1.4816, "step": 36359 }, { "epoch": 2.86, "learning_rate": 1.587089797295188e-06, "loss": 1.4079, "step": 36360 }, { "epoch": 2.86, "learning_rate": 1.5852971091201483e-06, "loss": 1.4502, "step": 36361 }, { "epoch": 2.86, "learning_rate": 1.5835054285990356e-06, "loss": 1.478, "step": 36362 }, { "epoch": 2.86, "learning_rate": 1.581714755744007e-06, "loss": 1.4589, "step": 36363 }, { "epoch": 2.86, "learning_rate": 1.5799250905672523e-06, "loss": 1.4265, "step": 36364 }, { "epoch": 2.86, "learning_rate": 1.5781364330808788e-06, "loss": 1.4601, "step": 36365 }, { "epoch": 2.86, "learning_rate": 1.5763487832970768e-06, "loss": 1.4293, "step": 36366 }, { "epoch": 2.86, "learning_rate": 1.5745621412279363e-06, "loss": 1.4079, "step": 36367 }, { "epoch": 2.86, "learning_rate": 1.5727765068856146e-06, "loss": 1.4394, "step": 36368 }, { "epoch": 2.86, "learning_rate": 1.5709918802822518e-06, "loss": 1.4806, "step": 36369 }, { "epoch": 2.86, "learning_rate": 1.5692082614299217e-06, "loss": 1.4364, "step": 36370 }, { "epoch": 2.86, "learning_rate": 1.5674256503407644e-06, "loss": 1.4376, "step": 36371 }, { "epoch": 2.86, "learning_rate": 1.5656440470268873e-06, "loss": 1.43, "step": 36372 }, { "epoch": 2.86, "learning_rate": 1.5638634515003467e-06, "loss": 1.4799, "step": 36373 }, { "epoch": 2.86, "learning_rate": 1.5620838637732835e-06, "loss": 1.4708, "step": 36374 }, { "epoch": 2.86, "learning_rate": 1.5603052838577379e-06, "loss": 1.4148, "step": 36375 }, { "epoch": 2.86, "learning_rate": 1.558527711765817e-06, "loss": 1.4476, "step": 36376 }, { "epoch": 2.86, "learning_rate": 1.5567511475095606e-06, "loss": 1.4067, "step": 36377 }, { "epoch": 2.86, "learning_rate": 1.5549755911010597e-06, "loss": 1.4552, "step": 36378 }, { "epoch": 2.86, "learning_rate": 1.5532010425523544e-06, "loss": 1.4145, "step": 36379 }, { "epoch": 2.86, "learning_rate": 1.5514275018755017e-06, "loss": 1.4129, "step": 36380 }, { "epoch": 2.86, "learning_rate": 1.5496549690825256e-06, "loss": 1.4115, "step": 36381 }, { "epoch": 2.86, "learning_rate": 1.547883444185466e-06, "loss": 1.5016, "step": 36382 }, { "epoch": 2.86, "learning_rate": 1.5461129271963635e-06, "loss": 1.4242, "step": 36383 }, { "epoch": 2.86, "learning_rate": 1.5443434181272251e-06, "loss": 1.4274, "step": 36384 }, { "epoch": 2.86, "learning_rate": 1.5425749169900914e-06, "loss": 1.4275, "step": 36385 }, { "epoch": 2.86, "learning_rate": 1.5408074237969192e-06, "loss": 1.4266, "step": 36386 }, { "epoch": 2.86, "learning_rate": 1.539040938559749e-06, "loss": 1.447, "step": 36387 }, { "epoch": 2.86, "learning_rate": 1.5372754612905714e-06, "loss": 1.3724, "step": 36388 }, { "epoch": 2.86, "learning_rate": 1.5355109920013597e-06, "loss": 1.412, "step": 36389 }, { "epoch": 2.86, "learning_rate": 1.5337475307040882e-06, "loss": 1.4743, "step": 36390 }, { "epoch": 2.86, "learning_rate": 1.5319850774107467e-06, "loss": 1.5154, "step": 36391 }, { "epoch": 2.86, "learning_rate": 1.5302236321332929e-06, "loss": 1.4373, "step": 36392 }, { "epoch": 2.86, "learning_rate": 1.5284631948837001e-06, "loss": 1.4627, "step": 36393 }, { "epoch": 2.86, "learning_rate": 1.5267037656738924e-06, "loss": 1.4341, "step": 36394 }, { "epoch": 2.86, "learning_rate": 1.5249453445158432e-06, "loss": 1.4582, "step": 36395 }, { "epoch": 2.86, "learning_rate": 1.5231879314214934e-06, "loss": 1.4172, "step": 36396 }, { "epoch": 2.86, "learning_rate": 1.5214315264027332e-06, "loss": 1.4559, "step": 36397 }, { "epoch": 2.86, "learning_rate": 1.5196761294715364e-06, "loss": 1.4677, "step": 36398 }, { "epoch": 2.86, "learning_rate": 1.5179217406397936e-06, "loss": 1.439, "step": 36399 }, { "epoch": 2.86, "learning_rate": 1.5161683599194118e-06, "loss": 1.4213, "step": 36400 }, { "epoch": 2.86, "learning_rate": 1.514415987322315e-06, "loss": 1.4819, "step": 36401 }, { "epoch": 2.86, "learning_rate": 1.5126646228603933e-06, "loss": 1.4029, "step": 36402 }, { "epoch": 2.86, "learning_rate": 1.5109142665455543e-06, "loss": 1.4603, "step": 36403 }, { "epoch": 2.86, "learning_rate": 1.5091649183896382e-06, "loss": 1.4387, "step": 36404 }, { "epoch": 2.86, "learning_rate": 1.5074165784045522e-06, "loss": 1.4392, "step": 36405 }, { "epoch": 2.86, "learning_rate": 1.5056692466021702e-06, "loss": 1.3748, "step": 36406 }, { "epoch": 2.86, "learning_rate": 1.5039229229943494e-06, "loss": 1.462, "step": 36407 }, { "epoch": 2.86, "learning_rate": 1.5021776075929304e-06, "loss": 1.4178, "step": 36408 }, { "epoch": 2.86, "learning_rate": 1.5004333004097869e-06, "loss": 1.4744, "step": 36409 }, { "epoch": 2.86, "learning_rate": 1.4986900014567593e-06, "loss": 1.4534, "step": 36410 }, { "epoch": 2.86, "learning_rate": 1.4969477107456718e-06, "loss": 1.478, "step": 36411 }, { "epoch": 2.86, "learning_rate": 1.4952064282883647e-06, "loss": 1.4646, "step": 36412 }, { "epoch": 2.87, "learning_rate": 1.4934661540966452e-06, "loss": 1.4699, "step": 36413 }, { "epoch": 2.87, "learning_rate": 1.4917268881823374e-06, "loss": 1.4567, "step": 36414 }, { "epoch": 2.87, "learning_rate": 1.4899886305572483e-06, "loss": 1.4923, "step": 36415 }, { "epoch": 2.87, "learning_rate": 1.488251381233202e-06, "loss": 1.4158, "step": 36416 }, { "epoch": 2.87, "learning_rate": 1.4865151402219389e-06, "loss": 1.429, "step": 36417 }, { "epoch": 2.87, "learning_rate": 1.4847799075353162e-06, "loss": 1.413, "step": 36418 }, { "epoch": 2.87, "learning_rate": 1.483045683185058e-06, "loss": 1.4554, "step": 36419 }, { "epoch": 2.87, "learning_rate": 1.4813124671829713e-06, "loss": 1.4608, "step": 36420 }, { "epoch": 2.87, "learning_rate": 1.4795802595408134e-06, "loss": 1.4499, "step": 36421 }, { "epoch": 2.87, "learning_rate": 1.477849060270342e-06, "loss": 1.4658, "step": 36422 }, { "epoch": 2.87, "learning_rate": 1.4761188693833136e-06, "loss": 1.4534, "step": 36423 }, { "epoch": 2.87, "learning_rate": 1.4743896868914694e-06, "loss": 1.473, "step": 36424 }, { "epoch": 2.87, "learning_rate": 1.4726615128065666e-06, "loss": 1.4523, "step": 36425 }, { "epoch": 2.87, "learning_rate": 1.470934347140329e-06, "loss": 1.4234, "step": 36426 }, { "epoch": 2.87, "learning_rate": 1.4692081899044804e-06, "loss": 1.4255, "step": 36427 }, { "epoch": 2.87, "learning_rate": 1.4674830411107285e-06, "loss": 1.3814, "step": 36428 }, { "epoch": 2.87, "learning_rate": 1.4657589007708137e-06, "loss": 1.4703, "step": 36429 }, { "epoch": 2.87, "learning_rate": 1.4640357688964266e-06, "loss": 1.4267, "step": 36430 }, { "epoch": 2.87, "learning_rate": 1.462313645499258e-06, "loss": 1.4399, "step": 36431 }, { "epoch": 2.87, "learning_rate": 1.4605925305910315e-06, "loss": 1.4463, "step": 36432 }, { "epoch": 2.87, "learning_rate": 1.4588724241833882e-06, "loss": 1.4795, "step": 36433 }, { "epoch": 2.87, "learning_rate": 1.4571533262880353e-06, "loss": 1.4899, "step": 36434 }, { "epoch": 2.87, "learning_rate": 1.4554352369166466e-06, "loss": 1.4357, "step": 36435 }, { "epoch": 2.87, "learning_rate": 1.4537181560808797e-06, "loss": 1.4459, "step": 36436 }, { "epoch": 2.87, "learning_rate": 1.4520020837923753e-06, "loss": 1.4449, "step": 36437 }, { "epoch": 2.87, "learning_rate": 1.450287020062807e-06, "loss": 1.4104, "step": 36438 }, { "epoch": 2.87, "learning_rate": 1.4485729649038324e-06, "loss": 1.4178, "step": 36439 }, { "epoch": 2.87, "learning_rate": 1.446859918327059e-06, "loss": 1.4225, "step": 36440 }, { "epoch": 2.87, "learning_rate": 1.4451478803441107e-06, "loss": 1.4749, "step": 36441 }, { "epoch": 2.87, "learning_rate": 1.4434368509666449e-06, "loss": 1.4201, "step": 36442 }, { "epoch": 2.87, "learning_rate": 1.441726830206269e-06, "loss": 1.4132, "step": 36443 }, { "epoch": 2.87, "learning_rate": 1.4400178180745902e-06, "loss": 1.4294, "step": 36444 }, { "epoch": 2.87, "learning_rate": 1.438309814583183e-06, "loss": 1.438, "step": 36445 }, { "epoch": 2.87, "learning_rate": 1.4366028197436874e-06, "loss": 1.4759, "step": 36446 }, { "epoch": 2.87, "learning_rate": 1.434896833567678e-06, "loss": 1.4343, "step": 36447 }, { "epoch": 2.87, "learning_rate": 1.433191856066712e-06, "loss": 1.4634, "step": 36448 }, { "epoch": 2.87, "learning_rate": 1.4314878872524139e-06, "loss": 1.4435, "step": 36449 }, { "epoch": 2.87, "learning_rate": 1.4297849271363072e-06, "loss": 1.4412, "step": 36450 }, { "epoch": 2.87, "learning_rate": 1.4280829757299828e-06, "loss": 1.4143, "step": 36451 }, { "epoch": 2.87, "learning_rate": 1.4263820330449816e-06, "loss": 1.4675, "step": 36452 }, { "epoch": 2.87, "learning_rate": 1.424682099092861e-06, "loss": 1.4579, "step": 36453 }, { "epoch": 2.87, "learning_rate": 1.422983173885145e-06, "loss": 1.4756, "step": 36454 }, { "epoch": 2.87, "learning_rate": 1.421285257433391e-06, "loss": 1.4642, "step": 36455 }, { "epoch": 2.87, "learning_rate": 1.4195883497491235e-06, "loss": 1.4418, "step": 36456 }, { "epoch": 2.87, "learning_rate": 1.417892450843866e-06, "loss": 1.4621, "step": 36457 }, { "epoch": 2.87, "learning_rate": 1.4161975607290933e-06, "loss": 1.468, "step": 36458 }, { "epoch": 2.87, "learning_rate": 1.4145036794163623e-06, "loss": 1.4481, "step": 36459 }, { "epoch": 2.87, "learning_rate": 1.412810806917164e-06, "loss": 1.4426, "step": 36460 }, { "epoch": 2.87, "learning_rate": 1.4111189432429726e-06, "loss": 1.4334, "step": 36461 }, { "epoch": 2.87, "learning_rate": 1.4094280884052788e-06, "loss": 1.4744, "step": 36462 }, { "epoch": 2.87, "learning_rate": 1.4077382424155903e-06, "loss": 1.4123, "step": 36463 }, { "epoch": 2.87, "learning_rate": 1.4060494052853478e-06, "loss": 1.44, "step": 36464 }, { "epoch": 2.87, "learning_rate": 1.4043615770260252e-06, "loss": 1.3995, "step": 36465 }, { "epoch": 2.87, "learning_rate": 1.4026747576490804e-06, "loss": 1.4779, "step": 36466 }, { "epoch": 2.87, "learning_rate": 1.4009889471659874e-06, "loss": 1.4325, "step": 36467 }, { "epoch": 2.87, "learning_rate": 1.3993041455881538e-06, "loss": 1.4678, "step": 36468 }, { "epoch": 2.87, "learning_rate": 1.3976203529270535e-06, "loss": 1.4454, "step": 36469 }, { "epoch": 2.87, "learning_rate": 1.395937569194111e-06, "loss": 1.4275, "step": 36470 }, { "epoch": 2.87, "learning_rate": 1.3942557944007504e-06, "loss": 1.4899, "step": 36471 }, { "epoch": 2.87, "learning_rate": 1.3925750285583625e-06, "loss": 1.378, "step": 36472 }, { "epoch": 2.87, "learning_rate": 1.390895271678405e-06, "loss": 1.431, "step": 36473 }, { "epoch": 2.87, "learning_rate": 1.3892165237722519e-06, "loss": 1.4228, "step": 36474 }, { "epoch": 2.87, "learning_rate": 1.3875387848512943e-06, "loss": 1.4907, "step": 36475 }, { "epoch": 2.87, "learning_rate": 1.3858620549269562e-06, "loss": 1.4481, "step": 36476 }, { "epoch": 2.87, "learning_rate": 1.3841863340105951e-06, "loss": 1.4131, "step": 36477 }, { "epoch": 2.87, "learning_rate": 1.3825116221136023e-06, "loss": 1.5033, "step": 36478 }, { "epoch": 2.87, "learning_rate": 1.3808379192473184e-06, "loss": 1.4476, "step": 36479 }, { "epoch": 2.87, "learning_rate": 1.3791652254231512e-06, "loss": 1.4202, "step": 36480 }, { "epoch": 2.87, "learning_rate": 1.3774935406524411e-06, "loss": 1.4443, "step": 36481 }, { "epoch": 2.87, "learning_rate": 1.3758228649465131e-06, "loss": 1.4166, "step": 36482 }, { "epoch": 2.87, "learning_rate": 1.374153198316741e-06, "loss": 1.5018, "step": 36483 }, { "epoch": 2.87, "learning_rate": 1.3724845407744488e-06, "loss": 1.4402, "step": 36484 }, { "epoch": 2.87, "learning_rate": 1.370816892330978e-06, "loss": 1.424, "step": 36485 }, { "epoch": 2.87, "learning_rate": 1.3691502529976194e-06, "loss": 1.4568, "step": 36486 }, { "epoch": 2.87, "learning_rate": 1.3674846227857138e-06, "loss": 1.4576, "step": 36487 }, { "epoch": 2.87, "learning_rate": 1.3658200017065857e-06, "loss": 1.4719, "step": 36488 }, { "epoch": 2.87, "learning_rate": 1.3641563897714925e-06, "loss": 1.4155, "step": 36489 }, { "epoch": 2.87, "learning_rate": 1.3624937869917752e-06, "loss": 1.4525, "step": 36490 }, { "epoch": 2.87, "learning_rate": 1.3608321933786914e-06, "loss": 1.4168, "step": 36491 }, { "epoch": 2.87, "learning_rate": 1.3591716089435157e-06, "loss": 1.423, "step": 36492 }, { "epoch": 2.87, "learning_rate": 1.3575120336975554e-06, "loss": 1.5003, "step": 36493 }, { "epoch": 2.87, "learning_rate": 1.3558534676520683e-06, "loss": 1.4285, "step": 36494 }, { "epoch": 2.87, "learning_rate": 1.3541959108182788e-06, "loss": 1.4302, "step": 36495 }, { "epoch": 2.87, "learning_rate": 1.3525393632074944e-06, "loss": 1.4639, "step": 36496 }, { "epoch": 2.87, "learning_rate": 1.3508838248309228e-06, "loss": 1.4402, "step": 36497 }, { "epoch": 2.87, "learning_rate": 1.3492292956998385e-06, "loss": 1.3622, "step": 36498 }, { "epoch": 2.87, "learning_rate": 1.3475757758254325e-06, "loss": 1.4587, "step": 36499 }, { "epoch": 2.87, "learning_rate": 1.3459232652189622e-06, "loss": 1.411, "step": 36500 }, { "epoch": 2.87, "learning_rate": 1.3442717638916355e-06, "loss": 1.4611, "step": 36501 }, { "epoch": 2.87, "learning_rate": 1.342621271854677e-06, "loss": 1.4305, "step": 36502 }, { "epoch": 2.87, "learning_rate": 1.3409717891192773e-06, "loss": 1.3999, "step": 36503 }, { "epoch": 2.87, "learning_rate": 1.3393233156966444e-06, "loss": 1.4591, "step": 36504 }, { "epoch": 2.87, "learning_rate": 1.3376758515979691e-06, "loss": 1.4597, "step": 36505 }, { "epoch": 2.87, "learning_rate": 1.336029396834426e-06, "loss": 1.4325, "step": 36506 }, { "epoch": 2.87, "learning_rate": 1.3343839514172228e-06, "loss": 1.4522, "step": 36507 }, { "epoch": 2.87, "learning_rate": 1.3327395153575005e-06, "loss": 1.4381, "step": 36508 }, { "epoch": 2.87, "learning_rate": 1.3310960886664335e-06, "loss": 1.4327, "step": 36509 }, { "epoch": 2.87, "learning_rate": 1.3294536713551962e-06, "loss": 1.4612, "step": 36510 }, { "epoch": 2.87, "learning_rate": 1.327812263434913e-06, "loss": 1.4769, "step": 36511 }, { "epoch": 2.87, "learning_rate": 1.326171864916742e-06, "loss": 1.4654, "step": 36512 }, { "epoch": 2.87, "learning_rate": 1.3245324758118236e-06, "loss": 1.4161, "step": 36513 }, { "epoch": 2.87, "learning_rate": 1.3228940961312827e-06, "loss": 1.4068, "step": 36514 }, { "epoch": 2.87, "learning_rate": 1.3212567258862438e-06, "loss": 1.488, "step": 36515 }, { "epoch": 2.87, "learning_rate": 1.3196203650878146e-06, "loss": 1.4424, "step": 36516 }, { "epoch": 2.87, "learning_rate": 1.3179850137471193e-06, "loss": 1.4277, "step": 36517 }, { "epoch": 2.87, "learning_rate": 1.3163506718752492e-06, "loss": 1.4345, "step": 36518 }, { "epoch": 2.87, "learning_rate": 1.3147173394833288e-06, "loss": 1.4366, "step": 36519 }, { "epoch": 2.87, "learning_rate": 1.3130850165823991e-06, "loss": 1.4001, "step": 36520 }, { "epoch": 2.87, "learning_rate": 1.3114537031836015e-06, "loss": 1.4681, "step": 36521 }, { "epoch": 2.87, "learning_rate": 1.3098233992979602e-06, "loss": 1.4829, "step": 36522 }, { "epoch": 2.87, "learning_rate": 1.3081941049365663e-06, "loss": 1.4249, "step": 36523 }, { "epoch": 2.87, "learning_rate": 1.3065658201104779e-06, "loss": 1.4428, "step": 36524 }, { "epoch": 2.87, "learning_rate": 1.3049385448307526e-06, "loss": 1.4442, "step": 36525 }, { "epoch": 2.87, "learning_rate": 1.3033122791084317e-06, "loss": 1.5126, "step": 36526 }, { "epoch": 2.87, "learning_rate": 1.3016870229545728e-06, "loss": 1.4425, "step": 36527 }, { "epoch": 2.87, "learning_rate": 1.3000627763802173e-06, "loss": 1.4276, "step": 36528 }, { "epoch": 2.87, "learning_rate": 1.2984395393963397e-06, "loss": 1.4558, "step": 36529 }, { "epoch": 2.87, "learning_rate": 1.2968173120140147e-06, "loss": 1.4693, "step": 36530 }, { "epoch": 2.87, "learning_rate": 1.2951960942442497e-06, "loss": 1.4569, "step": 36531 }, { "epoch": 2.87, "learning_rate": 1.2935758860980195e-06, "loss": 1.4216, "step": 36532 }, { "epoch": 2.87, "learning_rate": 1.2919566875863486e-06, "loss": 1.4793, "step": 36533 }, { "epoch": 2.87, "learning_rate": 1.2903384987202447e-06, "loss": 1.3861, "step": 36534 }, { "epoch": 2.87, "learning_rate": 1.2887213195106827e-06, "loss": 1.464, "step": 36535 }, { "epoch": 2.87, "learning_rate": 1.2871051499686036e-06, "loss": 1.4309, "step": 36536 }, { "epoch": 2.87, "learning_rate": 1.2854899901050485e-06, "loss": 1.4537, "step": 36537 }, { "epoch": 2.87, "learning_rate": 1.2838758399309257e-06, "loss": 1.4238, "step": 36538 }, { "epoch": 2.87, "learning_rate": 1.2822626994572427e-06, "loss": 1.4128, "step": 36539 }, { "epoch": 2.88, "learning_rate": 1.2806505686949076e-06, "loss": 1.4385, "step": 36540 }, { "epoch": 2.88, "learning_rate": 1.2790394476548782e-06, "loss": 1.4462, "step": 36541 }, { "epoch": 2.88, "learning_rate": 1.2774293363481125e-06, "loss": 1.5027, "step": 36542 }, { "epoch": 2.88, "learning_rate": 1.275820234785535e-06, "loss": 1.4297, "step": 36543 }, { "epoch": 2.88, "learning_rate": 1.274212142978054e-06, "loss": 1.4697, "step": 36544 }, { "epoch": 2.88, "learning_rate": 1.2726050609366101e-06, "loss": 1.4746, "step": 36545 }, { "epoch": 2.88, "learning_rate": 1.2709989886720784e-06, "loss": 1.4367, "step": 36546 }, { "epoch": 2.88, "learning_rate": 1.2693939261954167e-06, "loss": 1.4092, "step": 36547 }, { "epoch": 2.88, "learning_rate": 1.2677898735174664e-06, "loss": 1.415, "step": 36548 }, { "epoch": 2.88, "learning_rate": 1.2661868306491685e-06, "loss": 1.4516, "step": 36549 }, { "epoch": 2.88, "learning_rate": 1.2645847976013813e-06, "loss": 1.415, "step": 36550 }, { "epoch": 2.88, "learning_rate": 1.262983774384979e-06, "loss": 1.3904, "step": 36551 }, { "epoch": 2.88, "learning_rate": 1.261383761010837e-06, "loss": 1.4682, "step": 36552 }, { "epoch": 2.88, "learning_rate": 1.2597847574898123e-06, "loss": 1.4747, "step": 36553 }, { "epoch": 2.88, "learning_rate": 1.2581867638327804e-06, "loss": 1.442, "step": 36554 }, { "epoch": 2.88, "learning_rate": 1.256589780050582e-06, "loss": 1.4414, "step": 36555 }, { "epoch": 2.88, "learning_rate": 1.254993806154042e-06, "loss": 1.4537, "step": 36556 }, { "epoch": 2.88, "learning_rate": 1.253398842154002e-06, "loss": 1.4154, "step": 36557 }, { "epoch": 2.88, "learning_rate": 1.2518048880613196e-06, "loss": 1.4058, "step": 36558 }, { "epoch": 2.88, "learning_rate": 1.2502119438867865e-06, "loss": 1.4026, "step": 36559 }, { "epoch": 2.88, "learning_rate": 1.2486200096412269e-06, "loss": 1.4336, "step": 36560 }, { "epoch": 2.88, "learning_rate": 1.2470290853354492e-06, "loss": 1.4583, "step": 36561 }, { "epoch": 2.88, "learning_rate": 1.2454391709802615e-06, "loss": 1.4053, "step": 36562 }, { "epoch": 2.88, "learning_rate": 1.243850266586438e-06, "loss": 1.4573, "step": 36563 }, { "epoch": 2.88, "learning_rate": 1.2422623721647873e-06, "loss": 1.4514, "step": 36564 }, { "epoch": 2.88, "learning_rate": 1.2406754877260838e-06, "loss": 1.4112, "step": 36565 }, { "epoch": 2.88, "learning_rate": 1.239089613281119e-06, "loss": 1.4238, "step": 36566 }, { "epoch": 2.88, "learning_rate": 1.2375047488406176e-06, "loss": 1.4175, "step": 36567 }, { "epoch": 2.88, "learning_rate": 1.2359208944153709e-06, "loss": 1.4508, "step": 36568 }, { "epoch": 2.88, "learning_rate": 1.234338050016137e-06, "loss": 1.4457, "step": 36569 }, { "epoch": 2.88, "learning_rate": 1.2327562156536409e-06, "loss": 1.4846, "step": 36570 }, { "epoch": 2.88, "learning_rate": 1.2311753913386401e-06, "loss": 1.4281, "step": 36571 }, { "epoch": 2.88, "learning_rate": 1.22959557708186e-06, "loss": 1.4397, "step": 36572 }, { "epoch": 2.88, "learning_rate": 1.2280167728940416e-06, "loss": 1.4979, "step": 36573 }, { "epoch": 2.88, "learning_rate": 1.2264389787858598e-06, "loss": 1.4454, "step": 36574 }, { "epoch": 2.88, "learning_rate": 1.2248621947680725e-06, "loss": 1.482, "step": 36575 }, { "epoch": 2.88, "learning_rate": 1.2232864208513715e-06, "loss": 1.4611, "step": 36576 }, { "epoch": 2.88, "learning_rate": 1.221711657046448e-06, "loss": 1.5196, "step": 36577 }, { "epoch": 2.88, "learning_rate": 1.2201379033640102e-06, "loss": 1.4448, "step": 36578 }, { "epoch": 2.88, "learning_rate": 1.2185651598147328e-06, "loss": 1.4151, "step": 36579 }, { "epoch": 2.88, "learning_rate": 1.2169934264092906e-06, "loss": 1.4508, "step": 36580 }, { "epoch": 2.88, "learning_rate": 1.215422703158342e-06, "loss": 1.3989, "step": 36581 }, { "epoch": 2.88, "learning_rate": 1.2138529900725779e-06, "loss": 1.4368, "step": 36582 }, { "epoch": 2.88, "learning_rate": 1.212284287162657e-06, "loss": 1.4275, "step": 36583 }, { "epoch": 2.88, "learning_rate": 1.210716594439204e-06, "loss": 1.4138, "step": 36584 }, { "epoch": 2.88, "learning_rate": 1.2091499119128767e-06, "loss": 1.4497, "step": 36585 }, { "epoch": 2.88, "learning_rate": 1.2075842395943168e-06, "loss": 1.4197, "step": 36586 }, { "epoch": 2.88, "learning_rate": 1.2060195774941494e-06, "loss": 1.4663, "step": 36587 }, { "epoch": 2.88, "learning_rate": 1.204455925622999e-06, "loss": 1.4412, "step": 36588 }, { "epoch": 2.88, "learning_rate": 1.202893283991474e-06, "loss": 1.4147, "step": 36589 }, { "epoch": 2.88, "learning_rate": 1.201331652610199e-06, "loss": 1.38, "step": 36590 }, { "epoch": 2.88, "learning_rate": 1.1997710314897657e-06, "loss": 1.4096, "step": 36591 }, { "epoch": 2.88, "learning_rate": 1.1982114206407823e-06, "loss": 1.4167, "step": 36592 }, { "epoch": 2.88, "learning_rate": 1.1966528200738067e-06, "loss": 1.4138, "step": 36593 }, { "epoch": 2.88, "learning_rate": 1.1950952297994476e-06, "loss": 1.4196, "step": 36594 }, { "epoch": 2.88, "learning_rate": 1.1935386498282794e-06, "loss": 1.4381, "step": 36595 }, { "epoch": 2.88, "learning_rate": 1.1919830801708607e-06, "loss": 1.4401, "step": 36596 }, { "epoch": 2.88, "learning_rate": 1.1904285208377662e-06, "loss": 1.4233, "step": 36597 }, { "epoch": 2.88, "learning_rate": 1.1888749718395375e-06, "loss": 1.4679, "step": 36598 }, { "epoch": 2.88, "learning_rate": 1.1873224331867327e-06, "loss": 1.3882, "step": 36599 }, { "epoch": 2.88, "learning_rate": 1.1857709048898768e-06, "loss": 1.4781, "step": 36600 }, { "epoch": 2.88, "learning_rate": 1.1842203869595114e-06, "loss": 1.4177, "step": 36601 }, { "epoch": 2.88, "learning_rate": 1.182670879406178e-06, "loss": 1.4748, "step": 36602 }, { "epoch": 2.88, "learning_rate": 1.1811223822403849e-06, "loss": 1.4257, "step": 36603 }, { "epoch": 2.88, "learning_rate": 1.1795748954726404e-06, "loss": 1.4191, "step": 36604 }, { "epoch": 2.88, "learning_rate": 1.1780284191134525e-06, "loss": 1.4672, "step": 36605 }, { "epoch": 2.88, "learning_rate": 1.1764829531733465e-06, "loss": 1.4876, "step": 36606 }, { "epoch": 2.88, "learning_rate": 1.174938497662764e-06, "loss": 1.4132, "step": 36607 }, { "epoch": 2.88, "learning_rate": 1.1733950525922297e-06, "loss": 1.4898, "step": 36608 }, { "epoch": 2.88, "learning_rate": 1.1718526179722353e-06, "loss": 1.4402, "step": 36609 }, { "epoch": 2.88, "learning_rate": 1.170311193813206e-06, "loss": 1.397, "step": 36610 }, { "epoch": 2.88, "learning_rate": 1.168770780125633e-06, "loss": 1.4317, "step": 36611 }, { "epoch": 2.88, "learning_rate": 1.1672313769199914e-06, "loss": 1.4652, "step": 36612 }, { "epoch": 2.88, "learning_rate": 1.1656929842067064e-06, "loss": 1.4422, "step": 36613 }, { "epoch": 2.88, "learning_rate": 1.164155601996236e-06, "loss": 1.4581, "step": 36614 }, { "epoch": 2.88, "learning_rate": 1.1626192302990056e-06, "loss": 1.4156, "step": 36615 }, { "epoch": 2.88, "learning_rate": 1.1610838691254564e-06, "loss": 1.3751, "step": 36616 }, { "epoch": 2.88, "learning_rate": 1.1595495184860304e-06, "loss": 1.451, "step": 36617 }, { "epoch": 2.88, "learning_rate": 1.1580161783911024e-06, "loss": 1.4441, "step": 36618 }, { "epoch": 2.88, "learning_rate": 1.156483848851114e-06, "loss": 1.4606, "step": 36619 }, { "epoch": 2.88, "learning_rate": 1.154952529876474e-06, "loss": 1.4659, "step": 36620 }, { "epoch": 2.88, "learning_rate": 1.1534222214775568e-06, "loss": 1.4198, "step": 36621 }, { "epoch": 2.88, "learning_rate": 1.1518929236647544e-06, "loss": 1.4322, "step": 36622 }, { "epoch": 2.88, "learning_rate": 1.1503646364484752e-06, "loss": 1.4173, "step": 36623 }, { "epoch": 2.88, "learning_rate": 1.148837359839061e-06, "loss": 1.4833, "step": 36624 }, { "epoch": 2.88, "learning_rate": 1.1473110938469033e-06, "loss": 1.4982, "step": 36625 }, { "epoch": 2.88, "learning_rate": 1.145785838482377e-06, "loss": 1.4901, "step": 36626 }, { "epoch": 2.88, "learning_rate": 1.1442615937557909e-06, "loss": 1.4147, "step": 36627 }, { "epoch": 2.88, "learning_rate": 1.1427383596775364e-06, "loss": 1.4073, "step": 36628 }, { "epoch": 2.88, "learning_rate": 1.1412161362579553e-06, "loss": 1.4571, "step": 36629 }, { "epoch": 2.88, "learning_rate": 1.139694923507356e-06, "loss": 1.4776, "step": 36630 }, { "epoch": 2.88, "learning_rate": 1.1381747214360804e-06, "loss": 1.4478, "step": 36631 }, { "epoch": 2.88, "learning_rate": 1.1366555300544533e-06, "loss": 1.4468, "step": 36632 }, { "epoch": 2.88, "learning_rate": 1.1351373493727832e-06, "loss": 1.4383, "step": 36633 }, { "epoch": 2.88, "learning_rate": 1.133620179401379e-06, "loss": 1.426, "step": 36634 }, { "epoch": 2.88, "learning_rate": 1.1321040201505481e-06, "loss": 1.4182, "step": 36635 }, { "epoch": 2.88, "learning_rate": 1.1305888716305667e-06, "loss": 1.45, "step": 36636 }, { "epoch": 2.88, "learning_rate": 1.1290747338517592e-06, "loss": 1.4293, "step": 36637 }, { "epoch": 2.88, "learning_rate": 1.127561606824351e-06, "loss": 1.463, "step": 36638 }, { "epoch": 2.88, "learning_rate": 1.126049490558667e-06, "loss": 1.4318, "step": 36639 }, { "epoch": 2.88, "learning_rate": 1.1245383850649325e-06, "loss": 1.4306, "step": 36640 }, { "epoch": 2.88, "learning_rate": 1.1230282903534393e-06, "loss": 1.4695, "step": 36641 }, { "epoch": 2.88, "learning_rate": 1.1215192064344125e-06, "loss": 1.4935, "step": 36642 }, { "epoch": 2.88, "learning_rate": 1.1200111333181273e-06, "loss": 1.4824, "step": 36643 }, { "epoch": 2.88, "learning_rate": 1.1185040710148085e-06, "loss": 1.4059, "step": 36644 }, { "epoch": 2.88, "learning_rate": 1.1169980195346817e-06, "loss": 1.4584, "step": 36645 }, { "epoch": 2.88, "learning_rate": 1.1154929788879718e-06, "loss": 1.4565, "step": 36646 }, { "epoch": 2.88, "learning_rate": 1.1139889490849209e-06, "loss": 1.4142, "step": 36647 }, { "epoch": 2.88, "learning_rate": 1.1124859301357037e-06, "loss": 1.4342, "step": 36648 }, { "epoch": 2.88, "learning_rate": 1.1109839220505623e-06, "loss": 1.4585, "step": 36649 }, { "epoch": 2.88, "learning_rate": 1.109482924839672e-06, "loss": 1.4308, "step": 36650 }, { "epoch": 2.88, "learning_rate": 1.1079829385132244e-06, "loss": 1.4774, "step": 36651 }, { "epoch": 2.88, "learning_rate": 1.1064839630813949e-06, "loss": 1.4729, "step": 36652 }, { "epoch": 2.88, "learning_rate": 1.1049859985543918e-06, "loss": 1.4593, "step": 36653 }, { "epoch": 2.88, "learning_rate": 1.1034890449423572e-06, "loss": 1.3945, "step": 36654 }, { "epoch": 2.88, "learning_rate": 1.1019931022554662e-06, "loss": 1.3559, "step": 36655 }, { "epoch": 2.88, "learning_rate": 1.1004981705038773e-06, "loss": 1.4884, "step": 36656 }, { "epoch": 2.88, "learning_rate": 1.0990042496977324e-06, "loss": 1.444, "step": 36657 }, { "epoch": 2.88, "learning_rate": 1.0975113398471736e-06, "loss": 1.4596, "step": 36658 }, { "epoch": 2.88, "learning_rate": 1.0960194409623257e-06, "loss": 1.4266, "step": 36659 }, { "epoch": 2.88, "learning_rate": 1.0945285530533643e-06, "loss": 1.4565, "step": 36660 }, { "epoch": 2.88, "learning_rate": 1.093038676130381e-06, "loss": 1.4324, "step": 36661 }, { "epoch": 2.88, "learning_rate": 1.091549810203468e-06, "loss": 1.4009, "step": 36662 }, { "epoch": 2.88, "learning_rate": 1.0900619552827672e-06, "loss": 1.4349, "step": 36663 }, { "epoch": 2.88, "learning_rate": 1.0885751113783868e-06, "loss": 1.4464, "step": 36664 }, { "epoch": 2.88, "learning_rate": 1.087089278500386e-06, "loss": 1.4086, "step": 36665 }, { "epoch": 2.88, "learning_rate": 1.085604456658873e-06, "loss": 1.4903, "step": 36666 }, { "epoch": 2.89, "learning_rate": 1.0841206458639395e-06, "loss": 1.4455, "step": 36667 }, { "epoch": 2.89, "learning_rate": 1.0826378461256447e-06, "loss": 1.3962, "step": 36668 }, { "epoch": 2.89, "learning_rate": 1.0811560574540468e-06, "loss": 1.4642, "step": 36669 }, { "epoch": 2.89, "learning_rate": 1.0796752798592379e-06, "loss": 1.4282, "step": 36670 }, { "epoch": 2.89, "learning_rate": 1.0781955133512432e-06, "loss": 1.414, "step": 36671 }, { "epoch": 2.89, "learning_rate": 1.0767167579401216e-06, "loss": 1.4488, "step": 36672 }, { "epoch": 2.89, "learning_rate": 1.0752390136359145e-06, "loss": 1.488, "step": 36673 }, { "epoch": 2.89, "learning_rate": 1.0737622804486312e-06, "loss": 1.4373, "step": 36674 }, { "epoch": 2.89, "learning_rate": 1.07228655838833e-06, "loss": 1.4037, "step": 36675 }, { "epoch": 2.89, "learning_rate": 1.0708118474650197e-06, "loss": 1.4188, "step": 36676 }, { "epoch": 2.89, "learning_rate": 1.0693381476887086e-06, "loss": 1.4803, "step": 36677 }, { "epoch": 2.89, "learning_rate": 1.0678654590694225e-06, "loss": 1.4286, "step": 36678 }, { "epoch": 2.89, "learning_rate": 1.0663937816171197e-06, "loss": 1.4687, "step": 36679 }, { "epoch": 2.89, "learning_rate": 1.064923115341826e-06, "loss": 1.4522, "step": 36680 }, { "epoch": 2.89, "learning_rate": 1.0634534602535161e-06, "loss": 1.45, "step": 36681 }, { "epoch": 2.89, "learning_rate": 1.061984816362149e-06, "loss": 1.4348, "step": 36682 }, { "epoch": 2.89, "learning_rate": 1.0605171836777337e-06, "loss": 1.4528, "step": 36683 }, { "epoch": 2.89, "learning_rate": 1.059050562210212e-06, "loss": 1.3836, "step": 36684 }, { "epoch": 2.89, "learning_rate": 1.0575849519695423e-06, "loss": 1.4761, "step": 36685 }, { "epoch": 2.89, "learning_rate": 1.056120352965667e-06, "loss": 1.4299, "step": 36686 }, { "epoch": 2.89, "learning_rate": 1.0546567652085613e-06, "loss": 1.373, "step": 36687 }, { "epoch": 2.89, "learning_rate": 1.0531941887081342e-06, "loss": 1.465, "step": 36688 }, { "epoch": 2.89, "learning_rate": 1.0517326234743106e-06, "loss": 1.4236, "step": 36689 }, { "epoch": 2.89, "learning_rate": 1.050272069517033e-06, "loss": 1.4431, "step": 36690 }, { "epoch": 2.89, "learning_rate": 1.04881252684621e-06, "loss": 1.4493, "step": 36691 }, { "epoch": 2.89, "learning_rate": 1.0473539954717669e-06, "loss": 1.4171, "step": 36692 }, { "epoch": 2.89, "learning_rate": 1.0458964754035625e-06, "loss": 1.5293, "step": 36693 }, { "epoch": 2.89, "learning_rate": 1.044439966651539e-06, "loss": 1.4191, "step": 36694 }, { "epoch": 2.89, "learning_rate": 1.0429844692255718e-06, "loss": 1.3975, "step": 36695 }, { "epoch": 2.89, "learning_rate": 1.0415299831355362e-06, "loss": 1.4383, "step": 36696 }, { "epoch": 2.89, "learning_rate": 1.0400765083913075e-06, "loss": 1.5011, "step": 36697 }, { "epoch": 2.89, "learning_rate": 1.0386240450027617e-06, "loss": 1.4612, "step": 36698 }, { "epoch": 2.89, "learning_rate": 1.0371725929797402e-06, "loss": 1.4919, "step": 36699 }, { "epoch": 2.89, "learning_rate": 1.035722152332119e-06, "loss": 1.4415, "step": 36700 }, { "epoch": 2.89, "learning_rate": 1.03427272306974e-06, "loss": 1.4066, "step": 36701 }, { "epoch": 2.89, "learning_rate": 1.0328243052024454e-06, "loss": 1.4009, "step": 36702 }, { "epoch": 2.89, "learning_rate": 1.0313768987400606e-06, "loss": 1.4629, "step": 36703 }, { "epoch": 2.89, "learning_rate": 1.0299305036924277e-06, "loss": 1.4597, "step": 36704 }, { "epoch": 2.89, "learning_rate": 1.0284851200693555e-06, "loss": 1.4309, "step": 36705 }, { "epoch": 2.89, "learning_rate": 1.0270407478806531e-06, "loss": 1.5032, "step": 36706 }, { "epoch": 2.89, "learning_rate": 1.0255973871361456e-06, "loss": 1.4995, "step": 36707 }, { "epoch": 2.89, "learning_rate": 1.0241550378456088e-06, "loss": 1.471, "step": 36708 }, { "epoch": 2.89, "learning_rate": 1.022713700018868e-06, "loss": 1.4373, "step": 36709 }, { "epoch": 2.89, "learning_rate": 1.0212733736656653e-06, "loss": 1.4792, "step": 36710 }, { "epoch": 2.89, "learning_rate": 1.0198340587958097e-06, "loss": 1.4583, "step": 36711 }, { "epoch": 2.89, "learning_rate": 1.018395755419077e-06, "loss": 1.4329, "step": 36712 }, { "epoch": 2.89, "learning_rate": 1.0169584635452088e-06, "loss": 1.424, "step": 36713 }, { "epoch": 2.89, "learning_rate": 1.0155221831839977e-06, "loss": 1.4166, "step": 36714 }, { "epoch": 2.89, "learning_rate": 1.0140869143451525e-06, "loss": 1.457, "step": 36715 }, { "epoch": 2.89, "learning_rate": 1.0126526570384485e-06, "loss": 1.4592, "step": 36716 }, { "epoch": 2.89, "learning_rate": 1.0112194112736117e-06, "loss": 1.4987, "step": 36717 }, { "epoch": 2.89, "learning_rate": 1.0097871770603837e-06, "loss": 1.4565, "step": 36718 }, { "epoch": 2.89, "learning_rate": 1.008355954408474e-06, "loss": 1.4349, "step": 36719 }, { "epoch": 2.89, "learning_rate": 1.006925743327608e-06, "loss": 1.4715, "step": 36720 }, { "epoch": 2.89, "learning_rate": 1.0054965438274942e-06, "loss": 1.4715, "step": 36721 }, { "epoch": 2.89, "learning_rate": 1.0040683559178419e-06, "loss": 1.4779, "step": 36722 }, { "epoch": 2.89, "learning_rate": 1.0026411796083267e-06, "loss": 1.3755, "step": 36723 }, { "epoch": 2.89, "learning_rate": 1.001215014908674e-06, "loss": 1.4465, "step": 36724 }, { "epoch": 2.89, "learning_rate": 9.997898618285428e-07, "loss": 1.4279, "step": 36725 }, { "epoch": 2.89, "learning_rate": 9.983657203776086e-07, "loss": 1.4483, "step": 36726 }, { "epoch": 2.89, "learning_rate": 9.96942590565547e-07, "loss": 1.4329, "step": 36727 }, { "epoch": 2.89, "learning_rate": 9.955204724020338e-07, "loss": 1.448, "step": 36728 }, { "epoch": 2.89, "learning_rate": 9.940993658966946e-07, "loss": 1.4756, "step": 36729 }, { "epoch": 2.89, "learning_rate": 9.92679271059188e-07, "loss": 1.4544, "step": 36730 }, { "epoch": 2.89, "learning_rate": 9.912601878991566e-07, "loss": 1.4018, "step": 36731 }, { "epoch": 2.89, "learning_rate": 9.898421164262593e-07, "loss": 1.4392, "step": 36732 }, { "epoch": 2.89, "learning_rate": 9.884250566500717e-07, "loss": 1.4442, "step": 36733 }, { "epoch": 2.89, "learning_rate": 9.870090085802696e-07, "loss": 1.4486, "step": 36734 }, { "epoch": 2.89, "learning_rate": 9.85593972226445e-07, "loss": 1.4303, "step": 36735 }, { "epoch": 2.89, "learning_rate": 9.841799475981904e-07, "loss": 1.4295, "step": 36736 }, { "epoch": 2.89, "learning_rate": 9.827669347051315e-07, "loss": 1.4399, "step": 36737 }, { "epoch": 2.89, "learning_rate": 9.813549335568438e-07, "loss": 1.4358, "step": 36738 }, { "epoch": 2.89, "learning_rate": 9.799439441629364e-07, "loss": 1.4309, "step": 36739 }, { "epoch": 2.89, "learning_rate": 9.785339665329516e-07, "loss": 1.4284, "step": 36740 }, { "epoch": 2.89, "learning_rate": 9.771250006764985e-07, "loss": 1.4651, "step": 36741 }, { "epoch": 2.89, "learning_rate": 9.757170466031362e-07, "loss": 1.4251, "step": 36742 }, { "epoch": 2.89, "learning_rate": 9.743101043224067e-07, "loss": 1.4815, "step": 36743 }, { "epoch": 2.89, "learning_rate": 9.72904173843869e-07, "loss": 1.462, "step": 36744 }, { "epoch": 2.89, "learning_rate": 9.71499255177083e-07, "loss": 1.4258, "step": 36745 }, { "epoch": 2.89, "learning_rate": 9.700953483315565e-07, "loss": 1.4804, "step": 36746 }, { "epoch": 2.89, "learning_rate": 9.686924533168494e-07, "loss": 1.4091, "step": 36747 }, { "epoch": 2.89, "learning_rate": 9.672905701424872e-07, "loss": 1.3791, "step": 36748 }, { "epoch": 2.89, "learning_rate": 9.658896988179787e-07, "loss": 1.4598, "step": 36749 }, { "epoch": 2.89, "learning_rate": 9.644898393528334e-07, "loss": 1.3885, "step": 36750 }, { "epoch": 2.89, "learning_rate": 9.630909917565433e-07, "loss": 1.4198, "step": 36751 }, { "epoch": 2.89, "learning_rate": 9.616931560386342e-07, "loss": 1.4385, "step": 36752 }, { "epoch": 2.89, "learning_rate": 9.602963322085823e-07, "loss": 1.4324, "step": 36753 }, { "epoch": 2.89, "learning_rate": 9.589005202758626e-07, "loss": 1.4083, "step": 36754 }, { "epoch": 2.89, "learning_rate": 9.57505720249968e-07, "loss": 1.4269, "step": 36755 }, { "epoch": 2.89, "learning_rate": 9.561119321403577e-07, "loss": 1.4055, "step": 36756 }, { "epoch": 2.89, "learning_rate": 9.547191559565072e-07, "loss": 1.4298, "step": 36757 }, { "epoch": 2.89, "learning_rate": 9.533273917078587e-07, "loss": 1.4286, "step": 36758 }, { "epoch": 2.89, "learning_rate": 9.519366394038552e-07, "loss": 1.4261, "step": 36759 }, { "epoch": 2.89, "learning_rate": 9.505468990539555e-07, "loss": 1.4461, "step": 36760 }, { "epoch": 2.89, "learning_rate": 9.491581706676021e-07, "loss": 1.4905, "step": 36761 }, { "epoch": 2.89, "learning_rate": 9.477704542542041e-07, "loss": 1.406, "step": 36762 }, { "epoch": 2.89, "learning_rate": 9.463837498231875e-07, "loss": 1.4494, "step": 36763 }, { "epoch": 2.89, "learning_rate": 9.449980573839777e-07, "loss": 1.3875, "step": 36764 }, { "epoch": 2.89, "learning_rate": 9.436133769459675e-07, "loss": 1.4798, "step": 36765 }, { "epoch": 2.89, "learning_rate": 9.422297085185826e-07, "loss": 1.4566, "step": 36766 }, { "epoch": 2.89, "learning_rate": 9.408470521111821e-07, "loss": 1.4719, "step": 36767 }, { "epoch": 2.89, "learning_rate": 9.394654077331754e-07, "loss": 1.4101, "step": 36768 }, { "epoch": 2.89, "learning_rate": 9.38084775393938e-07, "loss": 1.4155, "step": 36769 }, { "epoch": 2.89, "learning_rate": 9.367051551028625e-07, "loss": 1.4821, "step": 36770 }, { "epoch": 2.89, "learning_rate": 9.35326546869275e-07, "loss": 1.4473, "step": 36771 }, { "epoch": 2.89, "learning_rate": 9.339489507025844e-07, "loss": 1.3944, "step": 36772 }, { "epoch": 2.89, "learning_rate": 9.325723666120999e-07, "loss": 1.4771, "step": 36773 }, { "epoch": 2.89, "learning_rate": 9.311967946071975e-07, "loss": 1.4555, "step": 36774 }, { "epoch": 2.89, "learning_rate": 9.298222346972028e-07, "loss": 1.4744, "step": 36775 }, { "epoch": 2.89, "learning_rate": 9.284486868914586e-07, "loss": 1.4322, "step": 36776 }, { "epoch": 2.89, "learning_rate": 9.270761511992741e-07, "loss": 1.4206, "step": 36777 }, { "epoch": 2.89, "learning_rate": 9.257046276299751e-07, "loss": 1.4453, "step": 36778 }, { "epoch": 2.89, "learning_rate": 9.243341161928875e-07, "loss": 1.4159, "step": 36779 }, { "epoch": 2.89, "learning_rate": 9.229646168972871e-07, "loss": 1.4307, "step": 36780 }, { "epoch": 2.89, "learning_rate": 9.215961297524999e-07, "loss": 1.4268, "step": 36781 }, { "epoch": 2.89, "learning_rate": 9.202286547678018e-07, "loss": 1.4703, "step": 36782 }, { "epoch": 2.89, "learning_rate": 9.188621919525019e-07, "loss": 1.5082, "step": 36783 }, { "epoch": 2.89, "learning_rate": 9.174967413158263e-07, "loss": 1.4668, "step": 36784 }, { "epoch": 2.89, "learning_rate": 9.161323028671008e-07, "loss": 1.5056, "step": 36785 }, { "epoch": 2.89, "learning_rate": 9.147688766155514e-07, "loss": 1.4519, "step": 36786 }, { "epoch": 2.89, "learning_rate": 9.134064625704707e-07, "loss": 1.4866, "step": 36787 }, { "epoch": 2.89, "learning_rate": 9.120450607410678e-07, "loss": 1.48, "step": 36788 }, { "epoch": 2.89, "learning_rate": 9.106846711366023e-07, "loss": 1.4205, "step": 36789 }, { "epoch": 2.89, "learning_rate": 9.093252937663331e-07, "loss": 1.4374, "step": 36790 }, { "epoch": 2.89, "learning_rate": 9.07966928639453e-07, "loss": 1.4691, "step": 36791 }, { "epoch": 2.89, "learning_rate": 9.066095757652047e-07, "loss": 1.473, "step": 36792 }, { "epoch": 2.89, "learning_rate": 9.052532351528141e-07, "loss": 1.4161, "step": 36793 }, { "epoch": 2.89, "learning_rate": 9.038979068114571e-07, "loss": 1.4353, "step": 36794 }, { "epoch": 2.9, "learning_rate": 9.025435907503598e-07, "loss": 1.4545, "step": 36795 }, { "epoch": 2.9, "learning_rate": 9.011902869787313e-07, "loss": 1.4339, "step": 36796 }, { "epoch": 2.9, "learning_rate": 8.998379955057145e-07, "loss": 1.3829, "step": 36797 }, { "epoch": 2.9, "learning_rate": 8.984867163405351e-07, "loss": 1.4288, "step": 36798 }, { "epoch": 2.9, "learning_rate": 8.971364494923361e-07, "loss": 1.4383, "step": 36799 }, { "epoch": 2.9, "learning_rate": 8.957871949703099e-07, "loss": 1.4305, "step": 36800 }, { "epoch": 2.9, "learning_rate": 8.94438952783616e-07, "loss": 1.4174, "step": 36801 }, { "epoch": 2.9, "learning_rate": 8.930917229413804e-07, "loss": 1.4243, "step": 36802 }, { "epoch": 2.9, "learning_rate": 8.917455054527789e-07, "loss": 1.4925, "step": 36803 }, { "epoch": 2.9, "learning_rate": 8.904003003269378e-07, "loss": 1.4232, "step": 36804 }, { "epoch": 2.9, "learning_rate": 8.89056107572983e-07, "loss": 1.4419, "step": 36805 }, { "epoch": 2.9, "learning_rate": 8.877129272000572e-07, "loss": 1.4546, "step": 36806 }, { "epoch": 2.9, "learning_rate": 8.863707592172864e-07, "loss": 1.4317, "step": 36807 }, { "epoch": 2.9, "learning_rate": 8.850296036337468e-07, "loss": 1.4779, "step": 36808 }, { "epoch": 2.9, "learning_rate": 8.836894604585809e-07, "loss": 1.4406, "step": 36809 }, { "epoch": 2.9, "learning_rate": 8.823503297008816e-07, "loss": 1.4496, "step": 36810 }, { "epoch": 2.9, "learning_rate": 8.810122113697249e-07, "loss": 1.4371, "step": 36811 }, { "epoch": 2.9, "learning_rate": 8.796751054742035e-07, "loss": 1.4483, "step": 36812 }, { "epoch": 2.9, "learning_rate": 8.783390120233935e-07, "loss": 1.4917, "step": 36813 }, { "epoch": 2.9, "learning_rate": 8.77003931026371e-07, "loss": 1.4738, "step": 36814 }, { "epoch": 2.9, "learning_rate": 8.756698624922121e-07, "loss": 1.4496, "step": 36815 }, { "epoch": 2.9, "learning_rate": 8.743368064299427e-07, "loss": 1.4569, "step": 36816 }, { "epoch": 2.9, "learning_rate": 8.730047628486558e-07, "loss": 1.467, "step": 36817 }, { "epoch": 2.9, "learning_rate": 8.716737317573441e-07, "loss": 1.4317, "step": 36818 }, { "epoch": 2.9, "learning_rate": 8.703437131650837e-07, "loss": 1.4536, "step": 36819 }, { "epoch": 2.9, "learning_rate": 8.690147070809006e-07, "loss": 1.4503, "step": 36820 }, { "epoch": 2.9, "learning_rate": 8.676867135138044e-07, "loss": 1.4201, "step": 36821 }, { "epoch": 2.9, "learning_rate": 8.663597324728211e-07, "loss": 1.4595, "step": 36822 }, { "epoch": 2.9, "learning_rate": 8.650337639669435e-07, "loss": 1.4182, "step": 36823 }, { "epoch": 2.9, "learning_rate": 8.637088080051979e-07, "loss": 1.4295, "step": 36824 }, { "epoch": 2.9, "learning_rate": 8.62384864596577e-07, "loss": 1.4627, "step": 36825 }, { "epoch": 2.9, "learning_rate": 8.610619337500401e-07, "loss": 1.4787, "step": 36826 }, { "epoch": 2.9, "learning_rate": 8.597400154746137e-07, "loss": 1.4371, "step": 36827 }, { "epoch": 2.9, "learning_rate": 8.584191097792403e-07, "loss": 1.4336, "step": 36828 }, { "epoch": 2.9, "learning_rate": 8.570992166728962e-07, "loss": 1.4044, "step": 36829 }, { "epoch": 2.9, "learning_rate": 8.55780336164541e-07, "loss": 1.4833, "step": 36830 }, { "epoch": 2.9, "learning_rate": 8.54462468263134e-07, "loss": 1.4611, "step": 36831 }, { "epoch": 2.9, "learning_rate": 8.531456129776182e-07, "loss": 1.4883, "step": 36832 }, { "epoch": 2.9, "learning_rate": 8.51829770316953e-07, "loss": 1.4774, "step": 36833 }, { "epoch": 2.9, "learning_rate": 8.505149402900479e-07, "loss": 1.4102, "step": 36834 }, { "epoch": 2.9, "learning_rate": 8.492011229058293e-07, "loss": 1.4633, "step": 36835 }, { "epoch": 2.9, "learning_rate": 8.478883181732399e-07, "loss": 1.4597, "step": 36836 }, { "epoch": 2.9, "learning_rate": 8.465765261011891e-07, "loss": 1.4763, "step": 36837 }, { "epoch": 2.9, "learning_rate": 8.452657466985535e-07, "loss": 1.4285, "step": 36838 }, { "epoch": 2.9, "learning_rate": 8.439559799742591e-07, "loss": 1.4604, "step": 36839 }, { "epoch": 2.9, "learning_rate": 8.426472259371985e-07, "loss": 1.4118, "step": 36840 }, { "epoch": 2.9, "learning_rate": 8.413394845962485e-07, "loss": 1.3908, "step": 36841 }, { "epoch": 2.9, "learning_rate": 8.400327559602849e-07, "loss": 1.512, "step": 36842 }, { "epoch": 2.9, "learning_rate": 8.387270400382007e-07, "loss": 1.4486, "step": 36843 }, { "epoch": 2.9, "learning_rate": 8.374223368388389e-07, "loss": 1.4087, "step": 36844 }, { "epoch": 2.9, "learning_rate": 8.36118646371059e-07, "loss": 1.4465, "step": 36845 }, { "epoch": 2.9, "learning_rate": 8.348159686437206e-07, "loss": 1.4804, "step": 36846 }, { "epoch": 2.9, "learning_rate": 8.335143036656666e-07, "loss": 1.4543, "step": 36847 }, { "epoch": 2.9, "learning_rate": 8.322136514457234e-07, "loss": 1.4045, "step": 36848 }, { "epoch": 2.9, "learning_rate": 8.309140119927504e-07, "loss": 1.4349, "step": 36849 }, { "epoch": 2.9, "learning_rate": 8.296153853155407e-07, "loss": 1.4338, "step": 36850 }, { "epoch": 2.9, "learning_rate": 8.283177714229205e-07, "loss": 1.4786, "step": 36851 }, { "epoch": 2.9, "learning_rate": 8.270211703237162e-07, "loss": 1.4776, "step": 36852 }, { "epoch": 2.9, "learning_rate": 8.257255820267039e-07, "loss": 1.4271, "step": 36853 }, { "epoch": 2.9, "learning_rate": 8.244310065407101e-07, "loss": 1.4431, "step": 36854 }, { "epoch": 2.9, "learning_rate": 8.231374438744942e-07, "loss": 1.4675, "step": 36855 }, { "epoch": 2.9, "learning_rate": 8.218448940368493e-07, "loss": 1.4414, "step": 36856 }, { "epoch": 2.9, "learning_rate": 8.205533570365686e-07, "loss": 1.4399, "step": 36857 }, { "epoch": 2.9, "learning_rate": 8.192628328823947e-07, "loss": 1.411, "step": 36858 }, { "epoch": 2.9, "learning_rate": 8.179733215831041e-07, "loss": 1.4438, "step": 36859 }, { "epoch": 2.9, "learning_rate": 8.166848231474565e-07, "loss": 1.4106, "step": 36860 }, { "epoch": 2.9, "learning_rate": 8.153973375841948e-07, "loss": 1.4417, "step": 36861 }, { "epoch": 2.9, "learning_rate": 8.141108649020456e-07, "loss": 1.3859, "step": 36862 }, { "epoch": 2.9, "learning_rate": 8.128254051097516e-07, "loss": 1.4707, "step": 36863 }, { "epoch": 2.9, "learning_rate": 8.115409582160559e-07, "loss": 1.4687, "step": 36864 }, { "epoch": 2.9, "learning_rate": 8.102575242296683e-07, "loss": 1.4719, "step": 36865 }, { "epoch": 2.9, "learning_rate": 8.089751031592983e-07, "loss": 1.4368, "step": 36866 }, { "epoch": 2.9, "learning_rate": 8.076936950136725e-07, "loss": 1.4644, "step": 36867 }, { "epoch": 2.9, "learning_rate": 8.064132998014505e-07, "loss": 1.472, "step": 36868 }, { "epoch": 2.9, "learning_rate": 8.051339175313587e-07, "loss": 1.4269, "step": 36869 }, { "epoch": 2.9, "learning_rate": 8.038555482120901e-07, "loss": 1.4376, "step": 36870 }, { "epoch": 2.9, "learning_rate": 8.025781918523044e-07, "loss": 1.4279, "step": 36871 }, { "epoch": 2.9, "learning_rate": 8.013018484606615e-07, "loss": 1.4369, "step": 36872 }, { "epoch": 2.9, "learning_rate": 8.000265180458543e-07, "loss": 1.4687, "step": 36873 }, { "epoch": 2.9, "learning_rate": 7.987522006165426e-07, "loss": 1.4208, "step": 36874 }, { "epoch": 2.9, "learning_rate": 7.974788961813527e-07, "loss": 1.4543, "step": 36875 }, { "epoch": 2.9, "learning_rate": 7.962066047489446e-07, "loss": 1.4494, "step": 36876 }, { "epoch": 2.9, "learning_rate": 7.949353263279612e-07, "loss": 1.5095, "step": 36877 }, { "epoch": 2.9, "learning_rate": 7.93665060927029e-07, "loss": 1.4007, "step": 36878 }, { "epoch": 2.9, "learning_rate": 7.923958085547744e-07, "loss": 1.4134, "step": 36879 }, { "epoch": 2.9, "learning_rate": 7.911275692198072e-07, "loss": 1.4718, "step": 36880 }, { "epoch": 2.9, "learning_rate": 7.89860342930737e-07, "loss": 1.4417, "step": 36881 }, { "epoch": 2.9, "learning_rate": 7.885941296961906e-07, "loss": 1.4486, "step": 36882 }, { "epoch": 2.9, "learning_rate": 7.873289295247442e-07, "loss": 1.4678, "step": 36883 }, { "epoch": 2.9, "learning_rate": 7.86064742424991e-07, "loss": 1.4465, "step": 36884 }, { "epoch": 2.9, "learning_rate": 7.848015684055076e-07, "loss": 1.4401, "step": 36885 }, { "epoch": 2.9, "learning_rate": 7.835394074748869e-07, "loss": 1.4901, "step": 36886 }, { "epoch": 2.9, "learning_rate": 7.822782596416722e-07, "loss": 1.3786, "step": 36887 }, { "epoch": 2.9, "learning_rate": 7.810181249144731e-07, "loss": 1.4659, "step": 36888 }, { "epoch": 2.9, "learning_rate": 7.797590033017831e-07, "loss": 1.4323, "step": 36889 }, { "epoch": 2.9, "learning_rate": 7.785008948121951e-07, "loss": 1.4284, "step": 36890 }, { "epoch": 2.9, "learning_rate": 7.772437994542524e-07, "loss": 1.4289, "step": 36891 }, { "epoch": 2.9, "learning_rate": 7.759877172364648e-07, "loss": 1.4805, "step": 36892 }, { "epoch": 2.9, "learning_rate": 7.747326481673754e-07, "loss": 1.4839, "step": 36893 }, { "epoch": 2.9, "learning_rate": 7.734785922554943e-07, "loss": 1.4513, "step": 36894 }, { "epoch": 2.9, "learning_rate": 7.722255495093477e-07, "loss": 1.4257, "step": 36895 }, { "epoch": 2.9, "learning_rate": 7.709735199374456e-07, "loss": 1.4602, "step": 36896 }, { "epoch": 2.9, "learning_rate": 7.697225035482646e-07, "loss": 1.3968, "step": 36897 }, { "epoch": 2.9, "learning_rate": 7.684725003503311e-07, "loss": 1.4574, "step": 36898 }, { "epoch": 2.9, "learning_rate": 7.672235103521219e-07, "loss": 1.4218, "step": 36899 }, { "epoch": 2.9, "learning_rate": 7.659755335620965e-07, "loss": 1.4461, "step": 36900 }, { "epoch": 2.9, "learning_rate": 7.647285699887484e-07, "loss": 1.4395, "step": 36901 }, { "epoch": 2.9, "learning_rate": 7.634826196405375e-07, "loss": 1.4446, "step": 36902 }, { "epoch": 2.9, "learning_rate": 7.622376825259236e-07, "loss": 1.4395, "step": 36903 }, { "epoch": 2.9, "learning_rate": 7.609937586533665e-07, "loss": 1.4515, "step": 36904 }, { "epoch": 2.9, "learning_rate": 7.59750848031293e-07, "loss": 1.4409, "step": 36905 }, { "epoch": 2.9, "learning_rate": 7.58508950668163e-07, "loss": 1.5041, "step": 36906 }, { "epoch": 2.9, "learning_rate": 7.572680665724029e-07, "loss": 1.4339, "step": 36907 }, { "epoch": 2.9, "learning_rate": 7.560281957524228e-07, "loss": 1.4288, "step": 36908 }, { "epoch": 2.9, "learning_rate": 7.547893382166659e-07, "loss": 1.4165, "step": 36909 }, { "epoch": 2.9, "learning_rate": 7.535514939735088e-07, "loss": 1.4252, "step": 36910 }, { "epoch": 2.9, "learning_rate": 7.523146630313781e-07, "loss": 1.443, "step": 36911 }, { "epoch": 2.9, "learning_rate": 7.510788453986838e-07, "loss": 1.4384, "step": 36912 }, { "epoch": 2.9, "learning_rate": 7.498440410837858e-07, "loss": 1.4766, "step": 36913 }, { "epoch": 2.9, "learning_rate": 7.486102500950941e-07, "loss": 1.4864, "step": 36914 }, { "epoch": 2.9, "learning_rate": 7.473774724409853e-07, "loss": 1.3953, "step": 36915 }, { "epoch": 2.9, "learning_rate": 7.461457081298028e-07, "loss": 1.4346, "step": 36916 }, { "epoch": 2.9, "learning_rate": 7.449149571699398e-07, "loss": 1.4958, "step": 36917 }, { "epoch": 2.9, "learning_rate": 7.43685219569723e-07, "loss": 1.4667, "step": 36918 }, { "epoch": 2.9, "learning_rate": 7.424564953375289e-07, "loss": 1.4699, "step": 36919 }, { "epoch": 2.9, "learning_rate": 7.412287844816845e-07, "loss": 1.4384, "step": 36920 }, { "epoch": 2.9, "learning_rate": 7.400020870105328e-07, "loss": 1.4445, "step": 36921 }, { "epoch": 2.91, "learning_rate": 7.38776402932384e-07, "loss": 1.4782, "step": 36922 }, { "epoch": 2.91, "learning_rate": 7.375517322555813e-07, "loss": 1.4647, "step": 36923 }, { "epoch": 2.91, "learning_rate": 7.363280749884349e-07, "loss": 1.4121, "step": 36924 }, { "epoch": 2.91, "learning_rate": 7.351054311392546e-07, "loss": 1.4147, "step": 36925 }, { "epoch": 2.91, "learning_rate": 7.338838007163339e-07, "loss": 1.4592, "step": 36926 }, { "epoch": 2.91, "learning_rate": 7.326631837279662e-07, "loss": 1.3914, "step": 36927 }, { "epoch": 2.91, "learning_rate": 7.314435801824448e-07, "loss": 1.468, "step": 36928 }, { "epoch": 2.91, "learning_rate": 7.302249900880464e-07, "loss": 1.3865, "step": 36929 }, { "epoch": 2.91, "learning_rate": 7.290074134530477e-07, "loss": 1.4552, "step": 36930 }, { "epoch": 2.91, "learning_rate": 7.277908502857255e-07, "loss": 1.5316, "step": 36931 }, { "epoch": 2.91, "learning_rate": 7.265753005943231e-07, "loss": 1.4628, "step": 36932 }, { "epoch": 2.91, "learning_rate": 7.25360764387084e-07, "loss": 1.4555, "step": 36933 }, { "epoch": 2.91, "learning_rate": 7.241472416722849e-07, "loss": 1.4146, "step": 36934 }, { "epoch": 2.91, "learning_rate": 7.229347324581359e-07, "loss": 1.3827, "step": 36935 }, { "epoch": 2.91, "learning_rate": 7.217232367528969e-07, "loss": 1.4071, "step": 36936 }, { "epoch": 2.91, "learning_rate": 7.205127545647616e-07, "loss": 1.4072, "step": 36937 }, { "epoch": 2.91, "learning_rate": 7.193032859019732e-07, "loss": 1.4261, "step": 36938 }, { "epoch": 2.91, "learning_rate": 7.180948307727418e-07, "loss": 1.4052, "step": 36939 }, { "epoch": 2.91, "learning_rate": 7.168873891852611e-07, "loss": 1.3951, "step": 36940 }, { "epoch": 2.91, "learning_rate": 7.156809611477243e-07, "loss": 1.4757, "step": 36941 }, { "epoch": 2.91, "learning_rate": 7.144755466683416e-07, "loss": 1.4627, "step": 36942 }, { "epoch": 2.91, "learning_rate": 7.132711457552898e-07, "loss": 1.4686, "step": 36943 }, { "epoch": 2.91, "learning_rate": 7.120677584167456e-07, "loss": 1.4515, "step": 36944 }, { "epoch": 2.91, "learning_rate": 7.108653846608691e-07, "loss": 1.4504, "step": 36945 }, { "epoch": 2.91, "learning_rate": 7.096640244958374e-07, "loss": 1.4431, "step": 36946 }, { "epoch": 2.91, "learning_rate": 7.084636779297936e-07, "loss": 1.4493, "step": 36947 }, { "epoch": 2.91, "learning_rate": 7.072643449709148e-07, "loss": 1.4502, "step": 36948 }, { "epoch": 2.91, "learning_rate": 7.060660256273109e-07, "loss": 1.4397, "step": 36949 }, { "epoch": 2.91, "learning_rate": 7.048687199071424e-07, "loss": 1.428, "step": 36950 }, { "epoch": 2.91, "learning_rate": 7.036724278185024e-07, "loss": 1.4253, "step": 36951 }, { "epoch": 2.91, "learning_rate": 7.024771493695513e-07, "loss": 1.4567, "step": 36952 }, { "epoch": 2.91, "learning_rate": 7.012828845683994e-07, "loss": 1.4094, "step": 36953 }, { "epoch": 2.91, "learning_rate": 7.000896334231398e-07, "loss": 1.4429, "step": 36954 }, { "epoch": 2.91, "learning_rate": 6.988973959418831e-07, "loss": 1.4407, "step": 36955 }, { "epoch": 2.91, "learning_rate": 6.977061721327226e-07, "loss": 1.4305, "step": 36956 }, { "epoch": 2.91, "learning_rate": 6.965159620037353e-07, "loss": 1.4901, "step": 36957 }, { "epoch": 2.91, "learning_rate": 6.953267655630146e-07, "loss": 1.4433, "step": 36958 }, { "epoch": 2.91, "learning_rate": 6.941385828186541e-07, "loss": 1.4541, "step": 36959 }, { "epoch": 2.91, "learning_rate": 6.929514137786807e-07, "loss": 1.4108, "step": 36960 }, { "epoch": 2.91, "learning_rate": 6.917652584511712e-07, "loss": 1.4201, "step": 36961 }, { "epoch": 2.91, "learning_rate": 6.90580116844186e-07, "loss": 1.4823, "step": 36962 }, { "epoch": 2.91, "learning_rate": 6.893959889657685e-07, "loss": 1.4335, "step": 36963 }, { "epoch": 2.91, "learning_rate": 6.882128748239457e-07, "loss": 1.4228, "step": 36964 }, { "epoch": 2.91, "learning_rate": 6.870307744267611e-07, "loss": 1.4465, "step": 36965 }, { "epoch": 2.91, "learning_rate": 6.858496877822417e-07, "loss": 1.427, "step": 36966 }, { "epoch": 2.91, "learning_rate": 6.846696148984144e-07, "loss": 1.492, "step": 36967 }, { "epoch": 2.91, "learning_rate": 6.834905557832726e-07, "loss": 1.4458, "step": 36968 }, { "epoch": 2.91, "learning_rate": 6.823125104448268e-07, "loss": 1.4367, "step": 36969 }, { "epoch": 2.91, "learning_rate": 6.811354788910872e-07, "loss": 1.4353, "step": 36970 }, { "epoch": 2.91, "learning_rate": 6.799594611300307e-07, "loss": 1.4756, "step": 36971 }, { "epoch": 2.91, "learning_rate": 6.78784457169651e-07, "loss": 1.464, "step": 36972 }, { "epoch": 2.91, "learning_rate": 6.77610467017925e-07, "loss": 1.4305, "step": 36973 }, { "epoch": 2.91, "learning_rate": 6.76437490682813e-07, "loss": 1.409, "step": 36974 }, { "epoch": 2.91, "learning_rate": 6.752655281722918e-07, "loss": 1.4564, "step": 36975 }, { "epoch": 2.91, "learning_rate": 6.74094579494322e-07, "loss": 1.466, "step": 36976 }, { "epoch": 2.91, "learning_rate": 6.729246446568304e-07, "loss": 1.4559, "step": 36977 }, { "epoch": 2.91, "learning_rate": 6.717557236677773e-07, "loss": 1.3857, "step": 36978 }, { "epoch": 2.91, "learning_rate": 6.705878165351064e-07, "loss": 1.4436, "step": 36979 }, { "epoch": 2.91, "learning_rate": 6.694209232667446e-07, "loss": 1.4477, "step": 36980 }, { "epoch": 2.91, "learning_rate": 6.682550438705859e-07, "loss": 1.4855, "step": 36981 }, { "epoch": 2.91, "learning_rate": 6.670901783545735e-07, "loss": 1.4737, "step": 36982 }, { "epoch": 2.91, "learning_rate": 6.659263267266179e-07, "loss": 1.433, "step": 36983 }, { "epoch": 2.91, "learning_rate": 6.647634889945963e-07, "loss": 1.4108, "step": 36984 }, { "epoch": 2.91, "learning_rate": 6.636016651664355e-07, "loss": 1.4063, "step": 36985 }, { "epoch": 2.91, "learning_rate": 6.624408552500127e-07, "loss": 1.4891, "step": 36986 }, { "epoch": 2.91, "learning_rate": 6.612810592532048e-07, "loss": 1.482, "step": 36987 }, { "epoch": 2.91, "learning_rate": 6.601222771838721e-07, "loss": 1.4881, "step": 36988 }, { "epoch": 2.91, "learning_rate": 6.589645090499085e-07, "loss": 1.4542, "step": 36989 }, { "epoch": 2.91, "learning_rate": 6.578077548591576e-07, "loss": 1.4318, "step": 36990 }, { "epoch": 2.91, "learning_rate": 6.566520146194798e-07, "loss": 1.4868, "step": 36991 }, { "epoch": 2.91, "learning_rate": 6.554972883387189e-07, "loss": 1.4473, "step": 36992 }, { "epoch": 2.91, "learning_rate": 6.543435760247185e-07, "loss": 1.455, "step": 36993 }, { "epoch": 2.91, "learning_rate": 6.531908776853057e-07, "loss": 1.4594, "step": 36994 }, { "epoch": 2.91, "learning_rate": 6.520391933283076e-07, "loss": 1.402, "step": 36995 }, { "epoch": 2.91, "learning_rate": 6.508885229615512e-07, "loss": 1.4089, "step": 36996 }, { "epoch": 2.91, "learning_rate": 6.497388665928471e-07, "loss": 1.4798, "step": 36997 }, { "epoch": 2.91, "learning_rate": 6.48590224229989e-07, "loss": 1.4416, "step": 36998 }, { "epoch": 2.91, "learning_rate": 6.474425958808038e-07, "loss": 1.4478, "step": 36999 }, { "epoch": 2.91, "learning_rate": 6.462959815530522e-07, "loss": 1.4577, "step": 37000 }, { "epoch": 2.91, "learning_rate": 6.451503812545278e-07, "loss": 1.4983, "step": 37001 }, { "epoch": 2.91, "learning_rate": 6.440057949930078e-07, "loss": 1.4215, "step": 37002 }, { "epoch": 2.91, "learning_rate": 6.428622227762692e-07, "loss": 1.44, "step": 37003 }, { "epoch": 2.91, "learning_rate": 6.417196646120726e-07, "loss": 1.4452, "step": 37004 }, { "epoch": 2.91, "learning_rate": 6.405781205081784e-07, "loss": 1.4652, "step": 37005 }, { "epoch": 2.91, "learning_rate": 6.39437590472347e-07, "loss": 1.4743, "step": 37006 }, { "epoch": 2.91, "learning_rate": 6.382980745123056e-07, "loss": 1.4659, "step": 37007 }, { "epoch": 2.91, "learning_rate": 6.371595726357815e-07, "loss": 1.4185, "step": 37008 }, { "epoch": 2.91, "learning_rate": 6.360220848505349e-07, "loss": 1.3977, "step": 37009 }, { "epoch": 2.91, "learning_rate": 6.348856111642598e-07, "loss": 1.4341, "step": 37010 }, { "epoch": 2.91, "learning_rate": 6.337501515846998e-07, "loss": 1.4082, "step": 37011 }, { "epoch": 2.91, "learning_rate": 6.326157061195325e-07, "loss": 1.4359, "step": 37012 }, { "epoch": 2.91, "learning_rate": 6.314822747764847e-07, "loss": 1.4219, "step": 37013 }, { "epoch": 2.91, "learning_rate": 6.303498575632504e-07, "loss": 1.4351, "step": 37014 }, { "epoch": 2.91, "learning_rate": 6.292184544875067e-07, "loss": 1.4999, "step": 37015 }, { "epoch": 2.91, "learning_rate": 6.280880655569309e-07, "loss": 1.3828, "step": 37016 }, { "epoch": 2.91, "learning_rate": 6.269586907792168e-07, "loss": 1.4204, "step": 37017 }, { "epoch": 2.91, "learning_rate": 6.258303301620249e-07, "loss": 1.4672, "step": 37018 }, { "epoch": 2.91, "learning_rate": 6.247029837130158e-07, "loss": 1.4422, "step": 37019 }, { "epoch": 2.91, "learning_rate": 6.235766514398166e-07, "loss": 1.4198, "step": 37020 }, { "epoch": 2.91, "learning_rate": 6.224513333501213e-07, "loss": 1.3874, "step": 37021 }, { "epoch": 2.91, "learning_rate": 6.213270294515404e-07, "loss": 1.4794, "step": 37022 }, { "epoch": 2.91, "learning_rate": 6.202037397517346e-07, "loss": 1.4272, "step": 37023 }, { "epoch": 2.91, "learning_rate": 6.190814642582809e-07, "loss": 1.4457, "step": 37024 }, { "epoch": 2.91, "learning_rate": 6.1796020297884e-07, "loss": 1.4431, "step": 37025 }, { "epoch": 2.91, "learning_rate": 6.168399559210224e-07, "loss": 1.4162, "step": 37026 }, { "epoch": 2.91, "learning_rate": 6.157207230924222e-07, "loss": 1.436, "step": 37027 }, { "epoch": 2.91, "learning_rate": 6.146025045006331e-07, "loss": 1.4787, "step": 37028 }, { "epoch": 2.91, "learning_rate": 6.134853001532658e-07, "loss": 1.4056, "step": 37029 }, { "epoch": 2.91, "learning_rate": 6.123691100578976e-07, "loss": 1.4623, "step": 37030 }, { "epoch": 2.91, "learning_rate": 6.11253934222089e-07, "loss": 1.4417, "step": 37031 }, { "epoch": 2.91, "learning_rate": 6.101397726534341e-07, "loss": 1.4635, "step": 37032 }, { "epoch": 2.91, "learning_rate": 6.090266253594933e-07, "loss": 1.4466, "step": 37033 }, { "epoch": 2.91, "learning_rate": 6.079144923478108e-07, "loss": 1.4499, "step": 37034 }, { "epoch": 2.91, "learning_rate": 6.06803373625947e-07, "loss": 1.4623, "step": 37035 }, { "epoch": 2.91, "learning_rate": 6.056932692014627e-07, "loss": 1.481, "step": 37036 }, { "epoch": 2.91, "learning_rate": 6.045841790818684e-07, "loss": 1.4338, "step": 37037 }, { "epoch": 2.91, "learning_rate": 6.034761032747082e-07, "loss": 1.4517, "step": 37038 }, { "epoch": 2.91, "learning_rate": 6.023690417874926e-07, "loss": 1.4183, "step": 37039 }, { "epoch": 2.91, "learning_rate": 6.012629946277492e-07, "loss": 1.4401, "step": 37040 }, { "epoch": 2.91, "learning_rate": 6.001579618029884e-07, "loss": 1.4898, "step": 37041 }, { "epoch": 2.91, "learning_rate": 5.990539433207043e-07, "loss": 1.4228, "step": 37042 }, { "epoch": 2.91, "learning_rate": 5.979509391884074e-07, "loss": 1.4853, "step": 37043 }, { "epoch": 2.91, "learning_rate": 5.968489494135753e-07, "loss": 1.4005, "step": 37044 }, { "epoch": 2.91, "learning_rate": 5.957479740036853e-07, "loss": 1.3924, "step": 37045 }, { "epoch": 2.91, "learning_rate": 5.946480129662146e-07, "loss": 1.4571, "step": 37046 }, { "epoch": 2.91, "learning_rate": 5.935490663086572e-07, "loss": 1.4521, "step": 37047 }, { "epoch": 2.91, "learning_rate": 5.924511340384408e-07, "loss": 1.4679, "step": 37048 }, { "epoch": 2.92, "learning_rate": 5.913542161630092e-07, "loss": 1.4575, "step": 37049 }, { "epoch": 2.92, "learning_rate": 5.902583126898563e-07, "loss": 1.4975, "step": 37050 }, { "epoch": 2.92, "learning_rate": 5.891634236263931e-07, "loss": 1.4999, "step": 37051 }, { "epoch": 2.92, "learning_rate": 5.880695489800635e-07, "loss": 1.4208, "step": 37052 }, { "epoch": 2.92, "learning_rate": 5.869766887582783e-07, "loss": 1.434, "step": 37053 }, { "epoch": 2.92, "learning_rate": 5.858848429684648e-07, "loss": 1.469, "step": 37054 }, { "epoch": 2.92, "learning_rate": 5.847940116180505e-07, "loss": 1.4825, "step": 37055 }, { "epoch": 2.92, "learning_rate": 5.837041947144294e-07, "loss": 1.4325, "step": 37056 }, { "epoch": 2.92, "learning_rate": 5.826153922650123e-07, "loss": 1.4666, "step": 37057 }, { "epoch": 2.92, "learning_rate": 5.815276042771599e-07, "loss": 1.4528, "step": 37058 }, { "epoch": 2.92, "learning_rate": 5.80440830758283e-07, "loss": 1.4158, "step": 37059 }, { "epoch": 2.92, "learning_rate": 5.793550717157758e-07, "loss": 1.4388, "step": 37060 }, { "epoch": 2.92, "learning_rate": 5.782703271569822e-07, "loss": 1.4198, "step": 37061 }, { "epoch": 2.92, "learning_rate": 5.77186597089263e-07, "loss": 1.4711, "step": 37062 }, { "epoch": 2.92, "learning_rate": 5.761038815199958e-07, "loss": 1.4473, "step": 37063 }, { "epoch": 2.92, "learning_rate": 5.750221804565247e-07, "loss": 1.4619, "step": 37064 }, { "epoch": 2.92, "learning_rate": 5.739414939061937e-07, "loss": 1.4291, "step": 37065 }, { "epoch": 2.92, "learning_rate": 5.72861821876347e-07, "loss": 1.4304, "step": 37066 }, { "epoch": 2.92, "learning_rate": 5.717831643742954e-07, "loss": 1.465, "step": 37067 }, { "epoch": 2.92, "learning_rate": 5.70705521407383e-07, "loss": 1.3993, "step": 37068 }, { "epoch": 2.92, "learning_rate": 5.696288929829206e-07, "loss": 1.4516, "step": 37069 }, { "epoch": 2.92, "learning_rate": 5.685532791082026e-07, "loss": 1.4203, "step": 37070 }, { "epoch": 2.92, "learning_rate": 5.674786797905562e-07, "loss": 1.4729, "step": 37071 }, { "epoch": 2.92, "learning_rate": 5.664050950372589e-07, "loss": 1.4207, "step": 37072 }, { "epoch": 2.92, "learning_rate": 5.653325248556051e-07, "loss": 1.4549, "step": 37073 }, { "epoch": 2.92, "learning_rate": 5.642609692528888e-07, "loss": 1.3821, "step": 37074 }, { "epoch": 2.92, "learning_rate": 5.631904282363709e-07, "loss": 1.463, "step": 37075 }, { "epoch": 2.92, "learning_rate": 5.621209018133121e-07, "loss": 1.4691, "step": 37076 }, { "epoch": 2.92, "learning_rate": 5.610523899910068e-07, "loss": 1.4933, "step": 37077 }, { "epoch": 2.92, "learning_rate": 5.599848927766826e-07, "loss": 1.4488, "step": 37078 }, { "epoch": 2.92, "learning_rate": 5.589184101775835e-07, "loss": 1.4079, "step": 37079 }, { "epoch": 2.92, "learning_rate": 5.578529422009537e-07, "loss": 1.4486, "step": 37080 }, { "epoch": 2.92, "learning_rate": 5.567884888540542e-07, "loss": 1.4937, "step": 37081 }, { "epoch": 2.92, "learning_rate": 5.557250501440791e-07, "loss": 1.4054, "step": 37082 }, { "epoch": 2.92, "learning_rate": 5.546626260782561e-07, "loss": 1.4805, "step": 37083 }, { "epoch": 2.92, "learning_rate": 5.536012166638127e-07, "loss": 1.5109, "step": 37084 }, { "epoch": 2.92, "learning_rate": 5.52540821907943e-07, "loss": 1.4892, "step": 37085 }, { "epoch": 2.92, "learning_rate": 5.514814418178581e-07, "loss": 1.3923, "step": 37086 }, { "epoch": 2.92, "learning_rate": 5.504230764007355e-07, "loss": 1.4524, "step": 37087 }, { "epoch": 2.92, "learning_rate": 5.49365725663753e-07, "loss": 1.4126, "step": 37088 }, { "epoch": 2.92, "learning_rate": 5.483093896141211e-07, "loss": 1.4253, "step": 37089 }, { "epoch": 2.92, "learning_rate": 5.472540682589843e-07, "loss": 1.4637, "step": 37090 }, { "epoch": 2.92, "learning_rate": 5.461997616055203e-07, "loss": 1.4524, "step": 37091 }, { "epoch": 2.92, "learning_rate": 5.451464696608898e-07, "loss": 1.4123, "step": 37092 }, { "epoch": 2.92, "learning_rate": 5.440941924322373e-07, "loss": 1.4494, "step": 37093 }, { "epoch": 2.92, "learning_rate": 5.43042929926707e-07, "loss": 1.4365, "step": 37094 }, { "epoch": 2.92, "learning_rate": 5.419926821514431e-07, "loss": 1.3675, "step": 37095 }, { "epoch": 2.92, "learning_rate": 5.409434491135567e-07, "loss": 1.4774, "step": 37096 }, { "epoch": 2.92, "learning_rate": 5.39895230820192e-07, "loss": 1.4244, "step": 37097 }, { "epoch": 2.92, "learning_rate": 5.388480272784601e-07, "loss": 1.4559, "step": 37098 }, { "epoch": 2.92, "learning_rate": 5.378018384954719e-07, "loss": 1.43, "step": 37099 }, { "epoch": 2.92, "learning_rate": 5.367566644783383e-07, "loss": 1.4426, "step": 37100 }, { "epoch": 2.92, "learning_rate": 5.357125052341371e-07, "loss": 1.3898, "step": 37101 }, { "epoch": 2.92, "learning_rate": 5.346693607699625e-07, "loss": 1.4483, "step": 37102 }, { "epoch": 2.92, "learning_rate": 5.336272310929091e-07, "loss": 1.409, "step": 37103 }, { "epoch": 2.92, "learning_rate": 5.325861162100375e-07, "loss": 1.4351, "step": 37104 }, { "epoch": 2.92, "learning_rate": 5.315460161284423e-07, "loss": 1.4556, "step": 37105 }, { "epoch": 2.92, "learning_rate": 5.305069308551513e-07, "loss": 1.4258, "step": 37106 }, { "epoch": 2.92, "learning_rate": 5.294688603972253e-07, "loss": 1.4185, "step": 37107 }, { "epoch": 2.92, "learning_rate": 5.284318047617254e-07, "loss": 1.4559, "step": 37108 }, { "epoch": 2.92, "learning_rate": 5.273957639556958e-07, "loss": 1.4549, "step": 37109 }, { "epoch": 2.92, "learning_rate": 5.263607379861645e-07, "loss": 1.4439, "step": 37110 }, { "epoch": 2.92, "learning_rate": 5.25326726860159e-07, "loss": 1.4388, "step": 37111 }, { "epoch": 2.92, "learning_rate": 5.242937305846906e-07, "loss": 1.464, "step": 37112 }, { "epoch": 2.92, "learning_rate": 5.232617491667701e-07, "loss": 1.4145, "step": 37113 }, { "epoch": 2.92, "learning_rate": 5.222307826134253e-07, "loss": 1.4871, "step": 37114 }, { "epoch": 2.92, "learning_rate": 5.212008309316506e-07, "loss": 1.4486, "step": 37115 }, { "epoch": 2.92, "learning_rate": 5.201718941284239e-07, "loss": 1.4812, "step": 37116 }, { "epoch": 2.92, "learning_rate": 5.191439722107393e-07, "loss": 1.4507, "step": 37117 }, { "epoch": 2.92, "learning_rate": 5.181170651855915e-07, "loss": 1.39, "step": 37118 }, { "epoch": 2.92, "learning_rate": 5.170911730599248e-07, "loss": 1.4342, "step": 37119 }, { "epoch": 2.92, "learning_rate": 5.160662958407335e-07, "loss": 1.4156, "step": 37120 }, { "epoch": 2.92, "learning_rate": 5.150424335349457e-07, "loss": 1.4235, "step": 37121 }, { "epoch": 2.92, "learning_rate": 5.140195861495223e-07, "loss": 1.4332, "step": 37122 }, { "epoch": 2.92, "learning_rate": 5.129977536914242e-07, "loss": 1.4721, "step": 37123 }, { "epoch": 2.92, "learning_rate": 5.119769361675629e-07, "loss": 1.4313, "step": 37124 }, { "epoch": 2.92, "learning_rate": 5.109571335848994e-07, "loss": 1.4262, "step": 37125 }, { "epoch": 2.92, "learning_rate": 5.099383459503448e-07, "loss": 1.4431, "step": 37126 }, { "epoch": 2.92, "learning_rate": 5.089205732707935e-07, "loss": 1.4663, "step": 37127 }, { "epoch": 2.92, "learning_rate": 5.0790381555319e-07, "loss": 1.4663, "step": 37128 }, { "epoch": 2.92, "learning_rate": 5.068880728044289e-07, "loss": 1.4676, "step": 37129 }, { "epoch": 2.92, "learning_rate": 5.058733450313878e-07, "loss": 1.4346, "step": 37130 }, { "epoch": 2.92, "learning_rate": 5.048596322409615e-07, "loss": 1.4981, "step": 37131 }, { "epoch": 2.92, "learning_rate": 5.038469344400609e-07, "loss": 1.4702, "step": 37132 }, { "epoch": 2.92, "learning_rate": 5.028352516355305e-07, "loss": 1.4501, "step": 37133 }, { "epoch": 2.92, "learning_rate": 5.018245838342483e-07, "loss": 1.4182, "step": 37134 }, { "epoch": 2.92, "learning_rate": 5.008149310430753e-07, "loss": 1.4625, "step": 37135 }, { "epoch": 2.92, "learning_rate": 4.998062932688728e-07, "loss": 1.4457, "step": 37136 }, { "epoch": 2.92, "learning_rate": 4.987986705184854e-07, "loss": 1.4733, "step": 37137 }, { "epoch": 2.92, "learning_rate": 4.977920627987575e-07, "loss": 1.4629, "step": 37138 }, { "epoch": 2.92, "learning_rate": 4.96786470116517e-07, "loss": 1.4296, "step": 37139 }, { "epoch": 2.92, "learning_rate": 4.957818924785917e-07, "loss": 1.4247, "step": 37140 }, { "epoch": 2.92, "learning_rate": 4.947783298917929e-07, "loss": 1.4485, "step": 37141 }, { "epoch": 2.92, "learning_rate": 4.937757823629651e-07, "loss": 1.4458, "step": 37142 }, { "epoch": 2.92, "learning_rate": 4.927742498988862e-07, "loss": 1.4407, "step": 37143 }, { "epoch": 2.92, "learning_rate": 4.917737325063675e-07, "loss": 1.4231, "step": 37144 }, { "epoch": 2.92, "learning_rate": 4.907742301921868e-07, "loss": 1.4765, "step": 37145 }, { "epoch": 2.92, "learning_rate": 4.897757429631555e-07, "loss": 1.416, "step": 37146 }, { "epoch": 2.92, "learning_rate": 4.887782708260346e-07, "loss": 1.4343, "step": 37147 }, { "epoch": 2.92, "learning_rate": 4.877818137876022e-07, "loss": 1.4919, "step": 37148 }, { "epoch": 2.92, "learning_rate": 4.867863718546361e-07, "loss": 1.4254, "step": 37149 }, { "epoch": 2.92, "learning_rate": 4.85791945033881e-07, "loss": 1.4077, "step": 37150 }, { "epoch": 2.92, "learning_rate": 4.847985333320647e-07, "loss": 1.3866, "step": 37151 }, { "epoch": 2.92, "learning_rate": 4.83806136755982e-07, "loss": 1.45, "step": 37152 }, { "epoch": 2.92, "learning_rate": 4.82814755312344e-07, "loss": 1.4375, "step": 37153 }, { "epoch": 2.92, "learning_rate": 4.818243890078788e-07, "loss": 1.3966, "step": 37154 }, { "epoch": 2.92, "learning_rate": 4.808350378493142e-07, "loss": 1.4056, "step": 37155 }, { "epoch": 2.92, "learning_rate": 4.798467018433616e-07, "loss": 1.4295, "step": 37156 }, { "epoch": 2.92, "learning_rate": 4.788593809967489e-07, "loss": 1.4658, "step": 37157 }, { "epoch": 2.92, "learning_rate": 4.778730753161542e-07, "loss": 1.4316, "step": 37158 }, { "epoch": 2.92, "learning_rate": 4.768877848083052e-07, "loss": 1.4337, "step": 37159 }, { "epoch": 2.92, "learning_rate": 4.7590350947986353e-07, "loss": 1.4507, "step": 37160 }, { "epoch": 2.92, "learning_rate": 4.749202493375237e-07, "loss": 1.4959, "step": 37161 }, { "epoch": 2.92, "learning_rate": 4.739380043879637e-07, "loss": 1.3826, "step": 37162 }, { "epoch": 2.92, "learning_rate": 4.729567746378449e-07, "loss": 1.3945, "step": 37163 }, { "epoch": 2.92, "learning_rate": 4.719765600938452e-07, "loss": 1.4555, "step": 37164 }, { "epoch": 2.92, "learning_rate": 4.7099736076259274e-07, "loss": 1.451, "step": 37165 }, { "epoch": 2.92, "learning_rate": 4.700191766507655e-07, "loss": 1.4414, "step": 37166 }, { "epoch": 2.92, "learning_rate": 4.6904200776499145e-07, "loss": 1.4778, "step": 37167 }, { "epoch": 2.92, "learning_rate": 4.680658541118987e-07, "loss": 1.4237, "step": 37168 }, { "epoch": 2.92, "learning_rate": 4.6709071569811517e-07, "loss": 1.429, "step": 37169 }, { "epoch": 2.92, "learning_rate": 4.66116592530269e-07, "loss": 1.5003, "step": 37170 }, { "epoch": 2.92, "learning_rate": 4.651434846149715e-07, "loss": 1.4308, "step": 37171 }, { "epoch": 2.92, "learning_rate": 4.641713919588341e-07, "loss": 1.4922, "step": 37172 }, { "epoch": 2.92, "learning_rate": 4.6320031456845153e-07, "loss": 1.4255, "step": 37173 }, { "epoch": 2.92, "learning_rate": 4.6223025245041844e-07, "loss": 1.4273, "step": 37174 }, { "epoch": 2.92, "learning_rate": 4.6126120561131296e-07, "loss": 1.4606, "step": 37175 }, { "epoch": 2.93, "learning_rate": 4.602931740577298e-07, "loss": 1.4497, "step": 37176 }, { "epoch": 2.93, "learning_rate": 4.5932615779621373e-07, "loss": 1.4498, "step": 37177 }, { "epoch": 2.93, "learning_rate": 4.5836015683337615e-07, "loss": 1.4704, "step": 37178 }, { "epoch": 2.93, "learning_rate": 4.5739517117572843e-07, "loss": 1.4413, "step": 37179 }, { "epoch": 2.93, "learning_rate": 4.5643120082984874e-07, "loss": 1.4706, "step": 37180 }, { "epoch": 2.93, "learning_rate": 4.554682458022818e-07, "loss": 1.4637, "step": 37181 }, { "epoch": 2.93, "learning_rate": 4.5450630609955576e-07, "loss": 1.4302, "step": 37182 }, { "epoch": 2.93, "learning_rate": 4.535453817282153e-07, "loss": 1.4441, "step": 37183 }, { "epoch": 2.93, "learning_rate": 4.52585472694772e-07, "loss": 1.4677, "step": 37184 }, { "epoch": 2.93, "learning_rate": 4.5162657900573717e-07, "loss": 1.424, "step": 37185 }, { "epoch": 2.93, "learning_rate": 4.5066870066763904e-07, "loss": 1.5204, "step": 37186 }, { "epoch": 2.93, "learning_rate": 4.497118376869724e-07, "loss": 1.4127, "step": 37187 }, { "epoch": 2.93, "learning_rate": 4.48755990070232e-07, "loss": 1.4797, "step": 37188 }, { "epoch": 2.93, "learning_rate": 4.47801157823896e-07, "loss": 1.437, "step": 37189 }, { "epoch": 2.93, "learning_rate": 4.4684734095447595e-07, "loss": 1.4762, "step": 37190 }, { "epoch": 2.93, "learning_rate": 4.4589453946843323e-07, "loss": 1.4072, "step": 37191 }, { "epoch": 2.93, "learning_rate": 4.4494275337221274e-07, "loss": 1.413, "step": 37192 }, { "epoch": 2.93, "learning_rate": 4.4399198267232593e-07, "loss": 1.5018, "step": 37193 }, { "epoch": 2.93, "learning_rate": 4.4304222737520103e-07, "loss": 1.4073, "step": 37194 }, { "epoch": 2.93, "learning_rate": 4.4209348748726614e-07, "loss": 1.4792, "step": 37195 }, { "epoch": 2.93, "learning_rate": 4.411457630149995e-07, "loss": 1.4646, "step": 37196 }, { "epoch": 2.93, "learning_rate": 4.4019905396482923e-07, "loss": 1.4644, "step": 37197 }, { "epoch": 2.93, "learning_rate": 4.392533603431503e-07, "loss": 1.4648, "step": 37198 }, { "epoch": 2.93, "learning_rate": 4.383086821564241e-07, "loss": 1.4486, "step": 37199 }, { "epoch": 2.93, "learning_rate": 4.3736501941104565e-07, "loss": 1.4675, "step": 37200 }, { "epoch": 2.93, "learning_rate": 4.364223721134097e-07, "loss": 1.4173, "step": 37201 }, { "epoch": 2.93, "learning_rate": 4.354807402699445e-07, "loss": 1.4745, "step": 37202 }, { "epoch": 2.93, "learning_rate": 4.3454012388701163e-07, "loss": 1.4129, "step": 37203 }, { "epoch": 2.93, "learning_rate": 4.3360052297102264e-07, "loss": 1.4639, "step": 37204 }, { "epoch": 2.93, "learning_rate": 4.3266193752835575e-07, "loss": 1.4686, "step": 37205 }, { "epoch": 2.93, "learning_rate": 4.3172436756537254e-07, "loss": 1.5114, "step": 37206 }, { "epoch": 2.93, "learning_rate": 4.307878130884346e-07, "loss": 1.4785, "step": 37207 }, { "epoch": 2.93, "learning_rate": 4.298522741039201e-07, "loss": 1.4548, "step": 37208 }, { "epoch": 2.93, "learning_rate": 4.289177506181574e-07, "loss": 1.4722, "step": 37209 }, { "epoch": 2.93, "learning_rate": 4.2798424263750795e-07, "loss": 1.4418, "step": 37210 }, { "epoch": 2.93, "learning_rate": 4.270517501683168e-07, "loss": 1.3994, "step": 37211 }, { "epoch": 2.93, "learning_rate": 4.261202732168789e-07, "loss": 1.432, "step": 37212 }, { "epoch": 2.93, "learning_rate": 4.251898117895558e-07, "loss": 1.4217, "step": 37213 }, { "epoch": 2.93, "learning_rate": 4.242603658926591e-07, "loss": 1.4339, "step": 37214 }, { "epoch": 2.93, "learning_rate": 4.2333193553248377e-07, "loss": 1.3771, "step": 37215 }, { "epoch": 2.93, "learning_rate": 4.2240452071534146e-07, "loss": 1.4398, "step": 37216 }, { "epoch": 2.93, "learning_rate": 4.214781214475271e-07, "loss": 1.3488, "step": 37217 }, { "epoch": 2.93, "learning_rate": 4.205527377353357e-07, "loss": 1.4545, "step": 37218 }, { "epoch": 2.93, "learning_rate": 4.196283695850455e-07, "loss": 1.3792, "step": 37219 }, { "epoch": 2.93, "learning_rate": 4.187050170029349e-07, "loss": 1.4696, "step": 37220 }, { "epoch": 2.93, "learning_rate": 4.177826799952655e-07, "loss": 1.4637, "step": 37221 }, { "epoch": 2.93, "learning_rate": 4.168613585683156e-07, "loss": 1.4415, "step": 37222 }, { "epoch": 2.93, "learning_rate": 4.1594105272833024e-07, "loss": 1.4392, "step": 37223 }, { "epoch": 2.93, "learning_rate": 4.1502176248153776e-07, "loss": 1.4373, "step": 37224 }, { "epoch": 2.93, "learning_rate": 4.141034878342164e-07, "loss": 1.397, "step": 37225 }, { "epoch": 2.93, "learning_rate": 4.1318622879257803e-07, "loss": 1.4312, "step": 37226 }, { "epoch": 2.93, "learning_rate": 4.122699853628675e-07, "loss": 1.442, "step": 37227 }, { "epoch": 2.93, "learning_rate": 4.113547575512799e-07, "loss": 1.4736, "step": 37228 }, { "epoch": 2.93, "learning_rate": 4.1044054536406025e-07, "loss": 1.4194, "step": 37229 }, { "epoch": 2.93, "learning_rate": 4.0952734880738694e-07, "loss": 1.4727, "step": 37230 }, { "epoch": 2.93, "learning_rate": 4.0861516788747163e-07, "loss": 1.4687, "step": 37231 }, { "epoch": 2.93, "learning_rate": 4.077040026105094e-07, "loss": 1.4144, "step": 37232 }, { "epoch": 2.93, "learning_rate": 4.0679385298267866e-07, "loss": 1.4423, "step": 37233 }, { "epoch": 2.93, "learning_rate": 4.058847190101744e-07, "loss": 1.4576, "step": 37234 }, { "epoch": 2.93, "learning_rate": 4.0497660069917505e-07, "loss": 1.4478, "step": 37235 }, { "epoch": 2.93, "learning_rate": 4.04069498055809e-07, "loss": 1.4251, "step": 37236 }, { "epoch": 2.93, "learning_rate": 4.031634110862547e-07, "loss": 1.4677, "step": 37237 }, { "epoch": 2.93, "learning_rate": 4.022583397966739e-07, "loss": 1.4543, "step": 37238 }, { "epoch": 2.93, "learning_rate": 4.013542841932116e-07, "loss": 1.4707, "step": 37239 }, { "epoch": 2.93, "learning_rate": 4.004512442819796e-07, "loss": 1.4627, "step": 37240 }, { "epoch": 2.93, "learning_rate": 3.995492200691397e-07, "loss": 1.4609, "step": 37241 }, { "epoch": 2.93, "learning_rate": 3.9864821156082026e-07, "loss": 1.428, "step": 37242 }, { "epoch": 2.93, "learning_rate": 3.9774821876309984e-07, "loss": 1.4563, "step": 37243 }, { "epoch": 2.93, "learning_rate": 3.968492416821234e-07, "loss": 1.4583, "step": 37244 }, { "epoch": 2.93, "learning_rate": 3.959512803239695e-07, "loss": 1.4215, "step": 37245 }, { "epoch": 2.93, "learning_rate": 3.950543346947499e-07, "loss": 1.4582, "step": 37246 }, { "epoch": 2.93, "learning_rate": 3.941584048005597e-07, "loss": 1.4176, "step": 37247 }, { "epoch": 2.93, "learning_rate": 3.932634906474774e-07, "loss": 1.4238, "step": 37248 }, { "epoch": 2.93, "learning_rate": 3.923695922415815e-07, "loss": 1.3941, "step": 37249 }, { "epoch": 2.93, "learning_rate": 3.9147670958891706e-07, "loss": 1.4525, "step": 37250 }, { "epoch": 2.93, "learning_rate": 3.905848426955793e-07, "loss": 1.3849, "step": 37251 }, { "epoch": 2.93, "learning_rate": 3.8969399156761336e-07, "loss": 1.4508, "step": 37252 }, { "epoch": 2.93, "learning_rate": 3.8880415621104776e-07, "loss": 1.4119, "step": 37253 }, { "epoch": 2.93, "learning_rate": 3.879153366319443e-07, "loss": 1.4133, "step": 37254 }, { "epoch": 2.93, "learning_rate": 3.8702753283633147e-07, "loss": 1.4335, "step": 37255 }, { "epoch": 2.93, "learning_rate": 3.861407448302545e-07, "loss": 1.5, "step": 37256 }, { "epoch": 2.93, "learning_rate": 3.8525497261969187e-07, "loss": 1.4712, "step": 37257 }, { "epoch": 2.93, "learning_rate": 3.843702162107054e-07, "loss": 1.4124, "step": 37258 }, { "epoch": 2.93, "learning_rate": 3.834864756092737e-07, "loss": 1.4538, "step": 37259 }, { "epoch": 2.93, "learning_rate": 3.8260375082139193e-07, "loss": 1.5048, "step": 37260 }, { "epoch": 2.93, "learning_rate": 3.8172204185308865e-07, "loss": 1.3976, "step": 37261 }, { "epoch": 2.93, "learning_rate": 3.80841348710309e-07, "loss": 1.4549, "step": 37262 }, { "epoch": 2.93, "learning_rate": 3.7996167139904833e-07, "loss": 1.4656, "step": 37263 }, { "epoch": 2.93, "learning_rate": 3.7908300992530174e-07, "loss": 1.4238, "step": 37264 }, { "epoch": 2.93, "learning_rate": 3.782053642949978e-07, "loss": 1.4509, "step": 37265 }, { "epoch": 2.93, "learning_rate": 3.773287345140985e-07, "loss": 1.4515, "step": 37266 }, { "epoch": 2.93, "learning_rate": 3.7645312058858234e-07, "loss": 1.4263, "step": 37267 }, { "epoch": 2.93, "learning_rate": 3.7557852252439457e-07, "loss": 1.4285, "step": 37268 }, { "epoch": 2.93, "learning_rate": 3.747049403274471e-07, "loss": 1.4508, "step": 37269 }, { "epoch": 2.93, "learning_rate": 3.738323740036686e-07, "loss": 1.4589, "step": 37270 }, { "epoch": 2.93, "learning_rate": 3.7296082355900426e-07, "loss": 1.4899, "step": 37271 }, { "epoch": 2.93, "learning_rate": 3.7209028899938265e-07, "loss": 1.4417, "step": 37272 }, { "epoch": 2.93, "learning_rate": 3.712207703306824e-07, "loss": 1.3617, "step": 37273 }, { "epoch": 2.93, "learning_rate": 3.7035226755881553e-07, "loss": 1.451, "step": 37274 }, { "epoch": 2.93, "learning_rate": 3.694847806896939e-07, "loss": 1.4395, "step": 37275 }, { "epoch": 2.93, "learning_rate": 3.6861830972919614e-07, "loss": 1.4541, "step": 37276 }, { "epoch": 2.93, "learning_rate": 3.677528546832176e-07, "loss": 1.428, "step": 37277 }, { "epoch": 2.93, "learning_rate": 3.6688841555760353e-07, "loss": 1.4204, "step": 37278 }, { "epoch": 2.93, "learning_rate": 3.6602499235824924e-07, "loss": 1.3997, "step": 37279 }, { "epoch": 2.93, "learning_rate": 3.651625850910167e-07, "loss": 1.4565, "step": 37280 }, { "epoch": 2.93, "learning_rate": 3.643011937617513e-07, "loss": 1.3966, "step": 37281 }, { "epoch": 2.93, "learning_rate": 3.6344081837629823e-07, "loss": 1.424, "step": 37282 }, { "epoch": 2.93, "learning_rate": 3.625814589405196e-07, "loss": 1.39, "step": 37283 }, { "epoch": 2.93, "learning_rate": 3.6172311546022737e-07, "loss": 1.473, "step": 37284 }, { "epoch": 2.93, "learning_rate": 3.6086578794126684e-07, "loss": 1.4305, "step": 37285 }, { "epoch": 2.93, "learning_rate": 3.6000947638943347e-07, "loss": 1.4625, "step": 37286 }, { "epoch": 2.93, "learning_rate": 3.591541808105558e-07, "loss": 1.4044, "step": 37287 }, { "epoch": 2.93, "learning_rate": 3.582999012104626e-07, "loss": 1.4579, "step": 37288 }, { "epoch": 2.93, "learning_rate": 3.5744663759491586e-07, "loss": 1.4914, "step": 37289 }, { "epoch": 2.93, "learning_rate": 3.5659438996974434e-07, "loss": 1.4681, "step": 37290 }, { "epoch": 2.93, "learning_rate": 3.5574315834071e-07, "loss": 1.4817, "step": 37291 }, { "epoch": 2.93, "learning_rate": 3.548929427135916e-07, "loss": 1.4407, "step": 37292 }, { "epoch": 2.93, "learning_rate": 3.540437430941678e-07, "loss": 1.441, "step": 37293 }, { "epoch": 2.93, "learning_rate": 3.5319555948821745e-07, "loss": 1.4626, "step": 37294 }, { "epoch": 2.93, "learning_rate": 3.5234839190148577e-07, "loss": 1.398, "step": 37295 }, { "epoch": 2.93, "learning_rate": 3.515022403397183e-07, "loss": 1.4629, "step": 37296 }, { "epoch": 2.93, "learning_rate": 3.5065710480867704e-07, "loss": 1.4695, "step": 37297 }, { "epoch": 2.93, "learning_rate": 3.498129853140741e-07, "loss": 1.4604, "step": 37298 }, { "epoch": 2.93, "learning_rate": 3.489698818616715e-07, "loss": 1.4729, "step": 37299 }, { "epoch": 2.93, "learning_rate": 3.481277944571814e-07, "loss": 1.4923, "step": 37300 }, { "epoch": 2.93, "learning_rate": 3.472867231063159e-07, "loss": 1.4314, "step": 37301 }, { "epoch": 2.93, "learning_rate": 3.4644666781478705e-07, "loss": 1.4817, "step": 37302 }, { "epoch": 2.94, "learning_rate": 3.456076285882903e-07, "loss": 1.4097, "step": 37303 }, { "epoch": 2.94, "learning_rate": 3.447696054325377e-07, "loss": 1.4018, "step": 37304 }, { "epoch": 2.94, "learning_rate": 3.4393259835322485e-07, "loss": 1.427, "step": 37305 }, { "epoch": 2.94, "learning_rate": 3.4309660735601374e-07, "loss": 1.4767, "step": 37306 }, { "epoch": 2.94, "learning_rate": 3.4226163244658323e-07, "loss": 1.4864, "step": 37307 }, { "epoch": 2.94, "learning_rate": 3.414276736306121e-07, "loss": 1.4556, "step": 37308 }, { "epoch": 2.94, "learning_rate": 3.4059473091376243e-07, "loss": 1.4413, "step": 37309 }, { "epoch": 2.94, "learning_rate": 3.397628043016798e-07, "loss": 1.3895, "step": 37310 }, { "epoch": 2.94, "learning_rate": 3.389318938000263e-07, "loss": 1.463, "step": 37311 }, { "epoch": 2.94, "learning_rate": 3.381019994144307e-07, "loss": 1.4357, "step": 37312 }, { "epoch": 2.94, "learning_rate": 3.37273121150522e-07, "loss": 1.3704, "step": 37313 }, { "epoch": 2.94, "learning_rate": 3.364452590139455e-07, "loss": 1.4502, "step": 37314 }, { "epoch": 2.94, "learning_rate": 3.356184130103301e-07, "loss": 1.5115, "step": 37315 }, { "epoch": 2.94, "learning_rate": 3.347925831452547e-07, "loss": 1.4662, "step": 37316 }, { "epoch": 2.94, "learning_rate": 3.3396776942434813e-07, "loss": 1.4141, "step": 37317 }, { "epoch": 2.94, "learning_rate": 3.331439718532225e-07, "loss": 1.5025, "step": 37318 }, { "epoch": 2.94, "learning_rate": 3.323211904374401e-07, "loss": 1.4572, "step": 37319 }, { "epoch": 2.94, "learning_rate": 3.3149942518261305e-07, "loss": 1.4081, "step": 37320 }, { "epoch": 2.94, "learning_rate": 3.3067867609430363e-07, "loss": 1.4517, "step": 37321 }, { "epoch": 2.94, "learning_rate": 3.298589431780907e-07, "loss": 1.5046, "step": 37322 }, { "epoch": 2.94, "learning_rate": 3.290402264395531e-07, "loss": 1.4393, "step": 37323 }, { "epoch": 2.94, "learning_rate": 3.282225258842197e-07, "loss": 1.4451, "step": 37324 }, { "epoch": 2.94, "learning_rate": 3.2740584151766947e-07, "loss": 1.4396, "step": 37325 }, { "epoch": 2.94, "learning_rate": 3.265901733454479e-07, "loss": 1.4464, "step": 37326 }, { "epoch": 2.94, "learning_rate": 3.257755213730673e-07, "loss": 1.4093, "step": 37327 }, { "epoch": 2.94, "learning_rate": 3.2496188560607317e-07, "loss": 1.4501, "step": 37328 }, { "epoch": 2.94, "learning_rate": 3.2414926604999446e-07, "loss": 1.488, "step": 37329 }, { "epoch": 2.94, "learning_rate": 3.2333766271034345e-07, "loss": 1.4263, "step": 37330 }, { "epoch": 2.94, "learning_rate": 3.2252707559263237e-07, "loss": 1.4527, "step": 37331 }, { "epoch": 2.94, "learning_rate": 3.2171750470237343e-07, "loss": 1.492, "step": 37332 }, { "epoch": 2.94, "learning_rate": 3.2090895004504567e-07, "loss": 1.4574, "step": 37333 }, { "epoch": 2.94, "learning_rate": 3.2010141162614465e-07, "loss": 1.4508, "step": 37334 }, { "epoch": 2.94, "learning_rate": 3.1929488945114933e-07, "loss": 1.4543, "step": 37335 }, { "epoch": 2.94, "learning_rate": 3.1848938352553865e-07, "loss": 1.4397, "step": 37336 }, { "epoch": 2.94, "learning_rate": 3.1768489385479154e-07, "loss": 1.428, "step": 37337 }, { "epoch": 2.94, "learning_rate": 3.1688142044437035e-07, "loss": 1.4226, "step": 37338 }, { "epoch": 2.94, "learning_rate": 3.160789632997207e-07, "loss": 1.4188, "step": 37339 }, { "epoch": 2.94, "learning_rate": 3.1527752242628824e-07, "loss": 1.4026, "step": 37340 }, { "epoch": 2.94, "learning_rate": 3.144770978295019e-07, "loss": 1.4878, "step": 37341 }, { "epoch": 2.94, "learning_rate": 3.1367768951484073e-07, "loss": 1.4021, "step": 37342 }, { "epoch": 2.94, "learning_rate": 3.128792974876837e-07, "loss": 1.4217, "step": 37343 }, { "epoch": 2.94, "learning_rate": 3.1208192175347647e-07, "loss": 1.4511, "step": 37344 }, { "epoch": 2.94, "learning_rate": 3.1128556231763134e-07, "loss": 1.4397, "step": 37345 }, { "epoch": 2.94, "learning_rate": 3.104902191855607e-07, "loss": 1.4243, "step": 37346 }, { "epoch": 2.94, "learning_rate": 3.096958923626436e-07, "loss": 1.4893, "step": 37347 }, { "epoch": 2.94, "learning_rate": 3.089025818542923e-07, "loss": 1.4416, "step": 37348 }, { "epoch": 2.94, "learning_rate": 3.0811028766588585e-07, "loss": 1.4512, "step": 37349 }, { "epoch": 2.94, "learning_rate": 3.073190098027867e-07, "loss": 1.4862, "step": 37350 }, { "epoch": 2.94, "learning_rate": 3.0652874827040705e-07, "loss": 1.4501, "step": 37351 }, { "epoch": 2.94, "learning_rate": 3.0573950307407614e-07, "loss": 1.4205, "step": 37352 }, { "epoch": 2.94, "learning_rate": 3.0495127421917285e-07, "loss": 1.5091, "step": 37353 }, { "epoch": 2.94, "learning_rate": 3.0416406171104303e-07, "loss": 1.4897, "step": 37354 }, { "epoch": 2.94, "learning_rate": 3.033778655550323e-07, "loss": 1.4575, "step": 37355 }, { "epoch": 2.94, "learning_rate": 3.025926857564698e-07, "loss": 1.5006, "step": 37356 }, { "epoch": 2.94, "learning_rate": 3.018085223206845e-07, "loss": 1.3943, "step": 37357 }, { "epoch": 2.94, "learning_rate": 3.010253752530223e-07, "loss": 1.4588, "step": 37358 }, { "epoch": 2.94, "learning_rate": 3.002432445587788e-07, "loss": 1.4743, "step": 37359 }, { "epoch": 2.94, "learning_rate": 2.994621302432831e-07, "loss": 1.47, "step": 37360 }, { "epoch": 2.94, "learning_rate": 2.986820323118311e-07, "loss": 1.4332, "step": 37361 }, { "epoch": 2.94, "learning_rate": 2.9790295076970175e-07, "loss": 1.4056, "step": 37362 }, { "epoch": 2.94, "learning_rate": 2.9712488562220747e-07, "loss": 1.4811, "step": 37363 }, { "epoch": 2.94, "learning_rate": 2.963478368746108e-07, "loss": 1.4382, "step": 37364 }, { "epoch": 2.94, "learning_rate": 2.955718045322075e-07, "loss": 1.4338, "step": 37365 }, { "epoch": 2.94, "learning_rate": 2.9479678860026e-07, "loss": 1.4269, "step": 37366 }, { "epoch": 2.94, "learning_rate": 2.9402278908403074e-07, "loss": 1.4388, "step": 37367 }, { "epoch": 2.94, "learning_rate": 2.932498059887656e-07, "loss": 1.3933, "step": 37368 }, { "epoch": 2.94, "learning_rate": 2.924778393197269e-07, "loss": 1.4438, "step": 37369 }, { "epoch": 2.94, "learning_rate": 2.917068890821439e-07, "loss": 1.4701, "step": 37370 }, { "epoch": 2.94, "learning_rate": 2.909369552812457e-07, "loss": 1.4494, "step": 37371 }, { "epoch": 2.94, "learning_rate": 2.9016803792227815e-07, "loss": 1.4151, "step": 37372 }, { "epoch": 2.94, "learning_rate": 2.894001370104537e-07, "loss": 1.477, "step": 37373 }, { "epoch": 2.94, "learning_rate": 2.8863325255098493e-07, "loss": 1.4342, "step": 37374 }, { "epoch": 2.94, "learning_rate": 2.8786738454906754e-07, "loss": 1.4373, "step": 37375 }, { "epoch": 2.94, "learning_rate": 2.871025330099308e-07, "loss": 1.3971, "step": 37376 }, { "epoch": 2.94, "learning_rate": 2.8633869793873723e-07, "loss": 1.3755, "step": 37377 }, { "epoch": 2.94, "learning_rate": 2.8557587934069923e-07, "loss": 1.4173, "step": 37378 }, { "epoch": 2.94, "learning_rate": 2.848140772209628e-07, "loss": 1.4574, "step": 37379 }, { "epoch": 2.94, "learning_rate": 2.8405329158474044e-07, "loss": 1.4627, "step": 37380 }, { "epoch": 2.94, "learning_rate": 2.8329352243714466e-07, "loss": 1.431, "step": 37381 }, { "epoch": 2.94, "learning_rate": 2.8253476978338797e-07, "loss": 1.4331, "step": 37382 }, { "epoch": 2.94, "learning_rate": 2.817770336285996e-07, "loss": 1.4476, "step": 37383 }, { "epoch": 2.94, "learning_rate": 2.8102031397792546e-07, "loss": 1.471, "step": 37384 }, { "epoch": 2.94, "learning_rate": 2.802646108364948e-07, "loss": 1.4476, "step": 37385 }, { "epoch": 2.94, "learning_rate": 2.7950992420943677e-07, "loss": 1.4332, "step": 37386 }, { "epoch": 2.94, "learning_rate": 2.787562541018973e-07, "loss": 1.4458, "step": 37387 }, { "epoch": 2.94, "learning_rate": 2.780036005189723e-07, "loss": 1.4457, "step": 37388 }, { "epoch": 2.94, "learning_rate": 2.7725196346579104e-07, "loss": 1.4549, "step": 37389 }, { "epoch": 2.94, "learning_rate": 2.7650134294743273e-07, "loss": 1.4257, "step": 37390 }, { "epoch": 2.94, "learning_rate": 2.7575173896901005e-07, "loss": 1.4164, "step": 37391 }, { "epoch": 2.94, "learning_rate": 2.750031515356188e-07, "loss": 1.4965, "step": 37392 }, { "epoch": 2.94, "learning_rate": 2.7425558065232165e-07, "loss": 1.4255, "step": 37393 }, { "epoch": 2.94, "learning_rate": 2.735090263241979e-07, "loss": 1.4932, "step": 37394 }, { "epoch": 2.94, "learning_rate": 2.727634885563268e-07, "loss": 1.4696, "step": 37395 }, { "epoch": 2.94, "learning_rate": 2.720189673537709e-07, "loss": 1.5018, "step": 37396 }, { "epoch": 2.94, "learning_rate": 2.7127546272155966e-07, "loss": 1.4669, "step": 37397 }, { "epoch": 2.94, "learning_rate": 2.7053297466478885e-07, "loss": 1.424, "step": 37398 }, { "epoch": 2.94, "learning_rate": 2.6979150318845454e-07, "loss": 1.465, "step": 37399 }, { "epoch": 2.94, "learning_rate": 2.6905104829760273e-07, "loss": 1.4629, "step": 37400 }, { "epoch": 2.94, "learning_rate": 2.683116099972793e-07, "loss": 1.4684, "step": 37401 }, { "epoch": 2.94, "learning_rate": 2.675731882924803e-07, "loss": 1.4786, "step": 37402 }, { "epoch": 2.94, "learning_rate": 2.668357831882517e-07, "loss": 1.4695, "step": 37403 }, { "epoch": 2.94, "learning_rate": 2.660993946895562e-07, "loss": 1.4507, "step": 37404 }, { "epoch": 2.94, "learning_rate": 2.653640228014231e-07, "loss": 1.4401, "step": 37405 }, { "epoch": 2.94, "learning_rate": 2.6462966752883175e-07, "loss": 1.4791, "step": 37406 }, { "epoch": 2.94, "learning_rate": 2.6389632887679477e-07, "loss": 1.4587, "step": 37407 }, { "epoch": 2.94, "learning_rate": 2.631640068502583e-07, "loss": 1.4485, "step": 37408 }, { "epoch": 2.94, "learning_rate": 2.6243270145420157e-07, "loss": 1.4915, "step": 37409 }, { "epoch": 2.94, "learning_rate": 2.617024126935874e-07, "loss": 1.4473, "step": 37410 }, { "epoch": 2.94, "learning_rate": 2.6097314057339503e-07, "loss": 1.4122, "step": 37411 }, { "epoch": 2.94, "learning_rate": 2.602448850985539e-07, "loss": 1.4401, "step": 37412 }, { "epoch": 2.94, "learning_rate": 2.595176462740267e-07, "loss": 1.4694, "step": 37413 }, { "epoch": 2.94, "learning_rate": 2.5879142410474286e-07, "loss": 1.4639, "step": 37414 }, { "epoch": 2.94, "learning_rate": 2.5806621859561507e-07, "loss": 1.4459, "step": 37415 }, { "epoch": 2.94, "learning_rate": 2.5734202975158933e-07, "loss": 1.4815, "step": 37416 }, { "epoch": 2.94, "learning_rate": 2.566188575775785e-07, "loss": 1.4006, "step": 37417 }, { "epoch": 2.94, "learning_rate": 2.5589670207849524e-07, "loss": 1.4035, "step": 37418 }, { "epoch": 2.94, "learning_rate": 2.551755632592356e-07, "loss": 1.4545, "step": 37419 }, { "epoch": 2.94, "learning_rate": 2.5445544112469574e-07, "loss": 1.4076, "step": 37420 }, { "epoch": 2.94, "learning_rate": 2.537363356797717e-07, "loss": 1.4655, "step": 37421 }, { "epoch": 2.94, "learning_rate": 2.530182469293429e-07, "loss": 1.4563, "step": 37422 }, { "epoch": 2.94, "learning_rate": 2.523011748782722e-07, "loss": 1.4806, "step": 37423 }, { "epoch": 2.94, "learning_rate": 2.515851195314389e-07, "loss": 1.4214, "step": 37424 }, { "epoch": 2.94, "learning_rate": 2.508700808937059e-07, "loss": 1.4459, "step": 37425 }, { "epoch": 2.94, "learning_rate": 2.5015605896993585e-07, "loss": 1.4751, "step": 37426 }, { "epoch": 2.94, "learning_rate": 2.494430537649583e-07, "loss": 1.4391, "step": 37427 }, { "epoch": 2.94, "learning_rate": 2.4873106528363605e-07, "loss": 1.4506, "step": 37428 }, { "epoch": 2.94, "learning_rate": 2.480200935307819e-07, "loss": 1.4823, "step": 37429 }, { "epoch": 2.95, "learning_rate": 2.473101385112253e-07, "loss": 1.4716, "step": 37430 }, { "epoch": 2.95, "learning_rate": 2.466012002297957e-07, "loss": 1.4997, "step": 37431 }, { "epoch": 2.95, "learning_rate": 2.458932786913059e-07, "loss": 1.4547, "step": 37432 }, { "epoch": 2.95, "learning_rate": 2.4518637390055215e-07, "loss": 1.4593, "step": 37433 }, { "epoch": 2.95, "learning_rate": 2.4448048586234724e-07, "loss": 1.5219, "step": 37434 }, { "epoch": 2.95, "learning_rate": 2.437756145814873e-07, "loss": 1.4553, "step": 37435 }, { "epoch": 2.95, "learning_rate": 2.4307176006273523e-07, "loss": 1.4523, "step": 37436 }, { "epoch": 2.95, "learning_rate": 2.423689223108871e-07, "loss": 1.4483, "step": 37437 }, { "epoch": 2.95, "learning_rate": 2.416671013307059e-07, "loss": 1.4249, "step": 37438 }, { "epoch": 2.95, "learning_rate": 2.40966297126971e-07, "loss": 1.3747, "step": 37439 }, { "epoch": 2.95, "learning_rate": 2.402665097044287e-07, "loss": 1.4535, "step": 37440 }, { "epoch": 2.95, "learning_rate": 2.3956773906784186e-07, "loss": 1.3786, "step": 37441 }, { "epoch": 2.95, "learning_rate": 2.3886998522192334e-07, "loss": 1.4038, "step": 37442 }, { "epoch": 2.95, "learning_rate": 2.3817324817145267e-07, "loss": 1.4606, "step": 37443 }, { "epoch": 2.95, "learning_rate": 2.3747752792112608e-07, "loss": 1.4485, "step": 37444 }, { "epoch": 2.95, "learning_rate": 2.3678282447568974e-07, "loss": 1.4851, "step": 37445 }, { "epoch": 2.95, "learning_rate": 2.3608913783983995e-07, "loss": 1.4343, "step": 37446 }, { "epoch": 2.95, "learning_rate": 2.3539646801830624e-07, "loss": 1.4261, "step": 37447 }, { "epoch": 2.95, "learning_rate": 2.3470481501578486e-07, "loss": 1.4645, "step": 37448 }, { "epoch": 2.95, "learning_rate": 2.3401417883697205e-07, "loss": 1.4435, "step": 37449 }, { "epoch": 2.95, "learning_rate": 2.3332455948656404e-07, "loss": 1.4413, "step": 37450 }, { "epoch": 2.95, "learning_rate": 2.3263595696922377e-07, "loss": 1.3938, "step": 37451 }, { "epoch": 2.95, "learning_rate": 2.3194837128963085e-07, "loss": 1.4195, "step": 37452 }, { "epoch": 2.95, "learning_rate": 2.3126180245246485e-07, "loss": 1.4114, "step": 37453 }, { "epoch": 2.95, "learning_rate": 2.305762504623887e-07, "loss": 1.4453, "step": 37454 }, { "epoch": 2.95, "learning_rate": 2.2989171532403206e-07, "loss": 1.4995, "step": 37455 }, { "epoch": 2.95, "learning_rate": 2.292081970420745e-07, "loss": 1.405, "step": 37456 }, { "epoch": 2.95, "learning_rate": 2.2852569562114564e-07, "loss": 1.456, "step": 37457 }, { "epoch": 2.95, "learning_rate": 2.2784421106587514e-07, "loss": 1.4058, "step": 37458 }, { "epoch": 2.95, "learning_rate": 2.2716374338089261e-07, "loss": 1.4232, "step": 37459 }, { "epoch": 2.95, "learning_rate": 2.26484292570811e-07, "loss": 1.47, "step": 37460 }, { "epoch": 2.95, "learning_rate": 2.2580585864024337e-07, "loss": 1.3986, "step": 37461 }, { "epoch": 2.95, "learning_rate": 2.2512844159380262e-07, "loss": 1.4062, "step": 37462 }, { "epoch": 2.95, "learning_rate": 2.2445204143610174e-07, "loss": 1.4866, "step": 37463 }, { "epoch": 2.95, "learning_rate": 2.2377665817170375e-07, "loss": 1.4386, "step": 37464 }, { "epoch": 2.95, "learning_rate": 2.2310229180522166e-07, "loss": 1.4953, "step": 37465 }, { "epoch": 2.95, "learning_rate": 2.2242894234121845e-07, "loss": 1.4382, "step": 37466 }, { "epoch": 2.95, "learning_rate": 2.2175660978425714e-07, "loss": 1.427, "step": 37467 }, { "epoch": 2.95, "learning_rate": 2.2108529413893405e-07, "loss": 1.4132, "step": 37468 }, { "epoch": 2.95, "learning_rate": 2.2041499540976226e-07, "loss": 1.4598, "step": 37469 }, { "epoch": 2.95, "learning_rate": 2.1974571360133808e-07, "loss": 1.4309, "step": 37470 }, { "epoch": 2.95, "learning_rate": 2.1907744871817457e-07, "loss": 1.5215, "step": 37471 }, { "epoch": 2.95, "learning_rate": 2.1841020076481807e-07, "loss": 1.3913, "step": 37472 }, { "epoch": 2.95, "learning_rate": 2.1774396974581499e-07, "loss": 1.4406, "step": 37473 }, { "epoch": 2.95, "learning_rate": 2.170787556656617e-07, "loss": 1.4476, "step": 37474 }, { "epoch": 2.95, "learning_rate": 2.1641455852888788e-07, "loss": 1.4589, "step": 37475 }, { "epoch": 2.95, "learning_rate": 2.1575137833999e-07, "loss": 1.4342, "step": 37476 }, { "epoch": 2.95, "learning_rate": 2.1508921510349775e-07, "loss": 1.4184, "step": 37477 }, { "epoch": 2.95, "learning_rate": 2.1442806882389084e-07, "loss": 1.4283, "step": 37478 }, { "epoch": 2.95, "learning_rate": 2.1376793950564908e-07, "loss": 1.4632, "step": 37479 }, { "epoch": 2.95, "learning_rate": 2.1310882715326883e-07, "loss": 1.3676, "step": 37480 }, { "epoch": 2.95, "learning_rate": 2.1245073177122986e-07, "loss": 1.4404, "step": 37481 }, { "epoch": 2.95, "learning_rate": 2.117936533639786e-07, "loss": 1.4406, "step": 37482 }, { "epoch": 2.95, "learning_rate": 2.1113759193599477e-07, "loss": 1.4419, "step": 37483 }, { "epoch": 2.95, "learning_rate": 2.1048254749172488e-07, "loss": 1.426, "step": 37484 }, { "epoch": 2.95, "learning_rate": 2.0982852003561535e-07, "loss": 1.4737, "step": 37485 }, { "epoch": 2.95, "learning_rate": 2.091755095721126e-07, "loss": 1.4511, "step": 37486 }, { "epoch": 2.95, "learning_rate": 2.0852351610564644e-07, "loss": 1.4251, "step": 37487 }, { "epoch": 2.95, "learning_rate": 2.0787253964064664e-07, "loss": 1.4394, "step": 37488 }, { "epoch": 2.95, "learning_rate": 2.0722258018152637e-07, "loss": 1.4607, "step": 37489 }, { "epoch": 2.95, "learning_rate": 2.0657363773269876e-07, "loss": 1.4843, "step": 37490 }, { "epoch": 2.95, "learning_rate": 2.0592571229857692e-07, "loss": 1.4151, "step": 37491 }, { "epoch": 2.95, "learning_rate": 2.0527880388355732e-07, "loss": 1.3983, "step": 37492 }, { "epoch": 2.95, "learning_rate": 2.0463291249201984e-07, "loss": 1.4785, "step": 37493 }, { "epoch": 2.95, "learning_rate": 2.039880381283776e-07, "loss": 1.4071, "step": 37494 }, { "epoch": 2.95, "learning_rate": 2.0334418079699378e-07, "loss": 1.4598, "step": 37495 }, { "epoch": 2.95, "learning_rate": 2.0270134050223154e-07, "loss": 1.4949, "step": 37496 }, { "epoch": 2.95, "learning_rate": 2.0205951724845405e-07, "loss": 1.456, "step": 37497 }, { "epoch": 2.95, "learning_rate": 2.014187110400245e-07, "loss": 1.4683, "step": 37498 }, { "epoch": 2.95, "learning_rate": 2.0077892188132273e-07, "loss": 1.4186, "step": 37499 }, { "epoch": 2.95, "learning_rate": 2.0014014977664528e-07, "loss": 1.4957, "step": 37500 }, { "epoch": 2.95, "learning_rate": 1.9950239473035533e-07, "loss": 1.4108, "step": 37501 }, { "epoch": 2.95, "learning_rate": 1.9886565674676614e-07, "loss": 1.4589, "step": 37502 }, { "epoch": 2.95, "learning_rate": 1.9822993583022419e-07, "loss": 1.4582, "step": 37503 }, { "epoch": 2.95, "learning_rate": 1.9759523198502603e-07, "loss": 1.4194, "step": 37504 }, { "epoch": 2.95, "learning_rate": 1.9696154521550157e-07, "loss": 1.4238, "step": 37505 }, { "epoch": 2.95, "learning_rate": 1.9632887552593068e-07, "loss": 1.4424, "step": 37506 }, { "epoch": 2.95, "learning_rate": 1.9569722292060995e-07, "loss": 1.4343, "step": 37507 }, { "epoch": 2.95, "learning_rate": 1.9506658740385262e-07, "loss": 1.4424, "step": 37508 }, { "epoch": 2.95, "learning_rate": 1.9443696897992188e-07, "loss": 1.4663, "step": 37509 }, { "epoch": 2.95, "learning_rate": 1.9380836765308106e-07, "loss": 1.3837, "step": 37510 }, { "epoch": 2.95, "learning_rate": 1.9318078342762667e-07, "loss": 1.4436, "step": 37511 }, { "epoch": 2.95, "learning_rate": 1.9255421630778867e-07, "loss": 1.4273, "step": 37512 }, { "epoch": 2.95, "learning_rate": 1.91928666297847e-07, "loss": 1.4415, "step": 37513 }, { "epoch": 2.95, "learning_rate": 1.913041334020482e-07, "loss": 1.4213, "step": 37514 }, { "epoch": 2.95, "learning_rate": 1.9068061762460561e-07, "loss": 1.4328, "step": 37515 }, { "epoch": 2.95, "learning_rate": 1.9005811896978252e-07, "loss": 1.4754, "step": 37516 }, { "epoch": 2.95, "learning_rate": 1.8943663744179217e-07, "loss": 1.4916, "step": 37517 }, { "epoch": 2.95, "learning_rate": 1.8881617304484786e-07, "loss": 1.415, "step": 37518 }, { "epoch": 2.95, "learning_rate": 1.8819672578316291e-07, "loss": 1.4325, "step": 37519 }, { "epoch": 2.95, "learning_rate": 1.8757829566096728e-07, "loss": 1.408, "step": 37520 }, { "epoch": 2.95, "learning_rate": 1.8696088268242427e-07, "loss": 1.4897, "step": 37521 }, { "epoch": 2.95, "learning_rate": 1.863444868517472e-07, "loss": 1.5002, "step": 37522 }, { "epoch": 2.95, "learning_rate": 1.8572910817311604e-07, "loss": 1.4895, "step": 37523 }, { "epoch": 2.95, "learning_rate": 1.8511474665072746e-07, "loss": 1.4764, "step": 37524 }, { "epoch": 2.95, "learning_rate": 1.8450140228871147e-07, "loss": 1.4519, "step": 37525 }, { "epoch": 2.95, "learning_rate": 1.8388907509126472e-07, "loss": 1.4576, "step": 37526 }, { "epoch": 2.95, "learning_rate": 1.8327776506255055e-07, "loss": 1.4406, "step": 37527 }, { "epoch": 2.95, "learning_rate": 1.826674722066823e-07, "loss": 1.4291, "step": 37528 }, { "epoch": 2.95, "learning_rate": 1.8205819652784004e-07, "loss": 1.4184, "step": 37529 }, { "epoch": 2.95, "learning_rate": 1.8144993803013708e-07, "loss": 1.4415, "step": 37530 }, { "epoch": 2.95, "learning_rate": 1.8084269671772012e-07, "loss": 1.4293, "step": 37531 }, { "epoch": 2.95, "learning_rate": 1.8023647259470254e-07, "loss": 1.4444, "step": 37532 }, { "epoch": 2.95, "learning_rate": 1.796312656651977e-07, "loss": 1.4376, "step": 37533 }, { "epoch": 2.95, "learning_rate": 1.79027075933319e-07, "loss": 1.4194, "step": 37534 }, { "epoch": 2.95, "learning_rate": 1.784239034031798e-07, "loss": 1.4133, "step": 37535 }, { "epoch": 2.95, "learning_rate": 1.7782174807886017e-07, "loss": 1.4646, "step": 37536 }, { "epoch": 2.95, "learning_rate": 1.7722060996444022e-07, "loss": 1.4582, "step": 37537 }, { "epoch": 2.95, "learning_rate": 1.766204890640166e-07, "loss": 1.4407, "step": 37538 }, { "epoch": 2.95, "learning_rate": 1.7602138538166942e-07, "loss": 1.4699, "step": 37539 }, { "epoch": 2.95, "learning_rate": 1.7542329892144547e-07, "loss": 1.4886, "step": 37540 }, { "epoch": 2.95, "learning_rate": 1.7482622968742477e-07, "loss": 1.4422, "step": 37541 }, { "epoch": 2.95, "learning_rate": 1.742301776836541e-07, "loss": 1.4619, "step": 37542 }, { "epoch": 2.95, "learning_rate": 1.7363514291418023e-07, "loss": 1.4732, "step": 37543 }, { "epoch": 2.95, "learning_rate": 1.7304112538303327e-07, "loss": 1.4602, "step": 37544 }, { "epoch": 2.95, "learning_rate": 1.7244812509425998e-07, "loss": 1.3959, "step": 37545 }, { "epoch": 2.95, "learning_rate": 1.7185614205189047e-07, "loss": 1.4714, "step": 37546 }, { "epoch": 2.95, "learning_rate": 1.7126517625993818e-07, "loss": 1.451, "step": 37547 }, { "epoch": 2.95, "learning_rate": 1.7067522772239995e-07, "loss": 1.44, "step": 37548 }, { "epoch": 2.95, "learning_rate": 1.7008629644330586e-07, "loss": 1.4227, "step": 37549 }, { "epoch": 2.95, "learning_rate": 1.6949838242663605e-07, "loss": 1.3973, "step": 37550 }, { "epoch": 2.95, "learning_rate": 1.6891148567638734e-07, "loss": 1.4607, "step": 37551 }, { "epoch": 2.95, "learning_rate": 1.683256061965399e-07, "loss": 1.4232, "step": 37552 }, { "epoch": 2.95, "learning_rate": 1.677407439910905e-07, "loss": 1.4922, "step": 37553 }, { "epoch": 2.95, "learning_rate": 1.6715689906400265e-07, "loss": 1.4511, "step": 37554 }, { "epoch": 2.95, "learning_rate": 1.665740714192232e-07, "loss": 1.5123, "step": 37555 }, { "epoch": 2.95, "learning_rate": 1.659922610607156e-07, "loss": 1.4787, "step": 37556 }, { "epoch": 2.96, "learning_rate": 1.6541146799244344e-07, "loss": 1.4527, "step": 37557 }, { "epoch": 2.96, "learning_rate": 1.648316922183368e-07, "loss": 1.4966, "step": 37558 }, { "epoch": 2.96, "learning_rate": 1.6425293374234262e-07, "loss": 1.4293, "step": 37559 }, { "epoch": 2.96, "learning_rate": 1.63675192568391e-07, "loss": 1.4052, "step": 37560 }, { "epoch": 2.96, "learning_rate": 1.6309846870039556e-07, "loss": 1.4002, "step": 37561 }, { "epoch": 2.96, "learning_rate": 1.6252276214225314e-07, "loss": 1.4343, "step": 37562 }, { "epoch": 2.96, "learning_rate": 1.6194807289791058e-07, "loss": 1.4325, "step": 37563 }, { "epoch": 2.96, "learning_rate": 1.6137440097126475e-07, "loss": 1.5096, "step": 37564 }, { "epoch": 2.96, "learning_rate": 1.6080174636617927e-07, "loss": 1.4295, "step": 37565 }, { "epoch": 2.96, "learning_rate": 1.6023010908656764e-07, "loss": 1.4361, "step": 37566 }, { "epoch": 2.96, "learning_rate": 1.5965948913631011e-07, "loss": 1.4939, "step": 37567 }, { "epoch": 2.96, "learning_rate": 1.5908988651927023e-07, "loss": 1.4627, "step": 37568 }, { "epoch": 2.96, "learning_rate": 1.5852130123932826e-07, "loss": 1.4854, "step": 37569 }, { "epoch": 2.96, "learning_rate": 1.5795373330033112e-07, "loss": 1.4455, "step": 37570 }, { "epoch": 2.96, "learning_rate": 1.5738718270614236e-07, "loss": 1.4477, "step": 37571 }, { "epoch": 2.96, "learning_rate": 1.5682164946060894e-07, "loss": 1.4399, "step": 37572 }, { "epoch": 2.96, "learning_rate": 1.562571335675611e-07, "loss": 1.4528, "step": 37573 }, { "epoch": 2.96, "learning_rate": 1.556936350308291e-07, "loss": 1.4926, "step": 37574 }, { "epoch": 2.96, "learning_rate": 1.551311538542599e-07, "loss": 1.4228, "step": 37575 }, { "epoch": 2.96, "learning_rate": 1.5456969004165044e-07, "loss": 1.4507, "step": 37576 }, { "epoch": 2.96, "learning_rate": 1.5400924359681433e-07, "loss": 1.418, "step": 37577 }, { "epoch": 2.96, "learning_rate": 1.5344981452358185e-07, "loss": 1.4568, "step": 37578 }, { "epoch": 2.96, "learning_rate": 1.5289140282571667e-07, "loss": 1.4132, "step": 37579 }, { "epoch": 2.96, "learning_rate": 1.5233400850703236e-07, "loss": 1.4155, "step": 37580 }, { "epoch": 2.96, "learning_rate": 1.5177763157130928e-07, "loss": 1.4271, "step": 37581 }, { "epoch": 2.96, "learning_rate": 1.5122227202231107e-07, "loss": 1.433, "step": 37582 }, { "epoch": 2.96, "learning_rate": 1.5066792986383468e-07, "loss": 1.4629, "step": 37583 }, { "epoch": 2.96, "learning_rate": 1.5011460509962713e-07, "loss": 1.4384, "step": 37584 }, { "epoch": 2.96, "learning_rate": 1.4956229773345207e-07, "loss": 1.4426, "step": 37585 }, { "epoch": 2.96, "learning_rate": 1.4901100776903986e-07, "loss": 1.4305, "step": 37586 }, { "epoch": 2.96, "learning_rate": 1.484607352101541e-07, "loss": 1.4574, "step": 37587 }, { "epoch": 2.96, "learning_rate": 1.4791148006052522e-07, "loss": 1.4243, "step": 37588 }, { "epoch": 2.96, "learning_rate": 1.4736324232388353e-07, "loss": 1.4479, "step": 37589 }, { "epoch": 2.96, "learning_rate": 1.4681602200395936e-07, "loss": 1.443, "step": 37590 }, { "epoch": 2.96, "learning_rate": 1.4626981910444978e-07, "loss": 1.3833, "step": 37591 }, { "epoch": 2.96, "learning_rate": 1.457246336290685e-07, "loss": 1.453, "step": 37592 }, { "epoch": 2.96, "learning_rate": 1.4518046558152917e-07, "loss": 1.4158, "step": 37593 }, { "epoch": 2.96, "learning_rate": 1.4463731496551224e-07, "loss": 1.4389, "step": 37594 }, { "epoch": 2.96, "learning_rate": 1.4409518178471468e-07, "loss": 1.4421, "step": 37595 }, { "epoch": 2.96, "learning_rate": 1.4355406604280027e-07, "loss": 1.4493, "step": 37596 }, { "epoch": 2.96, "learning_rate": 1.4301396774346607e-07, "loss": 1.428, "step": 37597 }, { "epoch": 2.96, "learning_rate": 1.4247488689037578e-07, "loss": 1.459, "step": 37598 }, { "epoch": 2.96, "learning_rate": 1.419368234871765e-07, "loss": 1.4475, "step": 37599 }, { "epoch": 2.96, "learning_rate": 1.4139977753753195e-07, "loss": 1.3941, "step": 37600 }, { "epoch": 2.96, "learning_rate": 1.4086374904507258e-07, "loss": 1.4412, "step": 37601 }, { "epoch": 2.96, "learning_rate": 1.4032873801346212e-07, "loss": 1.4601, "step": 37602 }, { "epoch": 2.96, "learning_rate": 1.3979474444631433e-07, "loss": 1.4079, "step": 37603 }, { "epoch": 2.96, "learning_rate": 1.3926176834725966e-07, "loss": 1.431, "step": 37604 }, { "epoch": 2.96, "learning_rate": 1.3872980971991188e-07, "loss": 1.5127, "step": 37605 }, { "epoch": 2.96, "learning_rate": 1.3819886856790142e-07, "loss": 1.4549, "step": 37606 }, { "epoch": 2.96, "learning_rate": 1.3766894489480872e-07, "loss": 1.467, "step": 37607 }, { "epoch": 2.96, "learning_rate": 1.3714003870424763e-07, "loss": 1.4347, "step": 37608 }, { "epoch": 2.96, "learning_rate": 1.3661214999981518e-07, "loss": 1.4252, "step": 37609 }, { "epoch": 2.96, "learning_rate": 1.3608527878505858e-07, "loss": 1.4546, "step": 37610 }, { "epoch": 2.96, "learning_rate": 1.355594250636083e-07, "loss": 1.4271, "step": 37611 }, { "epoch": 2.96, "learning_rate": 1.3503458883899477e-07, "loss": 1.4335, "step": 37612 }, { "epoch": 2.96, "learning_rate": 1.345107701147985e-07, "loss": 1.4523, "step": 37613 }, { "epoch": 2.96, "learning_rate": 1.3398796889456665e-07, "loss": 1.4418, "step": 37614 }, { "epoch": 2.96, "learning_rate": 1.3346618518184637e-07, "loss": 1.4183, "step": 37615 }, { "epoch": 2.96, "learning_rate": 1.329454189802015e-07, "loss": 1.4477, "step": 37616 }, { "epoch": 2.96, "learning_rate": 1.324256702931459e-07, "loss": 1.4165, "step": 37617 }, { "epoch": 2.96, "learning_rate": 1.3190693912422668e-07, "loss": 1.4795, "step": 37618 }, { "epoch": 2.96, "learning_rate": 1.3138922547694107e-07, "loss": 1.4461, "step": 37619 }, { "epoch": 2.96, "learning_rate": 1.308725293548196e-07, "loss": 1.4266, "step": 37620 }, { "epoch": 2.96, "learning_rate": 1.3035685076137615e-07, "loss": 1.4203, "step": 37621 }, { "epoch": 2.96, "learning_rate": 1.2984218970010783e-07, "loss": 1.4411, "step": 37622 }, { "epoch": 2.96, "learning_rate": 1.2932854617449527e-07, "loss": 1.4698, "step": 37623 }, { "epoch": 2.96, "learning_rate": 1.288159201880523e-07, "loss": 1.4595, "step": 37624 }, { "epoch": 2.96, "learning_rate": 1.2830431174422617e-07, "loss": 1.4951, "step": 37625 }, { "epoch": 2.96, "learning_rate": 1.2779372084651406e-07, "loss": 1.395, "step": 37626 }, { "epoch": 2.96, "learning_rate": 1.2728414749837989e-07, "loss": 1.4579, "step": 37627 }, { "epoch": 2.96, "learning_rate": 1.2677559170327088e-07, "loss": 1.4509, "step": 37628 }, { "epoch": 2.96, "learning_rate": 1.2626805346466762e-07, "loss": 1.4553, "step": 37629 }, { "epoch": 2.96, "learning_rate": 1.25761532785984e-07, "loss": 1.4513, "step": 37630 }, { "epoch": 2.96, "learning_rate": 1.2525602967066729e-07, "loss": 1.5002, "step": 37631 }, { "epoch": 2.96, "learning_rate": 1.247515441221647e-07, "loss": 1.4626, "step": 37632 }, { "epoch": 2.96, "learning_rate": 1.2424807614387355e-07, "loss": 1.3921, "step": 37633 }, { "epoch": 2.96, "learning_rate": 1.2374562573924106e-07, "loss": 1.4885, "step": 37634 }, { "epoch": 2.96, "learning_rate": 1.232441929116812e-07, "loss": 1.4849, "step": 37635 }, { "epoch": 2.96, "learning_rate": 1.227437776645579e-07, "loss": 1.4307, "step": 37636 }, { "epoch": 2.96, "learning_rate": 1.2224438000131843e-07, "loss": 1.4242, "step": 37637 }, { "epoch": 2.96, "learning_rate": 1.217459999253101e-07, "loss": 1.4335, "step": 37638 }, { "epoch": 2.96, "learning_rate": 1.2124863743996348e-07, "loss": 1.47, "step": 37639 }, { "epoch": 2.96, "learning_rate": 1.2075229254860929e-07, "loss": 1.4474, "step": 37640 }, { "epoch": 2.96, "learning_rate": 1.2025696525462813e-07, "loss": 1.4106, "step": 37641 }, { "epoch": 2.96, "learning_rate": 1.1976265556141728e-07, "loss": 1.4656, "step": 37642 }, { "epoch": 2.96, "learning_rate": 1.1926936347229078e-07, "loss": 1.3565, "step": 37643 }, { "epoch": 2.96, "learning_rate": 1.1877708899061256e-07, "loss": 1.3927, "step": 37644 }, { "epoch": 2.96, "learning_rate": 1.1828583211972998e-07, "loss": 1.5004, "step": 37645 }, { "epoch": 2.96, "learning_rate": 1.1779559286297369e-07, "loss": 1.4453, "step": 37646 }, { "epoch": 2.96, "learning_rate": 1.1730637122367436e-07, "loss": 1.4699, "step": 37647 }, { "epoch": 2.96, "learning_rate": 1.1681816720516269e-07, "loss": 1.5039, "step": 37648 }, { "epoch": 2.96, "learning_rate": 1.16330980810736e-07, "loss": 1.4713, "step": 37649 }, { "epoch": 2.96, "learning_rate": 1.1584481204370833e-07, "loss": 1.4366, "step": 37650 }, { "epoch": 2.96, "learning_rate": 1.1535966090737702e-07, "loss": 1.4159, "step": 37651 }, { "epoch": 2.96, "learning_rate": 1.1487552740503946e-07, "loss": 1.4056, "step": 37652 }, { "epoch": 2.96, "learning_rate": 1.1439241153999301e-07, "loss": 1.4253, "step": 37653 }, { "epoch": 2.96, "learning_rate": 1.1391031331550171e-07, "loss": 1.444, "step": 37654 }, { "epoch": 2.96, "learning_rate": 1.1342923273484628e-07, "loss": 1.5204, "step": 37655 }, { "epoch": 2.96, "learning_rate": 1.1294916980129076e-07, "loss": 1.4966, "step": 37656 }, { "epoch": 2.96, "learning_rate": 1.1247012451809923e-07, "loss": 1.4241, "step": 37657 }, { "epoch": 2.96, "learning_rate": 1.1199209688851906e-07, "loss": 1.4014, "step": 37658 }, { "epoch": 2.96, "learning_rate": 1.1151508691581435e-07, "loss": 1.4524, "step": 37659 }, { "epoch": 2.96, "learning_rate": 1.110390946031825e-07, "loss": 1.4831, "step": 37660 }, { "epoch": 2.96, "learning_rate": 1.1056411995388759e-07, "loss": 1.3916, "step": 37661 }, { "epoch": 2.96, "learning_rate": 1.100901629711437e-07, "loss": 1.4525, "step": 37662 }, { "epoch": 2.96, "learning_rate": 1.096172236581816e-07, "loss": 1.432, "step": 37663 }, { "epoch": 2.96, "learning_rate": 1.0914530201819871e-07, "loss": 1.4153, "step": 37664 }, { "epoch": 2.96, "learning_rate": 1.0867439805439248e-07, "loss": 1.3847, "step": 37665 }, { "epoch": 2.96, "learning_rate": 1.0820451176997702e-07, "loss": 1.4648, "step": 37666 }, { "epoch": 2.96, "learning_rate": 1.077356431681331e-07, "loss": 1.4804, "step": 37667 }, { "epoch": 2.96, "learning_rate": 1.0726779225205818e-07, "loss": 1.405, "step": 37668 }, { "epoch": 2.96, "learning_rate": 1.0680095902489971e-07, "loss": 1.4483, "step": 37669 }, { "epoch": 2.96, "learning_rate": 1.0633514348985516e-07, "loss": 1.4364, "step": 37670 }, { "epoch": 2.96, "learning_rate": 1.0587034565008867e-07, "loss": 1.3979, "step": 37671 }, { "epoch": 2.96, "learning_rate": 1.0540656550873105e-07, "loss": 1.4196, "step": 37672 }, { "epoch": 2.96, "learning_rate": 1.0494380306894645e-07, "loss": 1.4178, "step": 37673 }, { "epoch": 2.96, "learning_rate": 1.0448205833386569e-07, "loss": 1.4115, "step": 37674 }, { "epoch": 2.96, "learning_rate": 1.0402133130663626e-07, "loss": 1.4283, "step": 37675 }, { "epoch": 2.96, "learning_rate": 1.0356162199038897e-07, "loss": 1.4617, "step": 37676 }, { "epoch": 2.96, "learning_rate": 1.0310293038823802e-07, "loss": 1.3731, "step": 37677 }, { "epoch": 2.96, "learning_rate": 1.0264525650329757e-07, "loss": 1.4455, "step": 37678 }, { "epoch": 2.96, "learning_rate": 1.0218860033866517e-07, "loss": 1.3884, "step": 37679 }, { "epoch": 2.96, "learning_rate": 1.0173296189745495e-07, "loss": 1.4651, "step": 37680 }, { "epoch": 2.96, "learning_rate": 1.0127834118276445e-07, "loss": 1.4585, "step": 37681 }, { "epoch": 2.96, "learning_rate": 1.0082473819767456e-07, "loss": 1.4522, "step": 37682 }, { "epoch": 2.96, "learning_rate": 1.0037215294526613e-07, "loss": 1.4596, "step": 37683 }, { "epoch": 2.97, "learning_rate": 9.992058542858672e-08, "loss": 1.4408, "step": 37684 }, { "epoch": 2.97, "learning_rate": 9.947003565075052e-08, "loss": 1.486, "step": 37685 }, { "epoch": 2.97, "learning_rate": 9.902050361478842e-08, "loss": 1.4455, "step": 37686 }, { "epoch": 2.97, "learning_rate": 9.857198932374799e-08, "loss": 1.4115, "step": 37687 }, { "epoch": 2.97, "learning_rate": 9.81244927806768e-08, "loss": 1.4268, "step": 37688 }, { "epoch": 2.97, "learning_rate": 9.767801398862241e-08, "loss": 1.4318, "step": 37689 }, { "epoch": 2.97, "learning_rate": 9.723255295061572e-08, "loss": 1.4596, "step": 37690 }, { "epoch": 2.97, "learning_rate": 9.678810966965434e-08, "loss": 1.4035, "step": 37691 }, { "epoch": 2.97, "learning_rate": 9.634468414880247e-08, "loss": 1.505, "step": 37692 }, { "epoch": 2.97, "learning_rate": 9.590227639104109e-08, "loss": 1.4522, "step": 37693 }, { "epoch": 2.97, "learning_rate": 9.546088639938443e-08, "loss": 1.4365, "step": 37694 }, { "epoch": 2.97, "learning_rate": 9.502051417681344e-08, "loss": 1.4028, "step": 37695 }, { "epoch": 2.97, "learning_rate": 9.458115972632574e-08, "loss": 1.4424, "step": 37696 }, { "epoch": 2.97, "learning_rate": 9.414282305091891e-08, "loss": 1.4885, "step": 37697 }, { "epoch": 2.97, "learning_rate": 9.370550415355726e-08, "loss": 1.4109, "step": 37698 }, { "epoch": 2.97, "learning_rate": 9.326920303720508e-08, "loss": 1.4333, "step": 37699 }, { "epoch": 2.97, "learning_rate": 9.283391970482667e-08, "loss": 1.3784, "step": 37700 }, { "epoch": 2.97, "learning_rate": 9.239965415938633e-08, "loss": 1.4523, "step": 37701 }, { "epoch": 2.97, "learning_rate": 9.196640640383169e-08, "loss": 1.4274, "step": 37702 }, { "epoch": 2.97, "learning_rate": 9.153417644109374e-08, "loss": 1.3814, "step": 37703 }, { "epoch": 2.97, "learning_rate": 9.110296427410347e-08, "loss": 1.4323, "step": 37704 }, { "epoch": 2.97, "learning_rate": 9.067276990580851e-08, "loss": 1.4823, "step": 37705 }, { "epoch": 2.97, "learning_rate": 9.024359333910657e-08, "loss": 1.4748, "step": 37706 }, { "epoch": 2.97, "learning_rate": 8.981543457692863e-08, "loss": 1.4338, "step": 37707 }, { "epoch": 2.97, "learning_rate": 8.938829362218903e-08, "loss": 1.4635, "step": 37708 }, { "epoch": 2.97, "learning_rate": 8.896217047776877e-08, "loss": 1.4656, "step": 37709 }, { "epoch": 2.97, "learning_rate": 8.853706514656556e-08, "loss": 1.4653, "step": 37710 }, { "epoch": 2.97, "learning_rate": 8.811297763146041e-08, "loss": 1.4876, "step": 37711 }, { "epoch": 2.97, "learning_rate": 8.768990793535103e-08, "loss": 1.4516, "step": 37712 }, { "epoch": 2.97, "learning_rate": 8.726785606108511e-08, "loss": 1.348, "step": 37713 }, { "epoch": 2.97, "learning_rate": 8.684682201156034e-08, "loss": 1.4463, "step": 37714 }, { "epoch": 2.97, "learning_rate": 8.642680578960781e-08, "loss": 1.4533, "step": 37715 }, { "epoch": 2.97, "learning_rate": 8.600780739807523e-08, "loss": 1.4329, "step": 37716 }, { "epoch": 2.97, "learning_rate": 8.558982683984361e-08, "loss": 1.459, "step": 37717 }, { "epoch": 2.97, "learning_rate": 8.517286411771074e-08, "loss": 1.4414, "step": 37718 }, { "epoch": 2.97, "learning_rate": 8.475691923452432e-08, "loss": 1.4863, "step": 37719 }, { "epoch": 2.97, "learning_rate": 8.434199219311544e-08, "loss": 1.4375, "step": 37720 }, { "epoch": 2.97, "learning_rate": 8.39280829962985e-08, "loss": 1.4234, "step": 37721 }, { "epoch": 2.97, "learning_rate": 8.351519164687126e-08, "loss": 1.4499, "step": 37722 }, { "epoch": 2.97, "learning_rate": 8.310331814764814e-08, "loss": 1.4397, "step": 37723 }, { "epoch": 2.97, "learning_rate": 8.269246250142691e-08, "loss": 1.449, "step": 37724 }, { "epoch": 2.97, "learning_rate": 8.228262471098868e-08, "loss": 1.4447, "step": 37725 }, { "epoch": 2.97, "learning_rate": 8.187380477911454e-08, "loss": 1.4801, "step": 37726 }, { "epoch": 2.97, "learning_rate": 8.146600270858561e-08, "loss": 1.4415, "step": 37727 }, { "epoch": 2.97, "learning_rate": 8.1059218502183e-08, "loss": 1.4557, "step": 37728 }, { "epoch": 2.97, "learning_rate": 8.065345216263786e-08, "loss": 1.4529, "step": 37729 }, { "epoch": 2.97, "learning_rate": 8.024870369274793e-08, "loss": 1.4393, "step": 37730 }, { "epoch": 2.97, "learning_rate": 7.98449730952111e-08, "loss": 1.4943, "step": 37731 }, { "epoch": 2.97, "learning_rate": 7.944226037280843e-08, "loss": 1.4111, "step": 37732 }, { "epoch": 2.97, "learning_rate": 7.904056552825444e-08, "loss": 1.4167, "step": 37733 }, { "epoch": 2.97, "learning_rate": 7.863988856429692e-08, "loss": 1.4579, "step": 37734 }, { "epoch": 2.97, "learning_rate": 7.824022948361708e-08, "loss": 1.4711, "step": 37735 }, { "epoch": 2.97, "learning_rate": 7.78415882889627e-08, "loss": 1.4029, "step": 37736 }, { "epoch": 2.97, "learning_rate": 7.744396498303162e-08, "loss": 1.4563, "step": 37737 }, { "epoch": 2.97, "learning_rate": 7.70473595685217e-08, "loss": 1.4244, "step": 37738 }, { "epoch": 2.97, "learning_rate": 7.665177204813078e-08, "loss": 1.4646, "step": 37739 }, { "epoch": 2.97, "learning_rate": 7.625720242454003e-08, "loss": 1.4246, "step": 37740 }, { "epoch": 2.97, "learning_rate": 7.5863650700414e-08, "loss": 1.4354, "step": 37741 }, { "epoch": 2.97, "learning_rate": 7.547111687845054e-08, "loss": 1.4011, "step": 37742 }, { "epoch": 2.97, "learning_rate": 7.50796009612975e-08, "loss": 1.4615, "step": 37743 }, { "epoch": 2.97, "learning_rate": 7.468910295161945e-08, "loss": 1.4545, "step": 37744 }, { "epoch": 2.97, "learning_rate": 7.429962285206426e-08, "loss": 1.4191, "step": 37745 }, { "epoch": 2.97, "learning_rate": 7.391116066529646e-08, "loss": 1.446, "step": 37746 }, { "epoch": 2.97, "learning_rate": 7.352371639391396e-08, "loss": 1.4539, "step": 37747 }, { "epoch": 2.97, "learning_rate": 7.313729004058133e-08, "loss": 1.4399, "step": 37748 }, { "epoch": 2.97, "learning_rate": 7.275188160789647e-08, "loss": 1.4286, "step": 37749 }, { "epoch": 2.97, "learning_rate": 7.236749109850725e-08, "loss": 1.3982, "step": 37750 }, { "epoch": 2.97, "learning_rate": 7.198411851499497e-08, "loss": 1.4587, "step": 37751 }, { "epoch": 2.97, "learning_rate": 7.160176385997418e-08, "loss": 1.4157, "step": 37752 }, { "epoch": 2.97, "learning_rate": 7.122042713604281e-08, "loss": 1.4729, "step": 37753 }, { "epoch": 2.97, "learning_rate": 7.084010834579879e-08, "loss": 1.452, "step": 37754 }, { "epoch": 2.97, "learning_rate": 7.046080749179006e-08, "loss": 1.4499, "step": 37755 }, { "epoch": 2.97, "learning_rate": 7.008252457663122e-08, "loss": 1.4328, "step": 37756 }, { "epoch": 2.97, "learning_rate": 6.970525960287021e-08, "loss": 1.5185, "step": 37757 }, { "epoch": 2.97, "learning_rate": 6.932901257305501e-08, "loss": 1.4076, "step": 37758 }, { "epoch": 2.97, "learning_rate": 6.895378348978353e-08, "loss": 1.4241, "step": 37759 }, { "epoch": 2.97, "learning_rate": 6.857957235555378e-08, "loss": 1.453, "step": 37760 }, { "epoch": 2.97, "learning_rate": 6.820637917294702e-08, "loss": 1.4481, "step": 37761 }, { "epoch": 2.97, "learning_rate": 6.783420394447791e-08, "loss": 1.4712, "step": 37762 }, { "epoch": 2.97, "learning_rate": 6.746304667266111e-08, "loss": 1.3746, "step": 37763 }, { "epoch": 2.97, "learning_rate": 6.709290736004457e-08, "loss": 1.4336, "step": 37764 }, { "epoch": 2.97, "learning_rate": 6.672378600912632e-08, "loss": 1.4664, "step": 37765 }, { "epoch": 2.97, "learning_rate": 6.635568262240431e-08, "loss": 1.4169, "step": 37766 }, { "epoch": 2.97, "learning_rate": 6.598859720239325e-08, "loss": 1.3887, "step": 37767 }, { "epoch": 2.97, "learning_rate": 6.56225297515911e-08, "loss": 1.4542, "step": 37768 }, { "epoch": 2.97, "learning_rate": 6.525748027244593e-08, "loss": 1.4289, "step": 37769 }, { "epoch": 2.97, "learning_rate": 6.489344876748903e-08, "loss": 1.4469, "step": 37770 }, { "epoch": 2.97, "learning_rate": 6.45304352391518e-08, "loss": 1.4631, "step": 37771 }, { "epoch": 2.97, "learning_rate": 6.416843968989893e-08, "loss": 1.4561, "step": 37772 }, { "epoch": 2.97, "learning_rate": 6.380746212221177e-08, "loss": 1.4797, "step": 37773 }, { "epoch": 2.97, "learning_rate": 6.344750253853837e-08, "loss": 1.452, "step": 37774 }, { "epoch": 2.97, "learning_rate": 6.308856094131009e-08, "loss": 1.436, "step": 37775 }, { "epoch": 2.97, "learning_rate": 6.273063733295836e-08, "loss": 1.4552, "step": 37776 }, { "epoch": 2.97, "learning_rate": 6.237373171593119e-08, "loss": 1.4412, "step": 37777 }, { "epoch": 2.97, "learning_rate": 6.201784409264333e-08, "loss": 1.3912, "step": 37778 }, { "epoch": 2.97, "learning_rate": 6.16629744655095e-08, "loss": 1.4261, "step": 37779 }, { "epoch": 2.97, "learning_rate": 6.130912283694444e-08, "loss": 1.4497, "step": 37780 }, { "epoch": 2.97, "learning_rate": 6.095628920934625e-08, "loss": 1.4524, "step": 37781 }, { "epoch": 2.97, "learning_rate": 6.0604473585113e-08, "loss": 1.4349, "step": 37782 }, { "epoch": 2.97, "learning_rate": 6.025367596664276e-08, "loss": 1.4474, "step": 37783 }, { "epoch": 2.97, "learning_rate": 5.990389635628368e-08, "loss": 1.5089, "step": 37784 }, { "epoch": 2.97, "learning_rate": 5.955513475645046e-08, "loss": 1.4657, "step": 37785 }, { "epoch": 2.97, "learning_rate": 5.9207391169491244e-08, "loss": 1.4431, "step": 37786 }, { "epoch": 2.97, "learning_rate": 5.886066559775415e-08, "loss": 1.3905, "step": 37787 }, { "epoch": 2.97, "learning_rate": 5.8514958043620607e-08, "loss": 1.4023, "step": 37788 }, { "epoch": 2.97, "learning_rate": 5.817026850943873e-08, "loss": 1.434, "step": 37789 }, { "epoch": 2.97, "learning_rate": 5.782659699752334e-08, "loss": 1.4183, "step": 37790 }, { "epoch": 2.97, "learning_rate": 5.7483943510222563e-08, "loss": 1.4594, "step": 37791 }, { "epoch": 2.97, "learning_rate": 5.7142308049851206e-08, "loss": 1.4297, "step": 37792 }, { "epoch": 2.97, "learning_rate": 5.6801690618740735e-08, "loss": 1.3873, "step": 37793 }, { "epoch": 2.97, "learning_rate": 5.646209121920597e-08, "loss": 1.4629, "step": 37794 }, { "epoch": 2.97, "learning_rate": 5.612350985356173e-08, "loss": 1.453, "step": 37795 }, { "epoch": 2.97, "learning_rate": 5.578594652407287e-08, "loss": 1.4209, "step": 37796 }, { "epoch": 2.97, "learning_rate": 5.5449401233054195e-08, "loss": 1.4761, "step": 37797 }, { "epoch": 2.97, "learning_rate": 5.511387398278722e-08, "loss": 1.4493, "step": 37798 }, { "epoch": 2.97, "learning_rate": 5.47793647755701e-08, "loss": 1.4411, "step": 37799 }, { "epoch": 2.97, "learning_rate": 5.4445873613634394e-08, "loss": 1.4469, "step": 37800 }, { "epoch": 2.97, "learning_rate": 5.4113400499261605e-08, "loss": 1.4152, "step": 37801 }, { "epoch": 2.97, "learning_rate": 5.3781945434733245e-08, "loss": 1.4492, "step": 37802 }, { "epoch": 2.97, "learning_rate": 5.345150842224755e-08, "loss": 1.4586, "step": 37803 }, { "epoch": 2.97, "learning_rate": 5.312208946410268e-08, "loss": 1.439, "step": 37804 }, { "epoch": 2.97, "learning_rate": 5.279368856251354e-08, "loss": 1.4399, "step": 37805 }, { "epoch": 2.97, "learning_rate": 5.246630571969501e-08, "loss": 1.4541, "step": 37806 }, { "epoch": 2.97, "learning_rate": 5.2139940937878657e-08, "loss": 1.3772, "step": 37807 }, { "epoch": 2.97, "learning_rate": 5.181459421929601e-08, "loss": 1.4984, "step": 37808 }, { "epoch": 2.97, "learning_rate": 5.149026556614533e-08, "loss": 1.4598, "step": 37809 }, { "epoch": 2.97, "learning_rate": 5.1166954980608186e-08, "loss": 1.4423, "step": 37810 }, { "epoch": 2.98, "learning_rate": 5.084466246491614e-08, "loss": 1.4699, "step": 37811 }, { "epoch": 2.98, "learning_rate": 5.052338802123412e-08, "loss": 1.4324, "step": 37812 }, { "epoch": 2.98, "learning_rate": 5.0203131651760375e-08, "loss": 1.4351, "step": 37813 }, { "epoch": 2.98, "learning_rate": 4.988389335864318e-08, "loss": 1.3565, "step": 37814 }, { "epoch": 2.98, "learning_rate": 4.9565673144064125e-08, "loss": 1.4158, "step": 37815 }, { "epoch": 2.98, "learning_rate": 4.9248471010204795e-08, "loss": 1.4662, "step": 37816 }, { "epoch": 2.98, "learning_rate": 4.8932286959180165e-08, "loss": 1.4833, "step": 37817 }, { "epoch": 2.98, "learning_rate": 4.861712099315518e-08, "loss": 1.4266, "step": 37818 }, { "epoch": 2.98, "learning_rate": 4.830297311427811e-08, "loss": 1.4373, "step": 37819 }, { "epoch": 2.98, "learning_rate": 4.798984332466393e-08, "loss": 1.4239, "step": 37820 }, { "epoch": 2.98, "learning_rate": 4.767773162646094e-08, "loss": 1.4588, "step": 37821 }, { "epoch": 2.98, "learning_rate": 4.736663802176744e-08, "loss": 1.3971, "step": 37822 }, { "epoch": 2.98, "learning_rate": 4.705656251271506e-08, "loss": 1.4958, "step": 37823 }, { "epoch": 2.98, "learning_rate": 4.674750510138548e-08, "loss": 1.4435, "step": 37824 }, { "epoch": 2.98, "learning_rate": 4.643946578989366e-08, "loss": 1.4687, "step": 37825 }, { "epoch": 2.98, "learning_rate": 4.613244458032128e-08, "loss": 1.3965, "step": 37826 }, { "epoch": 2.98, "learning_rate": 4.582644147476666e-08, "loss": 1.4661, "step": 37827 }, { "epoch": 2.98, "learning_rate": 4.552145647529482e-08, "loss": 1.4604, "step": 37828 }, { "epoch": 2.98, "learning_rate": 4.521748958397076e-08, "loss": 1.4265, "step": 37829 }, { "epoch": 2.98, "learning_rate": 4.4914540802892804e-08, "loss": 1.4036, "step": 37830 }, { "epoch": 2.98, "learning_rate": 4.461261013407602e-08, "loss": 1.4727, "step": 37831 }, { "epoch": 2.98, "learning_rate": 4.431169757958542e-08, "loss": 1.4327, "step": 37832 }, { "epoch": 2.98, "learning_rate": 4.401180314146935e-08, "loss": 1.4551, "step": 37833 }, { "epoch": 2.98, "learning_rate": 4.371292682175953e-08, "loss": 1.4411, "step": 37834 }, { "epoch": 2.98, "learning_rate": 4.3415068622487667e-08, "loss": 1.4566, "step": 37835 }, { "epoch": 2.98, "learning_rate": 4.3118228545685474e-08, "loss": 1.4516, "step": 37836 }, { "epoch": 2.98, "learning_rate": 4.282240659333469e-08, "loss": 1.4046, "step": 37837 }, { "epoch": 2.98, "learning_rate": 4.2527602767483683e-08, "loss": 1.4644, "step": 37838 }, { "epoch": 2.98, "learning_rate": 4.2233817070114195e-08, "loss": 1.3998, "step": 37839 }, { "epoch": 2.98, "learning_rate": 4.1941049503224634e-08, "loss": 1.511, "step": 37840 }, { "epoch": 2.98, "learning_rate": 4.1649300068796745e-08, "loss": 1.4367, "step": 37841 }, { "epoch": 2.98, "learning_rate": 4.1358568768812275e-08, "loss": 1.3848, "step": 37842 }, { "epoch": 2.98, "learning_rate": 4.106885560525297e-08, "loss": 1.4081, "step": 37843 }, { "epoch": 2.98, "learning_rate": 4.078016058008393e-08, "loss": 1.386, "step": 37844 }, { "epoch": 2.98, "learning_rate": 4.049248369527025e-08, "loss": 1.4411, "step": 37845 }, { "epoch": 2.98, "learning_rate": 4.020582495274372e-08, "loss": 1.4533, "step": 37846 }, { "epoch": 2.98, "learning_rate": 3.992018435446942e-08, "loss": 1.4474, "step": 37847 }, { "epoch": 2.98, "learning_rate": 3.963556190239581e-08, "loss": 1.4579, "step": 37848 }, { "epoch": 2.98, "learning_rate": 3.9351957598421356e-08, "loss": 1.4605, "step": 37849 }, { "epoch": 2.98, "learning_rate": 3.9069371444511164e-08, "loss": 1.4499, "step": 37850 }, { "epoch": 2.98, "learning_rate": 3.8787803442547064e-08, "loss": 1.4977, "step": 37851 }, { "epoch": 2.98, "learning_rate": 3.850725359446083e-08, "loss": 1.412, "step": 37852 }, { "epoch": 2.98, "learning_rate": 3.822772190216761e-08, "loss": 1.4566, "step": 37853 }, { "epoch": 2.98, "learning_rate": 3.794920836754922e-08, "loss": 1.4429, "step": 37854 }, { "epoch": 2.98, "learning_rate": 3.76717129924875e-08, "loss": 1.4368, "step": 37855 }, { "epoch": 2.98, "learning_rate": 3.739523577889758e-08, "loss": 1.3997, "step": 37856 }, { "epoch": 2.98, "learning_rate": 3.7119776728627984e-08, "loss": 1.4176, "step": 37857 }, { "epoch": 2.98, "learning_rate": 3.684533584354388e-08, "loss": 1.4173, "step": 37858 }, { "epoch": 2.98, "learning_rate": 3.657191312554375e-08, "loss": 1.4873, "step": 37859 }, { "epoch": 2.98, "learning_rate": 3.6299508576459465e-08, "loss": 1.5565, "step": 37860 }, { "epoch": 2.98, "learning_rate": 3.602812219813955e-08, "loss": 1.4664, "step": 37861 }, { "epoch": 2.98, "learning_rate": 3.5757753992432524e-08, "loss": 1.4097, "step": 37862 }, { "epoch": 2.98, "learning_rate": 3.548840396118691e-08, "loss": 1.4998, "step": 37863 }, { "epoch": 2.98, "learning_rate": 3.522007210620126e-08, "loss": 1.4422, "step": 37864 }, { "epoch": 2.98, "learning_rate": 3.49527584293241e-08, "loss": 1.472, "step": 37865 }, { "epoch": 2.98, "learning_rate": 3.4686462932354e-08, "loss": 1.4483, "step": 37866 }, { "epoch": 2.98, "learning_rate": 3.442118561710616e-08, "loss": 1.4437, "step": 37867 }, { "epoch": 2.98, "learning_rate": 3.4156926485379157e-08, "loss": 1.4401, "step": 37868 }, { "epoch": 2.98, "learning_rate": 3.389368553897154e-08, "loss": 1.4507, "step": 37869 }, { "epoch": 2.98, "learning_rate": 3.363146277966522e-08, "loss": 1.4686, "step": 37870 }, { "epoch": 2.98, "learning_rate": 3.337025820924211e-08, "loss": 1.4719, "step": 37871 }, { "epoch": 2.98, "learning_rate": 3.311007182946745e-08, "loss": 1.4569, "step": 37872 }, { "epoch": 2.98, "learning_rate": 3.2850903642139826e-08, "loss": 1.3915, "step": 37873 }, { "epoch": 2.98, "learning_rate": 3.259275364897451e-08, "loss": 1.4642, "step": 37874 }, { "epoch": 2.98, "learning_rate": 3.233562185175342e-08, "loss": 1.4674, "step": 37875 }, { "epoch": 2.98, "learning_rate": 3.207950825222516e-08, "loss": 1.4692, "step": 37876 }, { "epoch": 2.98, "learning_rate": 3.182441285210502e-08, "loss": 1.4146, "step": 37877 }, { "epoch": 2.98, "learning_rate": 3.15703356531416e-08, "loss": 1.4473, "step": 37878 }, { "epoch": 2.98, "learning_rate": 3.13172766570502e-08, "loss": 1.4337, "step": 37879 }, { "epoch": 2.98, "learning_rate": 3.106523586556275e-08, "loss": 1.4501, "step": 37880 }, { "epoch": 2.98, "learning_rate": 3.0814213280377917e-08, "loss": 1.4118, "step": 37881 }, { "epoch": 2.98, "learning_rate": 3.0564208903210986e-08, "loss": 1.4938, "step": 37882 }, { "epoch": 2.98, "learning_rate": 3.031522273576059e-08, "loss": 1.4491, "step": 37883 }, { "epoch": 2.98, "learning_rate": 3.0067254779692076e-08, "loss": 1.4348, "step": 37884 }, { "epoch": 2.98, "learning_rate": 2.9820305036720724e-08, "loss": 1.4882, "step": 37885 }, { "epoch": 2.98, "learning_rate": 2.957437350849523e-08, "loss": 1.4376, "step": 37886 }, { "epoch": 2.98, "learning_rate": 2.9329460196697573e-08, "loss": 1.4646, "step": 37887 }, { "epoch": 2.98, "learning_rate": 2.9085565103009745e-08, "loss": 1.4507, "step": 37888 }, { "epoch": 2.98, "learning_rate": 2.884268822906377e-08, "loss": 1.4251, "step": 37889 }, { "epoch": 2.98, "learning_rate": 2.8600829576508333e-08, "loss": 1.435, "step": 37890 }, { "epoch": 2.98, "learning_rate": 2.8359989146992113e-08, "loss": 1.4713, "step": 37891 }, { "epoch": 2.98, "learning_rate": 2.812016694216379e-08, "loss": 1.4392, "step": 37892 }, { "epoch": 2.98, "learning_rate": 2.788136296362209e-08, "loss": 1.4019, "step": 37893 }, { "epoch": 2.98, "learning_rate": 2.7643577213015687e-08, "loss": 1.4459, "step": 37894 }, { "epoch": 2.98, "learning_rate": 2.740680969194331e-08, "loss": 1.4746, "step": 37895 }, { "epoch": 2.98, "learning_rate": 2.7171060402003675e-08, "loss": 1.399, "step": 37896 }, { "epoch": 2.98, "learning_rate": 2.693632934482881e-08, "loss": 1.4152, "step": 37897 }, { "epoch": 2.98, "learning_rate": 2.6702616521984134e-08, "loss": 1.4483, "step": 37898 }, { "epoch": 2.98, "learning_rate": 2.6469921935085016e-08, "loss": 1.4942, "step": 37899 }, { "epoch": 2.98, "learning_rate": 2.623824558568022e-08, "loss": 1.4488, "step": 37900 }, { "epoch": 2.98, "learning_rate": 2.600758747535181e-08, "loss": 1.4497, "step": 37901 }, { "epoch": 2.98, "learning_rate": 2.5777947605665205e-08, "loss": 1.4387, "step": 37902 }, { "epoch": 2.98, "learning_rate": 2.554932597818582e-08, "loss": 1.4012, "step": 37903 }, { "epoch": 2.98, "learning_rate": 2.5321722594479067e-08, "loss": 1.4961, "step": 37904 }, { "epoch": 2.98, "learning_rate": 2.50951374560604e-08, "loss": 1.424, "step": 37905 }, { "epoch": 2.98, "learning_rate": 2.4869570564495233e-08, "loss": 1.4283, "step": 37906 }, { "epoch": 2.98, "learning_rate": 2.464502192128237e-08, "loss": 1.4328, "step": 37907 }, { "epoch": 2.98, "learning_rate": 2.4421491527987226e-08, "loss": 1.4066, "step": 37908 }, { "epoch": 2.98, "learning_rate": 2.4198979386091945e-08, "loss": 1.461, "step": 37909 }, { "epoch": 2.98, "learning_rate": 2.3977485497128636e-08, "loss": 1.4443, "step": 37910 }, { "epoch": 2.98, "learning_rate": 2.37570098625961e-08, "loss": 1.437, "step": 37911 }, { "epoch": 2.98, "learning_rate": 2.353755248399314e-08, "loss": 1.4287, "step": 37912 }, { "epoch": 2.98, "learning_rate": 2.33191133628019e-08, "loss": 1.4432, "step": 37913 }, { "epoch": 2.98, "learning_rate": 2.310169250050453e-08, "loss": 1.4788, "step": 37914 }, { "epoch": 2.98, "learning_rate": 2.2885289898583183e-08, "loss": 1.4898, "step": 37915 }, { "epoch": 2.98, "learning_rate": 2.2669905558503343e-08, "loss": 1.3773, "step": 37916 }, { "epoch": 2.98, "learning_rate": 2.2455539481747164e-08, "loss": 1.4354, "step": 37917 }, { "epoch": 2.98, "learning_rate": 2.2242191669746833e-08, "loss": 1.4718, "step": 37918 }, { "epoch": 2.98, "learning_rate": 2.2029862123951193e-08, "loss": 1.4605, "step": 37919 }, { "epoch": 2.98, "learning_rate": 2.181855084580908e-08, "loss": 1.4477, "step": 37920 }, { "epoch": 2.98, "learning_rate": 2.1608257836752684e-08, "loss": 1.4668, "step": 37921 }, { "epoch": 2.98, "learning_rate": 2.1398983098214195e-08, "loss": 1.3788, "step": 37922 }, { "epoch": 2.98, "learning_rate": 2.1190726631609145e-08, "loss": 1.4801, "step": 37923 }, { "epoch": 2.98, "learning_rate": 2.0983488438369723e-08, "loss": 1.4893, "step": 37924 }, { "epoch": 2.98, "learning_rate": 2.07772685198615e-08, "loss": 1.3803, "step": 37925 }, { "epoch": 2.98, "learning_rate": 2.057206687753332e-08, "loss": 1.472, "step": 37926 }, { "epoch": 2.98, "learning_rate": 2.036788351275076e-08, "loss": 1.4632, "step": 37927 }, { "epoch": 2.98, "learning_rate": 2.0164718426896044e-08, "loss": 1.4827, "step": 37928 }, { "epoch": 2.98, "learning_rate": 1.9962571621351398e-08, "loss": 1.4198, "step": 37929 }, { "epoch": 2.98, "learning_rate": 1.9761443097515707e-08, "loss": 1.4412, "step": 37930 }, { "epoch": 2.98, "learning_rate": 1.9561332856721236e-08, "loss": 1.3954, "step": 37931 }, { "epoch": 2.98, "learning_rate": 1.936224090033356e-08, "loss": 1.4513, "step": 37932 }, { "epoch": 2.98, "learning_rate": 1.9164167229718253e-08, "loss": 1.4307, "step": 37933 }, { "epoch": 2.98, "learning_rate": 1.8967111846207582e-08, "loss": 1.4847, "step": 37934 }, { "epoch": 2.98, "learning_rate": 1.8771074751150472e-08, "loss": 1.5143, "step": 37935 }, { "epoch": 2.98, "learning_rate": 1.8576055945862533e-08, "loss": 1.4997, "step": 37936 }, { "epoch": 2.98, "learning_rate": 1.8382055431692687e-08, "loss": 1.4458, "step": 37937 }, { "epoch": 2.99, "learning_rate": 1.8189073209923244e-08, "loss": 1.4213, "step": 37938 }, { "epoch": 2.99, "learning_rate": 1.7997109281886467e-08, "loss": 1.4659, "step": 37939 }, { "epoch": 2.99, "learning_rate": 1.7806163648897975e-08, "loss": 1.445, "step": 37940 }, { "epoch": 2.99, "learning_rate": 1.761623631222342e-08, "loss": 1.423, "step": 37941 }, { "epoch": 2.99, "learning_rate": 1.7427327273161762e-08, "loss": 1.3874, "step": 37942 }, { "epoch": 2.99, "learning_rate": 1.7239436533011963e-08, "loss": 1.4502, "step": 37943 }, { "epoch": 2.99, "learning_rate": 1.7052564093039678e-08, "loss": 1.4494, "step": 37944 }, { "epoch": 2.99, "learning_rate": 1.686670995451056e-08, "loss": 1.5077, "step": 37945 }, { "epoch": 2.99, "learning_rate": 1.6681874118690263e-08, "loss": 1.4187, "step": 37946 }, { "epoch": 2.99, "learning_rate": 1.6498056586844445e-08, "loss": 1.4348, "step": 37947 }, { "epoch": 2.99, "learning_rate": 1.6315257360188793e-08, "loss": 1.4656, "step": 37948 }, { "epoch": 2.99, "learning_rate": 1.6133476439988967e-08, "loss": 1.4393, "step": 37949 }, { "epoch": 2.99, "learning_rate": 1.5952713827477314e-08, "loss": 1.4082, "step": 37950 }, { "epoch": 2.99, "learning_rate": 1.577296952388618e-08, "loss": 1.4331, "step": 37951 }, { "epoch": 2.99, "learning_rate": 1.5594243530414608e-08, "loss": 1.4907, "step": 37952 }, { "epoch": 2.99, "learning_rate": 1.5416535848311595e-08, "loss": 1.4214, "step": 37953 }, { "epoch": 2.99, "learning_rate": 1.523984647874288e-08, "loss": 1.4156, "step": 37954 }, { "epoch": 2.99, "learning_rate": 1.506417542292415e-08, "loss": 1.4866, "step": 37955 }, { "epoch": 2.99, "learning_rate": 1.4889522682071108e-08, "loss": 1.4543, "step": 37956 }, { "epoch": 2.99, "learning_rate": 1.4715888257332831e-08, "loss": 1.4028, "step": 37957 }, { "epoch": 2.99, "learning_rate": 1.4543272149908358e-08, "loss": 1.4373, "step": 37958 }, { "epoch": 2.99, "learning_rate": 1.4371674360963426e-08, "loss": 1.3944, "step": 37959 }, { "epoch": 2.99, "learning_rate": 1.420109489168042e-08, "loss": 1.461, "step": 37960 }, { "epoch": 2.99, "learning_rate": 1.403153374319177e-08, "loss": 1.4466, "step": 37961 }, { "epoch": 2.99, "learning_rate": 1.3862990916646555e-08, "loss": 1.4301, "step": 37962 }, { "epoch": 2.99, "learning_rate": 1.3695466413227163e-08, "loss": 1.5027, "step": 37963 }, { "epoch": 2.99, "learning_rate": 1.3528960234032716e-08, "loss": 1.436, "step": 37964 }, { "epoch": 2.99, "learning_rate": 1.3363472380212292e-08, "loss": 1.4582, "step": 37965 }, { "epoch": 2.99, "learning_rate": 1.3199002852881669e-08, "loss": 1.4109, "step": 37966 }, { "epoch": 2.99, "learning_rate": 1.3035551653156617e-08, "loss": 1.4031, "step": 37967 }, { "epoch": 2.99, "learning_rate": 1.2873118782152914e-08, "loss": 1.411, "step": 37968 }, { "epoch": 2.99, "learning_rate": 1.2711704240986331e-08, "loss": 1.491, "step": 37969 }, { "epoch": 2.99, "learning_rate": 1.2551308030722684e-08, "loss": 1.4548, "step": 37970 }, { "epoch": 2.99, "learning_rate": 1.2391930152461093e-08, "loss": 1.4543, "step": 37971 }, { "epoch": 2.99, "learning_rate": 1.223357060730068e-08, "loss": 1.5027, "step": 37972 }, { "epoch": 2.99, "learning_rate": 1.2076229396290605e-08, "loss": 1.4319, "step": 37973 }, { "epoch": 2.99, "learning_rate": 1.1919906520513333e-08, "loss": 1.442, "step": 37974 }, { "epoch": 2.99, "learning_rate": 1.1764601981051336e-08, "loss": 1.4177, "step": 37975 }, { "epoch": 2.99, "learning_rate": 1.1610315778920464e-08, "loss": 1.4563, "step": 37976 }, { "epoch": 2.99, "learning_rate": 1.1457047915186535e-08, "loss": 1.4334, "step": 37977 }, { "epoch": 2.99, "learning_rate": 1.1304798390882052e-08, "loss": 1.4156, "step": 37978 }, { "epoch": 2.99, "learning_rate": 1.115356720705618e-08, "loss": 1.4608, "step": 37979 }, { "epoch": 2.99, "learning_rate": 1.100335436472477e-08, "loss": 1.4209, "step": 37980 }, { "epoch": 2.99, "learning_rate": 1.0854159864903678e-08, "loss": 1.4855, "step": 37981 }, { "epoch": 2.99, "learning_rate": 1.0705983708625409e-08, "loss": 1.3926, "step": 37982 }, { "epoch": 2.99, "learning_rate": 1.0558825896872514e-08, "loss": 1.4074, "step": 37983 }, { "epoch": 2.99, "learning_rate": 1.0412686430660844e-08, "loss": 1.4612, "step": 37984 }, { "epoch": 2.99, "learning_rate": 1.0267565310972948e-08, "loss": 1.4523, "step": 37985 }, { "epoch": 2.99, "learning_rate": 1.0123462538791372e-08, "loss": 1.4596, "step": 37986 }, { "epoch": 2.99, "learning_rate": 9.980378115115317e-09, "loss": 1.4833, "step": 37987 }, { "epoch": 2.99, "learning_rate": 9.838312040894025e-09, "loss": 1.4459, "step": 37988 }, { "epoch": 2.99, "learning_rate": 9.69726431709339e-09, "loss": 1.4929, "step": 37989 }, { "epoch": 2.99, "learning_rate": 9.557234944679303e-09, "loss": 1.4778, "step": 37990 }, { "epoch": 2.99, "learning_rate": 9.418223924601009e-09, "loss": 1.4439, "step": 37991 }, { "epoch": 2.99, "learning_rate": 9.280231257791093e-09, "loss": 1.4462, "step": 37992 }, { "epoch": 2.99, "learning_rate": 9.14325694521545e-09, "loss": 1.4235, "step": 37993 }, { "epoch": 2.99, "learning_rate": 9.007300987773358e-09, "loss": 1.4243, "step": 37994 }, { "epoch": 2.99, "learning_rate": 8.872363386397407e-09, "loss": 1.4101, "step": 37995 }, { "epoch": 2.99, "learning_rate": 8.738444142020184e-09, "loss": 1.4576, "step": 37996 }, { "epoch": 2.99, "learning_rate": 8.605543255524316e-09, "loss": 1.4726, "step": 37997 }, { "epoch": 2.99, "learning_rate": 8.473660727825737e-09, "loss": 1.4671, "step": 37998 }, { "epoch": 2.99, "learning_rate": 8.342796559823727e-09, "loss": 1.4382, "step": 37999 }, { "epoch": 2.99, "learning_rate": 8.212950752400915e-09, "loss": 1.4031, "step": 38000 }, { "epoch": 2.99, "learning_rate": 8.084123306439926e-09, "loss": 1.4139, "step": 38001 }, { "epoch": 2.99, "learning_rate": 7.956314222806737e-09, "loss": 1.4402, "step": 38002 }, { "epoch": 2.99, "learning_rate": 7.829523502383973e-09, "loss": 1.4882, "step": 38003 }, { "epoch": 2.99, "learning_rate": 7.703751146037606e-09, "loss": 1.4801, "step": 38004 }, { "epoch": 2.99, "learning_rate": 7.578997154600308e-09, "loss": 1.3937, "step": 38005 }, { "epoch": 2.99, "learning_rate": 7.455261528921398e-09, "loss": 1.4379, "step": 38006 }, { "epoch": 2.99, "learning_rate": 7.3325442698668465e-09, "loss": 1.426, "step": 38007 }, { "epoch": 2.99, "learning_rate": 7.210845378236019e-09, "loss": 1.421, "step": 38008 }, { "epoch": 2.99, "learning_rate": 7.090164854878233e-09, "loss": 1.4281, "step": 38009 }, { "epoch": 2.99, "learning_rate": 6.9705027005928506e-09, "loss": 1.4262, "step": 38010 }, { "epoch": 2.99, "learning_rate": 6.851858916212538e-09, "loss": 1.4594, "step": 38011 }, { "epoch": 2.99, "learning_rate": 6.734233502536657e-09, "loss": 1.4774, "step": 38012 }, { "epoch": 2.99, "learning_rate": 6.617626460364567e-09, "loss": 1.4472, "step": 38013 }, { "epoch": 2.99, "learning_rate": 6.502037790495629e-09, "loss": 1.4285, "step": 38014 }, { "epoch": 2.99, "learning_rate": 6.387467493679244e-09, "loss": 1.4472, "step": 38015 }, { "epoch": 2.99, "learning_rate": 6.273915570731425e-09, "loss": 1.4322, "step": 38016 }, { "epoch": 2.99, "learning_rate": 6.1613820224182265e-09, "loss": 1.4273, "step": 38017 }, { "epoch": 2.99, "learning_rate": 6.049866849489049e-09, "loss": 1.3849, "step": 38018 }, { "epoch": 2.99, "learning_rate": 5.939370052709946e-09, "loss": 1.4195, "step": 38019 }, { "epoch": 2.99, "learning_rate": 5.829891632813666e-09, "loss": 1.4458, "step": 38020 }, { "epoch": 2.99, "learning_rate": 5.721431590582914e-09, "loss": 1.4901, "step": 38021 }, { "epoch": 2.99, "learning_rate": 5.613989926717133e-09, "loss": 1.4249, "step": 38022 }, { "epoch": 2.99, "learning_rate": 5.507566641949068e-09, "loss": 1.3829, "step": 38023 }, { "epoch": 2.99, "learning_rate": 5.402161737028121e-09, "loss": 1.3889, "step": 38024 }, { "epoch": 2.99, "learning_rate": 5.297775212637079e-09, "loss": 1.5098, "step": 38025 }, { "epoch": 2.99, "learning_rate": 5.194407069508688e-09, "loss": 1.4516, "step": 38026 }, { "epoch": 2.99, "learning_rate": 5.09205730834239e-09, "loss": 1.4932, "step": 38027 }, { "epoch": 2.99, "learning_rate": 4.990725929820971e-09, "loss": 1.452, "step": 38028 }, { "epoch": 2.99, "learning_rate": 4.890412934643873e-09, "loss": 1.4619, "step": 38029 }, { "epoch": 2.99, "learning_rate": 4.791118323477228e-09, "loss": 1.4159, "step": 38030 }, { "epoch": 2.99, "learning_rate": 4.692842097003824e-09, "loss": 1.463, "step": 38031 }, { "epoch": 2.99, "learning_rate": 4.5955842559064485e-09, "loss": 1.3856, "step": 38032 }, { "epoch": 2.99, "learning_rate": 4.499344800817928e-09, "loss": 1.485, "step": 38033 }, { "epoch": 2.99, "learning_rate": 4.404123732404397e-09, "loss": 1.4056, "step": 38034 }, { "epoch": 2.99, "learning_rate": 4.3099210513153345e-09, "loss": 1.4465, "step": 38035 }, { "epoch": 2.99, "learning_rate": 4.216736758200223e-09, "loss": 1.4484, "step": 38036 }, { "epoch": 2.99, "learning_rate": 4.124570853658582e-09, "loss": 1.4459, "step": 38037 }, { "epoch": 2.99, "learning_rate": 4.0334233383398914e-09, "loss": 1.4482, "step": 38038 }, { "epoch": 2.99, "learning_rate": 3.94329421287698e-09, "loss": 1.4513, "step": 38039 }, { "epoch": 2.99, "learning_rate": 3.854183477836059e-09, "loss": 1.4061, "step": 38040 }, { "epoch": 2.99, "learning_rate": 3.766091133866611e-09, "loss": 1.4005, "step": 38041 }, { "epoch": 2.99, "learning_rate": 3.6790171815515024e-09, "loss": 1.3993, "step": 38042 }, { "epoch": 2.99, "learning_rate": 3.5929616214902533e-09, "loss": 1.4311, "step": 38043 }, { "epoch": 2.99, "learning_rate": 3.507924454249078e-09, "loss": 1.4015, "step": 38044 }, { "epoch": 2.99, "learning_rate": 3.4239056804108435e-09, "loss": 1.4475, "step": 38045 }, { "epoch": 2.99, "learning_rate": 3.340905300541763e-09, "loss": 1.4553, "step": 38046 }, { "epoch": 2.99, "learning_rate": 3.258923315224704e-09, "loss": 1.4472, "step": 38047 }, { "epoch": 2.99, "learning_rate": 3.177959725009227e-09, "loss": 1.4285, "step": 38048 }, { "epoch": 2.99, "learning_rate": 3.0980145304282387e-09, "loss": 1.4256, "step": 38049 }, { "epoch": 2.99, "learning_rate": 3.0190877320479534e-09, "loss": 1.4341, "step": 38050 }, { "epoch": 2.99, "learning_rate": 2.941179330384624e-09, "loss": 1.3726, "step": 38051 }, { "epoch": 2.99, "learning_rate": 2.8642893259711585e-09, "loss": 1.4355, "step": 38052 }, { "epoch": 2.99, "learning_rate": 2.788417719340463e-09, "loss": 1.4111, "step": 38053 }, { "epoch": 2.99, "learning_rate": 2.713564511008792e-09, "loss": 1.4348, "step": 38054 }, { "epoch": 2.99, "learning_rate": 2.6397297014590923e-09, "loss": 1.4392, "step": 38055 }, { "epoch": 2.99, "learning_rate": 2.566913291224271e-09, "loss": 1.481, "step": 38056 }, { "epoch": 2.99, "learning_rate": 2.495115280770621e-09, "loss": 1.447, "step": 38057 }, { "epoch": 2.99, "learning_rate": 2.424335670614397e-09, "loss": 1.4176, "step": 38058 }, { "epoch": 2.99, "learning_rate": 2.354574461221892e-09, "loss": 1.4493, "step": 38059 }, { "epoch": 2.99, "learning_rate": 2.2858316530594e-09, "loss": 1.476, "step": 38060 }, { "epoch": 2.99, "learning_rate": 2.2181072465932147e-09, "loss": 1.4594, "step": 38061 }, { "epoch": 2.99, "learning_rate": 2.1514012423062833e-09, "loss": 1.4045, "step": 38062 }, { "epoch": 2.99, "learning_rate": 2.085713640631592e-09, "loss": 1.4645, "step": 38063 }, { "epoch": 2.99, "learning_rate": 2.021044442018782e-09, "loss": 1.4029, "step": 38064 }, { "epoch": 3.0, "learning_rate": 1.95739364690084e-09, "loss": 1.422, "step": 38065 }, { "epoch": 3.0, "learning_rate": 1.894761255710753e-09, "loss": 1.3974, "step": 38066 }, { "epoch": 3.0, "learning_rate": 1.8331472688981607e-09, "loss": 1.4811, "step": 38067 }, { "epoch": 3.0, "learning_rate": 1.772551686846091e-09, "loss": 1.4983, "step": 38068 }, { "epoch": 3.0, "learning_rate": 1.7129745099875302e-09, "loss": 1.4089, "step": 38069 }, { "epoch": 3.0, "learning_rate": 1.6544157387388124e-09, "loss": 1.4513, "step": 38070 }, { "epoch": 3.0, "learning_rate": 1.5968753734496575e-09, "loss": 1.4888, "step": 38071 }, { "epoch": 3.0, "learning_rate": 1.540353414569706e-09, "loss": 1.4227, "step": 38072 }, { "epoch": 3.0, "learning_rate": 1.4848498624320248e-09, "loss": 1.4201, "step": 38073 }, { "epoch": 3.0, "learning_rate": 1.4303647174529475e-09, "loss": 1.4273, "step": 38074 }, { "epoch": 3.0, "learning_rate": 1.3768979799821945e-09, "loss": 1.3795, "step": 38075 }, { "epoch": 3.0, "learning_rate": 1.324449650386139e-09, "loss": 1.4576, "step": 38076 }, { "epoch": 3.0, "learning_rate": 1.2730197290145016e-09, "loss": 1.4191, "step": 38077 }, { "epoch": 3.0, "learning_rate": 1.222608216233656e-09, "loss": 1.4711, "step": 38078 }, { "epoch": 3.0, "learning_rate": 1.1732151123600153e-09, "loss": 1.4533, "step": 38079 }, { "epoch": 3.0, "learning_rate": 1.1248404177599536e-09, "loss": 1.4689, "step": 38080 }, { "epoch": 3.0, "learning_rate": 1.0774841327332306e-09, "loss": 1.4377, "step": 38081 }, { "epoch": 3.0, "learning_rate": 1.0311462576295671e-09, "loss": 1.4845, "step": 38082 }, { "epoch": 3.0, "learning_rate": 9.858267927320695e-10, "loss": 1.4464, "step": 38083 }, { "epoch": 3.0, "learning_rate": 9.41525738373805e-10, "loss": 1.3995, "step": 38084 }, { "epoch": 3.0, "learning_rate": 8.982430948378805e-10, "loss": 1.4929, "step": 38085 }, { "epoch": 3.0, "learning_rate": 8.559788624407094e-10, "loss": 1.4295, "step": 38086 }, { "epoch": 3.0, "learning_rate": 8.147330414320918e-10, "loss": 1.4512, "step": 38087 }, { "epoch": 3.0, "learning_rate": 7.745056321450948e-10, "loss": 1.4853, "step": 38088 }, { "epoch": 3.0, "learning_rate": 7.352966347962119e-10, "loss": 1.4643, "step": 38089 }, { "epoch": 3.0, "learning_rate": 6.971060496852033e-10, "loss": 1.4783, "step": 38090 }, { "epoch": 3.0, "learning_rate": 6.599338770785223e-10, "loss": 1.4419, "step": 38091 }, { "epoch": 3.0, "learning_rate": 6.237801171926626e-10, "loss": 1.4038, "step": 38092 }, { "epoch": 3.0, "learning_rate": 5.886447703107311e-10, "loss": 1.4419, "step": 38093 }, { "epoch": 3.0, "learning_rate": 5.545278366492211e-10, "loss": 1.4464, "step": 38094 }, { "epoch": 3.0, "learning_rate": 5.214293164579331e-10, "loss": 1.4558, "step": 38095 }, { "epoch": 3.0, "learning_rate": 4.893492099367069e-10, "loss": 1.3968, "step": 38096 }, { "epoch": 3.0, "learning_rate": 4.582875173186895e-10, "loss": 1.4312, "step": 38097 }, { "epoch": 3.0, "learning_rate": 4.2824423880372104e-10, "loss": 1.3819, "step": 38098 }, { "epoch": 3.0, "learning_rate": 3.9921937462494835e-10, "loss": 1.4538, "step": 38099 }, { "epoch": 3.0, "learning_rate": 3.7121292493225153e-10, "loss": 1.5402, "step": 38100 }, { "epoch": 3.0, "learning_rate": 3.442248899587774e-10, "loss": 1.4314, "step": 38101 }, { "epoch": 3.0, "learning_rate": 3.182552698710594e-10, "loss": 1.4789, "step": 38102 }, { "epoch": 3.0, "learning_rate": 2.9330406485228444e-10, "loss": 1.4952, "step": 38103 }, { "epoch": 3.0, "learning_rate": 2.693712750523325e-10, "loss": 1.4511, "step": 38104 }, { "epoch": 3.0, "learning_rate": 2.464569006543904e-10, "loss": 1.4643, "step": 38105 }, { "epoch": 3.0, "learning_rate": 2.2456094180833828e-10, "loss": 1.4974, "step": 38106 }, { "epoch": 3.0, "learning_rate": 2.036833986474029e-10, "loss": 1.425, "step": 38107 }, { "epoch": 3.0, "learning_rate": 1.8382427133811773e-10, "loss": 1.4331, "step": 38108 }, { "epoch": 3.0, "learning_rate": 1.6498355999705614e-10, "loss": 1.4042, "step": 38109 }, { "epoch": 3.0, "learning_rate": 1.4716126477409828e-10, "loss": 1.4844, "step": 38110 }, { "epoch": 3.0, "learning_rate": 1.3035738575251088e-10, "loss": 1.4571, "step": 38111 }, { "epoch": 3.0, "learning_rate": 1.14571923082174e-10, "loss": 1.4909, "step": 38112 }, { "epoch": 3.0, "learning_rate": 9.980487686300776e-11, "loss": 1.4658, "step": 38113 }, { "epoch": 3.0, "learning_rate": 8.605624717827886e-11, "loss": 1.4182, "step": 38114 }, { "epoch": 3.0, "learning_rate": 7.332603412790738e-11, "loss": 1.4711, "step": 38115 }, { "epoch": 3.0, "learning_rate": 6.161423781181341e-11, "loss": 1.4193, "step": 38116 }, { "epoch": 3.0, "learning_rate": 5.0920858313263645e-11, "loss": 1.4367, "step": 38117 }, { "epoch": 3.0, "learning_rate": 4.12458956655648e-11, "loss": 1.4355, "step": 38118 }, { "epoch": 3.0, "learning_rate": 3.258934998529028e-11, "loss": 1.482, "step": 38119 }, { "epoch": 3.0, "learning_rate": 2.495122128909344e-11, "loss": 1.4803, "step": 38120 }, { "epoch": 3.0, "learning_rate": 1.8331509660240994e-11, "loss": 1.4884, "step": 38121 }, { "epoch": 3.0, "learning_rate": 1.27302151153863e-11, "loss": 1.4714, "step": 38122 }, { "epoch": 3.0, "learning_rate": 8.147337721142733e-12, "loss": 1.3664, "step": 38123 }, { "epoch": 3.0, "learning_rate": 4.582877477510294e-12, "loss": 1.4175, "step": 38124 }, { "epoch": 3.0, "learning_rate": 2.036834451102365e-12, "loss": 1.4506, "step": 38125 }, { "epoch": 3.0, "learning_rate": 5.092086086122549e-13, "loss": 1.424, "step": 38126 }, { "epoch": 3.0, "learning_rate": 0.0, "loss": 1.4081, "step": 38127 }, { "epoch": 3.0, "step": 38127, "total_flos": 2.6896453959942144e+16, "train_loss": 1.6263817286927247, "train_runtime": 649257.4466, "train_samples_per_second": 60.135, "train_steps_per_second": 0.059 } ], "logging_steps": 1.0, "max_steps": 38127, "num_input_tokens_seen": 0, "num_train_epochs": 3, "save_steps": 500, "total_flos": 2.6896453959942144e+16, "train_batch_size": 64, "trial_name": null, "trial_params": null }